{
    "codes": {
        "7e59c5d99907c76cf6b5598a": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What is the minimum monthly number of patients who had bacteremia - gram negative rod?",
            "gold_sql": "SELECT MIN(T1.C1) FROM ( SELECT COUNT( DISTINCT diagnosis.patientunitstayid ) AS C1 FROM diagnosis WHERE diagnosis.diagnosisname = 'bacteremia - gram negative rod' GROUP BY strftime('%Y-%m',diagnosis.diagnosistime) ) AS T1",
            "pred_sql": "SELECT count(patient.patientunitstayid) FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid WHERE diagnosis.diagnosisname LIKE '%bacteremia - gram negative rod%' AND diagnosis.diagnosisname LIKE '%colitis%' AND vitalperiodic.observationtime > patient.hospitaladmittime AND vitalperiodic.observationtime < date(patient.hospitaladmittime, '+1 MONTH')",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the logic by joining unrelated tables (vitalperiodic), adding extra filters on diagnosisname (including an irrelevant 'colitis' condition), and applying a time window on observationtime\u2014none of which align with the intended monthly aggregation of distinct diagnosis records. This is not a fixable syntax or single-clause mistake but a fundamental restructuring error that alters the query\u2019s purpose.",
            "error_type": "Global: incorrect join and filter logic"
        },
        "b2647d82e56896db485d4407": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the name of the prescription drug that patient 030-12393 was prescribed within the same hospital visit after being diagnosed with hyperglycemia in 11/this year?",
            "gold_sql": "SELECT T2.drugname FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '030-12393' ) AND diagnosis.diagnosisname = 'hyperglycemia' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',diagnosis.diagnosistime) = '11' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '030-12393' ) AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',medication.drugstarttime) = '11' ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT medication.drugname FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid INNER JOIN diagnosis ON diagnosis.patientunitstayid = patient.patientunitstayid INNER JOIN vitalperiodic ON vitalperiodic.patientunitstayid = diagnosis.patientunitstayid WHERE diagnosis.icd9code = '401.9' AND strftime('%m',vitalperiodic.observationtime) = '11' AND patient.uniquepid = '030-12393'",
            "gold_answer": "[['aspirin'], ['diltiazem hcl'], ['diltiazem hcl'], ['diltiazem hcl'], ['diltiazem hcl'], ['diltiazem hcl'], ['diphenhydramine hcl'], ['furosemide'], ['furosemide'], ['insulin lispro'], ['lisinopril'], ['metoprolol tartrate'], ['metoprolol tartrate'], ['metoprolol tartrate'], ['metoprolol tartrate'], ['pantoprazole'], ['simvastatin']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the query logic by:\n1. Joining an unrelated vitalperiodic table, which is not part of the question about prescriptions after a hyperglycemia diagnosis.\n2. Filtering diagnosis by icd9code = '401.9' (hypertension) instead of diagnosisname = 'hyperglycemia'.\n3. Filtering on vitalperiodic.observationtime rather than medication.drugstarttime.\n4. Failing to enforce the temporal condition (diagnosis before prescription) and restricting to the same hospital visit.\nThese errors span multiple joins and clauses and fundamentally alter the query\u2019s intended structure and meaning. This is a Global error.",
            "error_type": "Global: join-error"
        },
        "57e889bf3fe08a0c30249fce": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When did patient 006-1016 experience the first instance where their heart rate was greater than 135.0?",
            "gold_sql": "SELECT vitalperiodic.observationtime FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-1016' ) ) AND vitalperiodic.heartrate > 135.0 AND vitalperiodic.heartrate IS NOT NULL ORDER BY vitalperiodic.observationtime ASC LIMIT 1",
            "pred_sql": "SELECT observationtime FROM vitalperiodic WHERE patientunitstayid = 241360 AND heartrate > 135 ORDER BY observationtime LIMIT 1",
            "gold_answer": "[['2100-01-16 02:20:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query hard-codes patientunitstayid = 241360 instead of deriving the correct patientunitstayid(s) for uniquepid '006-1016' via the patient table joins. This is not a simple syntax or column-name mistake but a flawed filtering strategy that breaks the intended relationship between patient and vitalperiodic. It alters which records are considered and thus the overall logic of fetching the first high heart rate event for the specified patient.",
            "error_type": "Global: incorrect join/filter relationship"
        },
        "91fbea49b336f86cd67dbbda": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many days have elapsed since the last time patient 006-106259 got a platelets x 1000 lab test on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',lab.labresulttime) ) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-106259' AND patient.hospitaldischargetime IS NULL ) ) AND lab.labname = 'platelets x 1000' ORDER BY lab.labresulttime DESC LIMIT 1",
            "pred_sql": "SELECT 2100 - strftime('%Y', lab.labresulttime) - strftime('%m', lab.labresulttime) + strftime('%d', lab.labresulttime) AS num FROM patient INNER JOIN lab ON patient.patientunitstayid = lab.patientunitstayid WHERE patient.uniquepid = '006-106259' AND lab.labname = 'platelets x 1000'",
            "gold_answer": "[['1.52']]",
            "pred_answer": "[['15.0'], ['16.0'], ['17.0'], ['18.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to restrict the lab results to the current hospital visit (no filter on hospitaldischargetime) and does not pick the most recent lab (no ORDER BY/LIMIT). It also uses an incorrect formula for date difference (2100 - year - month + day), rather than computing the Julian day difference relative to the fixed current time. These issues span multiple clauses (JOIN, WHERE, SELECT) and alter the overall logic, making the query fundamentally unable to answer the intended question.",
            "error_type": "Global: flawed structure and date calculation"
        },
        "ea593b30374a160e1a7febd4": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Is patient 002-12056's alt (sgpt) last measured on the first hospital visit greater than the first value measured on the first hospital visit?",
            "gold_sql": "SELECT ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-12056' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND lab.labname = 'alt (sgpt)' ORDER BY lab.labresulttime DESC LIMIT 1 ) > ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-12056' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND lab.labname = 'alt (sgpt)' ORDER BY lab.labresulttime ASC LIMIT 1 )",
            "pred_sql": "SELECT DISTINCT CASE WHEN iif(sum(CASE WHEN vitalperiodic.observationlabel = 'ALT (SGPT)' THEN 1 ELSE 0 END) - sum(CASE WHEN vitalperiodic.observationlabel = 'ALT (SGPT)' THEN 0 ELSE 1 END) > 0, 1, 0) THEN 'YES' ELSE 'NO' END FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '002-12056' AND patient.hospitaldischargeoffset = 0",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such column: vitalperiodic.observationlabel",
            "is_correct": false,
            "reasoning": "The predicted SQL references vitalperiodic.observationlabel, but the vitalperiodic table does not have an observationlabel column. This is a straightforward column reference error and does not require restructuring the entire query logic.",
            "error_type": "Local: table/column reference error"
        },
        "fd36b7748e8aadbcb2963358": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What's the respiratory rate change of patient 027-101654 second measured on the first icu visit compared to the first value measured on the first icu visit?",
            "gold_sql": "SELECT ( SELECT vitalperiodic.respiration FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-101654' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 ) AND vitalperiodic.respiration IS NOT NULL ORDER BY vitalperiodic.observationtime ASC LIMIT 1 OFFSET 1 ) - ( SELECT vitalperiodic.respiration FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-101654' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 ) AND vitalperiodic.respiration IS NOT NULL ORDER BY vitalperiodic.observationtime ASC LIMIT 1 )",
            "pred_sql": "SELECT vitalperiodic.respiration - ( SELECT vitalperiodic.respiration FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '027-101654' ORDER BY vitalperiodic.observationtime ASC LIMIT 1 ) AS resp_change FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid ORDER BY vitalperiodic.observationtime ASC LIMIT 1",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['6.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to restrict to the first ICU visit and does not correctly select the second respiration measurement. Instead, it joins all vitalperiodic records for the patient, uses ORDER BY and LIMIT 1 in the outer query (which yields the first measurement, not the second), and lacks the subquery logic to identify the first ICU stay. These mistakes alter the overall query structure and logic rather than a single clause, so this is a global error.",
            "error_type": "Global: incorrect join and filter logic"
        },
        "cd490e6dc2219e3ae3f771d1": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Could you tell me the name of the drug that was prescribed two times to patient 006-101311?",
            "gold_sql": "SELECT T1.drugname FROM ( SELECT medication.drugname, COUNT( medication.drugstarttime ) AS C1 FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-101311' ) ) GROUP BY medication.drugname ) AS T1 WHERE T1.C1 = 2",
            "pred_sql": "SELECT medication.drugname FROM patient INNER JOIN medication ON patient.patientunitstayid = medication.patientunitstayid WHERE patient.uniquepid = '006-101311' GROUP BY medication.drugname ORDER BY count(patient.patientunitstayid) = 2 LIMIT 1",
            "gold_answer": "[['magnesium sulfate 2 gm/50 ml ivpb']]",
            "pred_answer": "[['aspirin 325mg tab']]",
            "is_correct": false,
            "reasoning": "The predicted query correctly joins patient to medication and groups by drugname but mistakenly uses ORDER BY count(...) = 2 and LIMIT 1 instead of filtering with a WHERE or HAVING count = 2. This misuse of ORDER BY is confined to a specific clause and does not require restructuring the joins or overall query logic. It can be fixed locally by replacing the ORDER BY/ LIMIT logic with a HAVING count = 2 filter.",
            "error_type": "Local: incorrect filtering in ORDER BY clause"
        },
        "09866a4f032da7b5f0cf5fef": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What's the cost of a drug known as buffered lidocaine 1%?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'medication' AND cost.eventid IN ( SELECT medication.medicationid FROM medication WHERE medication.drugname = 'buffered lidocaine 1%' )",
            "pred_sql": "SELECT DISTINCT cost.cost FROM medication INNER JOIN cost ON medication.patientunitstayid = cost.patientunitstayid WHERE medication.drugname = 'buffered lidocaine 1%'",
            "gold_answer": "[['14.04']]",
            "pred_answer": "[['10.03'], ['10.04'], ['10.06'], ['10.19'], ['10.42'], ['10.5'], ['10.57'], ['10.61'], ['10.62'], ['10.79'], ['10.82'], ['10.98'], ['11.14'], ['11.5'], ['11.62'], ['11.66'], ['12.14'], ['12.33'], ['12.35'], ['12.68'], ['12.75'], ['12.76'], ['12.78'], ['12.9'], ['12.99'], ['13.17'], ['13.21'], ['13.31'], ['13.42'], ['13.46'], ['13.47'], ['13.5'], ['13.52'], ['13.6'], ['13.65'], ['13.68'], ['13.69'], ['13.79'], ['13.86'], ['13.88'], ['13.91'], ['13.94'], ['13.95'], ['13.97'], ['13.99'], ['14.04'], ['14.05'], ['14.13'], ['14.2'], ['14.27'], ['14.33'], ['14.35'], ['14.39'], ['14.41'], ['14.44'], ['14.62'], ['14.67'], ['14.74'], ['14.83'], ['14.94'], ['14.96'], ['15.0'], ['15.18'], ['15.26'], ['15.3'], ['15.4'], ['15.53'], ['15.74'], ['15.77'], ['15.79'], ['15.85'], ['16.66'], ['6.15'], ['6.23'], ['6.61'], ['6.81'], ['6.91'], ['7.07'], ['7.2'], ['7.51'], ['7.7'], ['7.77'], ['7.82'], ['7.9'], ['7.98'], ['8.13'], ['8.25'], ['8.46'], ['8.52'], ['8.59'], ['8.61'], ['8.63'], ['8.65'], ['8.75'], ['8.78'], ['8.86'], ['8.97'], ['9.01'], ['9.11'], ['9.22']]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins medication to cost on patientunitstayid rather than linking cost.eventid to medication.medicationid and filtering cost.eventtype = 'medication'. This incorrect join key pulls in all cost records for patients who received the drug, rather than the cost of that specific drug event. Fixing it requires restructuring the JOIN and WHERE clauses (using cost.eventid and eventtype), which is a change to the overall query logic rather than a minor local fix.",
            "error_type": "Global: incorrect join key"
        },
        "0ebd60232cb32fabbf55b709": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many prescriptions for 10 ml vial : calcium chloride 10 % iv soln were made?",
            "gold_sql": "SELECT COUNT(*) FROM medication WHERE medication.drugname = '10 ml vial : calcium chloride 10 % iv soln'",
            "pred_sql": "SELECT sum(CASE WHEN medication.drugname = 'Calcium Chloride 10 % IV Soln' THEN 1 ELSE 0 END) FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname LIKE 'Calcium Chloride 10 % IV Soln'",
            "gold_answer": "[['5.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted query incorrectly filters on the drug name 'Calcium Chloride 10 % IV Soln' using LIKE, instead of the exact value '10 ml vial : calcium chloride 10 % iv soln'. This mismatch in the literal value causes no rows to match, yielding NULL. The error is confined to the WHERE clause\u2019s filter value and does not alter the overall query structure or table relationships.",
            "error_type": "Local: value parsing error"
        },
        "d339235d5a63ad8b045e5ffc": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Can you retrieve the time of patient 031-10198's hospital admission since 1 year ago?",
            "gold_sql": "SELECT patient.hospitaladmittime FROM patient WHERE patient.uniquepid = '031-10198' AND datetime(patient.hospitaladmittime) >= datetime('2100-12-31 23:59:00','-1 year')",
            "pred_sql": "SELECT patient.hospitaladmittime FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '031-10198' AND datetime(vitalperiodic.observationtime) >= datetime('2100-12-31', '1 year')",
            "gold_answer": "[['2100-08-12 23:40:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces an unnecessary INNER JOIN to vitalperiodic and filters on vitalperiodic.observationtime instead of patient.hospitaladmittime, and also misuses the datetime offset (uses '1 year' instead of '-1 year'). These mistakes alter the fundamental logic and structure of the query, joining an unrelated table and applying the wrong filter column, so the error cannot be fixed by a small tweak in a single clause.",
            "error_type": "Global: incorrect join and filter logic"
        },
        "f85c9633e450cf4188a98ce3": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Get me the top three most common diagnoses.",
            "gold_sql": "SELECT T1.diagnosisname FROM ( SELECT diagnosis.diagnosisname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM diagnosis GROUP BY diagnosis.diagnosisname ) AS T1 WHERE T1.C1 <= 3",
            "pred_sql": "SELECT diagnosis.diagnosisname FROM diagnosis INNER JOIN ( SELECT patientunitstayid, count(diagnosisname) AS num FROM diagnosis GROUP BY patientunitstayid ORDER BY num DESC LIMIT 3 ) AS t3 ON diagnosis.patientunitstayid = t3.patientunitstayid",
            "gold_answer": "[['acute renal failure'], ['acute respiratory failure'], ['pneumonia']]",
            "pred_answer": "[['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['abdominal pain / tenderness'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute pyelonephritis'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure'], ['acute renal failure - acute tubular necrosis'], ['acute renal failure - acute tubular necrosis'], ['acute renal failure - acute tubular necrosis'], ['acute renal failure - acute tubular necrosis'], ['acute renal failure - acute tubular necrosis'], ['acute renal failure - acute tubular necrosis'], ['acute renal failure - acute tubular necrosis'], ['acute renal failure - acute tubular necrosis'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to hypovolemia/decreased circulating volume'], ['acute renal failure - due to sepsis'], ['acute renal failure - due to sepsis'], ['acute renal failure - due to sepsis'], ['acute renal failure - due to sepsis'], ['acute renal failure - due to sepsis'], ['acute renal failure - due to sepsis'], ['acute renal failure - due to sepsis'], ['acute renal failure - due to sepsis']]",
            "is_correct": false,
            "reasoning": "The predicted SQL finds the top three patients by number of diagnoses (GROUP BY patientunitstayid) and then joins back to list that patients\u2019 diagnoses, rather than finding the top three diagnoses by frequency (GROUP BY diagnosisname). This mistake spans the aggregation, join, and overall query logic, requiring restructuring the query to group by diagnosis and apply ranking. It is not a simple typo or localized clause fix.",
            "error_type": "Global: join logic error"
        },
        "920217f577771de7e12ed857": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the name of the organism found in patient 031-10329's last urine, catheter specimen microbiology test?",
            "gold_sql": "SELECT microlab.organism FROM microlab WHERE microlab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10329' ) ) AND microlab.culturesite = 'urine, catheter specimen' ORDER BY microlab.culturetakentime DESC LIMIT 1",
            "pred_sql": "SELECT organism FROM microlab WHERE patientunitstayid = 3110329 AND culturesite = 'urine, catheter specimen' AND culturetakentime = ( SELECT culturetakentime FROM microlab WHERE patientunitstayid = 3110329 AND culturesite = 'urine, catheter specimen' ORDER BY culturetakentime DESC LIMIT 1 )",
            "gold_answer": "[['klebsiella pneumoniae']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL hardcodes patientunitstayid = 3110329 instead of looking up the correct patientunitstayid via the patient.uniquepid field. This is a column/reference mapping error in the WHERE clause and does not require reworking the overall query structure\u2014just correcting the patient identifier join. Therefore, it\u2019s a local error.",
            "error_type": "Local: column reference error"
        },
        "3369b594f521d600670ecb74": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Compute the number of times patient 018-101040 was prescribed naloxone hcl since 1 year ago.",
            "gold_sql": "SELECT COUNT(*) FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '018-101040' ) ) AND medication.drugname = 'naloxone hcl' AND datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year')",
            "pred_sql": "SELECT count(DISTINCT medication.patientunitstayid) FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'naloxone hcl' AND strftime('%Y', medication.drugstarttime) < strftime('%Y', 'now', '-1 year')",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL not only fails to filter on the specific patient (missing any condition on patient.uniquepid), it also uses COUNT(DISTINCT patientunitstayid) instead of counting events, applies the wrong date comparison with strftime('%Y') against 'now' (instead of datetime('2100-12-31 23:59:00','-1 year')), and even inverts the date logic (< instead of \u2265). These mistakes span multiple clauses (JOIN, WHERE, aggregation) and fundamentally alter the query\u2019s intent, so it\u2019s a global error.",
            "error_type": "Global: incorrect filter and aggregation logic"
        },
        "1538db043c5c441dc0f2d160": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was patient 031-10302's first tested specimen in 04/this year?",
            "gold_sql": "SELECT microlab.culturesite FROM microlab WHERE microlab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10302' ) ) AND datetime(microlab.culturetakentime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',microlab.culturetakentime) = '04' ORDER BY microlab.culturetakentime ASC LIMIT 1",
            "pred_sql": "SELECT lab.labname FROM lab INNER JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE strftime('%Y %m', lab.labresulttime) = '2100 04' AND patient.uniquepid = '031-10302' LIMIT 1",
            "gold_answer": "[['blood, venipuncture']]",
            "pred_answer": "[['anion gap']]",
            "is_correct": false,
            "reasoning": "The predicted SQL pulls from the lab table and selects lab.labname, whereas the question asks for the first tested specimen (microlab.culturesite). This is not a minor column or alias fix but a fundamental choice of the wrong table and field, altering the entire query logic. Therefore it is a Global error.",
            "error_type": "Global: wrong table used"
        },
        "f96e1a80f60671c7b7c3d8a3": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many prescriptions were prescribed in 2100 for dextrose 50% vial?",
            "gold_sql": "SELECT COUNT(*) FROM medication WHERE medication.drugname = 'dextrose 50% vial' AND strftime('%Y',medication.drugstarttime) = '2100'",
            "pred_sql": "SELECT count(DISTINCT medication.medicationid) FROM medication INNER JOIN allergy ON medication.patientunitstayid = allergy.patientunitstayid INNER JOIN vitalperiodic ON medication.patientunitstayid = vitalperiodic.patientunitstayid WHERE allergy.drugname = 'dextrose 50% vial' AND medication.drugname = 'dextrose 50% vial'",
            "gold_answer": "[['9.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces INNER JOINs to the allergy and vitalperiodic tables, filtering by allergy.drugname, which is unrelated to the question about counting prescriptions. This fundamentally alters query logic and table relationships, requiring restructuring the entire query rather than fixing a small clause. Therefore, this is a global error in the join strategy.",
            "error_type": "Global: join error"
        },
        "3a4a57393220eaed3080ce41": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What did patient 030-10040 receive on the last icu visit as their last input?",
            "gold_sql": "SELECT intakeoutput.celllabel FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '030-10040' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime DESC LIMIT 1 ) AND intakeoutput.cellpath LIKE '%intake%' ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.cellpath FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.patientunitstayid = 3010040 ORDER BY intakeoutput.intakeoutputoffset DESC LIMIT 1",
            "gold_answer": "[['ns']]",
            "pred_answer": "no such column: intakeoutput.intakeoutputoffset",
            "is_correct": false,
            "reasoning": "The predicted query fails to execute because it orders by intakeoutput.intakeoutputoffset, a column that doesn\u2019t exist in the intakeoutput table. That is a simple table/column reference error localized to the ORDER BY clause and can be fixed by using the correct column (e.g., intakeoutputtime). This does not require restructuring the overall logic into subqueries or JOIN conditions, so it is a Local error.",
            "error_type": "Local: table/column reference error"
        },
        "01adde799ca93fbb843aea48": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Is the fio2 value second measured on the last hospital visit in patient 031-10622 greater than the value from the first measurement on the last hospital visit?",
            "gold_sql": "SELECT ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10622' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'fio2' ORDER BY lab.labresulttime ASC LIMIT 1 OFFSET 1 ) > ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10622' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'fio2' ORDER BY lab.labresulttime ASC LIMIT 1 )",
            "pred_sql": "SELECT CASE WHEN max(CASE WHEN patient.patientunitstayid = 369273 THEN vitalperiodic.fio2 ELSE NULL END) > max(CASE WHEN patient.patientunitstayid = 1224149 THEN vitalperiodic.fio2 ELSE NULL END) THEN 'YES' ELSE 'NO' END FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.patientunitstayid IN (369273, 1224149)",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such column: vitalperiodic.fio2",
            "is_correct": false,
            "reasoning": "The predicted SQL references a column vitalperiodic.fio2 that does not exist in the vitalperiodic table. This is a simple column reference error, and correcting or changing that reference would not require restructuring the overall query logic (though the logic is also incorrect). This falls under the category of a localized table/column reference error.",
            "error_type": "Local: table/column reference error"
        },
        "a0cf8ef52f1f759a0bad1de7": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Since 1 year ago, what are the top three most frequent drugs prescribed to patients within 2 months after the prescription of ondansetron 4mg/2ml inj?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'ondansetron 4mg/2ml inj' AND datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.drugstarttime < T2.drugstarttime AND datetime(T2.drugstarttime) BETWEEN datetime(T1.drugstarttime) AND datetime(T1.drugstarttime,'+2 month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "SELECT medication.drugname FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugstarttime >= ( SELECT medication.drugstarttime FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'ondansetron 4mg/2ml inj' ) AND medication.drugstarttime < ( SELECT medication.drugstarttime FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'ondansetron 4mg/2ml inj' ) + 2 * 30 * 24 * 60 * 60 GROUP BY medication.drugname ORDER BY count(medication.drugname) DESC LIMIT 3",
            "gold_answer": "[['dextrose 50% vial'], ['ondansetron 4mg/2ml inj'], ['sodium chloride 0.9% 1000 ml']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to implement the core logic of the question: it does not restrict to the past year, it does not correlate each patient\u2019s ondansetron prescription to their subsequent prescriptions, and it uses uncorrelated subqueries for the ondansetron drugstarttime rather than a per-patient join/window. These issues span multiple clauses (WHERE, JOIN, subqueries) and require a complete restructure of the query logic, not just a minor fix in a single clause.",
            "error_type": "Global: incorrect join logic"
        },
        "cd9635be7ce342f3e0c3219b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What is the cost of sodium phosphate 30 mmol/250ml ns?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'medication' AND cost.eventid IN ( SELECT medication.medicationid FROM medication WHERE medication.drugname = 'sodium phosphate 30 mmol/250ml ns' )",
            "pred_sql": "SELECT cost.cost FROM cost INNER JOIN patient ON cost.patienthealthsystemstayid = patient.patienthealthsystemstayid WHERE cost.eventtype = 'medication' AND cost.costid = 13",
            "gold_answer": "[['12.63']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL does not filter costs by the medication event ID nor reference the medication table to identify the correct event. Instead, it hardcodes cost.costid = 13 and introduces an unnecessary join to patient, altering the core logic of linking cost entries to the specified drug. This misjoins tables and changes the intended filtering, requiring restructuring of the query beyond a simple clause fix.",
            "error_type": "Global: join error"
        },
        "4808850ccfbd9313e08bc1e3": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "On the first hospital visit, what is the age of patient 006-100663?",
            "gold_sql": "SELECT patient.age FROM patient WHERE patient.uniquepid = '006-100663' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1",
            "pred_sql": "SELECT patient.age FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.patientunitstayid = 143870",
            "gold_answer": "[['74.0']]",
            "pred_answer": "[['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0'], ['76.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the query\u2019s logic by joining the vitalperiodic table and filtering on a specific patientunitstayid rather than selecting the first hospital visit for uniquepid '006-100663' with hospitaldischargetime IS NOT NULL. It ignores the required ORDER BY and LIMIT, uses the wrong table and key, and returns repeated values. This is not a localized syntax or column mistake but a structural error that alters the intended meaning of the query.",
            "error_type": "Global: incorrect join"
        },
        "2d95eaed3db09e820ba3514d": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What is the yearly average respiratory rate for patient 031-10598 since 164 days ago?",
            "gold_sql": "SELECT AVG(vitalperiodic.respiration) FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10598' ) ) AND vitalperiodic.respiration IS NOT NULL AND datetime(vitalperiodic.observationtime) >= datetime('2100-12-31 23:59:00','-164 day') GROUP BY strftime('%Y',vitalperiodic.observationtime)",
            "pred_sql": "SELECT avg(vitalperiodic.respiration) FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '031-10598' AND vitalperiodic.observationtime > (CURRENT_TIMESTAMP - INTERVAL '164' DAY)",
            "gold_answer": "[['17.138']]",
            "pred_answer": "near \"'164'\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL fails due to a syntax error in the WHERE clause when using \u201cCURRENT_TIMESTAMP - INTERVAL \u2018164\u2019 DAY\u201d, which is invalid in SQLite. This misuse of a temporal expression is localized to the date calculation and does not require restructuring the overall query logic. The rest of the query (JOIN, filters) remains intact, so it\u2019s a specific temporal syntax/local error.",
            "error_type": "Local: other-temporal error"
        },
        "f26a89e87c532d575cf44788": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How much is a ethanol lab test?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'lab' AND cost.eventid IN ( SELECT lab.labid FROM lab WHERE lab.labname = 'ethanol' )",
            "pred_sql": "SELECT labresult FROM lab WHERE labname = 'ethanol'",
            "gold_answer": "[['8.3']]",
            "pred_answer": "[['0.0'], ['0.027'], ['1.0'], ['108.0'], ['114.0'], ['126.0'], ['138.0'], ['141.0'], ['145.0'], ['148.0'], ['15.0'], ['155.0'], ['168.0'], ['183.0'], ['184.0'], ['188.0'], ['193.0'], ['197.4'], ['198.0'], ['209.0'], ['22.0'], ['222.5'], ['223.0'], ['228.0'], ['231.0'], ['234.0'], ['244.0'], ['246.0'], ['247.0'], ['248.0'], ['250.0'], ['264.0'], ['266.0'], ['271.0'], ['284.0'], ['30.0'], ['309.0'], ['313.0'], ['316.3'], ['324.0'], ['338.0'], ['349.0'], ['35.0'], ['353.0'], ['355.0'], ['372.0'], ['383.0'], ['39.0'], ['41.0'], ['422.0'], ['447.0'], ['55.0'], ['60.0'], ['67.0'], ['68.0'], ['72.0'], ['75.0'], ['86.0'], ['89.0'], ['97.0'], ['98.0'], ['99.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL queries lab.labresult instead of retrieving the cost from the cost table. It ignores the cost.eventtype = 'lab' filter and the cost.eventid join, selecting the wrong column and table. Fixing this requires changing the SELECT source to cost.cost and adding the appropriate WHERE conditions, without altering the overall query structure.",
            "error_type": "Local: column reference error"
        },
        "926163a5316b8d10e3e66e0d": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the total stool output in patient 006-106828 yesterday?",
            "gold_sql": "SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-106828' ) ) AND intakeoutput.celllabel = 'stool' AND intakeoutput.cellpath LIKE '%output%' AND datetime(intakeoutput.intakeoutputtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-1 day')",
            "pred_sql": "SELECT sum(CASE WHEN intakeoutput.intakeoutputtime = ( SELECT max(intakeoutput.intakeoutputtime) FROM intakeoutput INNER JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '006-106828' ) THEN intakeoutput.cellvaluenumeric ELSE 0 END) FROM intakeoutput INNER JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '006-106828' AND intakeoutput.cellpath = 'Cumulative output (ml)'",
            "gold_answer": "[['3.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the intended logic: instead of summing stool outputs from yesterday, it sums only the latest cumulative output value regardless of date and uses the wrong cellpath. It omits the date filter and the stool label filter, and restructures the query to use a max timestamp subquery. These are not isolated syntax or reference mistakes but a fundamental misinterpretation of the requirement, requiring a major rewrite of the query logic.",
            "error_type": "Global: incorrect overall logic"
        },
        "8b553152e14bffb35726fff3": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When did patient 022-100769 have their first urine catheter output on 10/21/this year?",
            "gold_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '022-100769' ) ) AND intakeoutput.cellpath LIKE '%output%' AND intakeoutput.celllabel = 'urine catheter' AND datetime(intakeoutput.intakeoutputtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m-%d',intakeoutput.intakeoutputtime) = '10-21' ORDER BY intakeoutput.intakeoutputtime ASC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput INNER JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '022-100769' AND strftime('%Y %m %d', intakeoutput.intakeoutputtime) = '2100 10 21'",
            "gold_answer": "[['2100-10-21 00:00:00']]",
            "pred_answer": "[['2100-10-21 00:00:00'], ['2100-10-21 01:08:00'], ['2100-10-21 01:58:00'], ['2100-10-21 03:03:00'], ['2100-10-21 04:53:00'], ['2100-10-21 06:58:00'], ['2100-10-21 09:00:00'], ['2100-10-21 11:00:00'], ['2100-10-21 12:04:00'], ['2100-10-21 13:00:00'], ['2100-10-21 14:00:00'], ['2100-10-21 15:00:00'], ['2100-10-21 16:00:00'], ['2100-10-21 17:00:00'], ['2100-10-21 18:00:00'], ['2100-10-21 19:00:00'], ['2100-10-21 20:00:00'], ['2100-10-21 21:30:00'], ['2100-10-21 22:00:00'], ['2100-10-21 23:00:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to include the required filters for intakeoutput.cellpath LIKE '%output%' and intakeoutput.celllabel = 'urine catheter', and it omits the ORDER BY ... LIMIT 1 to return only the first event. Instead it returns all intakeoutput events for that patient on the given date. These are errors confined to the WHERE clause and result-ranking clause, and can be fixed by adding the missing filter conditions and ordering/limit without altering the overall query structure.",
            "error_type": "Local: missing filter and limit conditions"
        },
        "3371b2f9debfbbaecaf88aaa": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Show me the top five most common input events this year.",
            "gold_sql": "SELECT T1.celllabel FROM ( SELECT intakeoutput.celllabel, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM intakeoutput WHERE intakeoutput.cellpath LIKE '%intake%' AND datetime(intakeoutput.intakeoutputtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') GROUP BY intakeoutput.celllabel ) AS T1 WHERE T1.C1 <= 5",
            "pred_sql": "SELECT intakeoutput.cellpath FROM intakeoutput INNER JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE intakeoutput.cellpath LIKE '%input%' AND strftime('%Y', intakeoutput.intakeoutputtime) = '2100' GROUP BY intakeoutput.cellpath ORDER BY count(intakeoutput.cellpath) DESC LIMIT 5",
            "gold_answer": "[['continuous infusion meds'], ['ns'], ['ns ivf'], ['oral'], ['p.o.']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query selects and filters on the wrong column (cellpath instead of celllabel), uses LIKE '%input%' instead of LIKE '%intake%', and applies an incorrect year filter with strftime rather than the required datetime start-of-year condition. These mistakes are confined to the SELECT and WHERE clauses and do not alter the overall join structure or logical flow, so they are localized reference and filtering errors.",
            "error_type": "Local: column reference error"
        },
        "ecc45c5ab8349e2cebba606b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What are the top three most commonly prescribed medicines this year?",
            "gold_sql": "SELECT T1.drugname FROM ( SELECT medication.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM medication WHERE datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') GROUP BY medication.drugname ) AS T1 WHERE T1.C1 <= 3",
            "pred_sql": "SELECT medication.drugname FROM medication INNER JOIN cost ON medication.patientunitstayid = cost.patientunitstayid WHERE cost.eventtype = 'medication' AND strftime('%Y', medication.drugstarttime) = strftime('%Y', 'now') GROUP BY medication.drugname ORDER BY count(medication.drugname) DESC LIMIT 3",
            "gold_answer": "[['1000 ml flex cont : sodium chloride 0.9 % iv soln'], ['potassium chloride'], ['tylenol']]",
            "pred_answer": "[['aspart insulin'], ['nacl 0.9% mbp'], ['potassium chloride']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the intended logic in several ways. It introduces an unnecessary INNER JOIN with the cost table (linking medications to cost records) which alters which medication counts are considered, rather than simply counting prescriptions. It also misuses strftime('now') instead of the fixed current date ('2100-12-31 23:59:00') as required by the assumptions. These changes affect the overall structure and meaning of the query rather than a local clause, so this is a global logic/join error.",
            "error_type": "Global: incorrect join/logic error"
        },
        "e196d71a57da821d3fea4ffc": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Is the respiratory rate level of patient 032-10123 second measured on the last icu visit less than the first measurement on the last icu visit?",
            "gold_sql": "SELECT ( SELECT vitalperiodic.respiration FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '032-10123' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime DESC LIMIT 1 ) AND vitalperiodic.respiration IS NOT NULL ORDER BY vitalperiodic.observationtime ASC LIMIT 1 OFFSET 1 ) < ( SELECT vitalperiodic.respiration FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '032-10123' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime DESC LIMIT 1 ) AND vitalperiodic.respiration IS NOT NULL ORDER BY vitalperiodic.observationtime ASC LIMIT 1 )",
            "pred_sql": "SELECT vitalperiodic.respiration < ( SELECT min(respiration) FROM vitalperiodic WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient ORDER BY hospitaldischargetime DESC LIMIT 1 ) ) FROM vitalperiodic WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient ORDER BY hospitaldischargetime DESC LIMIT 1 )",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0'], ['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally alters the intended logic: it fails to filter by the specific patient '032-10123', uses hospitaldischargetime instead of unitdischargetime to identify the last ICU visit, and compares every respiration reading to the minimum respiration rather than comparing only the second measurement to the first. Fixing this would require restructuring the query\u2019s joins, filtering, and comparison logic\u2014not just a localized tweak.",
            "error_type": "Global: join error"
        },
        "a3569887096547747b83607e": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many people were admitted to the hospital?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient",
            "pred_sql": "SELECT count(patientunitstayid) FROM patient",
            "gold_answer": "[['1384.0']]",
            "pred_answer": "[['1788.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts the number of patientunitstayid values (i.e., admissions) rather than the number of unique patients. This is a column reference mistake in the SELECT clause: using patientunitstayid instead of DISTINCT uniquepid. The overall query structure (a single-table aggregate) remains correct; only the chosen column is wrong.",
            "error_type": "Local: column reference error"
        },
        "0ba85fee6d6f0714d590db19": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How frequently were stress ulcer prophylaxis - lansoprazole procedures performed since 1 year ago?",
            "gold_sql": "SELECT COUNT(*) FROM treatment WHERE treatment.treatmentname = 'stress ulcer prophylaxis - lansoprazole' AND datetime(treatment.treatmenttime) >= datetime('2100-12-31 23:59:00','-1 year')",
            "pred_sql": "SELECT count(DISTINCT patientunitstayid) FROM treatment WHERE treatmentstring LIKE '%lansoprazole%' AND strftime('%Y',treatmenttime) >= strftime('%Y', 'now', '-1 year')",
            "gold_answer": "[['15.0']]",
            "pred_answer": "no such column: treatmentstring",
            "is_correct": false,
            "reasoning": "The predicted SQL refers to a non-existent column treatmentstring instead of treatmentname, causing a column reference error. This is a localized mistake that does not require restructuring the query's overall logic or flows, only correcting the column name and possibly the date condition.",
            "error_type": "Local: table/column reference error"
        },
        "1bf033967053a3e88b60ffec": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many current patients are there?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.hospitaldischargetime IS NULL",
            "pred_sql": "SELECT count(patientunitstayid) FROM patient WHERE hospitaldischargeoffset IS NULL",
            "gold_answer": "[['23.0']]",
            "pred_answer": "no such column: hospitaldischargeoffset",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column hospitaldischargeoffset instead of the correct hospitaldischargetime. This is a simple column reference error and does not affect the overall query structure or logic. It can be fixed by using the correct column name without altering the query\u2019s logical flow.",
            "error_type": "Local: column reference error"
        },
        "37bb636cce8f65f6ad5203a7": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the first lab test that patient 028-10451 received this month?",
            "gold_sql": "SELECT lab.labresulttime FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '028-10451' ) ) AND datetime(lab.labresulttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month') ORDER BY lab.labresulttime ASC LIMIT 1",
            "pred_sql": "SELECT patient.patientunitstayid FROM patient INNER JOIN lab ON patient.patientunitstayid = lab.patientunitstayid WHERE patient.uniquepid = '028-10451' AND strftime('%m', lab.labresulttime) = '02' AND lab.labname = 'Urine 1000 100' ORDER BY lab.labresulttime LIMIT 1",
            "gold_answer": "[['2100-12-07 00:59:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL is structurally similar to the ground truth (it uses the same tables and JOIN), but it makes local mistakes in its WHERE and SELECT clauses: it filters on a specific lab name (\u2018Urine 1000 100\u2019) that wasn\u2019t asked, it uses strftime('%m','\u2026') = '02' (wrong month literal) instead of matching the current month via the prescribed datetime('start of month') logic, and it selects patientunitstayid instead of the lab result time. These are all confined to specific expressions and can be corrected without changing the overall query structure or join logic. Therefore this is a Local error, specifically a temporal filter mistake.",
            "error_type": "Local: other-temporal error"
        },
        "a39cccf33e871b8d3c0ee195": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the output of patient 010-10081 for the first time on last month/13?",
            "gold_sql": "SELECT intakeoutput.celllabel FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '010-10081' ) ) AND intakeoutput.cellpath LIKE '%output%' AND datetime(intakeoutput.intakeoutputtime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month') AND strftime('%d',intakeoutput.intakeoutputtime) = '13' ORDER BY intakeoutput.intakeoutputtime ASC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.cellpath FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.uniquepid = '010-10081' AND strftime('%m', intakeoutput.intakeoutputtime) = '13' ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "gold_answer": "[['urine']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query not only selects the wrong column (cellpath instead of celllabel) but also omits the critical output-only filter, misuses the date filtering (month \u201813\u2019, missing last\u2010month/day logic), and even reverses the sort order. Fixing it would require rewriting multiple WHERE clauses, adding path conditions, correcting the date logic, and changing the ORDER direction. This error spans the overall structure and logic, so it\u2019s a global error.",
            "error_type": "Global: incorrect filter and column selection"
        },
        "7cdb91fabb7e08749637f74e": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many individuals are there who are current patients?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.hospitaldischargetime IS NULL",
            "pred_sql": "SELECT count(patientunitstayid) FROM patient WHERE hospitaldischargetime IS NULL",
            "gold_answer": "[['23.0']]",
            "pred_answer": "[['30.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts patientunitstayid for rows where hospitaldischargetime IS NULL, which yields the number of current stays, not distinct individuals. The correct intent is to count unique patients (using DISTINCT patient.uniquepid). This is a localized error in the SELECT clause\u2014specifically the aggregation and missing DISTINCT\u2014without affecting the overall query structure or relationships.",
            "error_type": "Local: missing DISTINCT"
        },
        "d37c1e31e9b13a891e553339": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When this year did patient 010-11267 receive their first bronchoscopy procedure?",
            "gold_sql": "SELECT treatment.treatmenttime FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '010-11267' ) ) AND treatment.treatmentname = 'bronchoscopy' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ORDER BY treatment.treatmenttime ASC LIMIT 1",
            "pred_sql": "SELECT datetime(vitalperiodic.observationtime) FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '010-11267' ORDER BY vitalperiodic.observationtime DESC LIMIT 1",
            "gold_answer": "[['2100-10-04 21:31:00']]",
            "pred_answer": "[['2100-10-10 14:41:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the vitalperiodic table and retrieves the latest observation time for the patient, instead of querying the treatment table for the first 'bronchoscopy' procedure this year. This is not a minor typo or missing column; it fundamentally changes the logic and tables involved, requiring a complete restructuring of the query.",
            "error_type": "Global: incorrect table and logic"
        },
        "62fe58e17f1786b0bd23e365": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the minimum daily number of patients who had urinary tract infection since 1 year ago?",
            "gold_sql": "SELECT MIN(T1.C1) FROM ( SELECT COUNT( DISTINCT diagnosis.patientunitstayid ) AS C1 FROM diagnosis WHERE diagnosis.diagnosisname = 'urinary tract infection' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') GROUP BY strftime('%Y-%m-%d',diagnosis.diagnosistime) ) AS T1",
            "pred_sql": "SELECT count(DISTINCT patient.patientunitstayid) FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE vitalperiodic.observationoffset BETWEEN '-365' AND '-1' AND vitalperiodic.sao2 < 95",
            "gold_answer": "[['1.0']]",
            "pred_answer": "no such column: vitalperiodic.observationoffset",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column vitalperiodic.observationoffset, which is a schema mismatch. This is a localized issue with the column reference and does not require restructuring the overall query logic.",
            "error_type": "Local: table/column reference error"
        },
        "35562087619eaf9ec7769a8d": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Count the number of times that patient 031-14167 received a laboratory test for tibc on the first hospital visit.",
            "gold_sql": "SELECT COUNT(*) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-14167' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND lab.labname = 'tibc'",
            "pred_sql": "SELECT count(lab.labname) FROM patient INNER JOIN lab ON patient.patientunitstayid = lab.patientunitstayid WHERE patient.uniquepid = '031-14167' AND patient.hospitaladmittime = ( SELECT hospitaladmittime FROM patient WHERE uniquepid = '031-14167' ORDER BY hospitaladmittime ASC LIMIT 1 )",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['330.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to apply the filter lab.labname = 'tibc' and omits the requirement that the first hospital visit must have a non\u2010null discharge time. Instead, it simply matches hospitaladmittime to the first admission date, counting all lab tests rather than only TIBC tests. This error spans multiple clauses (missing WHERE condition on labname and incorrect visit logic) and fundamentally alters the intended query meaning, so it is a global logic error.",
            "error_type": "Global: incorrect logic across JOIN and WHERE clauses"
        },
        "0f1282d072f4287535f50953": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How is cefazolin (ancef) in dextrose ivpb 2 g typically consumed?",
            "gold_sql": "SELECT DISTINCT medication.routeadmin FROM medication WHERE medication.drugname = 'cefazolin (ancef) in dextrose ivpb 2 g'",
            "pred_sql": "SELECT CASE WHEN medication.drugname = 'cefacolin (ancef)' THEN '800-30 g/1 ml by mouth' ELSE NULL END FROM medication INNER JOIN cost ON medication.medicationid = cost.eventid WHERE medication.drugname = 'dextrose ivpb 2 g'",
            "gold_answer": "[['ivpb']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL is fundamentally incorrect in its overall structure and logic. Instead of directly selecting the administration route from the medication table for the specific drug, it joins the cost table without any relevant cost filtering, uses an incorrect join key (medication.medicationid = cost.eventid) and wrong drug name filters. It even wraps results in a CASE expression that doesn\u2019t correspond to the question. These issues span multiple clauses (SELECT, JOIN, WHERE) and change the intended query meaning, indicating a global structural/logical error.",
            "error_type": "Global: join error"
        },
        "21a8c17ed1bc28ec4d74aa51": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the last time that patient 003-10024 was diagnosed with acute coronary syndrome - acute myocardial infarction (with st elevation) on the last hospital visit?",
            "gold_sql": "SELECT diagnosis.diagnosistime FROM diagnosis WHERE diagnosis.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '003-10024' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND diagnosis.diagnosisname = 'acute coronary syndrome - acute myocardial infarction (with st elevation)' ORDER BY diagnosis.diagnosistime DESC LIMIT 1",
            "pred_sql": "SELECT diagnosis.diagnosistime FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid WHERE patient.uniquepid = '003-10024' AND diagnosis.diagnosistime = ( SELECT max(diagnosis.diagnosistime) FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid WHERE patient.uniquepid = '003-10024' AND diagnosis.description = 'Acute coronary syndrome - acute myocardial infarction (with st elevation)' )",
            "gold_answer": "[['2100-10-27 17:58:00']]",
            "pred_answer": "no such column: diagnosis.description",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column diagnosis.description instead of diagnosis.diagnosisname, causing a column reference error. This is a localized mistake that can be fixed by correcting the column name without restructuring the overall query.",
            "error_type": "Local: column reference error"
        },
        "a3c5957d0565aeac6aacd10d": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the last time the heart rate of patient 027-104059 registered less than 65.0 on 06/04/this year?",
            "gold_sql": "SELECT vitalperiodic.observationtime FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-104059' ) ) AND vitalperiodic.heartrate < 65.0 AND vitalperiodic.heartrate IS NOT NULL AND datetime(vitalperiodic.observationtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m-%d',vitalperiodic.observationtime) = '06-04' ORDER BY vitalperiodic.observationtime DESC LIMIT 1",
            "pred_sql": "SELECT vitalperiodic.observationtime FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '027-104059' AND vitalperiodic.observationtime LIKE '2100-06-04%' AND vitalperiodic.heartrate < 65",
            "gold_answer": "[['2100-06-04 09:26:14']]",
            "pred_answer": "[['2100-06-04 06:51:14'], ['2100-06-04 06:56:14'], ['2100-06-04 07:01:14'], ['2100-06-04 07:21:14'], ['2100-06-04 07:26:14'], ['2100-06-04 07:31:14'], ['2100-06-04 07:36:14'], ['2100-06-04 07:41:14'], ['2100-06-04 07:46:14'], ['2100-06-04 07:51:14'], ['2100-06-04 07:56:14'], ['2100-06-04 08:01:14'], ['2100-06-04 08:06:14'], ['2100-06-04 08:11:14'], ['2100-06-04 08:16:14'], ['2100-06-04 08:21:14'], ['2100-06-04 08:26:14'], ['2100-06-04 08:31:14'], ['2100-06-04 08:51:14'], ['2100-06-04 08:56:14'], ['2100-06-04 09:01:14'], ['2100-06-04 09:06:14'], ['2100-06-04 09:11:14'], ['2100-06-04 09:16:14'], ['2100-06-04 09:21:14'], ['2100-06-04 09:26:14']]",
            "is_correct": false,
            "reasoning": "The predicted query still joins the correct tables and filters the heart rate < 65 on the specified date, but it fails to implement the \u2018last time\u2019 logic. It omits the ORDER BY observationtime DESC and LIMIT 1, and uses a simple LIKE filter instead of the prescribed datetime/strftime approach. These are errors confined to the WHERE and result\u2010ordering clauses without altering the overall table relationships or structure.",
            "error_type": "Local: missing ORDER BY and LIMIT"
        },
        "9ebae192531eacc7f1be3ed9": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Find out the number of drugs given to patient 006-112408 last month.",
            "gold_sql": "SELECT COUNT(*) FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-112408' ) ) AND datetime(medication.drugstarttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month')",
            "pred_sql": "SELECT count(DISTINCT medication.drugname) FROM patient INNER JOIN medication ON patient.patientunitstayid = medication.patientunitstayid WHERE patient.uniquepid = '006-112408' AND datetime(medication.drugstarttime) BETWEEN datetime('now','start of month', '-1 month') AND datetime('now','start of month', 'start of day', '-1 month')",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query only mis\u2010implements the counting and date condition but does not alter the overall query structure or table relationships. Specifically, it uses count(DISTINCT drugname) instead of COUNT(*) and uses datetime('now',\u2026) instead of the required fixed datetime('2100-12-31 23:59:00', \u2026) logic for last month. These are mistakes localized to the SELECT aggregation and the WHERE temporal filter, not structural join or multi\u2010clause logic errors.",
            "error_type": "Local: other-temporal error"
        },
        "562e56ddd403d8f9db6e6844": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Please list the four most common procedures carried out since 1 year ago.",
            "gold_sql": "SELECT T1.treatmentname FROM ( SELECT treatment.treatmentname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM treatment WHERE datetime(treatment.treatmenttime) >= datetime('2100-12-31 23:59:00','-1 year') GROUP BY treatment.treatmentname ) AS T1 WHERE T1.C1 <= 4",
            "pred_sql": "SELECT treatment.treatmentname FROM patient INNER JOIN treatment ON patient.patientunitstayid = treatment.patientunitstayid WHERE treatment.treatmenttime >= datetime('now', '1 year') GROUP BY treatment.treatmentname ORDER BY count(treatment.treatmentname) DESC LIMIT 4",
            "gold_answer": "[['antiemetic - serotonin antagonist'], ['chest x-ray'], ['mechanical ventilation'], ['stress ulcer prophylaxis - pantoprazole']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query\u2019s structure is mostly correct (it selects treatment names, groups, orders by count, and limits to 4), but its WHERE clause incorrectly uses datetime('now','1 year') instead of the required fixed current time '2100-12-31 23:59:00' with '-1 year'. This violates the temporal assumption and causes no rows to be returned. This is a localized error in the time filter and does not require restructuring the joins or overall logic of the query.",
            "error_type": "Local: temporal error"
        },
        "427cf46f018ef0bce1e0d80a": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What drug was prescribed to patient 012-1134 within the same day subsequent to their narcotic overdose diagnosis on the last hospital visit?",
            "gold_sql": "SELECT T2.drugname FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '012-1134' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) AND diagnosis.diagnosisname = 'narcotic overdose' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '012-1134' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND datetime(T1.diagnosistime,'start of day') = datetime(T2.drugstarttime,'start of day')",
            "pred_sql": "SELECT medication.drugname FROM medication INNER JOIN cost ON medication.patientunitstayid = cost.patientunitstayid INNER JOIN patient ON patient.patientunitstayid = cost.patientunitstayid WHERE medication.patientunitstayid = '012-1134' AND cost.admittime = patient.dischargetime AND cost.diagnosis = 'Narcotic overdose'",
            "gold_answer": "[['0.4 ml syringe : enoxaparin sodium 40 mg/0.4ml sc soln'], ['10 ml vial : calcium gluconate 10 % iv soln'], ['50 ml syringe : dextrose 50 % iv soln'], ['aspirin 81 mg po chew']]",
            "pred_answer": "no such column: cost.admittime",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the cost table instead of the diagnosis and medication tables that contain the necessary diagnosis and prescription times. It references non\u2010existent columns (cost.admittime, cost.diagnosis) and completely misaligns with the intended logic of finding prescriptions after a specific diagnosis on the last hospital visit. Fixing this would require restructuring the query to use diagnosis and medication tables, correct joins, and time comparisons, not just a minor correction in a single clause.",
            "error_type": "Global: incorrect table/join logic"
        },
        "ad04b8b2e4d28dd51a23c781": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Can you tell me about patient 016-10131's age on the first hospital visit?",
            "gold_sql": "SELECT patient.age FROM patient WHERE patient.uniquepid = '016-10131' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1",
            "pred_sql": "SELECT patient.age FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '016-10131' AND patient.hospitaldischargeoffset = 0",
            "gold_answer": "[['51.0']]",
            "pred_answer": "no such column: patient.hospitaldischargeoffset",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces an INNER JOIN on vitalperiodic which is unnecessary but not intrinsically breaking the query\u2019s logic, and more critically refers to a non-existent column hospitaldischargeoffset instead of hospitaldischargetime. This is a localized column reference error that can be fixed by correcting the column name without restructuring the query.",
            "error_type": "Local: column reference error"
        },
        "2ce97a7fc52bca5094ea71b8": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Gather the total output on last month/05 for patient 016-10197.",
            "gold_sql": "SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '016-10197' ) ) AND intakeoutput.cellpath LIKE '%output%' AND datetime(intakeoutput.intakeoutputtime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month') AND strftime('%d',intakeoutput.intakeoutputtime) = '05'",
            "pred_sql": "SELECT sum(intakeoutput.cellvaluenumeric) FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.uniquepid = '016-10197' AND intakeoutput.cellpath = 'output/urine/output.total' AND intakeoutput.cellvaluedatetime BETWEEN '2100-04-01 00:00:00' AND '2100-04-30 23:59:59'",
            "gold_answer": "[['30.0']]",
            "pred_answer": "no such column: intakeoutput.cellvaluedatetime",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non\u2010existent column intakeoutput.cellvaluedatetime instead of the correct intakeoutput.intakeoutputtime. This is a simple column reference mistake localized in the WHERE clause and does not require restructuring the query\u2019s joins or logic.",
            "error_type": "Local: column reference error"
        },
        "f325dc3d2c7b44a43dc1532c": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What is the average yearly number of patient records marked with valvular stenosis - mitral since 1 year ago?",
            "gold_sql": "SELECT AVG(T1.C1) FROM ( SELECT COUNT( DISTINCT diagnosis.patientunitstayid ) AS C1 FROM diagnosis WHERE diagnosis.diagnosisname = 'valvular stenosis - mitral' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') GROUP BY strftime('%Y',diagnosis.diagnosistime) ) AS T1",
            "pred_sql": "SELECT avg(patient.patienthealthsystemstayid) FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE vitalperiodic.observationtime >= datetime('now','start of year', '-1 year') AND vitalperiodic.diastolicbp >= 60 AND vitalperiodic.systolicbp > 120",
            "gold_answer": "[['2.0']]",
            "pred_answer": "no such column: vitalperiodic.diastolicbp",
            "is_correct": false,
            "reasoning": "The predicted SQL uses non-existent columns vitalperiodic.diastolicbp and vitalperiodic.systolicbp, resulting in a column reference error. This mistake is confined to incorrect column names in the WHERE clause and does not alter the overall query structure or logic flow.",
            "error_type": "Local: column reference error"
        },
        "07dbbde6bb9c8b1e8da9444b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How much does the bicarbonate lab test typically cost?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'lab' AND cost.eventid IN ( SELECT lab.labid FROM lab WHERE lab.labname = 'bicarbonate' )",
            "pred_sql": "SELECT cost.cost FROM lab INNER JOIN cost ON lab.patientunitstayid = cost.patientunitstayid WHERE lab.labname = 'Bicarbonate'",
            "gold_answer": "[['8.13']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins lab and cost on patientunitstayid rather than linking cost.eventid to lab.labid and filtering for eventtype = 'lab'. This incorrect join changes the overall logic of the query and fails to restrict to the bicarbonate lab test cost. Fixing this requires altering the join keys and adding filters, which is a structural change, not just a simple typo or localized fix.",
            "error_type": "Global: join error"
        },
        "6f28bb73040fa4b58ef368b2": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Since 11 months ago, when was the last microbiology test conducted for patient 031-10778?",
            "gold_sql": "SELECT microlab.culturetakentime FROM microlab WHERE microlab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10778' ) ) AND datetime(microlab.culturetakentime) >= datetime('2100-12-31 23:59:00','-11 month') ORDER BY microlab.culturetakentime DESC LIMIT 1",
            "pred_sql": "SELECT strftime('%Y-%m', microlab.culturetakentime) FROM patient INNER JOIN microlab ON patient.patientunitstayid = microlab.patientunitstayid WHERE patient.uniquepid = '031-10778' ORDER BY microlab.culturetakentime DESC LIMIT 1",
            "gold_answer": "[['2100-09-15 16:29:00']]",
            "pred_answer": "[['2100-09']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only joins patient\u2192microlab and orders by culturetakentime, but it never applies the \u201csince 11 months ago\u201d filter in the WHERE clause and even formats the date incorrectly (using strftime('%Y-%m') instead of returning the full timestamp). Both issues are confined to the SELECT and WHERE clauses (i.e., they don\u2019t require rethinking the JOINs or overall structure), so they are localized mistakes that can be fixed by adding the datetime filter and correcting the projection.",
            "error_type": "Local: missing time filter and incorrect date formatting"
        },
        "471462b1ab28191d8570e787": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Give me the five most common output events since 2100.",
            "gold_sql": "SELECT T1.celllabel FROM ( SELECT intakeoutput.celllabel, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM intakeoutput WHERE intakeoutput.cellpath LIKE '%output%' AND strftime('%Y',intakeoutput.intakeoutputtime) >= '2100' GROUP BY intakeoutput.celllabel ) AS T1 WHERE T1.C1 <= 5",
            "pred_sql": "SELECT intakeoutput.cellpath FROM intakeoutput INNER JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE patient.unitadmittime < '2100' AND patient.unitadmittime > '1900' AND intakeoutput.cellpath LIKE '%output%' GROUP BY intakeoutput.cellpath ORDER BY count(intakeoutput.cellpath) DESC LIMIT 5",
            "gold_answer": "[['indwelling catheter'], ['stool'], ['urinary catheter output: indwelling/continuous ure'], ['urine'], ['urine catheter']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally alters the query\u2019s logic and structure: it joins the intakeoutput table to patient on unitadmittime, applies incorrect time filters on patient.unitadmittime instead of filtering intakeoutput.intakeoutputtime by year \u2265 '2100', and selects cellpath rather than celllabel. These errors span multiple clauses (JOIN, WHERE, SELECT) and change the intended meaning of the query, requiring a significant rewrite rather than a local fix.",
            "error_type": "Global: incorrect join and filter logic"
        },
        "842cbb900711080a31ff45c7": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Find out the monthly minimum urine output volume of patient 012-1111 since 05/2100.",
            "gold_sql": "SELECT MIN(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '012-1111' ) ) AND intakeoutput.celllabel = 'urine' AND intakeoutput.cellpath LIKE '%output%' AND strftime('%Y-%m',intakeoutput.intakeoutputtime) >= '2100-05' GROUP BY strftime('%Y-%m',intakeoutput.intakeoutputtime)",
            "pred_sql": "SELECT intakeoutput.cellvaluenumeric FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.uniquepid = '012-1111' AND intakeoutput.cellpath = 'PregnancyUrineOutput' AND intakeoutput.intakeoutputtime >= '2005-01-01' AND intakeoutput.cellvaluenumeric > 0",
            "gold_answer": "[['100.0'], ['150.0']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely misses the core logic of the task. Instead of computing the monthly minimum urine output since May 2100 and grouping by month, it selects raw intakeoutput.cellvaluenumeric values without aggregation or grouping. It uses the wrong date filter (\u20182005-01-01\u2019 instead of '2100-05'), the wrong cellpath filter (equality to 'PregnancyUrineOutput' rather than celllabel = 'urine' and cellpath LIKE '%output%'), and omits the MIN() and GROUP BY strftime('%Y-%m', ...) entirely. These mistakes span multiple clauses and fundamentally alter the query\u2019s intended meaning, requiring a full restructuring of the query logic.",
            "error_type": "Global: incorrect aggregation and filtering"
        },
        "bdaee084287bac68d7820aa5": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Count how many times in 2100 patient 004-12030 had tracheal suctioning.",
            "gold_sql": "SELECT COUNT(*) FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-12030' ) ) AND treatment.treatmentname = 'tracheal suctioning' AND strftime('%Y',treatment.treatmenttime) = '2100'",
            "pred_sql": "SELECT count(treatment.treatmentid) FROM patient INNER JOIN treatment ON patient.patientunitstayid = treatment.patientunitstayid WHERE patient.uniquepid = '004-12030' AND treatment.treatmentname = 'tracheostomy tube, suctioning'",
            "gold_answer": "[['5.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to include the year filter (strftime('%Y', treatment.treatmenttime) = '2100') and uses the wrong treatment name literal ('tracheostomy tube, suctioning' instead of 'tracheal suctioning'). Both issues are isolated to the WHERE clause and can be corrected by adjusting these conditions without changing the overall query structure or joins.",
            "error_type": "Local: value/condition error"
        },
        "21c120826fba86457b825834": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Can you tell me the name of the allergy patient 025-10477 had on the current hospital visit?",
            "gold_sql": "SELECT allergy.allergyname FROM allergy WHERE allergy.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '025-10477' AND patient.hospitaldischargetime IS NULL ) )",
            "pred_sql": "SELECT allergy.allergyname FROM allergy INNER JOIN patient ON allergy.patientunitstayid = patient.patientunitstayid WHERE allergy.patientunitstayid = 2510477",
            "gold_answer": "[['levaquin'], ['pcn']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL only filters on allergy.patientunitstayid = 2510477, completely missing the JOIN condition on the patient\u2019s unique PID and the requirement that hospitaldischargetime IS NULL for the current visit. It uses the wrong predicate value instead of filtering by patient.uniquepid and current admission. This is a localized mistake in the WHERE clause and does not require restructuring the query\u2019s overall flow or JOIN logic. It\u2019s a simple incorrect filter condition (value parsing/reference error).",
            "error_type": "Local: incorrect filter condition"
        },
        "30bec392082c2be51f011477": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Tell me patient 016-10268's minimum sao2 since 348 days ago.",
            "gold_sql": "SELECT MIN(vitalperiodic.sao2) FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '016-10268' ) ) AND vitalperiodic.sao2 IS NOT NULL AND datetime(vitalperiodic.observationtime) >= datetime('2100-12-31 23:59:00','-348 day')",
            "pred_sql": "SELECT min(vitalperiodic.sao2) FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '016-10268' AND vitalperiodic.observationtime - patient.admissiontime > 348 * 24 * 60 * 60",
            "gold_answer": "[['88.0']]",
            "pred_answer": "no such column: patient.admissiontime",
            "is_correct": false,
            "reasoning": "The predicted SQL references patient.admissiontime, which does not exist in the schema (the patient table has hospitaladmittime and unitadmittime but no admissiontime). This is a localized column reference error and does not require restructuring the overall query logic.",
            "error_type": "Local: column reference error"
        },
        "3693b0ad14990ea6976343c2": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "among patients in their 60 or above , what are the top four prescribed drugs?",
            "gold_sql": "SELECT T1.drugname FROM ( SELECT medication.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age >= 60 ) GROUP BY medication.drugname ) AS T1 WHERE T1.C1 <= 4",
            "pred_sql": "SELECT medication.drugname FROM vitalperiodic INNER JOIN medication ON vitalperiodic.patientunitstayid = medication.patientunitstayid WHERE vitalperiodic.sao2 >= 60 ORDER BY medication.drugname ASC LIMIT 4",
            "gold_answer": "[['1000 ml flex cont : sodium chloride 0.9 % iv soln'], ['nacl 0.9% mbp'], ['potassium chloride'], ['tylenol']]",
            "pred_answer": "[['.5 ml vial : pneumococcal vac polyvalent 25 mcg/0.5ml ij inj'], ['.5 ml vial : pneumococcal vac polyvalent 25 mcg/0.5ml ij inj'], ['.5 ml vial : pneumococcal vac polyvalent 25 mcg/0.5ml ij inj'], ['.5 ml vial : pneumococcal vac polyvalent 25 mcg/0.5ml ij inj']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the intended logic: it joins medication to vitalperiodic and filters on sao2 rather than selecting patients aged 60 or above. It also orders alphabetically and limits without any aggregation or ranking by prescription frequency. This is not a localized syntax fix but a complete restructuring of the query\u2019s logic and relationships, thus a global error.",
            "error_type": "Global: incorrect join/logic"
        },
        "faed071c4640fac3eb46ce91": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the first procedure patient 017-100002 had on the first hospital visit?",
            "gold_sql": "SELECT treatment.treatmentname FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '017-100002' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) ORDER BY treatment.treatmenttime ASC LIMIT 1",
            "pred_sql": "SELECT treatment.treatmentname FROM patient INNER JOIN treatment ON patient.patientunitstayid = treatment.patientunitstayid WHERE patient.patientunitstayid = 111170",
            "gold_answer": "[['chest x-ray']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely replaces the multi-step logic needed to (1) identify the correct patient via uniquepid, (2) select their first completed hospital visit, and (3) then pick the earliest treatment on that visit. Instead, it hard-codes a single patientunitstayid (111170), omits any uniquepid filter, ignores hospitaldischargetime, and drops the ORDER BY\u2026LIMIT to get the first procedure. This is not a small typo or missing alias\u2014it fundamentally breaks the intended query flow and must be restructured to fix.",
            "error_type": "Global: join/logic error"
        },
        "3c0cb3bd0156ed794e5cd31e": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Which was the first procedure that patient 017-101737 received since 2100?",
            "gold_sql": "SELECT treatment.treatmentname FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '017-101737' ) ) AND strftime('%Y',treatment.treatmenttime) >= '2100' ORDER BY treatment.treatmenttime ASC LIMIT 1",
            "pred_sql": "SELECT procedureevents.itemid FROM patient INNER JOIN procedureevents ON patient.patientunitstayid = procedureevents.patientunitstayid WHERE patient.uniquepid = '017-101737' AND procedureevents.itemid IN (40314, 40313, 40315, 40312) AND procedureevents.procedureordercategoryname = 'Evaluation' ORDER BY procedureevents.procedureordercategorydescription DESC LIMIT 1",
            "gold_answer": "[['cabg']]",
            "pred_answer": "no such table: procedureevents",
            "is_correct": false,
            "reasoning": "The predicted SQL refers to a table named procedureevents, which does not exist in the provided schema. This is a localized error in the FROM/JOIN clause (a table reference error) and does not affect the overall intended logic of selecting the first treatment since 2100. It can be fixed by replacing the nonexistent table with the correct one (treatment) without restructuring the query.",
            "error_type": "Local: table reference error"
        },
        "755f81df3ee4fb5f9851f75c": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the first height reading for patient 002-10122 on the current hospital visit?",
            "gold_sql": "SELECT patient.admissionheight FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-10122' AND patient.hospitaldischargetime IS NULL ) AND patient.admissionheight IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1",
            "pred_sql": "SELECT vitalperiodic.observationtime FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '002-10122' ORDER BY vitalperiodic.observationtime LIMIT 1",
            "gold_answer": "[['157.5']]",
            "pred_answer": "[['2100-12-29 17:50:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL selects vitalperiodic.observationtime instead of patient.admissionheight and does not restrict to the current hospital visit (no hospitaldischargetime IS NULL filter). The mistake is localized to using the wrong table/column and missing the simple WHERE clause for the current visit, rather than a fundamental restructuring of the query logic.",
            "error_type": "Local: column reference error"
        },
        "02cfc24a25bbc3f65344b938": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Tell me the top three most commonly prescribed drugs this year.",
            "gold_sql": "SELECT T1.drugname FROM ( SELECT medication.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM medication WHERE datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') GROUP BY medication.drugname ) AS T1 WHERE T1.C1 <= 3",
            "pred_sql": "SELECT medication.drugname FROM medication INNER JOIN cost ON medication.patientunitstayid = cost.patienthealthsystemstayid WHERE strftime('%Y', medication.drugstarttime) = '2100' GROUP BY medication.drugname ORDER BY count(medication.drugname) DESC LIMIT 3",
            "gold_answer": "[['1000 ml flex cont : sodium chloride 0.9 % iv soln'], ['potassium chloride'], ['tylenol']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces an INNER JOIN to the cost table on medication.patientunitstayid = cost.patienthealthsystemstayid, which is the wrong relationship and isn\u2019t needed to answer the question. This join filters out all medication records and changes the overall logic of the query. Fixing it requires removing or restructuring the join, not just tweaking a column reference in a single clause.",
            "error_type": "Global: incorrect join"
        },
        "3a7f1b2a7cc6efd048eaa761": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Tell me the name of the output patient 004-13203 had last on the last icu visit?",
            "gold_sql": "SELECT intakeoutput.celllabel FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-13203' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime DESC LIMIT 1 ) AND intakeoutput.cellpath LIKE '%output%' ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "pred_sql": "SELECT patient.patientunitstayid FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.patientunitstayid = '004-13203' ORDER BY patient.hospitaldischargeoffset DESC LIMIT 1",
            "gold_answer": "[['urine']]",
            "pred_answer": "no such column: patient.hospitaldischargeoffset",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column `patient.hospitaldischargeoffset`, which is a column reference error. This mistake is confined to an incorrect column name in the SELECT and ORDER BY clauses and does not affect the overall query structure or logic.",
            "error_type": "Local: column reference error"
        },
        "b775d3303dae346b324ba667": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What are the top five most commonly tested specimens?",
            "gold_sql": "SELECT T1.culturesite FROM ( SELECT microlab.culturesite, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM microlab GROUP BY microlab.culturesite ) AS T1 WHERE T1.C1 <= 5",
            "pred_sql": "SELECT labname FROM lab GROUP BY labname ORDER BY count(labname) DESC LIMIT 5",
            "gold_answer": "[['blood, venipuncture'], ['nasopharynx'], ['sputum, tracheal specimen'], ['urine, catheter specimen'], ['urine, voided specimen']]",
            "pred_answer": "[['bedside glucose'], ['chloride'], ['glucose'], ['potassium'], ['sodium']]",
            "is_correct": false,
            "reasoning": "The predicted SQL queries the lab table and labname column, returning lab test names (e.g., 'chloride', 'potassium') instead of specimen sites from the microlab.culturesite column. This is not a minor syntax or alias mistake but a fundamentally wrong choice of table and field, altering the overall query logic. Hence, this is a global error.",
            "error_type": "Global: incorrect table/column"
        },
        "81cd13f00eb5a013f9338eb9": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was patient 025-13916's last procedure conducted since 1 year ago?",
            "gold_sql": "SELECT treatment.treatmenttime FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '025-13916' ) ) AND datetime(treatment.treatmenttime) >= datetime('2100-12-31 23:59:00','-1 year') ORDER BY treatment.treatmenttime DESC LIMIT 1",
            "pred_sql": "SELECT DISTINCT cost.chargetime FROM patient INNER JOIN cost ON patient.patienthealthsystemstayid = cost.patienthealthsystemstayid WHERE patient.uniquepid = '025-13916' AND strftime('%Y',cost.chargetime) >= strftime('%Y', 'now') - 1",
            "gold_answer": "[['2100-07-30 13:53:00']]",
            "pred_answer": "[['2100-07-22 08:00:00'], ['2100-07-22 08:00:00'], ['2100-07-22 08:00:00'], ['2100-07-22 08:00:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 08:20:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-22 14:45:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-23 10:33:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 09:55:00'], ['2100-07-24 22:46:00'], ['2100-07-24 22:46:00'], ['2100-07-24 22:46:00'], ['2100-07-24 22:46:00'], ['2100-07-24 22:46:00'], ['2100-07-24 22:46:00'], ['2100-07-24 22:46:00'], ['2100-07-24 22:46:00'], ['2100-07-24 22:46:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the cost table and patient.patienthealthsystemstayid join instead of the treatment table, completely changing the target entity from procedures (treatments) to billing events. It also misapplies a year filter via strftime('%Y',\u2026) on 'now' rather than using the fixed timestamp and does not order or limit to the last event. These issues are not confined to a single clause but alter the overall logic and results, requiring a structural rewrite to use the correct table and date filtering.",
            "error_type": "Global: incorrect table/join logic"
        },
        "9e28a8849f1adf8f2f7622cd": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Do you know the minimum lipase value of patient 027-100559?",
            "gold_sql": "SELECT MIN(lab.labresult) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-100559' ) ) AND lab.labname = 'lipase'",
            "pred_sql": "SELECT vitalperiodic.lipase FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '027-100559' ORDER BY vitalperiodic.observationtime DESC LIMIT 1",
            "gold_answer": "[['192.0']]",
            "pred_answer": "no such column: vitalperiodic.lipase",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column vitalperiodic.lipase and even joins the wrong table (vitalperiodic instead of lab). This is a simple column/table reference error that does not require restructuring the overall query logic.",
            "error_type": "Local: table/column reference error"
        },
        "607553a977127c390af6f571": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Tell me patient 002-1185's minimum lactate value this month?",
            "gold_sql": "SELECT MIN(lab.labresult) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-1185' ) ) AND lab.labname = 'lactate' AND datetime(lab.labresulttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month')",
            "pred_sql": "SELECT vitalaperiodic.patientunitstayid, min(vitalaperiodic.lactate) FROM vitalaperiodic WHERE strftime('%Y-%m', vitalaperiodic.observationtime) = '2016-06' AND patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '002-1185' )",
            "gold_answer": "[['1.9']]",
            "pred_answer": "no such table: vitalaperiodic",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent table \"vitalaperiodic\" (it should be \"vitalperiodic\" or more appropriately the \"lab\" table for lactate values) and a non-existent column \"lactate\" in that table. This is a localized table/column reference error and does not involve the overall query structure or logic.",
            "error_type": "Local: table/column reference error"
        },
        "584bb8420b45d70a62b843c6": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "On the current icu visit, what was the average value of the mean blood pressure of patient 022-1011?",
            "gold_sql": "SELECT AVG(vitalperiodic.systemicmean) FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '022-1011' ) AND patient.unitdischargetime IS NULL ) AND vitalperiodic.systemicmean IS NOT NULL",
            "pred_sql": "SELECT vitalperiodic.systemicmean FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '022-1011'",
            "gold_answer": "[['76.145']]",
            "pred_answer": "[['-2.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['103.0'], ['103.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only selects raw systemicmean values joined on patientuniquepid without computing an average or filtering to the current ICU visit (unitdischargetime IS NULL). These mistakes are confined to the SELECT and WHERE clauses (missing AVG and missing current\u2010visit filter) and do not alter the overall join structure or logic across multiple clauses. Therefore, this is a Local error.",
            "error_type": "Local: missing-aggregation-and-filter error"
        },
        "c14463e7894fdd618987127c": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Could you tell me the last procedure that patient 009-10008 had this year?",
            "gold_sql": "SELECT treatment.treatmentname FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '009-10008' ) ) AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ORDER BY treatment.treatmenttime DESC LIMIT 1",
            "pred_sql": "SELECT DISTINCT treatment.treatmentname FROM treatment INNER JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '009-10008' AND strftime('%Y',treatment.treatmenttime) = '2100'",
            "gold_answer": "[['antiarrhythmics']]",
            "pred_answer": "[['administration of electrolytes'], ['antiarrhythmics'], ['antibacterials'], ['bronchodilator'], ['chest x-ray'], ['cultures'], ['glucocorticoid administration'], ['insulin'], ['mechanical ventilation'], ['mechanical ventilation'], ['mechanical ventilation'], ['oxygen therapy (40% to 60%)'], ['vasopressors - norepinephrine <= 0.1 micrograms/kg/min'], ['vasopressors - norepinephrine <= 0.1 micrograms/kg/min']]",
            "is_correct": false,
            "reasoning": "The predicted query returns all distinct procedures performed this year for the patient, rather than the single \u2018last\u2019 procedure. It omits the ORDER BY treatment time in descending order and the LIMIT 1 clause that would select the most recent event. This is not a minor typo or column reference issue but a structural flaw that fails to enforce the intended \u2018last procedure\u2019 logic.",
            "error_type": "Global: missing ORDER BY/LIMIT"
        },
        "b33c72567d5a653d849243e5": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Today, when did patient 027-103257 the last time have a stool event?",
            "gold_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-103257' ) ) AND intakeoutput.cellpath LIKE '%output%' AND intakeoutput.celllabel = 'stool' AND datetime(intakeoutput.intakeoutputtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-0 day') ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput INNER JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '027-103257' AND intakeoutput.cellpath = 'Cath Lab Stool' ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "gold_answer": "[['2100-12-31 07:52:05']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL only filters on intakeoutput.cellpath = 'Cath Lab Stool' and omits the required filters: intakeoutput.cellpath LIKE '%output%', intakeoutput.celllabel = 'stool', and the restriction to today\u2019s events. These mistakes are confined to the WHERE clause\u2019s filtering conditions without changing the overall query structure or joins. Thus, it\u2019s a localized column/value reference error.",
            "error_type": "Local: table/column reference error"
        },
        "eba36664c2a331fc498ecae9": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When did patient 030-12393 have a lab test for the last time last month?",
            "gold_sql": "SELECT lab.labresulttime FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '030-12393' ) ) AND datetime(lab.labresulttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month') ORDER BY lab.labresulttime DESC LIMIT 1",
            "pred_sql": "SELECT lab.labresulttime FROM lab INNER JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '030-12393' AND strftime('%Y %m',lab.labresulttime) = ( SELECT strftime('%Y %m', max(lab.labresulttime)) FROM lab INNER JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '030-12393' )",
            "gold_answer": "[['2100-11-25 04:15:00']]",
            "pred_answer": "[['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 17:15:00'], ['2100-11-24 21:40:00'], ['2100-11-25 02:00:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00'], ['2100-11-25 04:15:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL changes the overall logic of the query rather than just fixing a small typo or syntax issue. Instead of explicitly filtering for last month relative to the fixed current date and then ordering and limiting to one result, it attempts to match the YEAR and MONTH of every labresulttime against the YEAR and MONTH of the single maximum labresulttime. This not only misidentifies the correct month period (it doesn\u2019t anchor to \u201clast month\u201d per the assumptions) but also fails to apply LIMIT 1, leading to a fundamentally different result set. Because these problems span the WHERE filtering logic and subquery structure\u2014and alter the intended meaning of the query\u2014this is a Global error.",
            "error_type": "Global: incorrect filtering logic"
        },
        "c185698e6119b9fb668ad531": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was patient 004-10948's last heart rate on 06/21/this year?",
            "gold_sql": "SELECT vitalperiodic.heartrate FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-10948' ) ) AND vitalperiodic.heartrate IS NOT NULL AND datetime(vitalperiodic.observationtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m-%d',vitalperiodic.observationtime) = '06-21' ORDER BY vitalperiodic.observationtime DESC LIMIT 1",
            "pred_sql": "SELECT vitalperiodic.heartrate FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE strftime('%m %d %Y', vitalperiodic.observationtime) = '06 21 2100' AND patient.uniquepid = '004-10948'",
            "gold_answer": "[['99.0']]",
            "pred_answer": "[['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['100.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['101.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['102.0'], ['103.0'], ['103.0'], ['103.0'], ['103.0'], ['103.0'], ['103.0'], ['104.0'], ['104.0'], ['104.0'], ['104.0'], ['104.0'], ['104.0'], ['104.0'], ['104.0'], ['104.0'], ['104.0'], ['104.0'], ['104.0'], ['105.0'], ['105.0'], ['105.0'], ['105.0'], ['105.0'], ['105.0'], ['105.0'], ['106.0'], ['107.0'], ['107.0'], ['108.0'], ['110.0'], ['111.0'], ['112.0'], ['113.0'], ['114.0'], ['114.0'], ['114.0'], ['115.0'], ['115.0'], ['116.0'], ['117.0'], ['117.0'], ['118.0'], ['118.0'], ['119.0'], ['120.0'], ['121.0'], ['121.0'], ['123.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL retrieves all heart rate measurements on 06/21/2100 for patient 004-10948 but never orders them by observation time nor limits the result to the last measurement. The ground truth uses ORDER BY observationtime DESC LIMIT 1 to get exactly the most recent reading. Fixing this requires altering the overall query structure (adding ORDER BY and LIMIT), not just correcting a column name or minor syntax. Therefore, this is a global error.",
            "error_type": "Global: missing ORDER BY and LIMIT"
        },
        "f1e2ffce2af23bd974a8761a": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many patients were given a prescription of amiodarone (cordarone) 150 mg in d5w 100ml bolus since 1 year ago?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid = ( SELECT medication.patientunitstayid FROM medication WHERE medication.drugname = 'amiodarone (cordarone) 150 mg in d5w 100ml bolus' AND datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') )",
            "pred_sql": "SELECT count(patient.patientunitstayid) FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'amiodarone 150 mg prn 100 d5w' AND medication.drugstarttime > datetime(CURRENT_TIMESTAMP, '-1 year')",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query deviates from the ground truth only in localized parts: it uses the wrong drug name literal ('amiodarone 150 mg prn 100 d5w' vs. 'amiodarone (cordarone) 150 mg in d5w 100ml bolus'), employs CURRENT_TIMESTAMP instead of the fixed '2100-12-31 23:59:00' per assumptions, and counts patientunitstayid rather than DISTINCT uniquepid. None of these errors alter the overall logical structure or the table relationships; they are confined to value literals, datetime usage, and aggregation. Hence, this is a Local error.",
            "error_type": "Local: value parsing error"
        },
        "e90c9b066d2e1ffa492a8488": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What is the total number of patients who underwent nitroglycerin this year?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT treatment.patientunitstayid FROM treatment WHERE treatment.treatmentname = 'nitroglycerin' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') )",
            "pred_sql": "SELECT count(patient.patientunitstayid) FROM patient INNER JOIN medication ON patient.patientunitstayid = medication.patientunitstayid WHERE medication.routeadmin = 'N/A' AND strftime('%Y', medication.drugstarttime) = '2100'",
            "gold_answer": "[['21.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query uses the medication table (with a filter on routeadmin) rather than the treatment table and the treatmentname 'nitroglycerin'. It joins the wrong table, applies the wrong filter, and even omits DISTINCT on unique patient IDs. These mistakes alter the entire logic and require rewriting multiple clauses, not just a localized fix.",
            "error_type": "Global: incorrect table/join selection"
        },
        "28eacb920c6c640e5f539aef": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Tell me the difference between the total input and output of patient 002-10122 today.",
            "gold_sql": "SELECT ( SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-10122' ) ) AND intakeoutput.cellpath LIKE '%intake%' AND datetime(intakeoutput.intakeoutputtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-0 day') ) - ( SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-10122' ) ) AND intakeoutput.cellpath LIKE '%output%' AND datetime(intakeoutput.intakeoutputtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-0 day') )",
            "pred_sql": "SELECT sum(CASE WHEN intakeoutput.cellpath LIKE '%input%' THEN intakeoutput.cellvaluenumeric ELSE 0 END) - sum(CASE WHEN intakeoutput.cellpath LIKE '%output%' THEN intakeoutput.cellvaluenumeric ELSE 0 END) AS difference FROM intakeoutput INNER JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '002-10122' AND intakeoutput.intakeoutputtime LIKE '2100-05-21%'",
            "gold_answer": "[['-725.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted query\u2019s logic (subtracting summed inputs minus outputs) matches the intent, but its WHERE clause is wrong. It uses intakeoutput.intakeoutputtime LIKE '2100-05-21%' instead of the prescribed datetime comparison for today ('2100-12-31'), and even uses '%input%' instead of '%intake%'. These mistakes are confined to specific filter conditions and do not require restructuring the overall query, so this is a localized temporal/filtering error.",
            "error_type": "Local: other-temporal error"
        },
        "0506de2f8e7cd7c9aa03f59d": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was patient 004-10164's first minimum total bilirubin in 04/this year?",
            "gold_sql": "SELECT lab.labresulttime FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-10164' ) ) AND lab.labname = 'total bilirubin' AND datetime(lab.labresulttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',lab.labresulttime) = '04' ORDER BY lab.labresult ASC, lab.labresulttime ASC LIMIT 1",
            "pred_sql": "SELECT vitalaperiodic.observationtime FROM vitalaperiodic INNER JOIN patient ON vitalaperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '004-10164' AND strftime('%m', vitalaperiodic.observationtime) = '04' AND vitalaperiodic.vitalaperiodicid IN ( SELECT vitalaperiodic.vitalaperiodicid FROM vitalaperiodic INNER JOIN patient ON vitalaperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '004-10164' AND strftime('%m', vitalaperiodic.observationtime) = '04' GROUP BY vitalaperiodic.observationtime, vitalaperiodic.systemicmean ORDER BY sum(vitalaperiodic.systemicmean) ASC LIMIT 1 )",
            "gold_answer": "[['2100-04-15 22:50:00']]",
            "pred_answer": "no such table: vitalaperiodic",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent table \"vitalaperiodic\" instead of the correct \"vitalperiodic\". This is a simple table name typo/local reference mistake. It can be fixed by correcting the table name without altering the overall query structure or logic flow. Thus, this is a localized error.",
            "error_type": "Local: table reference error"
        },
        "25b215ec07b541e4460d1bd8": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Calculate the difference between the total input and output volume for patient 005-11459 on the last icu visit.",
            "gold_sql": "SELECT ( SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '005-11459' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime DESC LIMIT 1 ) AND intakeoutput.cellpath LIKE '%intake%' ) - ( SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '005-11459' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime DESC LIMIT 1 ) AND intakeoutput.cellpath LIKE '%output%' )",
            "pred_sql": "SELECT sum(intakeoutput.cellvaluenumeric) - sum(intakeoutput.cellvaluenumeric) FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.uniquepid = '005-11459'",
            "gold_answer": "[['675.1']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely abandons the intended logic of the query by: 1) joining patient to intakeoutput without restricting to the last ICU stay (no filter on unitdischargetime IS NOT NULL or ORDER BY patient.unitadmittime DESC LIMIT 1), 2) failing to distinguish intake vs output via cellpath LIKE filters, and 3) subtracting the same SUM(intakeoutput.cellvaluenumeric) from itself. These omissions are not localized syntax mistakes but rather fundamental logical flaws in how the query is structured and how tables are combined to achieve the goal. Fixing this would require restructuring the query to retrieve the correct stay and apply correct filters, not just tweaking a clause.",
            "error_type": "Global: incorrect query logic"
        },
        "afe9c889301128590f41e44b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the first time that patient 007-10026 had his/her respiratory rate checked?",
            "gold_sql": "SELECT vitalperiodic.observationtime FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '007-10026' ) ) AND vitalperiodic.respiration IS NOT NULL ORDER BY vitalperiodic.observationtime ASC LIMIT 1",
            "pred_sql": "SELECT observationtime FROM vitalperiodic WHERE patientunitstayid = 11026 AND respiration IS NOT NULL ORDER BY observationtime ASC LIMIT 1",
            "gold_answer": "[['2100-04-20 03:04:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL makes an incorrect assumption about the patientunitstayid by hard-coding = 11026 instead of deriving it via the patient.uniquepid = '007-10026'. This is a localized error in the WHERE clause filter, not a fundamental join or structural issue. It can be fixed by replacing the literal with the correct subquery or lookup, without altering the overall query structure.",
            "error_type": "Local: value parsing error"
        },
        "7c89f2615c9df69c34bbec67": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When did patient 031-10578 receive a urine, voided specimen microbiology test for the last time since 10/2100?",
            "gold_sql": "SELECT microlab.culturetakentime FROM microlab WHERE microlab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10578' ) ) AND microlab.culturesite = 'urine, voided specimen' AND strftime('%Y-%m',microlab.culturetakentime) >= '2100-10' ORDER BY microlab.culturetakentime DESC LIMIT 1",
            "pred_sql": "SELECT lab.labresulttime FROM lab INNER JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '031-10578' AND lab.labname = 'Urine, void specimen' AND strftime('%Y',lab.labresulttime) = '2100' AND strftime('%m',lab.labresulttime) = '10' ORDER BY lab.labresulttime DESC LIMIT 1",
            "gold_answer": "[['2100-12-05 03:15:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL queries the lab table and uses lab.labname instead of querying microlab.culturesite on the microlab table. The question explicitly asks for a microbiology test result (\u201curine, voided specimen microbiology test\u201d), which is stored in microlab, not lab. By using the wrong table and field, it completely changes the query\u2019s logic and returns no results. This is not a simple typo in a column name but a fundamental structural error requiring a different table and join, so it is a global error.",
            "error_type": "Global: wrong table usage"
        },
        "efb670084c99628cf9947e3b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Retrieve the top three most common input events since 2 year ago.",
            "gold_sql": "SELECT T1.celllabel FROM ( SELECT intakeoutput.celllabel, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM intakeoutput WHERE intakeoutput.cellpath LIKE '%intake%' AND datetime(intakeoutput.intakeoutputtime) >= datetime('2100-12-31 23:59:00','-2 year') GROUP BY intakeoutput.celllabel ) AS T1 WHERE T1.C1 <= 3",
            "pred_sql": "SELECT intakeoutput.cellpath FROM vitalperiodic INNER JOIN intakeoutput ON vitalperiodic.patientunitstayid = intakeoutput.patientunitstayid WHERE intakeoutput.cellpath LIKE '%input%' AND vitalperiodic.observationtime > datetime('now', '-2 years') GROUP BY intakeoutput.cellpath ORDER BY count(intakeoutput.cellpath) DESC LIMIT 3",
            "gold_answer": "[['continuous infusion meds'], ['ns ivf'], ['p.o.']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces a JOIN with the vitalperiodic table, which is not required by the question and fundamentally changes the scope of the query by restricting intake events to those with matching vital records. It also selects cellpath instead of celllabel and uses the wrong time reference ('now' instead of the fixed '2100-12-31 23:59:00'), altering the intended logic. These issues span multiple clauses and require restructuring the query logic to fix, so it is a Global error.",
            "error_type": "Global: incorrect join"
        },
        "1f0a42220dea53233554b8ab": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Show me the difference between patient 002-1185's total input and output yesterday.",
            "gold_sql": "SELECT ( SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-1185' ) ) AND intakeoutput.cellpath LIKE '%intake%' AND datetime(intakeoutput.intakeoutputtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-1 day') ) - ( SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-1185' ) ) AND intakeoutput.cellpath LIKE '%output%' AND datetime(intakeoutput.intakeoutputtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-1 day') )",
            "pred_sql": "SELECT sum(CASE WHEN intakeoutput.cellpath LIKE '%intake%' THEN intakeoutput.cellvaluenumeric ELSE 0 END) - sum(CASE WHEN intakeoutput.cellpath LIKE '%output%' THEN intakeoutput.cellvaluenumeric ELSE 0 END) FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.uniquepid = '002-1185' AND intakeoutput.intakeoutputtime LIKE '2100-12-31%'",
            "gold_answer": "[['2826.0']]",
            "pred_answer": "[['936.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL has a localized mistake in the WHERE clause: it filters intakeoutput.intakeoutputtime LIKE '2100-12-31%' (today) instead of filtering for yesterday using the required datetime(...) = datetime('2100-12-31 23:59:00','start of day','-1 day'). This temporal filter error is confined to a specific condition and does not require restructuring joins or the overall logic.",
            "error_type": "Local: other-temporal error"
        },
        "22bb11305202941a2417c8ab": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many times was milk of magnesia ud liq 30 ml prescribed for patient 006-102963 on the first hospital visit?",
            "gold_sql": "SELECT COUNT(*) FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-102963' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND medication.drugname = 'milk of magnesia ud liq 30 ml'",
            "pred_sql": "SELECT count(patient.patientunitstayid) FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patientunitstayid = 61880 AND medication.drugname = 'milk of magnesia ud liq 30 ml'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL hard-codes a single patientunitstayid (61880) rather than using the subquery logic to identify the patient\u2019s first hospital visit by patienthealthsystemstayid and hospitaladmittime as required. By replacing the multi-step filter with a fixed unitstayid, it fundamentally changes the query\u2019s intent and yields the wrong result. This is not a minor syntax or column reference mistake but a structural flaw in how the first hospital visit is determined.",
            "error_type": "Global: incorrect filtering logic"
        },
        "fbe51bdcf93df9fe52db2682": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Present the count of icu visits for patient 027-100293 in 2100.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.patientunitstayid ) FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-100293' ) AND strftime('%Y',patient.unitadmittime) = '2100'",
            "pred_sql": "SELECT count(patienthealthsystemstayid) FROM patient WHERE uniquepid = '027-100293' AND unitdischargeoffset >= 2100000000",
            "gold_answer": "[['1.0']]",
            "pred_answer": "no such column: unitdischargeoffset",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column 'unitdischargeoffset' in the patient table, causing the error 'no such column: unitdischargeoffset'. This is a localized column reference issue in the WHERE clause and does not affect the overall query structure or logic.",
            "error_type": "Local: table/column reference error"
        },
        "919f039cb4f4fe92f49e7c86": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many current patients belong to the 30s age category?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.hospitaldischargetime IS NULL AND patient.age BETWEEN 30 AND 39",
            "pred_sql": "SELECT count(patientunitstayid) FROM patient WHERE age >= 30 AND age < 40 AND hospitaldischargeoffset IS NULL",
            "gold_answer": "[['1.0']]",
            "pred_answer": "no such column: hospitaldischargeoffset",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column hospitaldischargeoffset instead of the correct hospitaldischargetime. This is purely a column reference error localized to the WHERE clause and does not alter the overall query structure or logic.",
            "error_type": "Local: table/column reference error"
        },
        "23bd0f2e14627cd02d82be60": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Tell me the name of the lab test that patient 004-11678 received first on the current hospital visit?",
            "gold_sql": "SELECT lab.labname FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-11678' AND patient.hospitaldischargetime IS NULL ) ) ORDER BY lab.labresulttime ASC LIMIT 1",
            "pred_sql": "SELECT lab.labname FROM lab INNER JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE patient.patientunitstayid = 11678 ORDER BY patient.hospitaladmittime DESC LIMIT 1",
            "gold_answer": "[['sodium']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins lab to patient but then filters on patient.patientunitstayid = 11678 (erroneously treating the unique PID as the unit stay ID) and omits the WHERE patient.hospitaldischargetime IS NULL condition entirely. This is not a simple typo or local clause mistake\u2014it fundamentally alters which records are selected and ignores the \"current hospital visit\" requirement. Correcting this requires restructuring the filter logic (using patient.uniquepid and checking hospitaldischargetime IS NULL), so it is a global error.",
            "error_type": "Global: incorrect filter and join logic"
        },
        "a18e5a51354eb5e0974771b6": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Among patients who received non-invasive ventilation this year, what are the top four most frequent medications that followed within the same month?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'non-invasive ventilation' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.drugstarttime AND datetime(T1.treatmenttime,'start of month') = datetime(T2.drugstarttime,'start of month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "SELECT medication.drugname FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugstarttime LIKE '2100-11%' AND patient.unittype LIKE 'VENT' GROUP BY medication.drugname ORDER BY count(patient.patientunitstayid) DESC LIMIT 4",
            "gold_answer": "[['1000 ml flex cont : sodium chloride 0.9 % iv soln'], ['potassium chloride'], ['potassium chloride 20 meq in 50 ml ivpb **locked dose'], ['potassium chloride crys er 20 meq po tbcr']]",
            "pred_answer": "no such column: patient.unittype",
            "is_correct": false,
            "reasoning": "The predicted SQL references patient.unittype, which does not exist in the provided schema, causing a column reference error. This is a localized mistake in the WHERE clause that does not require restructuring the overall query logic.",
            "error_type": "Local: table/column reference error"
        },
        "e3634a5a873426f73dde721b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What drugs are being added to patient 002-1185's prescription today, as compared to yesterday?",
            "gold_sql": "SELECT medication.drugname FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.uniquepid = '002-1185' ) AND datetime(medication.drugstarttime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-0 day') EXCEPT SELECT medication.drugname FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.uniquepid = '002-1185' ) AND datetime(medication.drugstarttime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-1 day')",
            "pred_sql": "SELECT DISTINCT CASE WHEN datetime(medication.drugstarttime) = datetime('2100-12-31 23:59:59') THEN 'today' ELSE 'yesterday' END AS date FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '002-1185'",
            "gold_answer": "[['acetaminophen 325 mg po tabs']]",
            "pred_answer": "[['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday'], ['yesterday']]",
            "is_correct": false,
            "reasoning": "The predicted SQL does not follow the overall intended logic of finding drug names added today compared to yesterday. Instead of selecting and comparing medication.drugname sets for today and yesterday (using EXCEPT), it simply returns a CASE expression of 'today' or 'yesterday' labels without any drug names or set difference. This is a fundamental structural and logical error that affects the entire query rather than a localized clause.",
            "error_type": "Global: incorrect query logic"
        },
        "c18b36446697d1dd00ce17f4": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Tell me the maximum overall hospital cost that includes ipratropium bromide 0.02 % in soln this year?",
            "gold_sql": "SELECT MAX(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT medication.patientunitstayid FROM medication WHERE medication.drugname = 'ipratropium bromide 0.02 % in soln' ) ) AND datetime(cost.chargetime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "SELECT max(cost.cost) FROM cost INNER JOIN patient ON cost.patienthealthsystemstayid = patient.patienthealthsystemstayid WHERE cost.cost = 'ipratropium bromide 0.02 % in soln this year'",
            "gold_answer": "[['3713.41']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely fails to capture the intended logic: it never sums costs per hospital stay, never filters by the medication or by the year, and even compares the numeric cost column to a string that includes the drug name and 'this year'. It only joins cost to patient and then applies a nonsensical WHERE clause on cost.cost. Fixing this would require rewriting the core structure of the query (adding subqueries or GROUP BY, proper joins to medication, date filtering, and summing), not just tweaking a single clause. Therefore, this is a Global error.",
            "error_type": "Global: join/logical error"
        },
        "4dcadc3a7cd58583235ea6cf": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the last time when patient 017-100143 was prescribed atorvastatin and furosemide at the same time in 07/2100?",
            "gold_sql": "SELECT T1.drugstarttime FROM ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '017-100143' ) AND medication.drugname = 'atorvastatin' AND strftime('%Y-%m',medication.drugstarttime) = '2100-07' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '017-100143' ) AND medication.drugname = 'furosemide' AND strftime('%Y-%m',medication.drugstarttime) = '2100-07' ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE datetime(T1.drugstarttime) = datetime(T2.drugstarttime) ORDER BY T1.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT medication.drugstarttime FROM patient INNER JOIN medication ON patient.patientunitstayid = medication.patientunitstayid WHERE medication.drugname IN ('atorvastatin', 'furosemide') AND patient.uniquepid = '017-100143' AND strftime('%m%Y', medication.drugstarttime) = '072100' ORDER BY medication.drugstarttime DESC LIMIT 1",
            "gold_answer": "[['2100-07-02 20:00:00']]",
            "pred_answer": "[['2100-07-04 02:00:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL simply filters medication records where the drug is either atorvastatin or furosemide and then takes the most recent date. It never enforces that both drugs were prescribed at the exact same time. The ground truth uses two subqueries (one for each drug) and then joins them on identical drugstarttime to ensure simultaneity. Furthermore, the predicted SQL\u2019s date filter strftime('%m%Y',\u2026) = '072100' is incorrectly formatted versus the required '%Y-%m' = '2100-07'. These mistakes alter the overall logic of the query\u2014simultaneity and correct month-year filtering\u2014so it is not a minor local fix but a fundamental structural error.",
            "error_type": "Global: incorrect join and date filtering logic"
        },
        "68b12c03eab7834e3298ca0d": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Can you tell me when patient 031-10407 had their first pleural fluid microbiology test in 11/2100?",
            "gold_sql": "SELECT microlab.culturetakentime FROM microlab WHERE microlab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10407' ) ) AND microlab.culturesite = 'pleural fluid' AND strftime('%Y-%m',microlab.culturetakentime) = '2100-11' ORDER BY microlab.culturetakentime ASC LIMIT 1",
            "pred_sql": "SELECT microlab.culturetakentime FROM patient INNER JOIN microlab ON patient.patientunitstayid = microlab.patientunitstayid WHERE patient.uniquepid = '031-10407' AND strftime('%Y %m',microlab.culturetakentime) = '2100 11'",
            "gold_answer": "[['2100-11-23 22:20:00']]",
            "pred_answer": "[['2100-11-22 15:20:00'], ['2100-11-23 22:20:00'], ['2100-11-23 22:20:00'], ['2100-11-23 22:20:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to restrict to culture site = 'pleural fluid', misuses the strftime format (using '%Y %m' vs '%Y-%m'), and omits the ORDER BY\u2026LIMIT 1 to pull just the first result. All of these issues are confined to specific clauses (WHERE and SELECT) and can be corrected without changing the overall join structure or logic, so this is a Local error.",
            "error_type": "Local: temporal-function/filter error"
        },
        "4f38f917911345d009b28a4b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How much did patient 004-11359 weigh when measured for the last time this month?",
            "gold_sql": "SELECT patient.admissionweight FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-11359' ) AND patient.admissionweight IS NOT NULL AND datetime(patient.unitadmittime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month') ORDER BY patient.unitadmittime DESC LIMIT 1",
            "pred_sql": "SELECT dischargeweight FROM patient WHERE uniquepid = '004-11359' ORDER BY patienthealthsystemstayid DESC LIMIT 1",
            "gold_answer": "[['74.8']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL not only uses the wrong column (dischargeweight instead of admissionweight) but also omits the critical time filter for \u201cthis month\u201d and does not order by unitadmittime. This is not a small typo but a fundamental change to the query\u2019s logic and structure, requiring significant restructuring to fix. Therefore it\u2019s a global error.",
            "error_type": "Global: incorrect logic and missing time filter"
        },
        "aba5ef6d5ebe30061e4ec2df": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Tell me the number of times patient 027-105098 got a urine event today.",
            "gold_sql": "SELECT COUNT(*) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-105098' ) ) AND intakeoutput.cellpath LIKE '%output%' AND intakeoutput.celllabel = 'urine' AND datetime(intakeoutput.intakeoutputtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-0 day')",
            "pred_sql": "SELECT count(cost.eventid) FROM cost INNER JOIN patient ON cost.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '027-105098' AND cost.eventtype = 'urine' AND cost.eventtime = '2100-12-01'",
            "gold_answer": "[['5.0']]",
            "pred_answer": "no such column: cost.eventtime",
            "is_correct": false,
            "reasoning": "The predicted query refers to cost.eventtime, which is not a valid column in the cost table, and it even uses the wrong table (cost) instead of intakeoutput for urine events. The primary issue is a missing/incorrect column reference rather than a wholesale restructuring of the query\u2019s logic. This is a localized error that can be fixed by using the correct table and column names.",
            "error_type": "Local: table/column reference error"
        },
        "07ac0c8bc729ad36ff0e48ae": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What diagnosis did patient 027-111437 receive the last time since 1 year ago?",
            "gold_sql": "SELECT diagnosis.diagnosisname FROM diagnosis WHERE diagnosis.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-111437' ) ) AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ORDER BY diagnosis.diagnosistime DESC LIMIT 1",
            "pred_sql": "SELECT diagnosis.diagnosisname FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid WHERE patient.patientunitstayid = 1027 AND diagnosis.diagnosistime > datetime('now', '-1 year')",
            "gold_answer": "[['hyponatremia']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query\u2019s structure (JOIN diagnosis to patient and filtering by a time window) matches the ground truth, but the WHERE clause is wrong: it hard\u2010codes patientunitstayid = 1027 instead of selecting by the given uniquepid through patienthealthsystemstayid, and it uses datetime('now') instead of the fixed '2100-12-31 23:59:00' reference. These are localized mistakes in the WHERE filters that can be fixed without reworking the overall query logic.",
            "error_type": "Local: incorrect WHERE filter"
        },
        "46eb2774e27a79287f213ed3": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the last input time of patient 006-104324 on the first icu visit?",
            "gold_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-104324' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 ) AND intakeoutput.cellpath LIKE '%intake%' ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.intakeoutputtime FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.patientunitstayid = '006-104324' AND patient.hospitaldischargeoffset = 1 ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "gold_answer": "[['2100-05-10 10:00:00']]",
            "pred_answer": "no such column: patient.hospitaldischargeoffset",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column patient.hospitaldischargeoffset, causing an execution error. This is a localized issue with a column reference and does not alter the overall query structure or logic.",
            "error_type": "Local: table/column reference error"
        },
        "3a01a286c1423e44aaa74e8b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What drug was patient 022-102442 allergic to last month?",
            "gold_sql": "SELECT allergy.drugname FROM allergy WHERE allergy.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '022-102442' ) ) AND datetime(allergy.allergytime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month')",
            "pred_sql": "SELECT allergy.drugname FROM allergy INNER JOIN patient ON patient.patientunitstayid = allergy.patientunitstayid WHERE strftime('%Y %m', allergy.allergytime) = '2100 12' AND patient.uniquepid = '022-102442'",
            "gold_answer": "[['codeine phosphate'], ['lidocaine'], ['penicillin g benzathine']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL correctly joins allergy to patient and filters by the given patient identifier, but it applies the wrong date filter for \"last month.\" Instead of using the 'start of month','-1 month' logic to target November (the month before the fixed current date of 2100-12-31), it hardcodes strftime('%Y %m') = '2100 12', which erroneously selects December. This is a mistake localized to the WHERE clause\u2019s temporal condition and does not require restructuring the query\u2019s overall logic or joins.",
            "error_type": "Local: temporal filter error"
        },
        "686a213e1cb9376d7b32c3c5": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What is the cost of a diagnosis of upper gi bleeding - esophageal?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'diagnosis' AND cost.eventid IN ( SELECT diagnosis.diagnosisid FROM diagnosis WHERE diagnosis.diagnosisname = 'upper gi bleeding - esophageal' )",
            "pred_sql": "SELECT sum(cost.cost) FROM diagnosis INNER JOIN cost ON diagnosis.patientunitstayid = cost.patientunitstayid WHERE diagnosis.diagnosisname = 'upper gastrointestinal bleeding - esophageal'",
            "gold_answer": "[['7.86']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally alters the intended logic by joining cost and diagnosis on patientunitstayid rather than filtering cost.eventid to match diagnosis.diagnosisid and cost.eventtype = 'diagnosis'. It also uses the wrong diagnosis name text ('upper gastrointestinal bleeding - esophageal' vs 'upper gi bleeding - esophageal'), resulting in no matching rows. These issues span multiple parts of the query (JOIN condition, WHERE filters) and change the query\u2019s meaning, requiring a restructuring of the query logic.",
            "error_type": "Global: join error"
        },
        "fb6a8797ebccfafdd3738ab6": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the name of the lab test that patient 027-101119 first had since 03/2100?",
            "gold_sql": "SELECT lab.labname FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-101119' ) ) AND strftime('%Y-%m',lab.labresulttime) >= '2100-03' ORDER BY lab.labresulttime ASC LIMIT 1",
            "pred_sql": "SELECT lab.labname FROM cost INNER JOIN patient ON cost.patienthealthsystemstayid = patient.patienthealthsystemstayid INNER JOIN lab ON lab.patientunitstayid = patient.patientunitstayid WHERE cost.eventtype = 'lab' AND patient.uniquepid = '027-101119' AND datetime(cost.eventtime) >= datetime('2100 03 21 23:59:00') LIMIT 1",
            "gold_answer": "[['ptt ratio']]",
            "pred_answer": "no such column: cost.eventtime",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it references a non-existent column cost.eventtime. This is a localized error in the SELECT\u2019s WHERE clause (a column reference issue), not a fundamental flaw in the overall query structure or join logic. It can be fixed by correcting the column name without restructuring the query\u2019s logic.",
            "error_type": "Local: table/column reference error"
        },
        "7f90858ee680596075465460": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many patients received a lithium lab test since 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT lab.patientunitstayid FROM lab WHERE lab.labname = 'lithium' AND strftime('%Y',lab.labresulttime) >= '2100' )",
            "pred_sql": "SELECT count(patientunitstayid) FROM lab WHERE labname LIKE '%lithium%' AND labresulttime LIKE '2100%'",
            "gold_answer": "[['3.0']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts the number of lab rows (tests) rather than the distinct number of patients, and it omits the DISTINCT and patient table reference entirely. It thus fundamentally changes the metric being computed (tests vs. patients) and requires restructuring the aggregation logic, not just a minor fix in one clause. This spans multiple parts of the query (FROM, SELECT, aggregation), altering the overall intent.",
            "error_type": "Global: aggregation error"
        },
        "a29b614ffd343441d111352e": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the first time that patient 013-10167 has been prescribed medication via the rectal route on the current hospital visit?",
            "gold_sql": "SELECT medication.drugstarttime FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '013-10167' AND patient.hospitaldischargetime IS NULL ) ) AND medication.routeadmin = 'rectal' ORDER BY medication.drugstarttime ASC LIMIT 1",
            "pred_sql": "SELECT medication.drugstarttime FROM patient INNER JOIN medication ON patient.patientunitstayid = medication.patientunitstayid WHERE patient.patientunitstayid = '013-10167' AND medication.routeadmin = 'oral' AND medication.drugname = 'clonidine hydrochloride 100 mg'",
            "gold_answer": "[['2100-12-15 07:28:06']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query fails to capture the overall structure required: it joins patient to medication but then filters patientunitstayid directly against the patient\u2019s unique ID, uses the wrong route ('oral' instead of 'rectal'), adds an extraneous drug filter, and omits the subquery logic to restrict to the current hospital visit. These issues span multiple clauses (JOIN, WHERE) and break the intended logic of identifying the current visit and the correct route, so they cannot be fixed by a minor local tweak.",
            "error_type": "Global: incorrect join and filter logic"
        },
        "f88531ecfa6e7dda7883c2ed": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Calculate the number of patients diagnosed with acute copd exacerbation - with baseline hypoxemia in 2100.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT diagnosis.patientunitstayid FROM diagnosis WHERE diagnosis.diagnosisname = 'acute copd exacerbation - with baseline hypoxemia' AND strftime('%Y',diagnosis.diagnosistime) = '2100' )",
            "pred_sql": "SELECT count(patient.patientunitstayid) FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid WHERE diagnosis.diagnosisname = 'acute copd exacerbation' AND substr(diagnosis.diagnosistime, 1, 4) = '2100'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['191.0']]",
            "is_correct": false,
            "reasoning": "The predicted query\u2019s JOIN structure is acceptable, but the WHERE clause is incorrect in two local ways: it filters for diagnosisname = 'acute copd exacerbation' instead of the full 'acute copd exacerbation - with baseline hypoxemia', and it uses count(patient.patientunitstayid) instead of COUNT(DISTINCT patient.uniquepid). These mistakes are confined to the SELECT/WHERE clause and do not alter the overall query logic or table relationships.",
            "error_type": "Local: incorrect WHERE value and missing DISTINCT"
        },
        "eefab9f6dfaede81ed784769": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What new medications were introduced for patient 015-100025 today compared to the ones yesterday?",
            "gold_sql": "SELECT medication.drugname FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.uniquepid = '015-100025' ) AND datetime(medication.drugstarttime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-0 day') EXCEPT SELECT medication.drugname FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.uniquepid = '015-100025' ) AND datetime(medication.drugstarttime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-1 day')",
            "pred_sql": "SELECT count(CASE WHEN datetime(drugstarttime, 'start of day') = datetime('2100-12-31 23:59:00', 'start of day', '-1 day') THEN drugname ELSE NULL END) - count(CASE WHEN datetime(drugstarttime, 'start of day') = datetime('2100-12-31 23:59:00', 'start of day', '-1 day') THEN drugname ELSE NULL END) FROM medication WHERE patientunitstayid = 150025",
            "gold_answer": "[['1 ml : heparin sodium (porcine) 5000 unit/ml ij soln'], ['1 ml vial : heparin sodium (porcine) 1000 unit/ml ij soln'], ['100 ml flex cont : sodium chloride 0.9 % iv soln'], ['acetaminophen 325 mg po tabs'], ['alteplase 2 mg ij solr'], ['aspirin 81 mg po chew'], ['atorvastatin calcium 40 mg po tabs'], ['carvedilol 25 mg po tabs'], ['diphenhydramine hcl 25 mg po caps'], ['famotidine 20 mg po tabs'], ['nitroglycerin 0.4 mg sl subl'], ['oxycodone hcl 5 mg po tabs'], ['prednisone 10 mg po tabs'], ['prednisone 20 mg po tabs'], ['prednisone 5 mg po tabs'], ['sodium chloride 0.9 % ij soln']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the intended set-difference logic into an aggregate count subtraction, never filters for today (uses yesterday\u2019s date twice), and even uses a hard\u2010coded patientunitstayid instead of mapping uniquepid. This goes beyond a simple column or filter mistake and requires rewriting multiple clauses (SELECT, WHERE, the core logic). It is a global error in the overall query structure and logic.",
            "error_type": "Global: flawed query logic"
        },
        "5578185fae1372b4229faeb9": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many hours has it been since patient 006-106828 got their first prescription of dext 5%-nacl 0.45%-kcl 20meq lvp on the current hospital visit?",
            "gold_sql": "SELECT 24 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',medication.drugstarttime) ) FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-106828' ) AND patient.hospitaldischargetime IS NULL ) AND medication.drugname = 'dext 5%-nacl 0.45%-kcl 20meq lvp' ORDER BY medication.drugstarttime ASC LIMIT 1",
            "pred_sql": "SELECT strftime('%J', medication.drugstoptime) - strftime('%J', medication.drugstarttime) FROM patient INNER JOIN medication ON patient.patientunitstayid = medication.patientunitstayid WHERE patient.uniquepid = '006-106828'",
            "gold_answer": "[['29.85']]",
            "pred_answer": "[['0.001'], ['0.003'], ['0.008'], ['0.008'], ['0.008'], ['0.012'], ['0.018'], ['0.04'], ['0.062'], ['0.115'], ['0.211'], ['0.285'], ['0.722'], ['1.006'], ['1.09'], ['1.407'], ['1.407'], ['1.407'], ['1.407'], ['1.407'], ['1.979'], ['2.008'], ['2.008'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to implement multiple crucial aspects of the requested query: it uses drugstoptime instead of the current time, omits filtering for the specific drug name, does not restrict to the current hospital visit, does not select only the first prescription (no ORDER BY/LIMIT), and does not multiply the day difference by 24. These omissions and miscalculations affect the overall logic and structure of the query, requiring substantial restructuring rather than a simple fix in one clause.",
            "error_type": "Global: flawed logic and structure"
        },
        "e54f79288280b63cd8d19288": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Show me the four most common specimens tested in 2100.",
            "gold_sql": "SELECT T1.culturesite FROM ( SELECT microlab.culturesite, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM microlab WHERE strftime('%Y',microlab.culturetakentime) = '2100' GROUP BY microlab.culturesite ) AS T1 WHERE T1.C1 <= 4",
            "pred_sql": "SELECT labname FROM lab GROUP BY labname ORDER BY count(labname) DESC LIMIT 4",
            "gold_answer": "[['blood, venipuncture'], ['nasopharynx'], ['sputum, tracheal specimen'], ['urine, catheter specimen']]",
            "pred_answer": "[['bedside glucose'], ['glucose'], ['potassium'], ['sodium']]",
            "is_correct": false,
            "reasoning": "The predicted SQL pulls from the lab table and uses labname, whereas the question concerns specimen cultures (microlab.culturesite) tested in year 2100. This is due to referencing the wrong table and column, not a deeper structural or multi-clause logical error.",
            "error_type": "Local: table reference error"
        },
        "e62f5265a62839d76b9c6085": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Tell me the total number of patients in ward 1027 since 1 year ago?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.wardid = 1027 AND datetime(patient.unitadmittime) >= datetime('2100-12-31 23:59:00','-1 year')",
            "pred_sql": "SELECT count(patientunitstayid) FROM patient WHERE wardid = 1027 AND hospitaldischargetime IS NOT NULL AND hospitaldischargetime > (TIMESTAMP 'now' - 365)",
            "gold_answer": "[['1.0']]",
            "pred_answer": "near \"'2100-12-31 23:59:00'\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL not only contains a syntax error with the TIMESTAMP 'now' expression (violating the time\u2010handling assumptions) but also fundamentally changes the query\u2019s logic. It filters on hospitaldischargetime instead of unitadmittime, requires hospitaldischargetime IS NOT NULL (thus excluding current patients), and counts patientunitstayid rather than distinct patient.uniquepid. These mistakes span multiple clauses and alter the intended meaning, so correcting it requires restructuring the WHERE clause and the SELECT aggregation, not just tweaking a single condition.",
            "error_type": "Global: logical error"
        },
        "f909c0386f0ae38828a9dc22": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the last time patient 033-11873 came to the hospital through floor?",
            "gold_sql": "SELECT patient.hospitaladmittime FROM patient WHERE patient.uniquepid = '033-11873' AND patient.hospitaladmitsource = 'floor' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1",
            "pred_sql": "SELECT patient.unitadmittime FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '033-11873' ORDER BY patient.unitadmittime DESC LIMIT 1",
            "gold_answer": "[['2100-03-07 21:45:00']]",
            "pred_answer": "[['2100-03-18 02:57:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally alters the query\u2019s logic by joining the wrong table (vitalperiodic) and using unitadmittime instead of hospitaladmittime. It also omits the required filter on hospitaladmitsource = 'floor' and the discharge check. This is not a minor syntax or reference mistake but a complete change of the intended structure and meaning.",
            "error_type": "Global: join error"
        },
        "900d73ff4784d0bc4c545e13": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Find the length in days of the first icu stay for patient 012-11370.",
            "gold_sql": "SELECT strftime('%J',patient.unitdischargetime) - strftime('%J',patient.unitadmittime) FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '012-11370' ) AND patient.unitadmittime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1",
            "pred_sql": "SELECT (strftime('%J', patient.hospitaladmittime) - strftime('%J', patient.unitadmittime)) - 1 FROM patient INNER JOIN icustay ON patient.patientunitstayid = icustay.patientunitstayid INNER JOIN vitalaperiodic ON icustay.patientunitstayid = vitalaperiodic.patientunitstayid WHERE patient.uniquepid = '012-11370' ORDER BY patient.hospitaladmittime LIMIT 1",
            "gold_answer": "[['5.401']]",
            "pred_answer": "no such table: icustay",
            "is_correct": false,
            "reasoning": "The predicted query references a non-existent table `icustay` (and even misspells `vitalperiodic` as `vitalaperiodic`), causing a missing table error. This is a straightforward table/column reference mistake localized to the FROM/JOIN clauses and does not require restructuring the entire query logic.",
            "error_type": "Local: table reference error"
        },
        "1db95e938a46a412595101d6": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Among patients in their 50s , what are the top five prescribed drugs in 2100?",
            "gold_sql": "SELECT T1.drugname FROM ( SELECT medication.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age BETWEEN 50 AND 59 ) AND strftime('%Y',medication.drugstarttime) = '2100' GROUP BY medication.drugname ) AS T1 WHERE T1.C1 <= 5",
            "pred_sql": "SELECT medication.drugname FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE strftime('%Y', patient.admissiontime) = '2100' AND strftime('%Y', medication.drugstarttime) = '2100' AND patient.patientage >= '50' ORDER BY medication.drugname DESC LIMIT 5",
            "gold_answer": "[['1000 ml flex cont : sodium chloride 0.9 % iv soln'], ['acetaminophen'], ['fentanyl'], ['midazolam'], ['potassium chloride']]",
            "pred_answer": "no such column: patient.admissiontime",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column patient.admissiontime, causing a 'no such column' error. This is a localized column reference mistake that does not alter the overall query structure or logic.",
            "error_type": "Local: table/column reference error"
        },
        "d36a003d44b40986f4c9f773": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What does a procedure under the name bronchodilator - ipratropium cost?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'treatment' AND cost.eventid IN ( SELECT treatment.treatmentid FROM treatment WHERE treatment.treatmentname = 'bronchodilator - ipratropium' )",
            "pred_sql": "SELECT sum(cost.cost) FROM treatment INNER JOIN cost ON treatment.treatmentid = cost.eventid WHERE treatment.treatmentname = 'bronchodilator - ipratropium'",
            "gold_answer": "[['7.82']]",
            "pred_answer": "[['3804.96']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses SUM(cost.cost) and omits the WHERE cost.eventtype = 'treatment' filter, whereas the ground truth selects the distinct cost for that treatment. The mistake is localized to the SELECT aggregation and missing eventtype condition; the overall query structure (joining treatment to cost) is correct. Thus, this is a local error in aggregation and filtering, not a structural or multi-clause logic error.",
            "error_type": "Local: aggregation/filter error"
        },
        "222b30c626c9d40e3e5ba330": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the name of the input that patient 016-10105 had first had on the first icu visit?",
            "gold_sql": "SELECT intakeoutput.celllabel FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '016-10105' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 ) AND intakeoutput.cellpath LIKE '%intake%' ORDER BY intakeoutput.intakeoutputtime ASC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.cellpath FROM intakeoutput INNER JOIN patient ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.uniquepid = '016-10105' ORDER BY patient.hospitaladmittime ASC LIMIT 1",
            "gold_answer": "[['p.o.']]",
            "pred_answer": "[['flowsheet|flowsheet cell labels|i&o|output (ml)|urine']]",
            "is_correct": false,
            "reasoning": "The predicted query completely alters the intended logic: it does not restrict to the patient\u2019s first ICU visit (no filtering on unitadmittime/unitdischargetime), it fails to filter for input events (no cellpath LIKE '%intake%'), orders by hospitaladmittime instead of intakeoutput time, and even selects the wrong column (cellpath vs. celllabel). These errors span multiple clauses and require a full restructure of the query, not just a minor fix in one clause.",
            "error_type": "Global: join-logic error"
        },
        "adf3b75d45df166e7546b701": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many days have there been since patient 002-10122's admission to the hospital?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',patient.hospitaladmittime) ) FROM patient WHERE patient.uniquepid = '002-10122' AND patient.hospitaldischargetime IS NULL",
            "pred_sql": "SELECT strftime('%J', hospitaladmittime) - strftime('%J', admissiontime) AS daysadmitted FROM patient WHERE uniquepid = '002-10122'",
            "gold_answer": "[['2.263']]",
            "pred_answer": "no such column: admissiontime",
            "is_correct": false,
            "reasoning": "The predicted query references a non-existent column admissiontime instead of the correct hospitaladmittime, leading to a column reference error. This is a localized mistake in the SELECT clause and WHERE clause rather than a flaw in the overall query logic or structure.",
            "error_type": "Local: table/column reference error"
        },
        "53c37ca3610c5c63ad42caa5": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Give me the details of the time patient 021-102127 was admitted to the hospital in 2100.",
            "gold_sql": "SELECT patient.hospitaladmittime FROM patient WHERE patient.uniquepid = '021-102127' AND strftime('%Y',patient.hospitaladmittime) = '2100'",
            "pred_sql": "SELECT patient.hospitaladmittime FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '021-102127' AND strftime('%Y', patient.hospitaladmittime) = '2100'",
            "gold_answer": "[['2100-03-15 17:09:00']]",
            "pred_answer": "[['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00'], ['2100-03-15 17:09:00']]",
            "is_correct": false,
            "reasoning": "The predicted query adds an INNER JOIN to the vitalperiodic table on patientunitstayid, which is not requested by the question. This join is unnecessary and unrelated to admission time, and it causes the admission time to be duplicated once for each matching vitalperiodic record. Fixing this would require removing the join entirely rather than a simple tweak within a single clause, as it fundamentally changes the query logic and structure.",
            "error_type": "Global: incorrect-join error"
        },
        "f82872c399e9c56e24060fd1": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the name of the procedure that was performed two or more times last month on patient 010-10275?",
            "gold_sql": "SELECT T1.treatmentname FROM ( SELECT treatment.treatmentname, COUNT( treatment.treatmenttime ) AS C1 FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '010-10275' ) ) AND datetime(treatment.treatmenttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month') GROUP BY treatment.treatmentname ) AS T1 WHERE T1.C1 >= 2",
            "pred_sql": "SELECT DISTINCT vitalperiodic.vitalname FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.unitdischargeoffset = '02' AND patient.uniquepid = '010-10275' AND vitalperiodic.vitalname LIKE '%procedure%' GROUP BY vitalperiodic.vitalname HAVING count(vitalperiodic.patientunitstayid) > 2",
            "gold_answer": "[['non-invasive ventilation']]",
            "pred_answer": "no such column: vitalperiodic.vitalname",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column \"vitalperiodic.vitalname\", causing a column reference error. This is a localized mistake in the SELECT clause rather than a flaw in the overall query structure or logic. The fix would involve correcting the column and table references, but the rest of the query framework (SELECT, JOIN, GROUP BY, HAVING) remains intact.",
            "error_type": "Local: table/column reference error"
        },
        "cf12388db91329bf2b7bd2cf": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many times since 1 year ago did patient 030-11483 receive a hct test?",
            "gold_sql": "SELECT COUNT(*) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '030-11483' ) ) AND lab.labname = 'hct' AND datetime(lab.labresulttime) >= datetime('2100-12-31 23:59:00','-1 year')",
            "pred_sql": "SELECT count(vitalperiodic.observationtime) FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '030-11483' AND vitalperiodic.observationtime >= datetime('2100-01-01 00:00:00', 'start of year', '-1 year')",
            "gold_answer": "[['3.0']]",
            "pred_answer": "[['508.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts rows from the vitalperiodic table (vital sign observations) instead of the lab table, and thus uses an entirely different table and join logic than intended. This mistake affects the core logic of the query, not just a localized clause or alias. Therefore, it is a global error in the query structure and table relationships.",
            "error_type": "Global: incorrect table join"
        },
        "6dd0c27259db780596544f5f": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How much did patient 031-10188 weigh the first time it was measured in 09/2100?",
            "gold_sql": "SELECT patient.admissionweight FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10188' ) AND patient.admissionweight IS NOT NULL AND strftime('%Y-%m',patient.unitadmittime) = '2100-09' ORDER BY patient.unitadmittime ASC LIMIT 1",
            "pred_sql": "SELECT patient.admissionweight FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '031-10188' AND strftime('%Y-%m-%d', vitalperiodic.observationtime) = '2100-09-01'",
            "gold_answer": "[['94.8']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins the patient table to vitalperiodic and filters on vitalperiodic.observationtime when the question is specifically asking for the admission weight recorded in the patient table (patient.admissionweight) at the first unit admission in September 2100. This is a fundamental logic error: it uses the wrong table for weight data and the wrong time filter, altering the intended query structure and meaning. Fixing it requires removing the join, changing the date criteria to unitadmittime, and ordering by that field\u2014i.e., a global restructuring of the query.",
            "error_type": "Global: join-logic error"
        },
        "8a40ba404a60b00e4b158864": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "This year, what are the top five most commonly taken specimens for patients within the same month after the diagnosis of prostate ca?",
            "gold_sql": "SELECT T3.culturesite FROM ( SELECT T2.culturesite, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'prostate ca' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, microlab.culturesite, microlab.culturetakentime FROM microlab JOIN patient ON microlab.patientunitstayid = patient.patientunitstayid WHERE datetime(microlab.culturetakentime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.culturetakentime AND datetime(T1.diagnosistime,'start of month') = datetime(T2.culturetakentime,'start of month') GROUP BY T2.culturesite ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT diagnosis.icd9code FROM diagnosis INNER JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE strftime('%Y %m', diagnosis.diagnosistime) = '2100 12' AND diagnosis.icd9code LIKE '585.4%' GROUP BY diagnosis.icd9code ORDER BY count(diagnosis.icd9code) DESC LIMIT 5",
            "gold_answer": "[['sputum, expectorated']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL entirely abandons the intended logic of retrieving the most common microlab.culturesite within the same month after a 'prostate ca' diagnosis this year. Instead, it selects diagnosis.icd9code, filters on a year\u2010month string and an unrelated ICD9 pattern, and groups by diagnoses rather than specimens. It fails to join diagnosis to microlab, omits the same\u2010month and post\u2010diagnosis conditions, and uses the wrong column and table. Fixing this would require rewriting major parts of the query, not just a localized tweak.",
            "error_type": "Global: incorrect table and logic"
        },
        "3c14c5beb79448ccd421c493": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the first time that patient 021-10001 had the maximum value of sao2 yesterday?",
            "gold_sql": "SELECT vitalperiodic.observationtime FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '021-10001' ) ) AND vitalperiodic.sao2 IS NOT NULL AND datetime(vitalperiodic.observationtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-1 day') ORDER BY vitalperiodic.sao2 DESC, vitalperiodic.observationtime ASC LIMIT 1",
            "pred_sql": "SELECT vitalperiodic.observationtime FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '021-10001' AND vitalperiodic.observationtime >= datetime('2100 12 31 23:59:00',' 1 day') AND vitalperiodic.sao2 = ( SELECT max(sao2) FROM vitalperiodic INNER JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '021-10001' AND vitalperiodic.observationtime >= datetime('2100 12 31 23:59:00',' 1 day') )",
            "gold_answer": "[['2100-12-30 19:59:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it uses an incorrect datetime function call and filter for \"yesterday\". It writes datetime('2100 12 31 23:59:00',' 1 day') instead of the prescribed datetime('2100-12-31 23:59:00','start of day','-1 day'). As a result, no rows match the date condition and the max(sao2) subquery also uses the same wrong filter. This is a localized error in the WHERE clause\u2019s date handling rather than a flaw in the overall join strategy or query structure.",
            "error_type": "Local: other-temporal error"
        },
        "12a07e53370dee4c45959cd3": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Which are the top three most frequent output events since 2 year ago?",
            "gold_sql": "SELECT T1.celllabel FROM ( SELECT intakeoutput.celllabel, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM intakeoutput WHERE intakeoutput.cellpath LIKE '%output%' AND datetime(intakeoutput.intakeoutputtime) >= datetime('2100-12-31 23:59:00','-2 year') GROUP BY intakeoutput.celllabel ) AS T1 WHERE T1.C1 <= 3",
            "pred_sql": "SELECT intakeoutput.cellpath FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE intakeoutput.cellpath IS NOT NULL AND intakeoutput.cellpath LIKE '%output%' AND strftime('%Y', intakeoutput.intakeoutputtime) < strftime('%Y', 'now') - 2 ORDER BY intakeoutput.cellpath DESC LIMIT 3",
            "gold_answer": "[['stool'], ['urine'], ['urine catheter']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally deviates from the intended structure and logic. Instead of aggregating by celllabel and ranking the counts to find the top three frequent output events since two years ago, it selects cellpath (not celllabel), adds an unnecessary JOIN to the patient table, applies an incorrect time filter using strftime('%Y') < strftime('%Y','now') - 2, and simply orders by cellpath descending with a LIMIT 3. These changes alter the overall query purpose\u2014there is no grouping, counting, or proper time window check\u2014so this is not a localized fix but a structural logic error.",
            "error_type": "Global: flawed aggregation and filtering logic"
        },
        "38ed40195f70eb4a952a2a53": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many times was morphine 5 mg/ml injection : 1 ml vial medication prescribed?",
            "gold_sql": "SELECT COUNT(*) FROM medication WHERE medication.drugname = 'morphine 5 mg/ml injection : 1 ml vial'",
            "pred_sql": "SELECT count(DISTINCT medication.patientunitstayid) FROM medication INNER JOIN treatment ON medication.patientunitstayid = treatment.patientunitstayid WHERE medication.drugname = 'morphine 5 mg/ml'",
            "gold_answer": "[['12.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query not only mismatches the drug name filter ('morphine 5 mg/ml' vs the exact 'morphine 5 mg/ml injection : 1 ml vial') but also introduces an unnecessary INNER JOIN to the treatment table and changes the aggregation from COUNT(*) of medication rows to COUNT(DISTINCT patientunitstayid). This alters the overall query logic and structure, affecting the intended result.",
            "error_type": "Global: incorrect join and aggregation"
        },
        "f10a334eb28950674d5eac2e": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What is the minimum total cost of the hospital visits that involve a procedure called insertion of venous catheter for hemodialysis since 1 year ago?",
            "gold_sql": "SELECT MIN(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT treatment.patientunitstayid FROM treatment WHERE treatment.treatmentname = 'insertion of venous catheter for hemodialysis' ) ) AND datetime(cost.chargetime) >= datetime('2100-12-31 23:59:00','-1 year') GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "SELECT sum(CASE WHEN cost.eventtype = 'Procedure' AND cost.description = 'insertion of venous catheter for hemodialysis' THEN cost.cost ELSE 0 END) FROM cost INNER JOIN patient ON cost.patienthealthsystemstayid = patient.patienthealthsystemstayid WHERE cost.eventdate >= datetime(patient.hospitaladmittime, '-1 year') AND cost.eventdate <= datetime(patient.hospitaladmittime)",
            "gold_answer": "[['1640.7']]",
            "pred_answer": "no such column: cost.description",
            "is_correct": false,
            "reasoning": "The predicted SQL not only references a non-existent column (cost.description) but also completely changes the intended logic\u2014joining cost directly to patient, using the wrong date filters, failing to group by visit and take the minimum across sums, and ignoring the treatment table. Fixing these issues would require a major restructuring of the query, not just a local tweak.",
            "error_type": "Global: join and aggregation logic error"
        },
        "a22b861f262fa2427d8449ff": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What are the top three frequent input events this year?",
            "gold_sql": "SELECT T1.celllabel FROM ( SELECT intakeoutput.celllabel, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM intakeoutput WHERE intakeoutput.cellpath LIKE '%intake%' AND datetime(intakeoutput.intakeoutputtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') GROUP BY intakeoutput.celllabel ) AS T1 WHERE T1.C1 <= 3",
            "pred_sql": "SELECT cellpath FROM intakeoutput WHERE cellpath LIKE '%input%' AND intakeoutputtime >= datetime('2100 12 31 23:59:00','start of year') GROUP BY cellpath ORDER BY count(cellpath) DESC LIMIT 3",
            "gold_answer": "[['continuous infusion meds'], ['ns ivf'], ['p.o.']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s mistakes are confined to specific clauses: it uses the wrong column (cellpath instead of celllabel), the wrong LIKE pattern ('%input%' instead of '%intake%'), and an incorrectly formatted datetime condition. These are localized errors in the SELECT and WHERE clauses that can be fixed without restructuring the entire query logic.",
            "error_type": "Local: column reference/value parsing error"
        },
        "d6c3eb4c10881ccf9ced74ae": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Give me the three most frequent procedures performed.",
            "gold_sql": "SELECT T1.treatmentname FROM ( SELECT treatment.treatmentname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM treatment GROUP BY treatment.treatmentname ) AS T1 WHERE T1.C1 <= 3",
            "pred_sql": "SELECT procedure_name FROM procedure WHERE procedure_name IS NOT NULL GROUP BY procedure_name ORDER BY count(procedure_name) DESC LIMIT 3",
            "gold_answer": "[['chest x-ray'], ['mechanical ventilation'], ['stress ulcer prophylaxis - pantoprazole']]",
            "pred_answer": "no such table: procedure",
            "is_correct": false,
            "reasoning": "The predicted SQL references a table named `procedure` and column `procedure_name`, which do not exist in the given schema. This is a localized issue with table/column references and does not involve the overall query logic or structure.",
            "error_type": "Local: table/column reference error"
        },
        "34d60bc7469406d563e8cc3b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was patient 010-10081's first value of ionized calcium this month?",
            "gold_sql": "SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '010-10081' ) ) AND lab.labname = 'ionized calcium' AND datetime(lab.labresulttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month') ORDER BY lab.labresulttime ASC LIMIT 1",
            "pred_sql": "SELECT DISTINCT lab.labresult FROM lab INNER JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE lab.labname = 'ionized calcium' AND patient.uniquepid = '010-10081' AND strftime('%Y %m', lab.labresulttime) = '2100 10' LIMIT 1",
            "gold_answer": "[['4.88']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query fails because it misparses \u201cthis month,\u201d using strftime('%Y %m') = '2100 10' (October) instead of filtering December 2100 via the prescribed start\u2010of\u2010month logic. This is a localized mistake in the WHERE clause\u2019s time filter, not a fundamental restructuring of joins or the overall logic.",
            "error_type": "Local: temporal filter error"
        },
        "107f5deba92d185055ac3f20": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How many patients were diagnosed with acute respiratory failure within 2 months following the previous diagnosis of pneumonia in 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'pneumonia' AND strftime('%Y',diagnosis.diagnosistime) = '2100' ) AS T1 JOIN ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'acute respiratory failure' AND strftime('%Y',diagnosis.diagnosistime) = '2100' ) AS T2 WHERE T1.diagnosistime < T2.diagnosistime AND datetime(T2.diagnosistime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month')",
            "pred_sql": "SELECT count(patient.patientunitstayid) FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE vitalperiodic.observationtime = ( SELECT diagnosis.diagnosistime FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid WHERE diagnosis.icd9code = '78552' ORDER BY diagnosis.diagnosistime DESC LIMIT 1 ) + 2 MONTH AND vitalperiodic.observationtime < ( SELECT diagnosis.diagnosistime FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid WHERE diagnosis.icd9code = '250.41' ORDER BY diagnosis.diagnosistime DESC LIMIT 1 ) + 2 MONTH",
            "gold_answer": "[['107.0']]",
            "pred_answer": "near \"MONTH\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted query completely diverges from the intended logic: it brings in the vitalperiodic table (irrelevant to counting diagnoses), uses ICD9 codes instead of diagnosis names, compares observationtime rather than diagnosistime, and applies invalid \u2018+ 2 MONTH\u2019 syntax. These issues span multiple clauses and fundamentally alter the query structure and meaning, not just a local mistake in a single clause.",
            "error_type": "Global: logical structure error"
        },
        "765941e9ac0c6dd1539c97a8": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When did patient 030-12080 come to the hospital via chest pain center for the first time?",
            "gold_sql": "SELECT patient.hospitaladmittime FROM patient WHERE patient.uniquepid = '030-12080' AND patient.hospitaladmitsource = 'chest pain center' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1",
            "pred_sql": "SELECT patient.hospitaladmittime FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '030-12080'",
            "gold_answer": "[['2100-01-02 15:12:00']]",
            "pred_answer": "[['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00'], ['2100-01-02 15:12:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the query structure by introducing an unnecessary JOIN to the vitalperiodic table, omitting the hospitaladmitsource filter ('chest pain center'), excluding the discharge-time check (hospitaldischargetime IS NOT NULL), and failing to order and limit for the first admission. These issues go beyond a simple typo or missing condition in one clause; they alter the overall logic and data relationships, producing repeated rows rather than the single first admission time.",
            "error_type": "Global: incorrect join strategy"
        },
        "73901b4a804f0cdbd67987e9": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What medication was patient 002-11177 prescribed two times this month?",
            "gold_sql": "SELECT T1.drugname FROM ( SELECT medication.drugname, COUNT( medication.drugstarttime ) AS C1 FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-11177' ) ) AND datetime(medication.drugstarttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month') GROUP BY medication.drugname ) AS T1 WHERE T1.C1 = 2",
            "pred_sql": "SELECT medication.drugname FROM medication INNER JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '002-11177' AND medication.drugstarttime LIKE '2100-02-%' ORDER BY medication.drugstarttime DESC LIMIT 2",
            "gold_answer": "[['1000 ml  -  potassium chloride in nacl 20-0.9 meq/l-% iv soln'], ['500 ml  -  sodium chloride 0.9 % iv soln'], ['alprazolam 0.25 mg po tabs'], ['morphine inj'], ['nitroglycerin 0.4 mg sl subl']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the logic: it uses a simple LIKE filter on medication.drugstarttime for \u201c2100-02-%\u201d (wrong month), fails to restrict to the current month (December 2100), omits the GROUP BY/COUNT/HAVING to find drugs prescribed exactly twice, and arbitrarily LIMITs to 2 rows. Fixing this is not a local tweak but requires rebuilding the aggregation and proper time filtering. This is a structural/logic error.",
            "error_type": "Global: incorrect logic"
        },
        "44c293f67498109bcfc02beb": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the organism found in the first microbiology test done on the patient 031-10407's nasopharynx last month?",
            "gold_sql": "SELECT microlab.organism FROM microlab WHERE microlab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10407' ) ) AND microlab.culturesite = 'nasopharynx' AND datetime(microlab.culturetakentime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month') ORDER BY microlab.culturetakentime ASC LIMIT 1",
            "pred_sql": "SELECT microlab.organism FROM patient INNER JOIN microlab ON patient.patientunitstayid = microlab.patientunitstayid WHERE patient.uniquepid = '031-10407' AND strftime('%Y-%m-%d',microlab.culturetakentime) LIKE '2015-11-18'",
            "gold_answer": "[['other']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query fails only in the WHERE clause: it hardcodes a specific date ('2015-11-18') instead of filtering for \u201clast month\u201d and also omits the culturesite = 'nasopharynx' condition. The table relationships and overall structure (JOIN patient-to-microlab, selecting microlab.organism) are correct. These mistakes are confined to the value conditions in the WHERE clause and do not require reworking the query\u2019s joins or logic flow. Therefore, this is a localized WHERE\u2010clause error.",
            "error_type": "Local: value parsing error"
        },
        "c6ba9aee9d82b7f7b53f02c0": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Get me patient 006-101341's total output volume on 01/07/2100.",
            "gold_sql": "SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-101341' ) ) AND intakeoutput.cellpath LIKE '%output%' AND strftime('%Y-%m-%d',intakeoutput.intakeoutputtime) = '2100-01-07'",
            "pred_sql": "SELECT intakeoutput.cellvalue * intakeoutput.cellvaluenumerical AS totalvol FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE patient.uniquepid = '006-101341' AND intakeoutput.intakeoutputtime = '2100-01-07' AND intakeoutput.cellpath LIKE '%output%'",
            "gold_answer": "[['5415.0']]",
            "pred_answer": "no such column: intakeoutput.cellvalue",
            "is_correct": false,
            "reasoning": "The predicted SQL misreferences columns inside the SELECT clause\u2014there is no intakeoutput.cellvalue or cellvaluenumerical column (the correct column is cellvaluenumeric). This is a localized column reference error that doesn\u2019t require restructuring joins or overall logic.",
            "error_type": "Local: column reference error"
        },
        "620abef8e30470561bc7876b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the name of the procedure that was given two times to patient 004-10113 in 08/this year?",
            "gold_sql": "SELECT T1.treatmentname FROM ( SELECT treatment.treatmentname, COUNT( treatment.treatmenttime ) AS C1 FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-10113' ) ) AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',treatment.treatmenttime) = '08' GROUP BY treatment.treatmentname ) AS T1 WHERE T1.C1 = 2",
            "pred_sql": "SELECT DISTINCT diagnosis.diagnosisname FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid WHERE patient.uniquepid = '004-10113' AND strftime('%m', diagnosis.diagnosistime) = '08' AND diagnosis.diagnosisid IN (1116, 1117)",
            "gold_answer": "[['vascular catheter placement'], ['vasodilating agent - iv - nicardipine']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query completely uses the diagnosis table instead of the treatment table and filters on diagnosis IDs, whereas the intended query must count treatments per patient in a given month and then select those with exactly two occurrences. This is not a minor typo or misplaced condition but a fundamental misselection of the data source and logic. Fixing it would require rewriting the entire query structure, switching tables, joins, and grouping logic, so it is a global error.",
            "error_type": "Global: incorrect-table-and-logic"
        },
        "e6f31fd573d77d5e1ae39ef3": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Tell me the total number of patients who were diagnosed with leukocytosis - leukemoid reaction since 2100.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT diagnosis.patientunitstayid FROM diagnosis WHERE diagnosis.diagnosisname = 'leukocytosis - leukemoid reaction' AND strftime('%Y',diagnosis.diagnosistime) >= '2100' )",
            "pred_sql": "SELECT count(DISTINCT patientunitstayid) FROM diagnosis WHERE icd9code IN ( '5188', '5189', '5190', '5191', '5192', '5193', '5194', '5195' )",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the query logic: it filters by icd9code instead of diagnosisname, omits the time constraint (since 2100), and counts directly from the diagnosis table rather than linking to the patient table for unique patients. These errors span multiple clauses (SELECT, WHERE) and alter the intended meaning, requiring significant restructuring to correct.",
            "error_type": "Global: logical inconsistency"
        },
        "a99eb67257698883467f88f8": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the length of stay in days for patient 017-101105's first hospital visit?",
            "gold_sql": "SELECT strftime('%J',patient.hospitaldischargetime) - strftime('%J',patient.hospitaladmittime) FROM patient WHERE patient.uniquepid = '017-101105' AND patient.hospitaladmittime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1",
            "pred_sql": "SELECT strftime('%J', patient.hospitaldischargetime) - strftime('%J', patient.hospitaladmittime) AS los FROM patient WHERE patientunitstayid = '017-101105'",
            "gold_answer": "[['1.536']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL filters on patientunitstayid instead of uniquepid, using the wrong column to identify the patient. This is a localized mistake in the WHERE clause (column reference error) and can be fixed without restructuring the overall query logic.",
            "error_type": "Local: table/column reference error"
        },
        "bf399a0a344947fcaf45438b": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was patient 032-10119's last hospital visit?",
            "gold_sql": "SELECT patient.hospitaladmittime FROM patient WHERE patient.uniquepid = '032-10119' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1",
            "pred_sql": "SELECT patient.hospitaldischargedatetime FROM patient INNER JOIN cost ON patient.patientunitstayid = cost.patientunitstayid WHERE patient.uniquepid = '032-10119' ORDER BY patient.hospitaladmittime DESC LIMIT 1",
            "gold_answer": "[['2100-10-20 06:21:08']]",
            "pred_answer": "no such column: patient.hospitaldischargedatetime",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column hospitaldischargedatetime and even includes an unnecessary JOIN to the cost table. The primary failure is a bad column reference (patient.hospitaldischargedatetime does not exist in the schema). This is a localized mistake that doesn\u2019t alter the overall query structure or intended logic beyond the wrong column name.",
            "error_type": "Local: table/column reference error"
        },
        "70857240166bae2581b96559": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the name of the last input that patient 016-10029 had yesterday?",
            "gold_sql": "SELECT intakeoutput.celllabel FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '016-10029' ) ) AND intakeoutput.cellpath LIKE '%intake%' AND datetime(intakeoutput.intakeoutputtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-1 day') ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.intakeoutputname FROM patient INNER JOIN intakeoutput ON patient.patientunitstayid = intakeoutput.patientunitstayid WHERE intakeoutput.intakeoutputtime LIKE '2100-12-31' AND patient.patientunitstayid = '016-10029' AND intakeoutput.cellpath LIKE '%input%' ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "gold_answer": "[['p.o.']]",
            "pred_answer": "no such column: intakeoutput.intakeoutputname",
            "is_correct": false,
            "reasoning": "The predicted query references a non-existent column `intakeoutput.intakeoutputname`, causing the error \u201cno such column\u201d. This is a simple column reference mistake and does not affect the overall query structure or logic, so it is a localized error.",
            "error_type": "Local: column reference error"
        },
        "bd2f163685751c157c0c3933": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What is the known allergy of patient 025-13060 since 08/2100?",
            "gold_sql": "SELECT allergy.allergyname FROM allergy WHERE allergy.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '025-13060' ) ) AND strftime('%Y-%m',allergy.allergytime) >= '2100-08'",
            "pred_sql": "SELECT allergyname FROM allergy WHERE patientunitstayid = '025-13060' AND allergytime >= '2100-08-01 00:00:00'",
            "gold_answer": "[['amoxicillin'], ['cefuroxime'], ['levofloxacin'], ['prednisone']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL directly compares allergy.patientunitstayid to the patient\u2019s unique PID ('025-13060') instead of mapping the unique PID to the correct patientunitstayid via the patient table. This is a mistake in the column used for filtering\u2014it doesn\u2019t require restructuring the entire query logic but simply the correct join/column reference.",
            "error_type": "Local: table/column reference error"
        },
        "7bd605f170632966619d3d2f": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "How much does albuterol/ipratropium neb 3ml cost?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'medication' AND cost.eventid IN ( SELECT medication.medicationid FROM medication WHERE medication.drugname = 'albuterol/ipratropium neb 3ml' )",
            "pred_sql": "SELECT DISTINCT cost.cost FROM medication INNER JOIN cost ON medication.patientunitstayid = cost.patienthealthsystemstayid WHERE medication.drugname = 'albuterol/ipratropium' AND medication.dosage = '3'",
            "gold_answer": "[['13.8']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally alters how cost is associated with the medication. Instead of joining cost.eventid to medication.medicationid and filtering cost.eventtype = 'medication', it joins medication.patientunitstayid to cost.patienthealthsystemstayid. It also misnames the drug and dosage. These join and filter mistakes change the overall query logic and require restructuring the query to correct the relationships, not just a simple typo fix.",
            "error_type": "Global: incorrect join relationship"
        },
        "28d92a418e13b07d795a817c": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When was the last total protein test that patient 011-10034 received?",
            "gold_sql": "SELECT lab.labresulttime FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '011-10034' ) ) AND lab.labname = 'total protein' ORDER BY lab.labresulttime DESC LIMIT 1",
            "pred_sql": "SELECT lab.labresulttime FROM lab INNER JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE patient.patientunitstayid = 11110034 AND lab.labname = 'Total Protein' ORDER BY lab.labresulttime DESC LIMIT 1",
            "gold_answer": "[['2100-05-14 08:50:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL filters on patient.patientunitstayid = 11110034 rather than matching the uniquepid = '011-10034' (and even misconstrues the ID format). It also joins on patientunitstayid instead of using the patienthealthsystemstayid/uniquepid relationship required by the ground truth. This is a localized mistake in the WHERE clause (wrong column and value), not a fundamental structural or multi-clause logic issue, so it is a Local error.",
            "error_type": "Local: column reference error"
        },
        "b77c2915664d4f7faa9af936": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "When did patient 002-12250 get input since 08/11/2100 for the last time?",
            "gold_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-12250' ) ) AND intakeoutput.cellpath LIKE '%intake%' AND strftime('%Y-%m-%d',intakeoutput.intakeoutputtime) >= '2100-08-11' ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput INNER JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '002-12250' AND intakeoutput.intakeoutputtime >= '2100-08-11'",
            "gold_answer": "[['2100-09-24 20:00:00']]",
            "pred_answer": "[['2100-09-19 06:38:00'], ['2100-09-19 06:38:00'], ['2100-09-19 09:23:00'], ['2100-09-19 15:00:00'], ['2100-09-19 18:46:00'], ['2100-09-19 18:46:00'], ['2100-09-19 18:50:00'], ['2100-09-19 19:59:00'], ['2100-09-19 22:32:00'], ['2100-09-20 09:00:00'], ['2100-09-20 10:00:00'], ['2100-09-20 13:48:00'], ['2100-09-20 19:59:00'], ['2100-09-20 19:59:00'], ['2100-09-20 20:34:00'], ['2100-09-21 00:00:00'], ['2100-09-21 02:55:00'], ['2100-09-21 02:55:00'], ['2100-09-21 02:55:00'], ['2100-09-21 06:00:00'], ['2100-09-21 09:00:00'], ['2100-09-21 11:00:00'], ['2100-09-21 11:00:00'], ['2100-09-21 11:00:00'], ['2100-09-21 15:29:00'], ['2100-09-21 19:30:00'], ['2100-09-21 19:30:00'], ['2100-09-21 19:30:00'], ['2100-09-22 02:47:00'], ['2100-09-22 11:53:00'], ['2100-09-22 11:53:00'], ['2100-09-22 11:53:00'], ['2100-09-22 14:32:00'], ['2100-09-22 14:32:00'], ['2100-09-22 17:00:00'], ['2100-09-23 05:00:00'], ['2100-09-23 05:00:00'], ['2100-09-23 09:00:00'], ['2100-09-23 23:00:00'], ['2100-09-24 01:55:00'], ['2100-09-24 08:42:00'], ['2100-09-24 19:58:00'], ['2100-09-24 20:00:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins the correct tables (intakeoutput to patient) and filters by patient.uniquepid and date, preserving the overall query structure. However, it fails to restrict to intake events (missing intakeoutput.cellpath LIKE '%intake%') and does not apply ORDER BY intakeoutputtime DESC LIMIT 1 to return only the last time. These are localized mistakes in the WHERE clause and missing ORDER BY/LIMIT rather than a structural or multi-clause logic error.",
            "error_type": "Local: filter/order error"
        },
        "0e04981caf3dfd83794866ec": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Provide the id list of patients who were diagnosed with cerebral subdural hematoma - secondary to anticoagulation since 2100.",
            "gold_sql": "SELECT DISTINCT patient.uniquepid FROM patient WHERE patient.patientunitstayid IN ( SELECT diagnosis.patientunitstayid FROM diagnosis WHERE diagnosis.diagnosisname = 'cerebral subdural hematoma - secondary to anticoagulation' AND strftime('%Y',diagnosis.diagnosistime) >= '2100' )",
            "pred_sql": "SELECT patient.patientunitstayid FROM diagnosis INNER JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'cerebral subdural hematoma - secondary to anticoagulation' AND strftime('%Y', diagnosis.diagnosistime) < '2100'",
            "gold_answer": "[['004-13216'], ['016-10104']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query\u2019s mistakes are confined to column selection and the WHERE condition. They selected patientunitstayid instead of uniquepid, omitted DISTINCT, and reversed the comparison operator (\u2018<\u2019 instead of \u2018>=\u2019). These are local, fixable changes within the SELECT and WHERE clauses and do not require restructuring the overall join or query logic.",
            "error_type": "Local: value parsing error"
        },
        "4cd480a8ce675198f964e1d4": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "After getting diagnosed with change in mental status, how many patients were found to have dka within the same month since 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'change in mental status' AND strftime('%Y',diagnosis.diagnosistime) >= '2100' ) AS T1 JOIN ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'dka' AND strftime('%Y',diagnosis.diagnosistime) >= '2100' ) AS T2 WHERE T1.diagnosistime < T2.diagnosistime AND datetime(T1.diagnosistime,'start of month') = datetime(T2.diagnosistime,'start of month')",
            "pred_sql": "SELECT count(patient.patientunitstayid) FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid WHERE strftime('%Y-%m',diagnosis.diagnosistime) > '2099-12' AND diagnosis.diagnosisname = 'Deep vein thrombosis (dVT)'",
            "gold_answer": "[['88.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only uses a single JOIN between patient and diagnosis and filters for 'Deep vein thrombosis (dVT)' after a date, completely omitting the two-step logic of first finding patients diagnosed with 'change in mental status' and then checking for 'dka' within the same month. It also uses the wrong diagnosis name, fails to join two diagnosis subqueries, and does not enforce the same-month constraint correctly. This is a fundamental logic and structure mismatch with the intended query.",
            "error_type": "Global: incorrect query logic"
        },
        "d55a6a2b9901cd04ec7a4599": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "What was the first drug that patient 035-1003 was prescribed on the first hospital visit?",
            "gold_sql": "SELECT medication.drugname FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '035-1003' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) ORDER BY medication.drugstarttime ASC LIMIT 1",
            "pred_sql": "SELECT medication.drugname FROM patient INNER JOIN medication ON patient.patientunitstayid = medication.patientunitstayid WHERE patient.patientunitstayid = '035-1003' ORDER BY patient.hospitaladmittime ASC LIMIT 1",
            "gold_answer": "[['azithromycin']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally misinterprets the patient identifier and hospital visit logic. Instead of finding the first admission for the given uniquepid and then ordering medications by start time, it directly equates patientunitstayid to the string \u2018035-1003\u2019 (which is actually uniquepid) and orders by hospitaladmittime, not drugstarttime. This incorrect join and WHERE clause change the query\u2019s overall structure and intended relationships, so it cannot be fixed by a small tweak in one clause.",
            "error_type": "Global: incorrect join logic"
        },
        "e2e9aeb5439fe4143b0fbcaa": {
            "db_id": "eicu",
            "generator_name": "codes",
            "question": "Find out the number of hospital visits patient 002-13199 had since 1 year ago.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.patienthealthsystemstayid ) FROM patient WHERE patient.uniquepid = '002-13199' AND datetime(patient.hospitaladmittime) >= datetime('2100-12-31 23:59:00','-1 year')",
            "pred_sql": "SELECT count(patient.patientunitstayid) FROM patient INNER JOIN vitalperiodic ON patient.patientunitstayid = vitalperiodic.patientunitstayid WHERE patient.uniquepid = '002-13199' AND vitalperiodic.observationtime >= date_sub(now(), interval 1 year)",
            "gold_answer": "[['1.0']]",
            "pred_answer": "near \"1\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL not only uses non-SQLite functions (date_sub, now()) but also joins the patient table to vitalperiodic and filters on observationtime instead of hospitaladmittime. It counts patientunitstayid instead of distinct patienthealthsystemstayid. These mistakes span multiple clauses (JOIN, WHERE, aggregation) and fundamentally change the query\u2019s logic, requiring a major restructuring rather than a small localized fix.",
            "error_type": "Global: incorrect join"
        }
    },
    "macsql": {
        "7f8b7f9548aac71092377027": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "Count the number of times that patient 028-10451 had oral on this month/14.",
            "gold_sql": "SELECT COUNT(*) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '028-10451' ) ) AND intakeoutput.cellpath LIKE '%intake%' AND intakeoutput.celllabel = 'oral' AND datetime(intakeoutput.intakeoutputtime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month') AND strftime('%d',intakeoutput.intakeoutputtime) = '14'",
            "pred_sql": "SELECT COUNT(*) FROM intakeoutput WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '028-10451' ) AND `cellpath` LIKE '%intake%' AND `celllabel` = 'p.o.' AND datetime(`intakeoutputtime`, 'start of month') = datetime('2100-12-31 23:59:00', 'start of month', '-0 month') AND strftime('%d', `intakeoutputtime`) = '14'",
            "gold_answer": "[['5.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s mistake is confined to the WHERE clause: it uses the wrong intake label ('p.o.' instead of 'oral') and oversimplifies the patient lookup, but the overall query structure (COUNT, date filtering, table relationships) remains intact. This is a localized error in the data filtering, not a fundamental logic or join structure issue.",
            "error_type": "Local: value parsing error"
        },
        "0815c33a58055c1981683dbf": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "What was the last medication that patient 030-10753 was prescribed in 02/this year?",
            "gold_sql": "SELECT medication.drugname FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '030-10753' ) ) AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',medication.drugstarttime) = '02' ORDER BY medication.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT T2.`drugname` FROM patient AS T1 INNER JOIN medication AS T2 ON T1.`patientunitstayid` = T2.`patientunitstayid` WHERE T1.`uniquepid` = '030-10753' AND datetime(T2.`drugstarttime`, 'start of month') = datetime('2100-12-31 23:59:00', 'start of month', '-0 month') AND strftime('%d', T2.`drugstarttime`) = '02' ORDER BY T2.`drugstarttime` DESC LIMIT 1",
            "gold_answer": "[['lorazepam']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s JOIN and table references are correct, but its WHERE clause incorrectly filters for records on the 2nd day of the current month (using start-of-month plus day = '02') instead of filtering for the month '02' of this year. This is an error confined to the temporal filtering logic in the WHERE clause and does not change the overall structure or joins of the query.",
            "error_type": "Local: other-temporal error"
        },
        "c3c29c659b13a485cb286bdd": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "When was the last time since 05/2100 that patient 025-11138 was prescribed with potassium chloride er 10 meq tablet,extended release and 15 ml cup : potassium chloride 10 % oral liqd at the same time?",
            "gold_sql": "SELECT T1.drugstarttime FROM ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '025-11138' ) AND medication.drugname = 'potassium chloride er 10 meq tablet,extended release' AND strftime('%Y-%m',medication.drugstarttime) >= '2100-05' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '025-11138' ) AND medication.drugname = '15 ml cup : potassium chloride 10 % oral liqd' AND strftime('%Y-%m',medication.drugstarttime) >= '2100-05' ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE datetime(T1.drugstarttime) = datetime(T2.drugstarttime) ORDER BY T1.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT MAX(datetime(`drugstarttime`)) FROM ( SELECT `patientunitstayid`, `drugstarttime` FROM medication WHERE `patientunitstayid` IN ( SELECT DISTINCT `patientunitstayid` FROM patient WHERE `uniquepid` = '025-11138' ) AND `drugname` = 'potassium chloride er 10 meq tablet, extended release' AND datetime(`drugstarttime`) >= datetime('2100-05-01 00:00:00') ) AS T1 JOIN ( SELECT `patientunitstayid`, `drugstarttime` FROM medication WHERE `patientunitstayid` IN ( SELECT DISTINCT `patientunitstayid` FROM patient WHERE `uniquepid` = '025-11138' ) AND `drugname` = '15 ml cup : potassium chloride 10 % oral liqd' AND datetime(`drugstarttime`) >= datetime('2100-05-01 00:00:00') ) AS T2 ON T1.`patientunitstayid` = T2.`patientunitstayid` AND datetime(T1.`drugstarttime`, 'start of day') = datetime(T2.`drugstarttime`, 'start of day')",
            "gold_answer": "[['2100-08-02 07:47:00']]",
            "pred_answer": "ambiguous column name: drugstarttime",
            "is_correct": false,
            "reasoning": "The predicted SQL fails due to an ambiguous column reference: in the outer SELECT MAX(datetime(`drugstarttime`)), the column `drugstarttime` is not qualified with a table alias, and both subqueries T1 and T2 define that column. This is a simple column reference error and can be fixed by prefixing the column with the correct alias (e.g., T1.drugstarttime). It does not require reworking the query\u2019s logic or structure.",
            "error_type": "Local: column reference error"
        },
        "9be5c5d50e8d9301923761d5": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "Tell me the top five most frequent procedures that patients are given within the same hospital visit after receiving stress ulcer prophylaxis - esomeprazole this year.",
            "gold_sql": "SELECT T3.treatmentname FROM ( SELECT T2.treatmentname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'stress ulcer prophylaxis - esomeprazole' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, treatment.treatmentname, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.treatmenttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.treatmentname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT T2.treatmentname FROM treatment AS T2 JOIN ( SELECT DISTINCT T1.patientunitstayid, T1.drugstarttime FROM medication AS T1 WHERE T1.drugname = 'stress ulcer prophylaxis - esomeprazole' AND datetime(T1.drugstarttime, 'start of year') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') ) AS T3 ON T2.patientunitstayid = T3.patientunitstayid WHERE T2.treatmenttime > T3.drugstarttime GROUP BY T2.treatmentname ORDER BY COUNT(*) DESC LIMIT 5",
            "gold_answer": "[['analgesics - neuraxial analgesics'], ['bronchodilator - beta-agonist'], ['bronchodilator - nebulized'], ['diagnostic ultrasound of heart - transthoracic echocardiography'], ['electrolyte administration - intravenous'], ['electrolyte administration - magnesium'], ['enteral feeds - tube feeding'], ['exploratory laparotomy'], ['glucose - d50'], ['insulin'], ['nicotine patch'], ['nitroglycerin'], ['occupational therapy consult'], ['physical therapy consult'], ['sedative agent - lorazepam'], ['stress ulcer prophylaxis - esomeprazole'], ['therapeutic antibacterials - empiric antibacterial coverage'], ['therapeutic antibacterials - metronidazole'], ['therapeutic antibacterials - quinolone'], ['vte prophylaxis - compression boots'], ['vte prophylaxis - low molecular weight heparin']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally misinterprets the event type by pulling 'stress ulcer prophylaxis \u2013 esomeprazole' from the medication table instead of the treatment table and then joining treatments without the proper year filter. This alters the core logic of which records to consider (medications vs. treatments) and thus yields no results. Fixing this is not a minor syntax change but requires restructuring the query to use the correct table and filters.",
            "error_type": "Global: incorrect table usage"
        },
        "82f6f02a554527d1b7e3eb21": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "What does it cost to have darbepoetin alfa?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'treatment' AND cost.eventid IN ( SELECT treatment.treatmentid FROM treatment WHERE treatment.treatmentname = 'darbepoetin alfa' )",
            "pred_sql": "SELECT DISTINCT C.`cost` FROM medication AS M INNER JOIN cost AS C ON M.`patientunitstayid` = C.`patientunitstayid` WHERE M.`drugname` LIKE '%darbepoetin alfa%' AND C.`eventtype` = 'medication'",
            "gold_answer": "[['7.76']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the medication table and joins cost on patientunitstayid with eventtype='medication', whereas the correct query must use the treatment table and join cost.eventid to treatment.treatmentid with eventtype='treatment'. This is not a simple fix within one clause but requires changing the table, join key, and event type, altering the overall logic of the query.",
            "error_type": "Global: join error"
        },
        "afb33348ed88ccb48d19b5cb": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "How many days have passed since the first time patient 027-105098 received a lab test of hgb on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',lab.labresulttime) ) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-105098' AND patient.hospitaldischargetime IS NULL ) ) AND lab.labname = 'hgb' ORDER BY lab.labresulttime ASC LIMIT 1",
            "pred_sql": "SELECT JULIANDAY('2100-12-31') - JULIANDAY(( SELECT MIN(`labresulttime`) FROM lab WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '027-105098' AND `hospitaldischargetime` IS NULL ) AND `labname` = 'hgb' )) AS days_passed",
            "gold_answer": "[['29.548']]",
            "pred_answer": "[['28.548']]",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s error is localized to how the current date is specified and used in the date arithmetic. It uses JULIANDAY('2100-12-31') (midnight) instead of the full timestamp '2100-12-31 23:59:00' as in the ground truth, causing about a one-day offset in the result. This is a value\u2010parsing/time\u2010specification mistake within the SELECT expression and does not alter the overall query structure or logic.",
            "error_type": "Local: other-temporal error"
        },
        "7c6e86c631d2d02c2573b329": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "Count the number of patients diagnosed with metastatic lung ca who did not come to the hospital within 2 months this year.",
            "gold_sql": "SELECT ( SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'metastatic lung ca' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 ) - ( SELECT COUNT( DISTINCT T2.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'metastatic lung ca' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 JOIN patient ON T2.uniquepid = patient.uniquepid WHERE T2.diagnosistime < patient.hospitaladmittime AND datetime(patient.hospitaladmittime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND datetime(patient.hospitaladmittime) BETWEEN datetime(T2.diagnosistime) AND datetime(T2.diagnosistime,'+2 month') )",
            "pred_sql": "SELECT COUNT(*) FROM ( SELECT DISTINCT T1.`uniquepid` FROM patient AS T1 INNER JOIN diagnosis AS T2 ON T1.`patientunitstayid` = T2.`patientunitstayid` WHERE T2.`diagnosisname` = 'metastatic lung ca' ) AS diagnosed_patients WHERE diagnosed_patients.`uniquepid` IN ( SELECT DISTINCT T1.`uniquepid` FROM patient AS T1 WHERE datetime(T1.`hospitaladmittime`) < datetime('2100-12-31 23:59:00', '-2 months') )",
            "gold_answer": "[['8.0']]",
            "pred_answer": "[['14.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the intended logic: it fails to restrict diagnoses to this year, ignores the 2\u2010month window relative to each diagnosis, and compares hospital admission time to a fixed 'now \u2013 2 months' instead of between diagnosis time and diagnosis time + 2 months. It also misuses the IN subquery on the patient table rather than joining diagnosis records for the correct time frame. These errors affect multiple clauses (SELECT, WHERE, JOIN) and require rewriting the overall query structure and logic.",
            "error_type": "Global: incorrect logical structure"
        },
        "81269a4127553519e317b8e4": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "When was the last time that patient 006-106828 had per iv flush: wrist r 20 gauge input today?",
            "gold_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-106828' ) ) AND intakeoutput.cellpath LIKE '%intake%' AND intakeoutput.celllabel = 'per iv flush: wrist r 20 gauge' AND datetime(intakeoutput.intakeoutputtime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-0 day') ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "pred_sql": "SELECT MAX(`intakeoutputtime`) FROM intakeoutput WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '006-106828' ) AND `cellpath` LIKE '%intake%' AND `celllabel` = 'per iv flush: wrist r 20 gauge' AND datetime(`intakeoutputtime`, 'start of day') = datetime('2100-12-31 23:59:00', 'start of day', '-0 day')",
            "gold_answer": "[['2100-12-31 11:00:00']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL simplifies the relationship between the patient and intakeoutput tables by directly equating intakeoutput.patientunitstayid to a single patient.patientunitstayid returned by the subquery on uniquepid. The ground truth SQL correctly handles potential multiple stays by joining through patienthealthsystemstayid and using IN, ensuring all relevant unit stays are considered. This mistake alters the fundamental data relationship and logic (it may miss the correct stay that has today's intakeoutput record), so it cannot be fixed by a minor syntax tweak but requires restructuring the join logic.",
            "error_type": "Global: join relationship error"
        },
        "a47c31b12b805a632b215dea": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "What was the diagnosis received by patient 027-102287 on the last hospital visit for the first time?",
            "gold_sql": "SELECT diagnosis.diagnosisname FROM diagnosis WHERE diagnosis.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-102287' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) ORDER BY diagnosis.diagnosistime ASC LIMIT 1",
            "pred_sql": "SELECT `diagnosisname` FROM diagnosis WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '027-102287' AND `hospitaldischargetime` IS NOT NULL ORDER BY `hospitaladmittime` DESC LIMIT 1 )",
            "gold_answer": "[['seizures - status epilepticus']]",
            "pred_answer": "[['encephalopathy - metabolic'], ['encephalopathy - toxic'], ['metabolic acidosis - lactic acidosis'], ['seizures - generalized tonic -clonic'], ['seizures - status epilepticus'], ['sinus tachycardia']]",
            "is_correct": false,
            "reasoning": "The predicted SQL omits the intermediate step of identifying the hospital-level stay (patienthealthsystemstayid) and instead directly uses a single patientunitstayid, thereby failing to capture all relevant unit stays within the last hospital visit. This is not a simple typo or missing alias but a fundamental change to the way tables are related and the overall logic of the query. Fixing this requires restructuring the query to include the patienthealthsystemstayid subquery and then deriving all patientunitstayid values from it, which is beyond a localized clause adjustment.",
            "error_type": "Global: incorrect join logic"
        },
        "0ec4d0ab8e32f4bcc5d9151e": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "What is the minimum total hospital cost that involved oxygen therapy (< 40%) - 30-40% since 2100?",
            "gold_sql": "SELECT MIN(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT treatment.patientunitstayid FROM treatment WHERE treatment.treatmentname = 'oxygen therapy (< 40%) - 30-40%' ) ) AND strftime('%Y',cost.chargetime) >= '2100' GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "SELECT MIN(total_cost) AS minimum_total_cost FROM ( SELECT T1.patienthealthsystemstayid, SUM(T2.cost) AS total_cost FROM ( SELECT DISTINCT T1.patienthealthsystemstayid FROM treatment AS T1 JOIN patient AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.treatmentname LIKE '%oxygen therapy%' AND T1.treatmentname LIKE '%30-40%' AND datetime(T1.treatmenttime) >= datetime('2100-01-01 00:00:00') ) AS T1 JOIN cost AS T2 ON T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T1.patienthealthsystemstayid ) AS total_costs",
            "gold_answer": "[['486.69']]",
            "pred_answer": "no such column: T1.patienthealthsystemstayid",
            "is_correct": false,
            "reasoning": "The failure occurs because the subquery labels the treatment table as T1 and then tries to select T1.patienthealthsystemstayid, but patienthealthsystemstayid is a column of the patient table (aliased T2), not of treatment. This is a straightforward column reference mistake in a single clause and can be fixed by selecting T2.patienthealthsystemstayid. No overall query logic or structure needs changing, so it\u2019s a Local error.",
            "error_type": "Local: column-reference error"
        },
        "e132de5413f8581089ebc590": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "Could you tell me the maximum total cost in a hospital where lorazepam 2 mg/1 ml 1 ml inj is used since 1 year ago?",
            "gold_sql": "SELECT MAX(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT medication.patientunitstayid FROM medication WHERE medication.drugname = 'lorazepam 2 mg/1 ml 1 ml inj' ) ) AND datetime(cost.chargetime) >= datetime('2100-12-31 23:59:00','-1 year') GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "SELECT MAX(total_cost) AS max_total_cost FROM ( SELECT T2.hospitalid, SUM(T3.cost) AS total_cost FROM patient AS T2 JOIN cost AS T3 ON T2.patienthealthsystemstayid = T3.patienthealthsystemstayid WHERE T2.hospitalid IN ( SELECT DISTINCT T2.hospitalid FROM medication AS T1 JOIN patient AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.drugname = 'lorazepam 2 mg/1 ml 1 ml inj' AND datetime(T1.drugstarttime) >= datetime('2100-12-31 23:59:00', '-1 year') ) GROUP BY T2.hospitalid ) AS hospital_costs",
            "gold_answer": "[['10138.72']]",
            "pred_answer": "[['105838.2']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the query\u2019s logic by grouping costs at the hospital level rather than per patient health system stay. The ground truth sums costs per patient stay (patienthealthsystemstayid) and then takes the maximum of those sums. The predicted version joins and groups by hospitalid, summing costs across all stays in each hospital, and then takes the maximum, which is a different aggregation scope. This is not a localized syntax or reference mistake but a structural error that alters the intended meaning of the query.",
            "error_type": "Global: incorrect grouping/aggregation"
        },
        "f7fbfcef8db77d835ccb2925": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "Retrieve the top four most frequent diagnoses of patients with age in their 60 or above since 1 year ago.",
            "gold_sql": "SELECT T1.diagnosisname FROM ( SELECT diagnosis.diagnosisname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM diagnosis WHERE diagnosis.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age >= 60 ) AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') GROUP BY diagnosis.diagnosisname ) AS T1 WHERE T1.C1 <= 4",
            "pred_sql": "SELECT `diagnosisname` FROM ( SELECT D.`diagnosisname`, COUNT(*) AS frequency FROM ( SELECT DISTINCT `patientunitstayid` FROM patient WHERE CAST(`age` AS INTEGER) >= 60 ) AS P INNER JOIN ( SELECT DISTINCT `patientunitstayid`, `diagnosisname` FROM diagnosis WHERE datetime(`diagnosistime`) >= datetime('2100-12-31 23:59:00', '-1 year') ) AS D ON P.`patientunitstayid` = D.`patientunitstayid` GROUP BY D.`diagnosisname` ORDER BY frequency DESC LIMIT 4 ) AS TopDiagnoses",
            "gold_answer": "[['acute renal failure'], ['acute respiratory failure'], ['congestive heart failure'], ['hypoxemia']]",
            "pred_answer": "[['acute renal failure'], ['acute respiratory failure'], ['congestive heart failure'], ['pneumonia']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the intended aggregation logic by introducing DISTINCT on diagnosis records per patient before counting. This causes it to count the number of patients with each diagnosis rather than the total number of diagnosis events, and it also uses LIMIT instead of a dense rank to handle ties. Fixing this requires restructuring the aggregation and windowing logic, which is beyond a simple one-clause correction.",
            "error_type": "Global: flawed aggregation logic"
        },
        "f9e17f8c9c58b6ed7aeb9d39": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "When did patient 010-10317 get in 02/this year a lab test for the first time?",
            "gold_sql": "SELECT lab.labresulttime FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '010-10317' ) ) AND datetime(lab.labresulttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',lab.labresulttime) = '02' ORDER BY lab.labresulttime ASC LIMIT 1",
            "pred_sql": "SELECT MIN(`labresulttime`) AS first_lab_test_time FROM lab WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '010-10317' ) AND datetime(`labresulttime`, 'start of month') = datetime('2100-12-31 23:59:00', 'start of month', '-0 month') AND strftime('%d', `labresulttime`) = '02'",
            "gold_answer": "[['2100-02-01 03:49:00']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s mistake is confined to the WHERE clause date filter. It uses `datetime(...,'start of month')` and `strftime('%d') = '02'` (i.e. day = 02 of the current month) instead of filtering for month = '02' of this year. The overall query structure (finding the first lab test for the patient) remains correct; only the temporal condition is wrong. This is a localized error in the date\u2010filtering logic.",
            "error_type": "Local: other-temporal error"
        },
        "fb5a2c37faa8aebf3fbe4240": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "What was patient 004-15751's first output time of urine on 04/11/this year?",
            "gold_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-15751' ) ) AND intakeoutput.cellpath LIKE '%output%' AND intakeoutput.celllabel = 'urine' AND datetime(intakeoutput.intakeoutputtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m-%d',intakeoutput.intakeoutputtime) = '04-11' ORDER BY intakeoutput.intakeoutputtime ASC LIMIT 1",
            "pred_sql": "SELECT MIN(`intakeoutputtime`) AS first_output_time FROM intakeoutput WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '004-15751' ) AND datetime(`intakeoutputtime`, 'start of year') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') AND strftime('%m-%d', `intakeoutputtime`) = '04-11' AND `cellpath` LIKE '%output%' AND `celllabel` LIKE '%urine%'",
            "gold_answer": "[['2100-04-11 16:00:00']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL simplifies the patient lookup by directly matching patientunitstayid to the one returned for uniquepid, rather than following the two\u2010step link via patienthealthsystemstayid as in the ground truth. This alters the intended relationship across unit stays and can miss the correct intakeoutput records. The error spans the core join logic (choice of key) and cannot be fixed by a minor tweak in a single clause\u2014it requires restructuring the patient\u2192unitstay link. Therefore, it's a global error.",
            "error_type": "Global: incorrect join key"
        },
        "1bbfae72fa70ce468d41d6dc": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "What is the maximum total hospital expense that includes dka in 2100?",
            "gold_sql": "SELECT MAX(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT diagnosis.patientunitstayid FROM diagnosis WHERE diagnosis.diagnosisname = 'dka' ) ) AND strftime('%Y',cost.chargetime) = '2100' GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "SELECT MAX(total_expense) AS max_total_expense FROM ( SELECT T1.patienthealthsystemstayid, SUM(T2.cost) AS total_expense FROM ( SELECT DISTINCT patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname LIKE '%dka%' AND strftime('%Y', patient.hospitaladmittime) = '2100' ) AS T1 JOIN cost AS T2 ON T1.patienthealthsystemstayid = T2.patienthealthsystemstayid WHERE T2.eventtype IN ('diagnosis', 'treatment', 'lab', 'medication') GROUP BY T1.patienthealthsystemstayid )",
            "gold_answer": "[['6005.92']]",
            "pred_answer": "[['42041.44']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the query logic in several ways. First, it filters on strftime('%Y', patient.hospitaladmittime) = '2100' instead of filtering cost records by strftime('%Y', cost.chargetime) = '2100'. Second, it restricts cost.eventtype to a subset ('diagnosis','treatment','lab','medication') rather than summing all cost records for each stay as intended. These changes span multiple clauses (FROM, JOIN, WHERE) and alter the set of cost records being aggregated, producing an entirely different result. Fixing this requires restructuring the query logic rather than a minor local correction.",
            "error_type": "Global: incorrect date filter and cost aggregation logic"
        },
        "8c1b4dadcbd7b9dfc08e81bb": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "When did patient 006-102786 have an input for the first time on 12/27/this year?",
            "gold_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-102786' ) ) AND intakeoutput.cellpath LIKE '%intake%' AND datetime(intakeoutput.intakeoutputtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m-%d',intakeoutput.intakeoutputtime) = '12-27' ORDER BY intakeoutput.intakeoutputtime ASC LIMIT 1",
            "pred_sql": "SELECT MIN(`intakeoutputtime`) AS first_intake_time FROM intakeoutput WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '006-102786' ) AND datetime(`intakeoutputtime`, 'start of year') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') AND strftime('%m-%d', `intakeoutputtime`) = '12-27' AND `cellpath` LIKE '%intake%'",
            "gold_answer": "[['2100-12-27 00:00:00']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only filters on a single patientunitstayid returned by \u2018SELECT patientunitstayid FROM patient WHERE uniquepid = \u2026\u2019, whereas the correct query needs to consider all unit stays associated with that patienthealthsystemstayid. This is not a minor syntax mistake but a faulty join/relationship logic that changes which rows are examined, causing the query to return no results. Hence, it\u2019s a global error in the join/relationship.",
            "error_type": "Global: join relationship error"
        },
        "254f0f752d2b8c107c1f3727": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "What was the first time that patient 027-101846 had the minimum amount of o2 sat (%) on the first hospital visit?",
            "gold_sql": "SELECT lab.labresulttime FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-101846' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND lab.labname = 'o2 sat (%)' ORDER BY lab.labresult ASC, lab.labresulttime ASC LIMIT 1",
            "pred_sql": "SELECT MIN(observationtime) AS first_min_sao2_time FROM vitalperiodic WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '027-101846' AND hospitaladmittime = ( SELECT MIN(hospitaladmittime) FROM patient WHERE uniquepid = '027-101846' ) ) AND sao2 = ( SELECT MIN(sao2) FROM vitalperiodic WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '027-101846' AND hospitaladmittime = ( SELECT MIN(hospitaladmittime) FROM patient WHERE uniquepid = '027-101846' ) ) )",
            "gold_answer": "[['2100-09-08 16:25:00']]",
            "pred_answer": "[['2100-09-10 19:26:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the vitalperiodic table and its sao2 and observationtime columns, whereas the question and ground truth refer explicitly to the lab table with labname = 'o2 sat (%)' and labresulttime. This is not a minor syntax or column name mistake but a fundamental change in data source and logic, altering the intended meaning of the query.",
            "error_type": "Global: wrong table/field selection"
        },
        "ca898dcba71dbcfe723e83b0": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "How many patients had a skin test administered?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT microlab.patientunitstayid FROM microlab WHERE microlab.culturesite = 'skin' )",
            "pred_sql": "SELECT COUNT(DISTINCT `patientunitstayid`) AS num_patients_with_skin_test FROM lab WHERE `labname` LIKE '%skin%'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the lab table and filters on labname LIKE '%skin%', whereas the correct logic requires querying the microlab table and filtering on culturesite = 'skin'. This is not a simple typo or local clause mistake but a fundamental misuse of the wrong table, altering the query\u2019s overall logic.",
            "error_type": "Global: incorrect table selection"
        },
        "d9e859cc9f043fddabe6d778": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "How many days have elapsed since the first time a procedure was performed on patient 027-100843 on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',treatment.treatmenttime) ) FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-100843' AND patient.hospitaldischargetime IS NULL ) ) ORDER BY treatment.treatmenttime ASC LIMIT 1",
            "pred_sql": "SELECT JULIANDAY('2100-12-31 23:59:00') - JULIANDAY( (SELECT MIN(`treatmenttime`) FROM treatment WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '027-100843' AND `hospitaldischargetime` IS NULL )) ) AS days_elapsed",
            "gold_answer": "[['34.919']]",
            "pred_answer": "[['7.621']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes how the patient\u2019s current admission is identified and how the first procedure time is retrieved. The ground truth SQL first finds the patient\u2019s current hospital admission (via patienthealthsystemstayid) and then filters all treatment records for any ICU stay (patientunitstayid) within that admission, ordering by treatment time to get the very first procedure. The predicted SQL, however, simply selects a single patientunitstayid row (without considering the patienthealthsystemstayid join) and then takes MIN(treatmenttime) for that one unitstay. This alters the intended relationship between hospital admissions and ICU stays and thus the resulting treatment time. Correcting this isn\u2019t a small tweak in one clause but requires restoring the proper sub-query structure (or join) to bind to the correct admission, so it\u2019s a global logic/structure error.",
            "error_type": "Global: incorrect join error"
        },
        "a9c37d707816110b60aebbd5": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "Among patients who are diagnosed with pulmonary aspiration - large particulate aspirate , what are the top three most common diagnoses that followed within the same month?",
            "gold_sql": "SELECT T3.diagnosisname FROM ( SELECT T2.diagnosisname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'pulmonary aspiration - large particulate aspirate' ) AS T1 JOIN ( SELECT patient.uniquepid, diagnosis.diagnosisname, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.diagnosistime AND datetime(T1.diagnosistime,'start of month') = datetime(T2.diagnosistime,'start of month') GROUP BY T2.diagnosisname ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "SELECT `diagnosisname` FROM ( SELECT T2.`diagnosisname`, COUNT(*) AS `count` FROM diagnosis AS T1 JOIN diagnosis AS T2 ON T1.`patientunitstayid` = T2.`patientunitstayid` AND datetime(T1.`diagnosistime`, 'start of month') = datetime(T2.`diagnosistime`, 'start of month') WHERE T1.`diagnosisname` = 'pulmonary aspiration - large particulate aspirate' AND T2.`diagnosisname` <> 'pulmonary aspiration - large particulate aspirate' GROUP BY T2.`diagnosisname` ORDER BY `count` DESC LIMIT 3 )",
            "gold_answer": "[['acute respiratory failure - due to inability to clear secretions'], ['pulmonary aspiration - large particulate aspirate']]",
            "pred_answer": "[['acute respiratory failure - due to inability to clear secretions']]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins diagnosis records on patientunitstayid rather than on the patient\u2019s unique ID, which changes the scope of follow-on diagnoses (it limits results to the same ICU stay instead of the same patient). This is a structural mistake in how tables are related and affects the overall logic. It also excludes the original diagnosis name, which deviates from the ground truth behavior, but the primary flaw is the incorrect join key that fundamentally alters which events are matched.",
            "error_type": "Global: join-key error"
        },
        "245d45258d03fb5864a40c62": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "What was the name of the last medication that was prescribed to patient 022-100938 in 02/this year?",
            "gold_sql": "SELECT medication.drugname FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '022-100938' ) ) AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',medication.drugstarttime) = '02' ORDER BY medication.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT `drugname` FROM medication WHERE `patientunitstayid` = ( SELECT DISTINCT `patientunitstayid` FROM patient WHERE `uniquepid` = '022-100938' ) AND datetime(`drugstarttime`, 'start of month') = datetime('2100-12-31 23:59:00', 'start of month', '-0 month') AND strftime('%d', `drugstarttime`) = '02' ORDER BY `drugstarttime` DESC LIMIT 1",
            "gold_answer": "[['synthroid']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query misapplies the temporal filter in the WHERE clause: it uses `datetime(drugstarttime, 'start of month') = ...` and `strftime('%d', drugstarttime) = '02'` (day = 02) instead of checking month = '02' relative to the start of the year. This is a mistake localized to the date\u2010filtering logic and does not require restructuring the joins or overall query flow. Thus it is a local error in the temporal condition.",
            "error_type": "Local: other-temporal error"
        },
        "9768a4a4b907cf6434f602e7": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "When was the first time patient 007-10152 was prescribed medication via the feeding tube route in 05/this year?",
            "gold_sql": "SELECT medication.drugstarttime FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '007-10152' ) ) AND medication.routeadmin = 'feeding tube' AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m',medication.drugstarttime) = '05' ORDER BY medication.drugstarttime ASC LIMIT 1",
            "pred_sql": "SELECT MIN(`drugstarttime`) AS first_feeding_tube_medication_time FROM medication WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '007-10152' ) AND `routeadmin` = 'feeding tube' AND datetime(`drugstarttime`, 'start of month') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') AND strftime('%m', `drugstarttime`) = '05'",
            "gold_answer": "[['2100-05-09 00:43:00']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted query\u2019s overall structure matches the intent\u2014filter by patient, route, month, and take the MIN date\u2014but it misuses the datetime modifier in the WHERE clause: it applies 'start of month' to drugstarttime and compares it to the 'start of year' of the current date, so no rows satisfy the condition. This is a localized mistake in a single condition rather than a flaw in the join logic or overall structure.",
            "error_type": "Local: other-temporal error"
        },
        "17aff9f53536f4057a93b06c": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "This year, how many patients received sodium chloride 0.9% 1,000 ml bag within the same hospital visit after being diagnosed with hemorrhage?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'hemorrhage' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'sodium chloride 0.9% 1,000 ml bag' AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 WHERE T1.diagnosistime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT COUNT(DISTINCT T3.uniquepid) AS patient_count FROM patient AS T3 INNER JOIN ( SELECT DISTINCT T1.patientunitstayid FROM diagnosis AS T1 WHERE T1.diagnosisname LIKE '%hemorrhage%' AND datetime(T1.diagnosistime, 'start of year') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') ) AS D ON T3.patientunitstayid = D.patientunitstayid INNER JOIN ( SELECT DISTINCT T2.patientunitstayid FROM medication AS T2 WHERE T2.drugname LIKE '%sodium chloride 0.9% 1,000 ml bag%' AND datetime(T2.drugstarttime, 'start of year') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') ) AS M ON T3.patientunitstayid = M.patientunitstayid",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['1.0']]",
            "is_correct": false,
            "reasoning": "The predicted query omits the critical temporal condition (ensuring the hemorrhage diagnosis occurs before the sodium chloride administration) and uses patientunitstayid to join events instead of patienthealthsystemstayid to enforce the same hospital visit. By failing to enforce event ordering and the correct visit identifier, the overall query logic is fundamentally altered, leading to incorrect results. This error spans multiple clauses (JOIN conditions and WHERE logic) and requires restructuring the query to include the temporal filter and correct join key.",
            "error_type": "Global: join and temporal logic error"
        },
        "dd2fff7121aa317a158ef08e": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "What are the ways to consume 150 ml flex cont : levofloxacin in d5w 5 mg/ml iv soln?",
            "gold_sql": "SELECT DISTINCT medication.routeadmin FROM medication WHERE medication.drugname = '150 ml flex cont : levofloxacin in d5w 5 mg/ml iv soln'",
            "pred_sql": "SELECT DISTINCT `routeadmin` FROM medication WHERE `drugname` = 'flex cont : levofloxacin in d5w 5 mg/ml iv soln' AND `dosage` LIKE '150%'",
            "gold_answer": "[['intravenous']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL only differs in the WHERE clause: it splits the drug identification into drugname and dosage rather than matching the full drugname string. This incorrect filter condition does not require restructuring the query\u2014only fixing the WHERE clause\u2014so it is a localized error.",
            "error_type": "Local: incorrect WHERE filter"
        },
        "e172b906c0bf5c99f8e7c2db": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "Since patient 022-1011's admission to the icu, how many days have passed?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',patient.unitadmittime) ) FROM patient WHERE patient.uniquepid = '022-1011' AND patient.unitdischargetime IS NULL",
            "pred_sql": "SELECT julianday('2100-12-31') - julianday( (SELECT `unitadmittime` FROM patient WHERE `uniquepid` = '022-1011') ) AS days_passed",
            "gold_answer": "[['32.806']]",
            "pred_answer": "[['31.806']]",
            "is_correct": false,
            "reasoning": "The predicted SQL diverges from the ground truth only in how it handles the date literal and omits the explicit filter on unitdischargetime. Instead of using the prescribed fixed datetime '2100-12-31 23:59:00' and strftime('%J', \u2026) to compute the Julian day difference, it uses julianday('2100-12-31'), which refers to midnight of that day. This single change in the datetime literal shifts the result by approximately one day (31.806 vs. 32.806) but does not alter the query\u2019s overall structure or joins. All other logic\u2014selecting admission time and calculating a difference\u2014remains intact. Therefore, this is a localized date/time formatting error, fixable by adjusting the literal to include the time component or using strftime as specified.",
            "error_type": "Local: other-temporal error"
        },
        "c3b217adda54fe59d3548b45": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "In patients who had the enteral feeds - nutritional supplement this year, what are the four most common diagnoses that followed within the same month?",
            "gold_sql": "SELECT T3.diagnosisname FROM ( SELECT T2.diagnosisname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'enteral feeds - nutritional supplement' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, diagnosis.diagnosisname, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.diagnosistime AND datetime(T1.treatmenttime,'start of month') = datetime(T2.diagnosistime,'start of month') GROUP BY T2.diagnosisname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "SELECT T2.diagnosisname FROM diagnosis AS T2 JOIN ( SELECT DISTINCT T1.patientunitstayid, T1.treatmenttime FROM treatment AS T1 WHERE T1.treatmentname = 'enteral feeds - nutritional supplement' AND datetime(T1.treatmenttime, 'start of year') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') ) AS T3 ON T2.patientunitstayid = T3.patientunitstayid AND datetime(T2.diagnosistime, 'start of month') = datetime(T3.treatmenttime, 'start of month') GROUP BY T2.diagnosisname ORDER BY COUNT(*) DESC LIMIT 4",
            "gold_answer": "[['acute respiratory distress'], ['anemia'], ['chronic respiratory failure'], ['copd'], ['dysphagia'], ['encephalopathy - post-anoxic'], ['esophagitis - regurgitant'], ['hyperglycemia'], ['hyperlipidemia'], ['neuropathy - polyneuropathy'], ['obesity - morbid'], ['pneumonia'], ['seizures'], ['sepsis']]",
            "pred_answer": "[['chronic respiratory failure'], ['hyperglycemia'], ['obesity - morbid'], ['sepsis']]",
            "is_correct": false,
            "reasoning": "The predicted query omits the crucial condition that the diagnosis must occur after the enteral feed treatment (T1.treatmenttime < T2.diagnosistime). It also joins on patientunitstayid instead of uniquepid, altering the patient grouping logic. These omissions fundamentally change which diagnoses are counted and require restructuring the query logic, not just a minor fix in one clause.",
            "error_type": "Global: incorrect join logic"
        },
        "71e4c636dcade292123624ea": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "What is the number of patients in ward 505 since 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.wardid = 505 AND strftime('%Y',patient.unitadmittime) >= '2100'",
            "pred_sql": "SELECT COUNT(*) FROM ( SELECT DISTINCT `uniquepid` FROM `patient` WHERE `wardid` = 505 AND datetime(`hospitaladmittime`) >= datetime('2100-01-01 00:00:00') ) AS unique_patients",
            "gold_answer": "[['9.0']]",
            "pred_answer": "[['12.0']]",
            "is_correct": false,
            "reasoning": "The predicted query filters on hospitaladmittime instead of unitadmittime (the date of ICU/ward admission) as required by the question. This is a local mistake in the WHERE clause\u2014using the wrong date column\u2014without altering the overall structure or logic of the query.",
            "error_type": "Local: column reference error"
        },
        "f6ec755f6e8667eca464825c": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "Get me patient 006-100471's total ivpb input amount.",
            "gold_sql": "SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-100471' ) ) AND intakeoutput.celllabel = 'ivpb' AND intakeoutput.cellpath LIKE '%intake%'",
            "pred_sql": "SELECT SUM(`cellvaluenumeric`) AS total_ivpb_input FROM intakeoutput WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '006-100471' ) AND `cellpath` LIKE '%ivpb%'",
            "gold_answer": "[['4865.0']]",
            "pred_answer": "[['700.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL restricts to a single patientunitstayid (from uniquepid) rather than summing across all unit stays within the same health system stay, and it omits the required celllabel = 'ivpb' and intake filter (cellpath LIKE '%intake%'). These omissions change the fundamental logic of the query and require restructuring the filtering and subquery logic, making this a global error.",
            "error_type": "Global: incorrect filtering and join logic"
        },
        "862e1b50da063e296890ae8c": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "Is the bedside glucose level of patient 022-105102 last measured on the last hospital visit greater than the first measurement on the last hospital visit?",
            "gold_sql": "SELECT ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '022-105102' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'bedside glucose' ORDER BY lab.labresulttime DESC LIMIT 1 ) > ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '022-105102' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'bedside glucose' ORDER BY lab.labresulttime ASC LIMIT 1 )",
            "pred_sql": "WITH GlucoseMeasurements AS ( SELECT `labresult`, `labresulttime` FROM `lab` WHERE `patientunitstayid` IN ( SELECT `patientunitstayid` FROM `patient` WHERE `patienthealthsystemstayid` = ( SELECT `patienthealthsystemstayid` FROM `patient` WHERE `uniquepid` = '022-105102' AND `hospitaldischargetime` IS NOT NULL ORDER BY `hospitaladmittime` DESC LIMIT 1 ) ) AND `labname` = 'glucose' ORDER BY `labresulttime` ) SELECT CASE WHEN (SELECT `labresult` FROM GlucoseMeasurements ORDER BY `labresulttime` DESC LIMIT 1) > (SELECT `labresult` FROM GlucoseMeasurements ORDER BY `labresulttime` ASC LIMIT 1) THEN 'True' ELSE 'False' END AS `IsLastGreaterThanFirst`",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['True']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses labname = 'glucose' instead of the required labname = 'bedside glucose'. This is a local issue with the filter condition (wrong literal/value) and does not require restructuring the query\u2019s logic or joins.",
            "error_type": "Local: value parsing error"
        },
        "3f78a402c7c8d638b4a4de3c": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "Count the number of times patient 016-10197 received volume (ml)-levofloxacin (levaquin) ivpb 750 mg on last month/09.",
            "gold_sql": "SELECT COUNT(*) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '016-10197' ) ) AND intakeoutput.cellpath LIKE '%intake%' AND intakeoutput.celllabel = 'volume (ml)-levofloxacin (levaquin) ivpb 750 mg' AND datetime(intakeoutput.intakeoutputtime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month') AND strftime('%d',intakeoutput.intakeoutputtime) = '09'",
            "pred_sql": "SELECT COUNT(*) FROM medication WHERE `patientunitstayid` = ( SELECT `patientunitstayid` FROM patient WHERE `uniquepid` = '016-10197' ) AND `drugname` = 'volume (ml)-levofloxacin (levaquin) ivpb 750 mg' AND datetime(`drugstarttime`, 'start of month') = datetime('2100-12-31 23:59:00', 'start of month', '-1 month') AND strftime('%d', `drugstarttime`) = '09'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL pulls from the medication table using drugname and drugstarttime, whereas the question and ground truth require using the intakeoutput table with celllabel and intakeoutputtime filtered by cellpath LIKE '%intake%'. This is not a simple column or syntax fix but a fundamental misuse of the table and join logic, altering the query\u2019s overall intent. Therefore it\u2019s a Global error.",
            "error_type": "Global: incorrect table usage"
        },
        "83bdb7920140393376346beb": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "How many patients were 1 ml crtrdg-ndl : lorazepam 2 mg/ml ij soln prescribed within the same hospital visit after undergoing vasopressors treatment?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'vasopressors' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = '1 ml crtrdg-ndl : lorazepam 2 mg/ml ij soln' ) AS T2 WHERE T1.treatmenttime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT COUNT(DISTINCT P.uniquepid) AS num_patients FROM patient AS P JOIN ( SELECT DISTINCT T1.patientunitstayid FROM treatment AS T1 WHERE T1.treatmentname LIKE '%vasopressors%' ) AS V ON P.patientunitstayid = V.patientunitstayid JOIN ( SELECT DISTINCT T2.patientunitstayid FROM medication AS T2 WHERE T2.drugname = '1 ml crtrdg-ndl : lorazepam 2 mg/ml ij soln' ) AS M ON P.patientunitstayid = M.patientunitstayid WHERE P.patienthealthsystemstayid = ( SELECT patienthealthsystemstayid FROM patient WHERE patientunitstayid = V.patientunitstayid LIMIT 1 )",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['3.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL drops the critical temporal condition (vasopressors treatment before lorazepam prescription) and, more fundamentally, joins the two events on patientunitstayid rather than patienthealthsystemstayid as required by \u201csame hospital visit.\u201d This wrong join key alters the overall logic (events may be linked within the same ICU stay rather than the broader hospital stay) and thus requires restructuring the query. Therefore, this is a global error.",
            "error_type": "Global: incorrect join relationship"
        },
        "e15ae33a051b2d3894c4e0e7": {
            "db_id": "eicu",
            "generator_name": "macsql",
            "question": "Can you provide the top three most frequent lab tests that within the same month took place after patients had antihypertensive drug - labetalol?",
            "gold_sql": "SELECT T3.labname FROM ( SELECT T2.labname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'antihypertensive drug - labetalol' ) AS T1 JOIN ( SELECT patient.uniquepid, lab.labname, lab.labresulttime FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.labresulttime AND datetime(T1.treatmenttime,'start of month') = datetime(T2.labresulttime,'start of month') GROUP BY T2.labname ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "SELECT T3.labname FROM ( SELECT T2.labname, COUNT(*) AS frequency FROM lab AS T2 JOIN medication AS T1 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.drugname LIKE '%labetalol%' AND datetime(T2.labresulttime, 'start of month') = datetime(T1.drugstarttime, 'start of month') AND T2.labresulttime > T1.drugstarttime GROUP BY T2.labname ) AS T3 ORDER BY T3.frequency DESC LIMIT 3",
            "gold_answer": "[['anion gap'], ['bedside glucose'], ['bicarbonate'], ['bun'], ['calcium'], ['chloride'], ['creatinine'], ['fio2'], ['glucose'], ['hct'], ['hgb'], ['lpm o2'], ['potassium'], ['sodium']]",
            "pred_answer": "[['bedside glucose'], ['glucose'], ['potassium']]",
            "is_correct": false,
            "reasoning": "The predicted query is joining the lab table to the medication table and filtering on medication.drugname rather than the treatment table\u2019s treatmentname = 'antihypertensive drug - labetalol'. This is a mistaken table/column reference (using medication.drugname and drugstarttime instead of treatment.treatmentname and treatmenttime). It can be fixed by swapping medication for treatment and using the correct columns without restructuring the rest of the query logic. Hence it\u2019s a local error.",
            "error_type": "Local: table reference error"
        }
    },
    "dinsql": {
        "019a52f54e374bbedbe7d39e": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Get me the top four most frequent lab tests that patients had within the same hospital visit after receiving antihypertensive drug - nicardipine.",
            "gold_sql": "SELECT T3.labname FROM ( SELECT T2.labname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'antihypertensive drug - nicardipine' ) AS T1 JOIN ( SELECT patient.uniquepid, lab.labname, lab.labresulttime, patient.patienthealthsystemstayid FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.labresulttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.labname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "WITH NicardipinePatients AS ( SELECT DISTINCT patientunitstayid, patienthealthsystemstayid FROM medication WHERE drugname LIKE '%nicardipine%' ), LabTestsAfterNicardipine AS ( SELECT lab.labname FROM lab INNER JOIN NicardipinePatients ON lab.patientunitstayid = NicardipinePatients.patientunitstayid INNER JOIN medication ON lab.patientunitstayid = medication.patientunitstayid WHERE medication.drugname LIKE '%nicardipine%' AND datetime(lab.labresulttime) > datetime(medication.drugstarttime) AND lab.patientunitstayid = medication.patientunitstayid AND lab.patientunitstayid IN ( SELECT patientunitstayid FROM patient WHERE patienthealthsystemstayid = NicardipinePatients.patienthealthsystemstayid ) ), RankedLabTests AS ( SELECT labname, COUNT(*) AS frequency FROM LabTestsAfterNicardipine GROUP BY labname ORDER BY frequency DESC LIMIT 4 ) SELECT labname FROM RankedLabTests",
            "gold_answer": "[['bedside glucose'], ['bicarbonate'], ['chloride'], ['creatinine'], ['potassium'], ['sodium']]",
            "pred_answer": "no such column: patienthealthsystemstayid",
            "is_correct": false,
            "reasoning": "The predicted SQL fails with \u201cno such column: patienthealthsystemstayid\u201d because the subquery references NicardipinePatients.patienthealthsystemstayid without bringing that CTE into scope or qualifying the column properly. This is a localized column reference error in the WHERE clause and does not reflect a deeper logical or structural misunderstanding of the overall query.",
            "error_type": "Local: table/column reference error"
        },
        "6a23b38247953991624db3b6": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "How much does patient 013-10117 change in anion gap second measured on the last hospital visit compared to the first value measured on the last hospital visit?",
            "gold_sql": "SELECT ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '013-10117' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'anion gap' ORDER BY lab.labresulttime ASC LIMIT 1 OFFSET 1 ) - ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '013-10117' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'anion gap' ORDER BY lab.labresulttime ASC LIMIT 1 )",
            "pred_sql": "WITH LastHospitalVisit AS ( SELECT patientunitstayid FROM patient WHERE uniquepid = '013-10117' AND hospitaldischargetime IS NOT NULL ORDER BY hospitaladmittime DESC LIMIT 1 ), AnionGapMeasurements AS ( SELECT labresult FROM lab WHERE patientunitstayid = (SELECT patientunitstayid FROM LastHospitalVisit) AND labname = 'anion gap' ORDER BY labresulttime LIMIT 2 ) SELECT MAX(labresult) - MIN(labresult) AS anion_gap_change FROM AnionGapMeasurements",
            "gold_answer": "[['-1.0']]",
            "pred_answer": "[['1.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL correctly identifies the last hospital visit and retrieves the first two anion gap measurements, but then uses MAX(labresult) \u2013 MIN(labresult), which calculates an absolute difference rather than the directed change (second minus first). This mistake is confined to the arithmetic expression in the SELECT clause and does not require restructuring joins or subqueries. Therefore, it is a localized calculation error.",
            "error_type": "Local: wrong-aggregation error"
        },
        "c5519431b0d7603182fa4334": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Find out how many patients were discharged from the hospital since 1 year ago.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.hospitaldischargetime IS NOT NULL AND datetime(patient.hospitaldischargetime) >= datetime('2100-12-31 23:59:00','-1 year')",
            "pred_sql": "SELECT COUNT(DISTINCT patienthealthsystemstayid) FROM patient WHERE datetime(hospitaldischargetime) >= datetime('2100-12-31 23:59:00', '-1 year')",
            "gold_answer": "[['1367.0']]",
            "pred_answer": "[['1519.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts DISTINCT patienthealthsystemstayid instead of DISTINCT patient.uniquepid, thus counting stays rather than unique patients. It also omits the explicit IS NOT NULL check, but the main issue is the wrong column reference. This is a localized mistake in the SELECT clause and WHERE filter, and does not affect the overall query structure or logic flow.",
            "error_type": "Local: table/column reference error"
        },
        "ef39f3af3855b7761d5db7c9": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What's the count of patients who left the hospital in 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.hospitaldischargetime IS NOT NULL AND strftime('%Y',patient.hospitaldischargetime) = '2100'",
            "pred_sql": "SELECT COUNT(DISTINCT patienthealthsystemstayid) FROM patient WHERE strftime('%Y', hospitaldischargetime) = '2100'",
            "gold_answer": "[['1367.0']]",
            "pred_answer": "[['1519.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses COUNT(DISTINCT patienthealthsystemstayid) instead of COUNT(DISTINCT patient.uniquepid). This is a column reference error (wrong column used for counting patients). The overall query structure and logic (filtering by year) remains correct, only the column in the SELECT is incorrect, so it is a Local error.",
            "error_type": "Local: column-reference error"
        },
        "ac1820fc6650cabcf6d961c7": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "When did patient 003-10464 get his/her last prescription of albuterol/ipratropium neb 3ml on the first hospital visit?",
            "gold_sql": "SELECT medication.drugstarttime FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '003-10464' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND medication.drugname = 'albuterol/ipratropium neb 3ml' ORDER BY medication.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT MAX(T2.drugstoptime) FROM patient AS T1 JOIN medication AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.uniquepid = '003-10464' AND T2.drugname = 'albuterol/ipratropium neb 3ml' AND T1.hospitaladmittime = ( SELECT MIN(hospitaladmittime) FROM patient WHERE uniquepid = '003-10464' AND hospitaldischargetime IS NOT NULL )",
            "gold_answer": "[['2100-11-11 18:35:00']]",
            "pred_answer": "[['2100-11-13 17:22:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL differs from the ground truth only in the SELECT clause: it aggregates MAX(drugstoptime) instead of ordering by and selecting the latest drugstarttime. The join logic, patient filtering, and first-visit restriction are structurally correct. This is a localized mistake in column selection, not a change to the overall query structure or logic.",
            "error_type": "Local: column reference error"
        },
        "9e616b0295d51d1aa25f7b71": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Count the number of patients for whom dexmedetomidine 200 mcg in 50 ml ns was prescribed within the same hospital visit post their diagnosis of acute coronary syndrome - acute myocardial infarction (no st elevation) this year.",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'acute coronary syndrome - acute myocardial infarction (no st elevation)' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'dexmedetomidine 200 mcg in 50 ml ns' AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 WHERE T1.diagnosistime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT COUNT(DISTINCT T1.uniquepid) FROM patient AS T1 JOIN diagnosis AS T2 ON T1.patientunitstayid = T2.patientunitstayid JOIN medication AS T3 ON T1.patientunitstayid = T3.patientunitstayid WHERE T2.diagnosisname = 'acute coronary syndrome - acute myocardial infarction (no st elevation)' AND T3.drugname = 'dexmedetomidine 200 mcg in 50 ml ns' AND strftime('%Y', T2.diagnosistime) = '2100' AND T1.patienthealthsystemstayid = T3.patienthealthsystemstayid AND datetime(T3.drugstarttime) > datetime(T2.diagnosistime)",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such column: T3.patienthealthsystemstayid",
            "is_correct": false,
            "reasoning": "The predicted SQL references T3.patienthealthsystemstayid, but the medication table does not have a patienthealthsystemstayid column (it only has patientunitstayid). This is a column reference error localized to the WHERE clause, and can be fixed by using the correct column (patientunitstayid) or joining on the correct key without altering the overall query structure.",
            "error_type": "Local: table/column reference error"
        },
        "fd736d3c511756e9cf8ead74": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Can you give me patient 031-10598's yearly average respiratory rate since 164 days ago?",
            "gold_sql": "SELECT AVG(vitalperiodic.respiration) FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10598' ) ) AND vitalperiodic.respiration IS NOT NULL AND datetime(vitalperiodic.observationtime) >= datetime('2100-12-31 23:59:00','-164 day') GROUP BY strftime('%Y',vitalperiodic.observationtime)",
            "pred_sql": "SELECT AVG(respiration) AS average_respiratory_rate FROM vitalperiodic WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '031-10598' ) AND datetime(observationtime) >= datetime('2100-12-31 23:59:00', '-164 days') GROUP BY strftime('%Y', observationtime)",
            "gold_answer": "[['17.138']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses a single equality filter on patientunitstayid directly from the patient table (SELECT patientunitstayid FROM patient WHERE uniquepid='031-10598'), whereas the correct query must first map uniquepid to a patienthealthsystemstayid and then find all related patientunitstayid values. This is not a minor syntax or column error but a fundamental flaw in how the patient and vitalperiodic tables are related, altering the intended logic and resulting in empty results.",
            "error_type": "Global: incorrect join/filter logic"
        },
        "35cca7494423f9c053a7198c": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Tell me the top three diagnoses with the highest 3-month mortality rate.",
            "gold_sql": "SELECT T4.diagnosisname FROM ( SELECT T3.diagnosisname, DENSE_RANK() OVER ( ORDER BY T3.C2 ASC ) AS C2 FROM ( SELECT T2.diagnosisname, AVG(C1) AS C2 FROM ( SELECT T1.diagnosisname, ( CASE WHEN (patient.hospitaldischargestatus = 'expired') AND(strftime('%J',patient.hospitaldischargetime) - strftime('%J',T1.diagnosistime)) < 365 / 4 THEN 0 ELSE 1 END ) as C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosisname, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) >= 365 / 4 GROUP BY patient.uniquepid, diagnosis.diagnosisname HAVING MIN(diagnosis.diagnosistime) = diagnosis.diagnosistime ) AS T1 JOIN patient ON T1.uniquepid = patient.uniquepid ) AS T2 GROUP BY T2.diagnosisname ) AS T3 ) AS T4 WHERE T4.C2 <= 3",
            "pred_sql": "WITH FirstDiagnosis AS ( SELECT patientunitstayid, diagnosisname, MIN(diagnosistime) AS first_diagnosistime FROM diagnosis GROUP BY patientunitstayid, diagnosisname ), MortalityWithin3Months AS ( SELECT FD.diagnosisname, COUNT(DISTINCT P.patientunitstayid) AS total_patients, SUM(CASE WHEN P.hospitaldischargestatus = 'expired' AND datetime(P.hospitaldischargetime) <= datetime(FD.first_diagnosistime, '+91.25 days') THEN 1 ELSE 0 END) AS deaths_within_3_months FROM FirstDiagnosis FD JOIN patient P ON FD.patientunitstayid = P.patientunitstayid GROUP BY FD.diagnosisname ), MortalityRate AS ( SELECT diagnosisname, (CAST(deaths_within_3_months AS FLOAT) / total_patients) AS mortality_rate FROM MortalityWithin3Months ) SELECT diagnosisname FROM MortalityRate ORDER BY mortality_rate DESC LIMIT 3",
            "gold_answer": "[['acute copd exacerbation - with baseline hypoxemia'], ['anuria'], ['ards - pulmonary etiology'], ['arterial thromboembolism'], ['arterial thromboembolism - kidney'], ['av block - pacemaker in place, pacing and capturing'], ['bacteremia - gram negative rod'], ['bacteremia - respiratory source'], ['cardiac arrest - initial rhythm: asystole'], ['cardiac arrest - initial rhythm: pulseless electrical activity'], ['cardiac arrest - initial rhythm: ventricular tachycardia'], ['cardiac arrest - un-witnessed'], ['cerebral subdural hematoma - secondary to anticoagulation'], ['cholecystitis - acute'], ['dvt - left upper extremity'], ['dvt - right upper extremity'], ['encephalopathy - toxic'], ['enteritis - colitis, presumed infectious'], ['facial bone fracture - maxillary fracture'], ['facial bone fracture - orbital fracture'], ['gastric ca'], ['hyperglycemia - corticosteroid related'], ['hypernatremia - severe (> 155 meq/dl)'], ['hypothermia'], ['liver ca'], ['melanoma - nodular'], ['mouth and jaw tumor - oral cavity squamous cell ca'], ['myopathy - malignant hyperthermia'], ['necrotizing fasciitis - abdomen/pelvis'], ['peripheral vascular ischemia - atherosclerotic thrombo-occlusion'], ['peripheral vascular ischemia - postoperative'], ['pleural effusion - due to heart failure'], ['pneumothorax - spontaneous'], ['s/p aneurysm resection/repair abdominal aorta'], ['seizures - from ischemia/infarction'], ['sepsis - sepsis with single organ dysfunction- circulatory system failure'], ['valve repair >= 7 days - aortic / mitral'], ['vascular insufficiency of intestine - due to extrinsic compression'], ['ventricular tachycardia - with hemodynamic compromise']]",
            "pred_answer": "[['acute copd exacerbation - with baseline hypoxemia'], ['anal ca'], ['anuria']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to restrict the cohort to only those diagnoses that occurred at least three months ago, so it includes recent diagnoses that have not yet had a full 3-month follow-up. This omission fundamentally alters the mortality rate calculation and requires restructuring the query (adding a filter on diagnosis time) rather than a simple fix within one clause. Therefore, it is a global logic error.",
            "error_type": "Global: missing follow-up time filter"
        },
        "bfc77af7df4b45fa5ec0579d": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "When was the time of patient 027-100241's last hospital discharge?",
            "gold_sql": "SELECT patient.hospitaldischargetime FROM patient WHERE patient.uniquepid = '027-100241' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaldischargetime DESC LIMIT 1",
            "pred_sql": "hospitaldischargetime FROM patient WHERE uniquepid = '027-100241' ORDER BY hospitaldischargetime DESC LIMIT 1",
            "gold_answer": "[['2100-12-01 22:31:00']]",
            "pred_answer": "null",
            "is_correct": false,
            "reasoning": "The predicted SQL is missing the SELECT keyword before the column list and also omits the IS NOT NULL filter on hospitaldischargetime. These are syntactic/local mistakes in the SELECT clause rather than a fundamental re\u2010structuring of the query logic or table relationships.",
            "error_type": "Local: syntax error"
        },
        "1afbc775f060dfcad71d671c": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Show me patient 018-10885's yearly minimum 24 h urine protein since 1 year ago.",
            "gold_sql": "SELECT MIN(lab.labresult) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '018-10885' ) ) AND lab.labname = '24 h urine protein' AND datetime(lab.labresulttime) >= datetime('2100-12-31 23:59:00','-1 year') GROUP BY strftime('%Y',lab.labresulttime)",
            "pred_sql": "SELECT strftime('%Y', intakeoutputtime) AS year, MIN(cellvaluenumeric) AS min_24h_urine_protein FROM intakeoutput WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '018-10885' ) AND celllabel LIKE '%24 h urine protein%' AND datetime(intakeoutputtime) >= datetime('2100-12-31 23:59:00', '-1 year') GROUP BY year",
            "gold_answer": "[['30.0']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL queries the intakeoutput table instead of the lab table to retrieve '24 h urine protein' results. This is not a simple syntax or column naming mistake but a fundamental misuse of the wrong table, which alters the entire logic of the query. Correcting this requires changing the core structure to reference the lab table and its labresult and labresulttime columns, so it is a global error.",
            "error_type": "Global: incorrect table selection"
        },
        "c7dc0e66cdfbbd924515dbbe": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What is the sex of patient 006-102774?",
            "gold_sql": "SELECT DISTINCT patient.gender FROM patient WHERE patient.uniquepid = '006-102774'",
            "pred_sql": "gender FROM patient WHERE uniquepid = '006-102774'",
            "gold_answer": "[['male']]",
            "pred_answer": "null",
            "is_correct": false,
            "reasoning": "The predicted SQL is missing the SELECT keyword and thus is a local syntax error in the SELECT clause. It does not change the intended logic or table relationships\u2014just a minor fix in the SELECT statement is needed. Therefore, this is a Local error.",
            "error_type": "Local: syntax error"
        },
        "814a25457ce2b7f59394f632": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "How many patients underwent anticoagulant administration - conventional heparin therapy within 2 months after the diagnosis with acute coronary syndrome - acute myocardial infarction (no st elevation), this year?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'acute coronary syndrome - acute myocardial infarction (no st elevation)' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'anticoagulant administration - conventional heparin therapy' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 WHERE T1.diagnosistime < T2.treatmenttime AND datetime(T2.treatmenttime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month')",
            "pred_sql": "SELECT COUNT(DISTINCT T1.patientunitstayid) FROM diagnosis AS T1 JOIN medication AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.diagnosisname = 'acute coronary syndrome - acute myocardial infarction (no st elevation)' AND T2.drugname = 'conventional heparin therapy' AND datetime(T2.drugstarttime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime, '+2 months') AND strftime('%Y', T1.diagnosistime) = '2100'",
            "gold_answer": "[['48.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the medication table instead of the treatment table and joins on patientunitstayid rather than counting unique patients (uniquepid). This is not a simple column or syntax mistake but a fundamental change to the query\u2019s logic: it selects from the wrong table, applies filters to drugname instead of treatmentname, and misaligns the intended event timing and patient identifier. Fixing this requires restructuring the core FROM/JOIN clauses and filters, so it\u2019s a global logic error.",
            "error_type": "Global: incorrect table join"
        },
        "1de044d1478a726d732f23df": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What are the five most commonly prescribed drugs for patients that received antibacterials within the same month?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'antibacterials' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.drugstarttime AND datetime(T1.treatmenttime,'start of month') = datetime(T2.drugstarttime,'start of month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "WITH AntibacterialPatients AS ( SELECT DISTINCT patientunitstayid, strftime('%Y-%m', drugstarttime) AS month FROM medication WHERE drugname LIKE '%antibacterial%' ), PrescribedDrugs AS ( SELECT drugname FROM medication WHERE (patientunitstayid, strftime('%Y-%m', drugstarttime)) IN (SELECT patientunitstayid, month FROM AntibacterialPatients) ) SELECT drugname FROM ( SELECT drugname, COUNT(*) AS count FROM PrescribedDrugs GROUP BY drugname ORDER BY count DESC LIMIT 5 )",
            "gold_answer": "[['dextrose 50%'], ['nacl 0.9% mbp'], ['piperacillin-tazobactam'], ['potassium chloride'], ['potassium chloride crys er 20 meq po tbcr']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely bypasses the treatment table, instead looking for drugs with \u2018antibacterial\u2019 in their name in the medication table. The question asks for drugs prescribed in the same month as a treatment event named 'antibacterials'. The predicted query never references treatment and so fails to capture the intended patient set, requiring a fundamental restructuring (correct joins between treatment and medication tables) rather than a small fix. This is a Global error.",
            "error_type": "Global: incorrect join/logic error"
        },
        "42c5e6a86e2af4026e2293e2": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Please provide the count of patients who had a volume (ml)-levofloxacin (levaquin) ivpb 750 mg input since 2 year ago.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT intakeoutput.patientunitstayid FROM intakeoutput WHERE intakeoutput.celllabel = 'volume (ml)-levofloxacin (levaquin) ivpb 750 mg' AND intakeoutput.cellpath LIKE '%input%' AND datetime(intakeoutput.intakeoutputtime) >= datetime('2100-12-31 23:59:00','-2 year') )",
            "pred_sql": "SELECT COUNT(DISTINCT patientunitstayid) FROM intakeoutput WHERE cellpath LIKE '%intake%' AND celllabel LIKE '%volume (ml)-levofloxacin (levaquin) ivpb 750 mg%' AND datetime(intakeoutputtime) >= datetime('2100-12-31 23:59:00', '-2 years')",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['7.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only queries the intakeoutput table, using cellpath LIKE '%intake%' (instead of '%input%') and counts DISTINCT patientunitstayid. It omits the patient table and thus counts ICU stays rather than unique patients. This is not a simple typo; it fundamentally alters the query\u2019s logic and relationships, requiring restructuring (adding a join or subquery) to count distinct patients based on their uniqepid.",
            "error_type": "Global: incorrect join/relationship"
        },
        "d4101fa929c237ae9386cf10": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Get me the patient ids who were diagnosed with cellulitis - abdomen/pelvis in 2100.",
            "gold_sql": "SELECT DISTINCT patient.uniquepid FROM patient WHERE patient.patientunitstayid IN ( SELECT diagnosis.patientunitstayid FROM diagnosis WHERE diagnosis.diagnosisname = 'cellulitis - abdomen/pelvis' AND strftime('%Y',diagnosis.diagnosistime) = '2100' )",
            "pred_sql": "SELECT DISTINCT patient.patientunitstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'cellulitis - abdomen/pelvis' AND strftime('%Y', diagnosis.diagnosistime) = '2100'",
            "gold_answer": "[['004-15269'], ['016-10986']]",
            "pred_answer": "[['1554049.0'], ['389703.0']]",
            "is_correct": false,
            "reasoning": "The predicted query differs only in the SELECT clause: it returns patient.patientunitstayid instead of patient.uniquepid. The JOIN and WHERE logic correctly filters diagnoses in 2100 for cellulitis - abdomen/pelvis, but the wrong column is projected. This is a localized column reference mistake that doesn\u2019t affect the overall query structure or logic.",
            "error_type": "Local: column reference error"
        },
        "5a547c9a0a0b185342a34529": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Give me the top three most commonly prescribed drugs since 2100.",
            "gold_sql": "SELECT T1.drugname FROM ( SELECT medication.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM medication WHERE strftime('%Y',medication.drugstarttime) >= '2100' GROUP BY medication.drugname ) AS T1 WHERE T1.C1 <= 3",
            "pred_sql": "SELECT drugname FROM medication WHERE datetime(drugstarttime) >= datetime('2100-12-31 23:59:00','-0 year') GROUP BY drugname ORDER BY COUNT(*) DESC LIMIT 3",
            "gold_answer": "[['1000 ml flex cont : sodium chloride 0.9 % iv soln'], ['potassium chloride'], ['tylenol']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The discrepancy lies solely in the WHERE clause\u2019s time filter. The ground truth uses strftime('%Y', medication.drugstarttime) >= '2100' to capture all prescriptions from the start of year 2100 onward. The predicted query instead filters for medication.drugstarttime >= '2100-12-31 23:59:00', effectively only including prescriptions on or after the very last moment of 2100, leading to no results. This is an isolated issue in the temporal condition and does not impact the overall query structure or logic beyond that clause.",
            "error_type": "Local: other-temporal error"
        },
        "750c6907adf544b9533322db": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Tell me what was the total estimated blood loss output of patient 002-10018 on last month/15.",
            "gold_sql": "SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-10018' ) ) AND intakeoutput.celllabel = 'estimated blood loss' AND intakeoutput.cellpath LIKE '%output%' AND datetime(intakeoutput.intakeoutputtime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month') AND strftime('%d',intakeoutput.intakeoutputtime) = '15'",
            "pred_sql": "SELECT SUM(T2.cellvaluenumeric) AS total_blood_loss FROM patient AS T1 INNER JOIN intakeoutput AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.uniquepid = '002-10018' AND datetime(T2.intakeoutputtime, 'start of month') = datetime('2100-12-31 23:59:00', 'start of month', '-1 month') AND strftime('%d', T2.intakeoutputtime) = '15' AND T2.cellpath LIKE '%output%' AND T2.celllabel = 'Estimated Blood Loss'",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "We compare the two queries: both correctly restrict to the 15th of last month, filter on output events, restrict to the same patient\u2019s unit stays, and sum the numeric cellvaluenumeric. The only substantive difference is the WHERE clause on celllabel: the ground truth uses lowercase 'estimated blood loss' whereas the predicted query uses capitalized 'Estimated Blood Loss'. This typo/case mismatch in the literal string causes no rows to match and thus no result, but does not change the overall query structure or logic. Therefore this is a local error (a value parsing/filtering mistake).",
            "error_type": "Local: value parsing error"
        },
        "07fea0d5ec85b1acf9d8910a": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Since 2100, when was the first time that patient 005-10606 was diagnosed with enteritis - colitis, presumed infectious?",
            "gold_sql": "SELECT diagnosis.diagnosistime FROM diagnosis WHERE diagnosis.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '005-10606' ) ) AND diagnosis.diagnosisname = 'enteritis - colitis, presumed infectious' AND strftime('%Y',diagnosis.diagnosistime) >= '2100' ORDER BY diagnosis.diagnosistime ASC LIMIT 1",
            "pred_sql": "SELECT MIN(diagnosistime) FROM diagnosis WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '005-10606' ) AND diagnosisname = 'enteritis - colitis, presumed infectious' AND datetime(diagnosistime) >= datetime('2100-12-31 23:59:00','start of year','-0 year')",
            "gold_answer": "[['2100-08-17 15:23:00']]",
            "pred_answer": "[['2100-08-27 00:51:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses a single patientunitstayid subquery instead of retrieving all unit stays for the patient's health system stay. The ground truth correctly accounts for all unit stays by first selecting the patienthealthsystemstayid for the given uniquepid and then all associated patientunitstayid values. By restricting to one unitstayid, the predicted query misses earlier diagnoses and returns the wrong date. This is not a simple syntax fix but an incorrect join/relationship logic that changes the overall result.",
            "error_type": "Global: incorrect join relationship"
        },
        "3cada3b262b36ccaf92ce91b": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What was the first time that patient 010-10482 had the maximum value of -basos?",
            "gold_sql": "SELECT lab.labresulttime FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '010-10482' ) ) AND lab.labname = '-basos' ORDER BY lab.labresult DESC, lab.labresulttime ASC LIMIT 1",
            "pred_sql": "SELECT labresulttime FROM lab WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '010-10482' ) AND labname = '-basos' ORDER BY CAST(labresult AS REAL) DESC, labresulttime ASC LIMIT 1",
            "gold_answer": "[['2100-05-15 17:04:00']]",
            "pred_answer": "[['2100-05-18 07:39:00']]",
            "is_correct": false,
            "reasoning": "The ground truth SQL first finds the patienthealthsystemstayid for uniquepid '010-10482', then retrieves all related patientunitstayid values to include every ICU stay for that patient. The predicted SQL, however, directly equates patientunitstayid to a single value retrieved by uniquepid, thus ignoring additional stays and changing the dataset over which the max is computed. This is not a minor fix in a single clause but alters the overall table relationship logic.",
            "error_type": "Global: incorrect join relationship"
        },
        "488a44148ca1110d01cc6bf6": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Can i know the 3-month survival rate of patients diagnosed with acute copd exacerbation who were then prescribed methylprednisolone sod suc(pf)?",
            "gold_sql": "SELECT AVG(C1) FROM ( SELECT ( CASE WHEN (patient.hospitaldischargestatus = 'expired') AND(strftime('%J',patient.hospitaldischargetime) - strftime('%J',T1.diagnosistime)) < 365 / 4 THEN 0 ELSE 1 END ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'acute copd exacerbation' AND strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) >= 365 / 4 GROUP BY patient.uniquepid HAVING MIN(diagnosis.diagnosistime) = diagnosis.diagnosistime ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'methylprednisolone sod suc(pf)' GROUP BY patient.uniquepid HAVING MAX(medication.drugstarttime) = medication.drugstarttime ) AS T2 ON T1.uniquepid = T2.uniquepid JOIN patient ON T1.uniquepid = patient.uniquepid WHERE T1.diagnosistime < T2.drugstarttime GROUP BY patient.uniquepid HAVING MAX(patient.hospitaldischargetime) = patient.hospitaldischargetime )",
            "pred_sql": "WITH DiagnosisPatients AS ( SELECT DISTINCT patientunitstayid, diagnosistime FROM diagnosis WHERE diagnosisname = 'acute copd exacerbation' ), MedicationPatients AS ( SELECT DISTINCT patientunitstayid FROM medication WHERE drugname = 'methylprednisolone sod suc(pf)' ), SurvivalPatients AS ( SELECT DISTINCT T1.patientunitstayid FROM DiagnosisPatients AS T1 INNER JOIN MedicationPatients AS T2 ON T1.patientunitstayid = T2.patientunitstayid INNER JOIN patient AS T3 ON T1.patientunitstayid = T3.patientunitstayid WHERE datetime(T3.hospitaldischargetime) > datetime(T1.diagnosistime, '+91 days') ), TotalPatients AS ( SELECT DISTINCT T1.patientunitstayid FROM DiagnosisPatients AS T1 INNER JOIN MedicationPatients AS T2 ON T1.patientunitstayid = T2.patientunitstayid ) SELECT CAST(COUNT(SurvivalPatients.patientunitstayid) AS FLOAT) / COUNT(TotalPatients.patientunitstayid) AS survival_rate FROM TotalPatients LEFT JOIN SurvivalPatients ON TotalPatients.patientunitstayid = SurvivalPatients.patientunitstayid",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the logic of the intended query. It does not enforce that the prescription occurs after the first diagnosis (it merely joins on patientunitstayid), it does not use the first diagnosis event, it does not filter patients whose diagnosis occurred at least three months ago relative to the fixed current time, and it misdefines survival by comparing discharge time to diagnosis + 91 days rather than checking death within three months. These issues span multiple clauses and alter the overall structure and meaning of the query, requiring significant restructuring to correct.",
            "error_type": "Global: incorrect join and survival logic"
        },
        "e6422d952e5bd12cfbf2a976": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Can you tell me the minimum total hospital cost if it involves a albumin lab test since 2100?",
            "gold_sql": "SELECT MIN(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT lab.patientunitstayid FROM lab WHERE lab.labname = 'albumin' ) ) AND strftime('%Y',cost.chargetime) >= '2100' GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "SELECT MIN(total_cost) FROM ( SELECT SUM(DISTINCT C.cost) AS total_cost FROM cost AS C JOIN lab AS L ON C.patientunitstayid = L.patientunitstayid JOIN patient AS P ON C.patienthealthsystemstayid = P.patienthealthsystemstayid WHERE L.labname = 'albumin' AND datetime(L.labresulttime) >= datetime('2100-01-01 00:00:00') AND C.eventtype = 'lab' AND P.hospitaldischargetime IS NOT NULL GROUP BY C.patienthealthsystemstayid )",
            "gold_answer": "[['122.78']]",
            "pred_answer": "[['59.74']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the logic of the original: it joins cost to lab directly on patientunitstayid (instead of filtering by patienthealthsystemstayid), restricts costs to only lab event types, sums DISTINCT costs (dropping duplicate costs), filters on labresulttime rather than cost.chargetime, and imposes a hospitaldischargetime IS NOT NULL condition. These changes span multiple clauses and alter the intended meaning and scope of the calculation rather than fixing a localized mistake.",
            "error_type": "Global: flawed query logic"
        },
        "f9fcc93b5505cb3b35d9dfdc": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "List the top three most common diagnoses for patients in their 30s.",
            "gold_sql": "SELECT T1.diagnosisname FROM ( SELECT diagnosis.diagnosisname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM diagnosis WHERE diagnosis.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age BETWEEN 30 AND 39 ) GROUP BY diagnosis.diagnosisname ) AS T1 WHERE T1.C1 <= 3",
            "pred_sql": "SELECT diagnosisname FROM diagnosis WHERE patientunitstayid IN ( SELECT patientunitstayid FROM patient WHERE CAST(age AS INTEGER) BETWEEN 30 AND 39 ) GROUP BY diagnosisname ORDER BY COUNT(diagnosisname) DESC LIMIT 3",
            "gold_answer": "[['acute respiratory failure'], ['diabetes mellitus'], ['esrd (end stage renal disease)'], ['septic shock']]",
            "pred_answer": "[['acute respiratory failure'], ['diabetes mellitus'], ['esrd (end stage renal disease)']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses a simple GROUP BY with ORDER BY COUNT and LIMIT 3, whereas the ground truth uses DENSE_RANK to include all diagnoses tied for the third most common. By using LIMIT 3, the predicted query omits any tied entries beyond the first three rows, thus changing the intended logic of returning all top-three-ranked diagnoses (including ties). This is not a minor column typo or syntax fix but a fundamental flaw in the ranking strategy that spans the overall query structure. Therefore, it is a Global error.",
            "error_type": "Global: incorrect ranking method"
        },
        "2d0d2460ff714b2ed38ef17a": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What are the five most frequently prescribed medications for patients diagnosed with hypertension - hypertensive emergency/urgency previously within the same month, since 1 year ago?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'hypertension - hypertensive emergency/urgency' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND datetime(T1.diagnosistime,'start of month') = datetime(T2.drugstarttime,'start of month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT T2.drugname FROM diagnosis AS T1 JOIN medication AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.diagnosisname = 'hypertension - hypertensive emergency/urgency' AND datetime(T1.diagnosistime, 'start of month') = datetime(T2.drugstarttime, 'start of month') AND datetime(T1.diagnosistime) >= datetime('2100-12-31 23:59:00', '-1 year') GROUP BY T2.drugname ORDER BY COUNT(T2.drugname) DESC LIMIT 5",
            "gold_answer": "[['10 ml vial : heparin sodium (porcine) 1000 unit/ml ij soln'], ['1000 ml flex cont : sodium chloride 0.9 % iv soln'], ['albuterol sulfate (2.5 mg/3ml) 0.083% in nebu'], ['alteplase 2 mg ij solr'], ['vancomycin hcl 1000 mg iv solr']]",
            "pred_answer": "[['10 ml vial : heparin sodium (porcine) 1000 unit/ml ij soln'], ['1000 ml flex cont : sodium chloride 0.9 % iv soln'], ['2 ml : ondansetron hcl 4 mg/2ml iv soln'], ['amlodipine besylate 10 mg po tabs'], ['carvedilol 6.25 mg po tabs']]",
            "is_correct": false,
            "reasoning": "The predicted SQL omits the critical condition ensuring that each medication\u2019s start time occurs after the diagnosis time (T1.diagnosistime < T2.drugstarttime). This missing temporal filter causes medications prescribed earlier in the same month to be incorrectly counted. The overall query structure (JOIN, GROUP BY, ORDER BY and LIMIT) remains intact; only a localized WHERE\u2010clause condition is missing.",
            "error_type": "Local: other-temporal error"
        },
        "47fc7d3548e30d33d281d558": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Please tell me the total number of patients who had a cl flush: introducer sheath ij r input since 2100.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT intakeoutput.patientunitstayid FROM intakeoutput WHERE intakeoutput.celllabel = 'cl flush: introducer sheath ij r' AND intakeoutput.cellpath LIKE '%input%' AND strftime('%Y',intakeoutput.intakeoutputtime) >= '2100' )",
            "pred_sql": "SELECT COUNT(DISTINCT P.patientunitstayid) FROM patient AS P INNER JOIN intakeoutput AS IO ON P.patientunitstayid = IO.patientunitstayid WHERE IO.cellpath LIKE '%cl flush: introducer sheath ij r%' AND datetime(IO.intakeoutputtime) >= datetime('2100-01-01 00:00:00')",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['3.0']]",
            "is_correct": false,
            "reasoning": "The predicted query makes localized mistakes in the SELECT and WHERE clauses without altering the overall query structure. Specifically: (1) It uses IO.cellpath LIKE '%cl flush\u2026%' instead of filtering on the correct column (celllabel) and misses the required input filter (cellpath LIKE '%input%'). (2) It counts DISTINCT patientunitstayid instead of DISTINCT patient.uniquepid. These are column/reference and filter errors confined to individual clauses, not a change in the join logic or overall query design.",
            "error_type": "Local: column/filter reference error"
        },
        "0c4056652a853e3a4d83a7ce": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "This year, how many patients were given cefazolin 2 gm in ns 100 ml ivpb within the same hospital visit after receiving a antiarrhythmics - class iii antiarrhythmic procedure?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'antiarrhythmics - class iii antiarrhythmic' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'cefazolin 2 gm in ns 100 ml ivpb' AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 WHERE T1.treatmenttime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT COUNT(DISTINCT T3.patienthealthsystemstayid) FROM medication AS T1 JOIN treatment AS T2 ON T1.patientunitstayid = T2.patientunitstayid JOIN patient AS T3 ON T1.patientunitstayid = T3.patientunitstayid WHERE T1.drugname = 'cefazolin 2 gm in ns 100 ml ivpb' AND T2.treatmentname = 'antiarrhythmics - class iii antiarrhythmic' AND datetime(T1.drugstarttime) > datetime(T2.treatmenttime) AND strftime('%Y', T1.drugstarttime) = '2100' AND T3.hospitaldischargetime IS NOT NULL AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such column: T1.patienthealthsystemstayid",
            "is_correct": false,
            "reasoning": "The predicted SQL references T1.patienthealthsystemstayid, but the medication table (aliased as T1) does not have a patienthealthsystemstayid column. This is a simple column reference error within a single clause and does not affect the overall query structure or logic, fitting the definition of a local error.",
            "error_type": "Local: column reference error"
        },
        "839e80df768eb6c06c6601ce": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "On 05/11/2100, what was the maximum value of the heart rate for patient 003-11972?",
            "gold_sql": "SELECT MAX(vitalperiodic.heartrate) FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '003-11972' ) ) AND vitalperiodic.heartrate IS NOT NULL AND strftime('%Y-%m-%d',vitalperiodic.observationtime) = '2100-05-11'",
            "pred_sql": "MAX(V.heartrate) AS max_heart_rate FROM patient AS P JOIN vitalperiodic AS V ON P.patientunitstayid = V.patientunitstayid WHERE P.uniquepid = '003-11972' AND datetime(V.observationtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m-%d',V.observationtime) = '05-11'",
            "gold_answer": "[['84.0']]",
            "pred_answer": "null",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s mistake is confined to the date\u2010filtering predicate: it uses datetime(...,'start of year') plus a separate strftime('%m-%d') test rather than matching the full date (strftime('%Y-%m-%d') = '2100-05-11') as in the ground truth. Because of that incorrect temporal condition, no rows qualify and the query returns NULL. This error is localized entirely in the WHERE clause\u2019s date logic and does not change the overall join structure or relationships between tables.",
            "error_type": "Local: other\u2010temporal error"
        },
        "3f431d7d1d47504f2a86e31f": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What time was patient 002-12407 prescribed a drug for the last time on the last hospital visit?",
            "gold_sql": "SELECT medication.drugstarttime FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-12407' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) ORDER BY medication.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT MAX(drugstoptime) FROM medication WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '002-12407' AND hospitaldischargetime IS NOT NULL ORDER BY hospitaladmittime DESC LIMIT 1 )",
            "gold_answer": "[['2100-03-05 00:00:40']]",
            "pred_answer": "[['2100-03-06 21:43:40']]",
            "is_correct": false,
            "reasoning": "The predicted SQL locally mis\u2010references the wrong time column: it uses MAX(drugstoptime) instead of retrieving medication.drugstarttime. This is confined to the SELECT expression and does not alter the overall query structure or join logic, so it\u2019s a localized column reference error.",
            "error_type": "Local: column reference error"
        },
        "9914665feeedfe52a91bea48": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What are the four most frequent drugs prescribed to male patients with an age of 60 or above within the same month after they are diagnosed with anemia - anemia of critical illness?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'anemia - anemia of critical illness' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.gender = 'male' AND patient.age >= 60 ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND datetime(T1.diagnosistime,'start of month') = datetime(T2.drugstarttime,'start of month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "WITH AnemiaPatients AS ( SELECT DISTINCT p.patientunitstayid FROM patient p JOIN diagnosis d ON p.patientunitstayid = d.patientunitstayid WHERE p.gender = 'male' AND CAST(p.age AS INTEGER) >= 60 AND d.diagnosisname = 'anemia - anemia of critical illness' ), PrescribedDrugs AS ( SELECT m.drugname FROM medication m JOIN AnemiaPatients ap ON m.patientunitstayid = ap.patientunitstayid JOIN diagnosis d ON m.patientunitstayid = d.patientunitstayid WHERE d.diagnosisname = 'anemia - anemia of critical illness' AND datetime(d.diagnosistime, 'start of month') = datetime(m.drugstarttime, 'start of month') ) SELECT drugname FROM ( SELECT drugname, COUNT(*) as freq, DENSE_RANK() OVER (ORDER BY COUNT(*) DESC) as rnk FROM PrescribedDrugs GROUP BY drugname ) ranked_drugs WHERE rnk <= 4",
            "gold_answer": "[['albumin human 5%'], ['ativan'], ['dextrose 50% abboject'], ['haldol'], ['morphine'], ['normal saline flush']]",
            "pred_answer": "[['albumin human 5%'], ['ativan'], ['dextrose 50% abboject'], ['normal saline flush']]",
            "is_correct": false,
            "reasoning": "The predicted SQL omits the crucial condition requiring the medication start time to occur after the diagnosis time (T1.diagnosistime < T2.drugstarttime). This is a missing WHERE\u2010clause filter rather than a flaw in the overall query structure, joins, or ranking logic. Adding the time-comparison condition back into the WHERE clause would align the predicted SQL with the intended logic, so the error is confined to a specific part of the query.",
            "error_type": "Local: missing time comparison filter"
        },
        "47d54fff12028659efa8b8b1": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "This year, what are the top three most common drugs prescribed within the same hospital visit to male patients aged 60 or above after being diagnosed with delirium?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'delirium' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.gender = 'male' AND patient.age >= 60 AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "WITH DeliriumPatients AS ( SELECT DISTINCT P.patientunitstayid, P.patienthealthsystemstayid FROM patient AS P INNER JOIN diagnosis AS D ON P.patientunitstayid = D.patientunitstayid WHERE P.gender = 'male' AND CAST(P.age AS INTEGER) >= 60 AND D.diagnosisname = 'delirium' AND datetime(D.diagnosistime, 'start of year') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') ), PrescribedDrugs AS ( SELECT M.drugname FROM DeliriumPatients AS DP INNER JOIN medication AS M ON DP.patientunitstayid = M.patientunitstayid WHERE datetime(M.drugstarttime, 'start of year') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') AND DP.patienthealthsystemstayid = (SELECT patienthealthsystemstayid FROM patient WHERE patientunitstayid = M.patientunitstayid) ) SELECT DISTINCT drugname FROM ( SELECT drugname, DENSE_RANK() OVER (ORDER BY COUNT(*) DESC) AS rank FROM PrescribedDrugs GROUP BY drugname ) AS RankedDrugs WHERE rank <= 3",
            "gold_answer": "[['dextrose 50% adult'], ['magnesium oxide'], ['sodium chloride 0.9%']]",
            "pred_answer": "[['dextrose 50% adult'], ['lorazepam'], ['sodium chloride 0.9%']]",
            "is_correct": false,
            "reasoning": "The predicted SQL builds two CTEs to identify male delirium patients and their prescriptions in the same year, then ranks the drugs. However, it never enforces that the drugstarttime occurs after the delirium diagnosistime. In the ground truth SQL, there is a WHERE clause T1.diagnosistime < T2.drugstarttime to ensure prescriptions happen after diagnosis. Omitting this temporal join condition fundamentally changes which drugs are counted and thus alters the intended result. This is not a simple typo or localized syntax issue but a missing logical constraint spanning the diagnosis\u2013medication relationship.",
            "error_type": "Global: missing temporal join condition"
        },
        "ce170c7abf96e8b47789c54d": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "When was patient 016-10564 first discharged from the hospital?",
            "gold_sql": "SELECT patient.hospitaldischargetime FROM patient WHERE patient.uniquepid = '016-10564' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaldischargetime ASC LIMIT 1",
            "pred_sql": "MIN(patient.hospitaldischargetime) AS first_discharge_time FROM patient WHERE patient.uniquepid = '016-10564' AND patient.hospitaldischargetime IS NOT NULL",
            "gold_answer": "[['2100-01-17 13:49:52']]",
            "pred_answer": "null",
            "is_correct": false,
            "reasoning": "The predicted SQL is missing the SELECT keyword before the aggregate function, making it a localized syntax/SELECT clause error. The overall query structure (finding the earliest discharge time) is correct, but the missing SELECT renders it invalid. This is a local syntax error that can be fixed without changing the query\u2019s logic.",
            "error_type": "Local: syntax error"
        },
        "a08d68de4bba22b9d544a0e0": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What is the daily maximum level of patient 006-100338's paco2 in 2100?",
            "gold_sql": "SELECT MAX(lab.labresult) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-100338' ) ) AND lab.labname = 'paco2' AND strftime('%Y',lab.labresulttime) = '2100' GROUP BY strftime('%Y-%m-%d',lab.labresulttime)",
            "pred_sql": "SELECT strftime('%Y-%m-%d', labresulttime) AS date, MAX(labresult) AS max_paco2 FROM lab WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '006-100338' ) AND labname = 'paco2' AND strftime('%Y', labresulttime) = '2100' GROUP BY date",
            "gold_answer": "[['31.0'], ['35.0'], ['36.0'], ['37.0'], ['39.0'], ['41.0'], ['45.0']]",
            "pred_answer": "[['2100-09-08', '45.0'], ['2100-09-09', '41.0'], ['2100-09-10', '39.0'], ['2100-09-11', '37.0'], ['2100-09-12', '35.0'], ['2100-09-13', '36.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL incorrectly restricts lab records to a single patientunitstayid derived directly from uniquepid, whereas the ground truth uses the patienthealthsystemstayid to include all relevant unit stays for that patient. This mistake affects the core logic of how patient records are associated across tables, altering the intended dataset. Fixing it would require changing the join/filter strategy rather than a simple typo or minor clause adjustment.",
            "error_type": "Global: join relationship error"
        },
        "bb8a3797c26badc2dc4e226f": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "How many days have passed from the time when patient 012-10585 was admitted to the icu?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',patient.unitadmittime) ) FROM patient WHERE patient.uniquepid = '012-10585' AND patient.unitdischargetime IS NULL",
            "pred_sql": "julianday('2100-12-31') - julianday(patient.unitadmittime) AS days_passed FROM patient WHERE patient.uniquepid = '012-10585'",
            "gold_answer": "[['4.351']]",
            "pred_answer": "null",
            "is_correct": false,
            "reasoning": "The predicted SQL is missing the SELECT keyword and does not apply the required filter on unitdischargetime IS NULL. The mistake is localized to the SELECT/WHERE clause syntax and does not alter the overall query structure or relationships between tables. Therefore, it is a local error.",
            "error_type": "Local: syntax error"
        },
        "0b64c8b521777103368b8d1f": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What is the number of times that patient 030-11672 visited the hospital in 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.patienthealthsystemstayid ) FROM patient WHERE patient.uniquepid = '030-11672' AND strftime('%Y',patient.hospitaladmittime) = '2100'",
            "pred_sql": "COUNT(DISTINCT patienthealthsystemstayid) FROM patient WHERE uniquepid = '030-11672' AND strftime('%Y', hospitaladmittime) = '2100'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "null",
            "is_correct": false,
            "reasoning": "The predicted SQL omits the SELECT keyword and the proper SELECT clause, making it a syntax/local error rather than a logical mistake in joining tables or query structure. The overall intention\u2014counting distinct hospital visits for the given patient in 2100\u2014is intact, but the missing SELECT renders the query invalid.",
            "error_type": "Local: syntax error"
        },
        "1c04274596c99433482a7a85": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What is the minimum total cost of hospitalization that includes the lactate laboratory test in 2100?",
            "gold_sql": "SELECT MIN(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT lab.patientunitstayid FROM lab WHERE lab.labname = 'lactate' ) ) AND strftime('%Y',cost.chargetime) = '2100' GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "SELECT MIN(total_cost) AS min_total_cost FROM ( SELECT SUM(DISTINCT C.cost) AS total_cost FROM cost AS C JOIN lab AS L ON C.patienthealthsystemstayid = L.patientunitstayid WHERE L.labname = 'lactate' AND strftime('%Y', L.labresulttime) = '2100' AND C.eventtype IN ('diagnosis', 'treatment', 'lab', 'medication') GROUP BY C.patienthealthsystemstayid )",
            "gold_answer": "[['270.99']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": [
                "The predicted query attempts to link cost and lab tables directly by matching cost.patienthealthsystemstayid to lab.patientunitstayid, but these are different keys and should not be joined directly.",
                "This join error fundamentally alters the relationships between tables and returns no matching rows.",
                "Additionally, the predicted query filters lab events by labresulttime instead of summing costs by the charge time (cost.chargetime), deviating from the intended cost aggregation logic.",
                "These mistakes are not isolated to a single clause but affect the overall data associations and logic of the query."
            ],
            "error_type": "Global: incorrect join keys and filtering"
        },
        "d446acea3c3db0da8b178a5e": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Which drug was patient 029-10096 allergic to since 09/2100?",
            "gold_sql": "SELECT allergy.drugname FROM allergy WHERE allergy.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '029-10096' ) ) AND strftime('%Y-%m',allergy.allergytime) >= '2100-09'",
            "pred_sql": "SELECT DISTINCT drugname FROM allergy WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '029-10096' ) AND strftime('%Y-%m', allergytime) >= '2100-09'",
            "gold_answer": "[['lasix'], ['lasix'], ['sulfacetamide sod monohydrate'], ['sulfacetamide sod monohydrate']]",
            "pred_answer": "[['lasix'], ['sulfacetamide sod monohydrate']]",
            "is_correct": false,
            "reasoning": "The predicted query uses a single-level direct equality on patientunitstayid = (SELECT patientunitstayid FROM patient WHERE uniquepid = '029-10096'), whereas the ground truth correctly links uniquepid \u2192 patienthealthsystemstayid \u2192 all patientunitstayid values to capture every ICU stay for that patient. The predicted SQL also uses '=' instead of 'IN', so it only returns allergies from one stay rather than all relevant stays. This misjoins the tables and breaks the intended patient\u2010to\u2010allergy relationship, requiring restructuring of the join logic rather than a simple fix in one clause.",
            "error_type": "Global: join error"
        },
        "25e1fa3607d0a4f426631379": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "What was the name of the medication that patient 003-10264 was prescribed within the same day after having received a stress ulcer prophylaxis - antacids procedure since 03/2100?",
            "gold_sql": "SELECT T2.drugname FROM ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '003-10264' ) AND treatment.treatmentname = 'stress ulcer prophylaxis - antacids' AND strftime('%Y-%m',treatment.treatmenttime) >= '2100-03' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '003-10264' ) AND strftime('%Y-%m',medication.drugstarttime) >= '2100-03' ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.drugstarttime AND datetime(T1.treatmenttime,'start of day') = datetime(T2.drugstarttime,'start of day')",
            "pred_sql": "SELECT DISTINCT T2.drugname FROM treatment AS T1 JOIN medication AS T2 ON T1.patientunitstayid = T2.patientunitstayid JOIN patient AS T3 ON T1.patientunitstayid = T3.patientunitstayid WHERE T3.uniquepid = '003-10264' AND T1.treatmentname = 'stress ulcer prophylaxis - antacids' AND datetime(T1.treatmenttime) >= datetime('2100-03-01') AND datetime(T1.treatmenttime, 'start of day') = datetime(T2.drugstarttime, 'start of day')",
            "gold_answer": "[['fentanyl citrate inj']]",
            "pred_answer": "[['acetaminophen'], ['bisacodyl supp'], ['fentanyl citrate inj'], ['fentanyl citrate inj'], ['hydralazine inj'], [\"lactated ringer's 1,000 ml bag.\"], [\"lactated ringer's 1,000 ml bag.\"], [\"lactated ringer's 1,000 ml bag.\"], ['magnesium hydroxide'], ['ondansetron inj'], ['ondansetron inj'], ['ondansetron inj']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to include the necessary condition that the medication start time must be after the treatment time (T1.treatmenttime < T2.drugstarttime). It only enforces that they occur on the same day, so medications given earlier that day are erroneously included. This mistake is confined to the WHERE clause logic and does not change the overall query structure or table relationships.",
            "error_type": "Local: missing time order condition"
        },
        "9f2f892efa9cbefc44db2be8": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Count the number of patients who were diagnosed with hepatic dysfunction - with cirrhosis but didn't come back to the hospital within the same month since 1 year ago.",
            "gold_sql": "SELECT ( SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'hepatic dysfunction - with cirrhosis' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 ) - ( SELECT COUNT( DISTINCT T2.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'hepatic dysfunction - with cirrhosis' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 JOIN patient ON T2.uniquepid = patient.uniquepid WHERE T2.diagnosistime < patient.hospitaladmittime AND datetime(patient.hospitaladmittime) >= datetime('2100-12-31 23:59:00','-1 year') AND datetime(T2.diagnosistime,'start of month') = datetime(patient.hospitaladmittime,'start of month') )",
            "pred_sql": "SELECT COUNT(DISTINCT T1.patientunitstayid) FROM diagnosis AS T1 JOIN patient AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.diagnosisname = 'hepatic dysfunction - with cirrhosis' AND datetime(T1.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') AND NOT EXISTS ( SELECT 1 FROM patient AS T3 WHERE T3.uniquepid = T2.uniquepid AND datetime(T3.hospitaladmittime,'start of month') = datetime(T2.hospitaladmittime,'start of month') AND datetime(T3.hospitaladmittime) > datetime(T2.hospitaldischargetime) )",
            "gold_answer": "[['12.0']]",
            "pred_answer": "[['16.0']]",
            "is_correct": false,
            "reasoning": "1. The predicted SQL counts DISTINCT patientunitstayid instead of DISTINCT uniquepid, changing the aggregation from patients to unit stays.\n2. The NOT EXISTS subquery logic is fundamentally flawed: it compares future hospitaladmittime against the original admission\u2019s discharge and matches months on T2.hospitaladmittime rather than the diagnosis time, breaking the intended \"same month return\" check.\n3. These mistakes alter the overall query logic and patient-level scope, requiring restructuring beyond a simple fix in one clause.\n4. Therefore, this is a Global error affecting the core logic and structure of the query.",
            "error_type": "Global: incorrect join and aggregation logic"
        },
        "a9a5042d9f74ed9c9f7a7f53": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Since 1 year ago, what are the top four most frequently ordered laboratory tests for patients within 2 months after diagnosed with acute respiratory failure - drug related?",
            "gold_sql": "SELECT T3.labname FROM ( SELECT T2.labname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'acute respiratory failure - drug related' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, lab.labname, lab.labresulttime FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE datetime(lab.labresulttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.labresulttime AND datetime(T2.labresulttime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month') GROUP BY T2.labname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "SELECT T2.labname FROM diagnosis AS T1 JOIN lab AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.diagnosisname = 'acute respiratory failure - drug related' AND datetime(T2.labresulttime) <= datetime(T1.diagnosistime, '+2 months') AND datetime(T1.diagnosistime) >= datetime('2100-12-31 23:59:00', '-1 year') GROUP BY T2.labname ORDER BY COUNT(T2.labname) DESC LIMIT 4",
            "gold_answer": "[['bedside glucose'], ['bicarbonate'], ['bun'], ['chloride'], ['creatinine'], ['glucose'], ['hct'], ['hgb'], ['mch'], ['mchc'], ['mcv'], ['platelets x 1000'], ['potassium'], ['rbc'], ['sodium'], ['wbc x 1000']]",
            "pred_answer": "[['bedside glucose'], ['potassium'], ['rbc'], ['wbc x 1000']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to restrict lab events to those occurring after the diagnosis. It only applies an upper bound (labresulttime \u2264 diagnosis time + 2 months) but omits the lower bound (labresulttime \u2265 diagnosis time). This mistake is confined to the WHERE clause and can be corrected by adding that one temporal condition, without restructuring the overall query.",
            "error_type": "Local: missing time\u2010bound condition"
        },
        "447f96c8b5fb35865f80afac": {
            "db_id": "eicu",
            "generator_name": "dinsql",
            "question": "Calculate the total number of patients diagnosed with hypotension who didn't revisit the hospital within the same month since 1 year ago.",
            "gold_sql": "SELECT ( SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'hypotension' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 ) - ( SELECT COUNT( DISTINCT T2.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'hypotension' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 JOIN patient ON T2.uniquepid = patient.uniquepid WHERE T2.diagnosistime < patient.hospitaladmittime AND datetime(patient.hospitaladmittime) >= datetime('2100-12-31 23:59:00','-1 year') AND datetime(T2.diagnosistime,'start of month') = datetime(patient.hospitaladmittime,'start of month') )",
            "pred_sql": "SELECT COUNT(DISTINCT T1.uniquepid) FROM patient AS T1 JOIN diagnosis AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T2.diagnosisname = 'hypotension' AND datetime(T1.hospitaladmittime) >= datetime('2100-12-31 23:59:00', '-1 year') AND NOT EXISTS ( SELECT 1 FROM patient AS T3 WHERE T3.uniquepid = T1.uniquepid AND datetime(T3.hospitaladmittime, 'start of month') = datetime(T1.hospitaladmittime, 'start of month') AND T3.patientunitstayid != T1.patientunitstayid AND datetime(T3.hospitaladmittime) >= datetime('2100-12-31 23:59:00', '-1 year') )",
            "gold_answer": "[['68.0']]",
            "pred_answer": "[['59.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the logic across multiple clauses: it filters on patient.hospitaladmittime instead of diagnosis.diagnosistime, and its NOT EXISTS subquery checks for other hospital admissions in the same month rather than revisits based on diagnosis time. These errors involve the overall join strategy and core query structure rather than a single clause, so they require major restructuring to fix.",
            "error_type": "Global: incorrect logical structure"
        }
    },
    "deepseek": {
        "969495ca8e36a6df510d7273": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Please list the daily minimum volume of urine that was output by patient 022-10471 on the last hospital visit.",
            "gold_sql": "SELECT MIN(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '022-10471' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND intakeoutput.celllabel = 'urine' AND intakeoutput.cellpath LIKE '%output%' GROUP BY strftime('%Y-%m-%d',intakeoutput.intakeoutputtime)",
            "pred_sql": "SELECT p.uniquepid, MIN(io.cellvaluenumeric) AS daily_min_urine_volume FROM patient p JOIN intakeoutput io ON p.patientunitstayid = io.patientunitstayid WHERE p.uniquepid = '022-10471' AND io.cellpath LIKE '%output (ml)|urine' AND p.hospitaldischargetime IS NOT NULL GROUP BY DATE(io.intakeoutputtime) ORDER BY DATE(io.intakeoutputtime) DESC LIMIT 1;",
            "gold_answer": "[['100.0'], ['200.0'], ['400.0']]",
            "pred_answer": "[['022-10471', '200.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL deviates from the intended logic in multiple ways: it applies ORDER BY \u2026 DESC LIMIT 1, returning only the last day's minimum instead of all daily minima; it uses an incorrect LIKE pattern for urine output; and it fails to restrict to the patient\u2019s most recent hospital stay properly. These issues span multiple clauses (FROM/WHERE, GROUP BY, ORDER BY/LIMIT) and require restructuring the query beyond a single clause fix. Therefore, this is a global error.",
            "error_type": "Global: flawed query structure"
        },
        "0327353ac5ed15c9699d9ea9": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Is the value of mean blood pressure in patient 022-1011 from last measurement on the current icu visit less than its first measurement on the current icu visit?",
            "gold_sql": "SELECT ( SELECT vitalperiodic.systemicmean FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '022-1011' ) AND patient.unitdischargetime IS NULL ) AND vitalperiodic.systemicmean IS NOT NULL ORDER BY vitalperiodic.observationtime DESC LIMIT 1 ) < ( SELECT vitalperiodic.systemicmean FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '022-1011' ) AND patient.unitdischargetime IS NULL ) AND vitalperiodic.systemicmean IS NOT NULL ORDER BY vitalperiodic.observationtime ASC LIMIT 1 )",
            "pred_sql": "SELECT (SELECT systemicmean FROM vitalperiodic WHERE patientunitstayid = (SELECT patientunitstayid FROM patient WHERE uniquepid = '022-1011' AND hospitaldischargetime IS NULL) ORDER BY observationtime DESC LIMIT 1) < (SELECT systemicmean FROM vitalperiodic WHERE patientunitstayid = (SELECT patientunitstayid FROM patient WHERE uniquepid = '022-1011' AND hospitaldischargetime IS NULL) ORDER BY observationtime ASC LIMIT 1) ;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses hospitaldischargetime to identify the current ICU visit and directly equates patientunitstayid from patient.uniquepid, whereas the ground truth correctly filters on patient.unitdischargetime IS NULL for the ICU visit via patienthealthsystemstayid and unitstay relationships. The predicted query thus misidentifies the visit and uses the wrong join/filter logic, fundamentally altering the intended semantics and resulting in no data. This is not a minor syntax or column naming issue but a core structural/logical error in how tables are joined and visits are identified.",
            "error_type": "Global: incorrect relationship error"
        },
        "59a090e63b9aecaa8ba090db": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "How many patients were given #3: in 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT intakeoutput.patientunitstayid FROM intakeoutput WHERE intakeoutput.celllabel = '#3:' AND intakeoutput.cellpath LIKE '%input%' AND strftime('%Y',intakeoutput.intakeoutputtime) = '2100' )",
            "pred_sql": "SELECT COUNT(DISTINCT patientunitstayid) FROM treatment WHERE treatmentid = 3 AND strftime('%Y', treatmenttime) = '2100';",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['1.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the treatment table with condition treatmentid = 3 instead of querying the intakeoutput table for celllabel '#3:' and filtering on input events in 2100. It also omits the subquery against patientunitstayid and fails to count distinct patient.uniquepid as required. This misuse of the wrong table and columns fundamentally alters the query\u2019s logic and fails to capture the intended data source, so the error is not a minor syntactic mistake but a structural and logical flaw.",
            "error_type": "Global: incorrect table and logic"
        },
        "9349e897c6c87592db2b6b4d": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What would be the monthly average weight of patient 013-10332 since 2100?",
            "gold_sql": "SELECT AVG(patient.admissionweight) FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '013-10332' ) AND patient.admissionweight IS NOT NULL AND strftime('%Y',patient.unitadmittime) >= '2100' GROUP BY strftime('%Y-%m',patient.unitadmittime)",
            "pred_sql": "-- Unfortunately, the database schema does not contain periodic weight measurements beyond admission and discharge weights, so it's not possible to calculate the monthly average weight for the patient. SELECT admissionweight, dischargeweight FROM patient WHERE uniquepid = '013-10332';",
            "gold_answer": "[['74.8']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely fails to implement the required aggregation (AVG) and grouping by month, and it does not filter by the date or compute a monthly average at all. Instead, it merely selects admissionweight and dischargeweight for the patient, which is a fundamentally different query structure and logic. Fixing this would require rewriting the query to include the proper aggregation, date filtering, and grouping clauses, not just a minor localized correction.",
            "error_type": "Global: structural-flaw"
        },
        "b3a0ff53392263e54edf05b0": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "When was patient 005-10974's first antidepressant - trazodone (desyrel) treatment on the first hospital visit?",
            "gold_sql": "SELECT treatment.treatmenttime FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '005-10974' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND treatment.treatmentname = 'antidepressant - trazodone (desyrel)' ORDER BY treatment.treatmenttime ASC LIMIT 1",
            "pred_sql": "SELECT MIN(m.drugstarttime) AS first_trazodone_time FROM patient p JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE p.uniquepid = '005-10974' AND (m.drugname = 'trazodone' OR m.drugname = 'Desyrel') AND p.hospitaladmittime = ( SELECT MIN(hospitaladmittime) FROM patient WHERE uniquepid = '005-10974' );",
            "gold_answer": "[['2100-09-19 01:14:00']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted query uses the medication table and drugstarttime to find the first trazodone event, whereas the question and ground truth require the treatment table and treatmenttime for 'antidepressant - trazodone (desyrel)' specifically on the first completed hospital visit. This mistake of choosing the wrong table and column and misapplying the hospital admission logic affects the overall structure and intended semantics of the query, not just a localized condition or syntax.",
            "error_type": "Global: incorrect table usage"
        },
        "8d42b976f508ae3b52c0c22f": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Share the five most frequently performed procedures since 2100.",
            "gold_sql": "SELECT T1.treatmentname FROM ( SELECT treatment.treatmentname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM treatment WHERE strftime('%Y',treatment.treatmenttime) >= '2100' GROUP BY treatment.treatmentname ) AS T1 WHERE T1.C1 <= 5",
            "pred_sql": "WITH procedures AS ( SELECT 'diagnosis' AS type, diagnosisname AS procedure_name, cost.chargetime FROM cost JOIN diagnosis ON cost.eventid = diagnosis.diagnosisid AND cost.patientunitstayid = diagnosis.patientunitstayid WHERE cost.event_type = 'diagnosis' AND chargetime >= '2100-01-01' UNION ALL SELECT 'treatment' AS type, treatmentname AS procedure_name, cost.chargetime FROM cost JOIN treatment ON cost.eventid = treatment.treatmentid AND cost.patientunitstayid = treatment.patientunitstayid WHERE cost.event_type = 'treatment' AND chargetime >= '2100-01-01' UNION ALL SELECT 'lab' AS type, labname AS procedure_name, cost.chargetime FROM cost JOIN lab ON cost.eventid = lab.labid AND cost.patientunitstayid = lab.patientunitstayid WHERE cost.event_type = 'lab' AND chargetime >= '2100-01-01' UNION ALL SELECT 'medication' AS type, drugname AS procedure_name, cost.chargetime FROM cost JOIN medication ON cost.eventid = medication.medicationid AND cost.patientunitstayid = medication.patientunitstayid WHERE cost.event_type = 'medication' AND chargetime >= '2100-01-01' ) SELECT procedure_name, COUNT(*) AS frequency FROM procedures GROUP BY procedure_name ORDER BY frequency DESC LIMIT 5;",
            "gold_answer": "[['antiemetic - serotonin antagonist'], ['chest x-ray'], ['mechanical ventilation'], ['normal saline administration'], ['stress ulcer prophylaxis - pantoprazole']]",
            "pred_answer": "no such column: cost.event_type",
            "is_correct": false,
            "reasoning": "The predicted SQL refers to cost.event_type, but the actual column is named cost.eventtype. This is a simple column reference error and does not require restructuring the query\u2019s overall logic or tables.",
            "error_type": "Local: column reference error"
        },
        "e6c1ce3d1f2119c0c4efd410": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "How many patients had antidepressant two or more times?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, COUNT(*) AS C1 FROM patient WHERE patient.patientunitstayid = ( SELECT treatment.patientunitstayid FROM treatment WHERE treatment.treatmentname = 'antidepressant' ) GROUP BY patient.uniquepid ) AS T1 WHERE T1.C1 >= 2",
            "pred_sql": "SELECT COUNT(DISTINCT m.patientunitstayid) AS count_patients FROM medication m WHERE m.drugname IN ('sertraline', 'fluoxetine', 'paroxetine', 'amitriptyline', 'duloxetine') GROUP BY m.patientunitstayid HAVING COUNT(DISTINCT m.medicationid) >= 2;",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the medication table and specific drug names (sertraline, fluoxetine, etc.) instead of using the treatment table and the generic 'antidepressant' treatmentname as specified. It also groups by patientunitstayid rather than uniquepid, thus altering the fundamental logic of which patients are counted and how. Fixing this would require changing the primary table, the grouping key, and the condition, which is more than a localized adjustment.",
            "error_type": "Global: wrong-table error"
        },
        "3a8fb984bbdae02fefa70866": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What is the name of the medication that patient 006-106259 received two or more times on the current hospital visit?",
            "gold_sql": "SELECT T1.drugname FROM ( SELECT medication.drugname, COUNT( medication.drugstarttime ) AS C1 FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-106259' AND patient.hospitaldischargetime IS NULL ) ) GROUP BY medication.drugname ) AS T1 WHERE T1.C1 >= 2",
            "pred_sql": "SELECT DISTINCT T2.drugname FROM patient AS T1 INNER JOIN medication AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.uniquepid = '006-106259' AND T1.hospitaldischargetime IS NULL -- current hospital visit GROUP BY T2.drugname, T2.routeadmin HAVING COUNT(T2.medicationid) >= 2;",
            "gold_answer": "[['duoneb 3 mg-0.5 mg/3 ml ud inh soln'], ['lisinopril 10 mg tab'], ['metoprolol tartrate 25 mg tab']]",
            "pred_answer": "[['azithromycin 500 mg in ns 250 ml iv'], ['clopidogrel 75 mg tab'], ['duoneb 3 mg-0.5 mg/3 ml ud inh soln'], ['duoneb 3 mg-0.5 mg/3 ml ud inh soln'], ['enoxaparin 40 mg/0.4 ml syr'], ['famotidine 20 mg tab'], ['lisinopril 10 mg tab'], ['lisinopril 10 mg tab'], ['methylprednisolone 40 mg inj'], ['metoprolol tartrate 25 mg tab'], ['metoprolol tartrate 25 mg tab'], ['prednisone 20 mg tab'], ['vancomycin 1 gm in ns 250 ml ivpb'], ['vancomycin 750 mg in ns 250 ml ivpb']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only differs in its GROUP BY clause: it groups by both drugname and routeadmin, then SELECTs only drugname (with DISTINCT). This splitting by route makes counts incorrect and duplicates appear, but it doesn\u2019t change the tables joined or the overall query structure. It\u2019s a localized mistake in the GROUP BY, so it\u2019s a local error.",
            "error_type": "Local: grouping error"
        },
        "b133ec5f24c3cd166147709c": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What is the 3-month survival rate for patients diagnosed with gi obstruction / ileus - small bowel obstruction?",
            "gold_sql": "SELECT AVG(C1) FROM ( SELECT ( CASE WHEN (patient.hospitaldischargestatus = 'expired') AND(strftime('%J',patient.hospitaldischargetime) - strftime('%J',T1.diagnosistime)) < 365 / 4 THEN 0 ELSE 1 END ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'gi obstruction / ileus - small bowel obstruction' AND strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) >= 365 / 4 GROUP BY patient.uniquepid HAVING MIN(diagnosis.diagnosistime) = diagnosis.diagnosistime ) AS T1 JOIN patient ON T1.uniquepid = patient.uniquepid GROUP BY patient.uniquepid HAVING MAX(patient.hospitaldischargetime) = patient.hospitaldischargetime )",
            "pred_sql": "WITH diagnosed_patients AS ( SELECT p.uniquepid, p.hospitaldischargestatus, MIN(d.diagnosistime) AS first_diagnosis_time FROM patient p JOIN diagnosis d ON p.patientunitstayid = d.patientunitstayid WHERE d.diagnosisname = 'gi obstruction / ileus - small bowel obstruction' GROUP BY p.uniquepid, p.hospitaldischargestatus ) SELECT COUNT(CASE WHEN (hospitaldischargestatus = 'expired' AND datetime(hospitaldischargetime) <= datetime(first_diagnosis_time, '+91 days')) THEN NULL ELSE 1 END) / COUNT(1) AS survival_rate FROM diagnosed_patients;",
            "gold_answer": "[['0.833']]",
            "pred_answer": "no such column: hospitaldischargetime",
            "is_correct": false,
            "reasoning": "The predicted SQL references the column hospitaldischargetime in the outer SELECT, but that column is not selected in the diagnosed_patients CTE. This is a simple column reference error that can be fixed by including hospitaldischargetime in the CTE, without altering the overall query structure or logic.",
            "error_type": "Local: column reference error"
        },
        "e18271222fca09e96024c7ae": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "List the top four most frequent specimens that patients are tested within the same month after receiving glucocorticoid administration this year.",
            "gold_sql": "SELECT T3.culturesite FROM ( SELECT T2.culturesite, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'glucocorticoid administration' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, microlab.culturesite, microlab.culturetakentime FROM microlab JOIN patient ON microlab.patientunitstayid = patient.patientunitstayid WHERE datetime(microlab.culturetakentime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.culturetakentime AND datetime(T1.treatmenttime,'start of month') = datetime(T2.culturetakentime,'start of month') GROUP BY T2.culturesite ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "WITH ranked_specs AS ( SELECT l.labname, COUNT(*) AS count_specimen, DENSE_RANK() OVER (ORDER BY COUNT(*) DESC) AS rank_specimen FROM medication m JOIN lab l ON m.patientunitstayid = l.patientunitstayid WHERE m.drugname LIKE '%cortisone%' OR m.drugname LIKE '%prednisone%' OR m.drugname LIKE '%dexamethasone%' OR m.drugname LIKE '%hydrocortisone%' AND strftime('%Y-%m', m.drugstarttime) = strftime('%Y-%m', l.labresulttime) AND strftime('%Y', m.drugstarttime) = '2100' GROUP BY l.labname ) SELECT labname FROM ranked_specs WHERE rank_specimen <= 4;",
            "gold_answer": "[['sputum, tracheal specimen']]",
            "pred_answer": "[['bedside glucose'], ['creatinine'], ['glucose'], ['potassium']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the medication and lab tables instead of the treatment and microlab tables, matches generic steroid drug names rather than the specific 'glucocorticoid administration' treatment name, and counts lab tests rather than culture specimens. It also misplaces the time relationship (using same-month but not ensuring culture occurs after treatment) and entirely alters the query\u2019s structure and intended relationships. This is not a simple typo or clause mistake but a fundamental change in tables, joins, and logic.",
            "error_type": "Global: incorrect tables and join logic"
        },
        "d83e7ab0c5e37663deb01e91": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "On the current hospital visit, how many hours have passed since the first time patient 025-10477 was prescribed 1000 ml : sodium chloride 0.9 % 0.9 % iv solp?",
            "gold_sql": "SELECT 24 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',medication.drugstarttime) ) FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '025-10477' ) AND patient.hospitaldischargetime IS NULL ) AND medication.drugname = '1000 ml : sodium chloride 0.9 % 0.9 % iv solp' ORDER BY medication.drugstarttime ASC LIMIT 1",
            "pred_sql": "SELECT p.uniquepid, MIN(m.drugstarttime) AS first_prescription_time, ROUND((strftime('%s', '2100-12-31 23:59:00') - strftime('%s', MIN(m.drugstarttime))) / 3600, 0) AS hours_since_first_prescription FROM patient p JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE p.uniquepid = '025-10477' AND p.hospitaldischargetime IS NULL AND m.drugname LIKE '%sodium chloride 0.9% 1000 ml iv soln%' GROUP BY p.uniquepid;",
            "gold_answer": "[['41.483']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it uses an incorrect LIKE pattern for the drugname, so no rows are returned. The mistake is localized to the WHERE clause\u2019s string matching of the drug name, and does not affect the overall query structure or logic.",
            "error_type": "Local: value parsing error"
        },
        "68d554a0eb8d6e33f7c18e04": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What is the patient count for 500 ml flex cont excel : sodium chloride 0.9 % iv soln prescription since 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid = ( SELECT medication.patientunitstayid FROM medication WHERE medication.drugname = '500 ml flex cont excel : sodium chloride 0.9 % iv soln' AND strftime('%Y',medication.drugstarttime) >= '2100' )",
            "pred_sql": "SELECT COUNT(DISTINCT patientunitstayid) AS patient_count FROM medication WHERE drugname = '500 ml flex cont excel : sodium chloride 0.9 % iv soln' AND drugstarttime >= '2100-01-01';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['5.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts distinct patientunitstayid directly from the medication table, whereas the ground truth counts distinct patient.uniquepid by first identifying the relevant patientunitstayid via a subquery on medication and then querying the patient table. This mistake changes the query\u2019s overall logic\u2014counting ICU/stay records instead of unique patients\u2014and requires restructuring the query (adding a join or subquery to map unit stays to unique patients). Therefore, it is not a localized syntax issue but a fundamental logical error in the query structure.",
            "error_type": "Global: aggregation-logic error"
        },
        "7e8eb77494306257f1f762c2": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "How many hours have elapsed since the first time on the current hospital visit that patient 012-10585 was diagnosed with pneumonia?",
            "gold_sql": "SELECT 24 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) ) FROM diagnosis WHERE diagnosis.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '012-10585' AND patient.hospitaldischargetime IS NULL ) ) AND diagnosis.diagnosisname = 'pneumonia' ORDER BY diagnosis.diagnosistime ASC LIMIT 1",
            "pred_sql": "SELECT ROUND((strftime('%s', '2100-12-31 23:59:00') - strftime('%s', (SELECT MIN(d.diagnosistime) FROM diagnosis d JOIN patient p ON d.patientunitstayid = p.patientunitstayid WHERE p.uniquepid = '012-10585' AND d.diagnosisname = 'pneumonia' AND p.hospitaldischargetime IS NULL))) / 3600) AS hours_since_diagnosis;",
            "gold_answer": "[['97.367']]",
            "pred_answer": "[['97.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL follows the same overall logic\u2014finding the first pneumonia diagnosis for the current hospital stay of patient '012-10585' and computing the hours elapsed until the fixed current time. The only substantive difference is that it uses UNIX timestamps and ROUND to return an integer number of hours (97.0) rather than the fractional hours (97.367) produced by the ground\u2010truth\u2019s Julian day calculation. This is a localized mistake in how the time difference is formatted (rounding off the decimal part) rather than a flaw in the query\u2019s structure or joins.",
            "error_type": "Local: value rounding error"
        },
        "66093ba08255a2b508004b34": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Calculate the number of patients who were given sodium phosphate prescription within the same hospital visit following their exploratory laparotomy.",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'exploratory laparotomy' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'sodium phosphate' ) AS T2 WHERE T1.treatmenttime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT COUNT(DISTINCT p.patientunitstayid) AS num_patients FROM patient p INNER JOIN diagnosis d ON p.patienthealthsystemstayid = d.patienthealthsystemstayid INNER JOIN medication m ON p.patienthealthsystemstayid = m.patienthealthsystemstayid WHERE d.diagnosisname LIKE '%exploratory laparotomy%' AND m.drugname LIKE '%sodium phosphate%' AND m.drugstarttime > d.diagnosistime;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "no such column: d.patienthealthsystemstayid",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it refers to a non\u2010existent column d.patienthealthsystemstayid in the diagnosis table. This is a simple column reference error within the JOIN/WHERE clause and does not affect the overall query structure or logic beyond that misreference. Hence it is a local error.",
            "error_type": "Local: table/column reference error"
        },
        "52c3e4197877ebed571489ef": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What is the number of patients who were prescribed pneumococcal polysaccharides since 1 year ago?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid = ( SELECT medication.patientunitstayid FROM medication WHERE medication.drugname = 'pneumococcal polysaccharides' AND datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') )",
            "pred_sql": "SELECT COUNT(DISTINCT p.uniquepid) FROM patient p JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE m.drugname = 'pneumococcal polysaccharides' AND m.drugstarttime >= '2099-12-31 23:59:00';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['2.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL differs from the ground\u2010truth only in the WHERE clause\u2019s time condition: it hardcodes '2099-12-31 23:59:00' instead of using the required datetime expression datetime('2100-12-31 23:59:00','-1 year') as per the SQL assumptions. This is a localized mistake in the date literal/formatting and does not require reworking the JOINs or overall query structure.",
            "error_type": "Local: incorrect date literal"
        },
        "eda63f3824496fdde6aee946": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "How long has it been in days since the last time 37.5 g tube : dextrose (diabetic use) 40 % po gel was prescribed to patient 016-10029 on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',medication.drugstarttime) ) FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '016-10029' ) AND patient.hospitaldischargetime IS NULL ) AND medication.drugname = '37.5 g tube : dextrose (diabetic use) 40 % po gel' ORDER BY medication.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT (strftime('%s', '2100-12-31 23:59:00') - strftime('%s', T1.drugstarttime)) / 86400 AS days_since_last_prescription FROM patient INNER JOIN medication AS T1 ON patient.patientunitstayid = T1.patientunitstayid WHERE patient.uniquepid = '016-10029' AND patient.hospitaldischargetime IS NULL AND T1.drugname = '37.5 g tube : dextrose (diabetic use) 40 % po gel' ORDER BY T1.drugstarttime DESC LIMIT 1;",
            "gold_answer": "[['6.089']]",
            "pred_answer": "[['6.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL differs only in how it computes the day difference: it uses UNIX-second timestamps divided by 86400, which truncates fractional days to an integer, rather than using Julian day difference (strftime('%J')) as in the ground truth. All other parts of the query (joins, filters, ordering, and limits) correctly target the same patient and drug on the current hospital visit. This is a localized mistake in the time-difference calculation and does not require restructuring the query\u2019s overall logic.",
            "error_type": "Local: other-temporal error"
        },
        "af68cfb7669d83903df2e7b1": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Tell me the total volume of input for patient 033-10044 on the current icu visit.",
            "gold_sql": "SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '033-10044' ) AND patient.unitdischargetime IS NULL ) AND intakeoutput.cellpath LIKE '%intake%'",
            "pred_sql": "SELECT SUM(DISTINCT io.cellvaluenumeric) AS total_input_volume FROM patient p JOIN intakeoutput io ON p.patientunitstayid = io.patientunitstayid WHERE p.uniquepid = '033-10044' AND p.unitdischargetime IS NULL AND io.cellpath LIKE '%intake%' AND io.cellpath NOT LIKE '%output%' ;",
            "gold_answer": "[['2170.0']]",
            "pred_answer": "[['1970.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL deviates from the ground truth only in the SELECT clause by using SUM(DISTINCT io.cellvaluenumeric) instead of SUM(io.cellvaluenumeric). This change in aggregation is a localized mistake in the SELECT expression: it removes duplicate values before summation, leading to an incorrect total. The JOIN conditions, filtering for the current ICU stay, and the intake filter are all correct. Since the error is confined to the aggregate function in the SELECT clause and does not affect the overall query structure or table relationships, it is a local error.",
            "error_type": "Local: incorrect aggregation in SELECT"
        },
        "5fe8240c72712d70d057790d": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "How many patients had a diagnosis of hypomagnesemia in 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT diagnosis.patientunitstayid FROM diagnosis WHERE diagnosis.diagnosisname = 'hypomagnesemia' AND strftime('%Y',diagnosis.diagnosistime) = '2100' )",
            "pred_sql": "SELECT COUNT(DISTINCT p.patientunitstayid) AS number_of_patients FROM patient p JOIN diagnosis d ON p.patientunitstayid = d.patientunitstayid WHERE d.diagnosisname = 'hypomagnesemia' AND strftime('%Y', d.diagnosistime) = '2100';",
            "gold_answer": "[['22.0']]",
            "pred_answer": "[['24.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts DISTINCT p.patientunitstayid (unique stays) instead of DISTINCT p.uniquepid (unique patients). This is a column reference mistake in the SELECT clause that leads to counting stays rather than patients, resulting in an inflated count. The overall query structure and logic remain correct; only the referenced column needs to be changed.",
            "error_type": "Local: column reference error"
        },
        "81131ba93ea7e3e5e2d9bf82": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "How many days has it been since patient 025-1000's last stay in ward 908 on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',patient.unitadmittime) ) FROM patient WHERE patient.uniquepid = '025-1000' AND patient.wardid = 908 AND patient.hospitaldischargetime IS NULL ORDER BY patient.unitadmittime DESC LIMIT 1",
            "pred_sql": "SELECT (strftime('%J', '2100-12-31 23:59:00') - strftime('%J', p.unitdischargetime)) AS days_since_last_stay FROM patient p WHERE p.uniquepid = '025-1000' AND p.wardid = 908 ORDER BY p.unitadmittime DESC LIMIT 1;",
            "gold_answer": "[['9.574']]",
            "pred_answer": "[['6.167']]",
            "is_correct": false,
            "reasoning": "The predicted query fails to restrict to the current hospital visit (it never filters WHERE hospitaldischargetime IS NULL) and furthermore subtracts the Julian day of unitdischargetime instead of unitadmittime. These mistakes change the overall set of rows considered and the core date calculation, so fixing it requires altering both the WHERE clause logic and the SELECT expression. This is not a simple typo or local syntax fix but a fundamental logic error across clauses.",
            "error_type": "Global: incorrect filter and column usage"
        },
        "a75bc868e8e28198c8b93ff2": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What is the length of the first hospital stay in days for patient 022-101650?",
            "gold_sql": "SELECT strftime('%J',patient.hospitaldischargetime) - strftime('%J',patient.hospitaladmittime) FROM patient WHERE patient.uniquepid = '022-101650' AND patient.hospitaladmittime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1",
            "pred_sql": "SELECT (strftime('%j', hospitaldischargetime) - strftime('%j', hospitaladmittime)) + 1 AS length_of_stay FROM patient WHERE uniquepid = '022-101650' AND hospitaldischargetime IS NOT NULL;",
            "gold_answer": "[['0.747']]",
            "pred_answer": "[['1.747']]",
            "is_correct": false,
            "reasoning": "The predicted SQL miscalculates the length of stay by using strftime('%j') (day\u2010of\u2010year) instead of strftime('%J') (Julian day number) and then arbitrarily adds +1. This is an error localized to the date arithmetic in the SELECT clause. The overall query structure (table, WHERE clause) remains intact.",
            "error_type": "Local: other\u2010temporal error"
        },
        "943bc16041b3fcf7d4976352": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What was the last ward that patient 002-10157 stayed in on the last hospital visit?",
            "gold_sql": "SELECT patient.wardid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-10157' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ORDER BY patient.unitadmittime DESC LIMIT 1",
            "pred_sql": "SELECT wardid FROM patient WHERE uniquepid = '002-10157' AND hospitaladmittime = (SELECT MAX(hospitaladmittime) FROM patient WHERE uniquepid = '002-10157');",
            "gold_answer": "[['93.0']]",
            "pred_answer": "[['93.0'], ['93.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL picks rows where hospitaladmittime is the maximum for that patient, rather than first identifying the last completed hospital visit (using hospitaldischargetime) and then selecting the last ward within that visit (using unitadmittime). It fails to filter on hospitaldischargetime IS NOT NULL and does not retrieve the ward with the maximum unitadmittime for that specific visit. This is not a simple typo or single\u2010clause fix but a flaw in the overall query logic and structure, requiring reworking the visit identification and ward selection steps.",
            "error_type": "Global: incorrect visit and ward selection logic"
        },
        "131699dc7495ab5b40aa2d69": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What was the name of the specimen test that was last given to patient 025-10060 on the last hospital visit?",
            "gold_sql": "SELECT microlab.culturesite FROM microlab WHERE microlab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '025-10060' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) ORDER BY microlab.culturetakentime DESC LIMIT 1",
            "pred_sql": "SELECT lab.labname FROM lab WHERE lab.patientunitstayid = ( SELECT p.patientunitstayid FROM patient p WHERE p.uniquepid = '025-10060' ORDER BY p.hospitaladmittime DESC LIMIT 1 ) ORDER BY lab.labresulttime DESC LIMIT 1;",
            "gold_answer": "[['sputum, expectorated']]",
            "pred_answer": "[['paco2']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the lab table instead of the microlab table to retrieve the specimen test name, and it fails to enforce the discharge condition for selecting the last hospital visit. This is not a minor syntax or column reference fix but a fundamental misselection of the source table and join logic, altering the intended meaning of the query.",
            "error_type": "Global: join/table selection error"
        },
        "51f6daf8480d7c0ebaa6546b": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Keep count of how many times patient 027-101164 outputted urine since 02/2100.",
            "gold_sql": "SELECT COUNT(*) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-101164' ) ) AND intakeoutput.cellpath LIKE '%output%' AND intakeoutput.celllabel = 'urine' AND strftime('%Y-%m',intakeoutput.intakeoutputtime) >= '2100-02'",
            "pred_sql": "SELECT COUNT(*) FROM intakeoutput JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE patient.patient = '027-101164' AND celllabel = 'urine' AND datetime(intakeoutputtime) >= datetime('2100-02-01');",
            "gold_answer": "[['31.0']]",
            "pred_answer": "no such column: patient.patient",
            "is_correct": false,
            "reasoning": "The predicted SQL refers to a non-existent column patient.patient instead of using the correct column (e.g., patient.uniquepid or joining via patienthealthsystemstayid), causing a simple column reference error. This is localized to the WHERE clause and doesn\u2019t alter the overall query logic.",
            "error_type": "Local: table/column reference error"
        },
        "ec8b06d3d0d215017406de8d": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What was the maximum -monos value for patient 004-16896 last month?",
            "gold_sql": "SELECT MAX(lab.labresult) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-16896' ) ) AND lab.labname = '-monos' AND datetime(lab.labresulttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month')",
            "pred_sql": "SELECT MAX(v.systemicmean) AS max_monos FROM vitalperiodic v JOIN patient p ON v.patientunitstayid = p.patientunitstayid WHERE p.uniquepid = '004-16896' AND strftime('%Y-%m', v.observationtime) = '2100-11';",
            "gold_answer": "[['8.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally misinterprets the question by querying the vitalperiodic table for systemicmean rather than the lab table for the '-monos' lab result. It also applies an incorrect time filter (using strftime('%Y-%m') = '2100-11' instead of the specified start-of-month filter) and fails to link through the patienthealthsystemstayid hierarchy. These are not localized typos or minor clause fixes but a complete mis-structuring of the query logic, table selection, and time filtering.",
            "error_type": "Global: incorrect table join and logic"
        },
        "1f665d965c0a35901cd6f9f6": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Count the number of times that patient 007-10182 received the stress ulcer treatment procedure since 2100.",
            "gold_sql": "SELECT COUNT(*) FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '007-10182' ) ) AND treatment.treatmentname = 'stress ulcer treatment' AND strftime('%Y',treatment.treatmenttime) >= '2100'",
            "pred_sql": "SELECT COUNT(t.treatmentid) AS count_stress_ulcer_treatments FROM patient p JOIN treatment t ON p.patientunitstayid = t.patientunitstayid WHERE p.uniquepid = '007-10182' AND t.treatmentname = 'stress ulcer treatment - omeprazole' AND t.treatmenttime >= '2100-01-01 00:00:00';",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses an incorrect treatment name filter ('stress ulcer treatment - omeprazole' instead of 'stress ulcer treatment'). The JOIN, date filter, and overall structure are correct and align with the intent, but the specific WHERE condition on treatmentname is wrong. This is a confined mistake in a single clause and does not affect the broader query logic.",
            "error_type": "Local: incorrect literal in WHERE clause"
        },
        "478c3255e0407d25b4d06849": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "In total, what was the input amount of zosyn that patient 005-10238 received on 03/26/this year?",
            "gold_sql": "SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '005-10238' ) ) AND intakeoutput.celllabel = 'zosyn' AND intakeoutput.cellpath LIKE '%intake%' AND datetime(intakeoutput.intakeoutputtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m-%d',intakeoutput.intakeoutputtime) = '03-26'",
            "pred_sql": "SELECT SUM(CAST(SUBSTR(T2.dosage, 0, INSTR(T2.dosage, ' ') - 1) AS REAL)) AS total_zosyn_input FROM patient AS T1 INNER JOIN medication AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.uniquepid = '005-10238' AND T2.drugname LIKE '%zosyn%' AND DATE(T2.drugstarttime) = '2100-03-26';",
            "gold_answer": "[['250.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL retrieves data from the medication table (joining patient to medication and using drugstarttime and dosage) rather than from the intakeoutput table with celllabel = 'zosyn' and cellpath LIKE '%intake%'. This is not a simple column or date formatting mistake; it fundamentally changes the source of data and the logic of the query. Fixing it requires restructuring the query to use intakeoutput instead of medication and applying the proper filters, so it is a global error.",
            "error_type": "Global: incorrect table/join error"
        },
        "91bea95ae8d28879a583b9d7": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What is the total cost for patient 011-10149's hospital stay?",
            "gold_sql": "SELECT SUM(cost.cost) FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '011-10149' )",
            "pred_sql": "SELECT SUM(DISTINCT c.cost) AS total_cost FROM patient p JOIN cost c ON p.patienthealthsystemstayid = c.patienthealthsystemstayid WHERE p.uniquepid = '011-10149';",
            "gold_answer": "[['530.59']]",
            "pred_answer": "[['355.51']]",
            "is_correct": false,
            "reasoning": "The predicted SQL incorrectly applies DISTINCT within the SUM aggregation, summing only unique cost values rather than all cost entries for the patient's stay. This mistake is confined to the SELECT clause's aggregate function and does not involve changes to the overall query structure or logic (joins and filters are correct). Hence, it is a localized error in the aggregate function.",
            "error_type": "Local: incorrect use of DISTINCT in SUM"
        },
        "74ea0cbd79ce583aa647a2d5": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Count the number of patients that were admitted to the hospital since 1 year ago.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE datetime(patient.hospitaladmittime) >= datetime('2100-12-31 23:59:00','-1 year')",
            "pred_sql": "SELECT COUNT(DISTINCT patienthealthsystemstayid) FROM patient WHERE hospitaladmittime >= datetime('2100-12-31 23:59:00', '-1 year');",
            "gold_answer": "[['1384.0']]",
            "pred_answer": "[['1542.0']]",
            "is_correct": false,
            "reasoning": "The predicted query uses COUNT(DISTINCT patienthealthsystemstayid) instead of COUNT(DISTINCT patient.uniquepid). This is simply the wrong column reference for distinct patients (it counts stays rather than unique patients) but doesn\u2019t alter the overall structure or logic of the query beyond that one column. Hence it\u2019s a local column reference error.",
            "error_type": "Local: column-reference error"
        },
        "6d7e48a3d6e297467b1e7db0": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What was the drug that was prescribed to patient 007-10111 within 2 days after the ercp on the first hospital visit?",
            "gold_sql": "SELECT T2.drugname FROM ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '007-10111' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) AND treatment.treatmentname = 'ercp' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '007-10111' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.drugstarttime AND datetime(T2.drugstarttime) BETWEEN datetime(T1.treatmenttime) AND datetime(T1.treatmenttime,'+2 day')",
            "pred_sql": "SELECT M.drugname FROM patient P JOIN treatment T ON P.patientunitstayid = T.patientunitstayid JOIN medication M ON P.patientunitstayid = M.patientunitstayid WHERE P.uniquepid = '007-10111' AND T.treatmentname LIKE '%erpc%' AND M.drugstarttime >= T.treatmenttime AND M.drugstarttime <= datetime(T.treatmenttime, '+2 days') AND P.hospitaladmittime = ( SELECT MIN(hospitaladmittime) FROM patient WHERE uniquepid = '007-10111' );",
            "gold_answer": "[['albuterol'], ['albuterol'], ['aspart insulin'], ['colace'], ['colace'], ['dextrose 50%'], ['dextrose 50%'], ['dextrose 50%'], ['dextrose 50%'], ['dilaudid'], ['dilaudid'], ['dilaudid'], ['dilaudid'], ['dulcolax laxative'], ['fentanyl'], ['fentanyl'], ['glucagen'], ['glucagen'], ['lasix'], ['lasix'], ['lidocaine'], ['lidocaine'], ['milk of magnesia'], ['oxycodone'], ['oxycodone'], ['oxycodone'], ['oxycodone'], ['oxycodone'], ['phenylephrine'], ['phenylephrine'], ['piperacillin-tazobactam'], ['piperacillin-tazobactam'], ['piperacillin-tazobactam'], ['piperacillin-tazobactam'], ['piperacillin-tazobactam'], ['piperacillin-tazobactam'], ['propofol'], ['propofol'], ['rocuronium'], ['rocuronium'], ['succinylcholine'], ['succinylcholine'], ['tylenol'], ['vancomycin'], ['vancomycin'], ['vancomycin'], ['vancomycin'], ['vancomycin'], ['zofran']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally alters the intended logic in several places rather than just fixing a minor typo.  First, it joins treatment and medication on patientunitstayid instead of using the hospital\u2010level patienthealthsystemstayid, changing the scope from a hospital visit to an ICU stay.  Second, it filters the earliest visit by comparing hospitaladmittime only, omitting the hospitaldischargetime IS NOT NULL condition, which breaks the \u201cfirst completed hospital visit\u201d requirement.  Third, it uses a LIKE '%erpc%' filter (misspelling the treatment name) and even misuses the SQLite datetime modifier '+2 days' instead of '+2 day'.  All of these issues require restructuring the joins and filtering logic, so the error is global.",
            "error_type": "Global: join-relationship error"
        },
        "043d8bebfcf620d4a94036f0": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Since patient 022-1011's admission in the icu, how many hours have elapsed?",
            "gold_sql": "SELECT 24 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',patient.unitadmittime) ) FROM patient WHERE patient.uniquepid = '022-1011' AND patient.unitdischargetime IS NULL",
            "pred_sql": "SELECT ROUND( ( strftime('%s', '2100-12-31 23:59:00') - strftime('%s', patient.unitadmittime) ) / 3600 ) AS hours_since_icu_admission FROM patient WHERE uniquepid = '022-1011';",
            "gold_answer": "[['787.333']]",
            "pred_answer": "[['787.0']]",
            "is_correct": false,
            "reasoning": "The predicted query omits the critical WHERE condition \"patient.unitdischargetime IS NULL\" that restricts to the current ICU admission. This missing filter changes the overall logic of the query (it could include past admissions or discharged records), and thus it is not a simple syntax or localized error but a global logic error.",
            "error_type": "Global: missing-current-admission-filter"
        },
        "f4edb21f87ce00914040c235": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "How many hours have passed since the first time patient 004-11678 underwent a procedure on the current hospital visit?",
            "gold_sql": "SELECT 24 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',treatment.treatmenttime) ) FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-11678' AND patient.hospitaldischargetime IS NULL ) ) ORDER BY treatment.treatmenttime ASC LIMIT 1",
            "pred_sql": "SELECT ROUND((strftime('%s', '2100-12-31 23:59:00') - strftime('%s', ( SELECT MIN(treatmenttime) FROM treatment WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '004-11678' AND hospitaldischargetime IS NULL ) )) / 3600) ) AS hours_since_first_procedure;",
            "gold_answer": "[['150.55']]",
            "pred_answer": "[['4132832563.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL is making a mistake solely in the arithmetic expression inside the SELECT clause \u2013 it divides only the second timestamp by 3600 instead of dividing the overall difference, and misplaces the parentheses. The table references, WHERE filtering and subqueries are otherwise correct for the current hospital visit. This is a localized error in the computation of hours, not a flaw in the overall query structure or joins. Therefore, it is a Local error.",
            "error_type": "Local: temporal arithmetic error"
        },
        "a63f998370bbc0b3359e838b": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "List the top four most frequent diagnoses that patients are diagnosed with within the same hospital visit after receiving inotropic agent - epinephrine > 0.1 micrograms/kg/min this year.",
            "gold_sql": "SELECT T3.diagnosisname FROM ( SELECT T2.diagnosisname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'inotropic agent - epinephrine > 0.1 micrograms/kg/min' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, diagnosis.diagnosisname, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.diagnosistime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.diagnosisname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "SELECT diagnosisname FROM diagnosis WHERE patientunitstayid IN ( SELECT m.patientunitstayid FROM patient p JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE m.drugname = 'inotropic agent - epinephrine' AND (CAST(SUBSTR(m.dosage, 1, INSTR(m.dosage, ' ') - 1) AS REAL) / p.admissionweight) > 0.1 AND STRFTIME('%Y', p.hospitaladmittime) = '2100' AND m.drugstarttime < diagnosistime ) GROUP BY diagnosisname ORDER BY COUNT(diagnosisname) DESC LIMIT 4;",
            "gold_answer": "[['s/p cabg < 7 days'], ['valve replacement < 7days - aortic']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the logic by using the medication table instead of the treatment table, miscomputing the dosage condition, filtering by hospital admission year rather than treatment/diagnosis times, and failing to join on the same patienthealthsystemstayid to ensure diagnoses occur within the same visit. These errors span multiple clauses and alter the intended data relationships, requiring a complete restructuring of the query logic rather than a localized fix.",
            "error_type": "Global: incorrect table usage and join logic"
        },
        "fb0def8c2f5978a67d16803e": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "When was the last time that patient 007-10459 was prescribed nacl 0.9% adv and vancomycin in 05/2100 at the same time?",
            "gold_sql": "SELECT T1.drugstarttime FROM ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '007-10459' ) AND medication.drugname = 'vancomycin' AND strftime('%Y-%m',medication.drugstarttime) = '2100-05' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '007-10459' ) AND medication.drugname = 'nacl 0.9% adv' AND strftime('%Y-%m',medication.drugstarttime) = '2100-05' ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE datetime(T1.drugstarttime) = datetime(T2.drugstarttime) ORDER BY T1.drugstarttime DESC LIMIT 1",
            "pred_sql": "SELECT MAX(m1.drugstarttime) AS last_prescription_time FROM patient JOIN medication m1 ON patient.patientunitstayid = m1.patientunitstayid JOIN medication m2 ON m1.patientunitstayid = m2.patientunitstayid WHERE patient.patientidentifier = '007-10459' AND m1.drugname = 'nacl 0.9% adv' AND m2.drugname = 'vancomycin' AND m1.drugstarttime < m2.drugstoptime AND m2.drugstarttime < m1.drugstoptime AND strftime('%Y-%m', m1.drugstarttime) = '2100-05' AND strftime('%Y-%m', m2.drugstarttime) = '2100-05';",
            "gold_answer": "[['2100-05-22 05:44:00']]",
            "pred_answer": "no such column: patient.patientidentifier",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it references patient.patientidentifier, which does not exist in the schema (the correct column is patient.uniquepid). This is a simple column naming mistake localized to the WHERE clause and can be fixed without altering the overall query structure or logic.",
            "error_type": "Local: table/column reference error"
        },
        "7001d255e38191c3413f86a2": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Since patient 013-10167's first stay in ward 549 on the current hospital visit, how many hours have passed?",
            "gold_sql": "SELECT 24 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',patient.unitadmittime) ) FROM patient WHERE patient.uniquepid = '013-10167' AND patient.wardid = 549 AND patient.hospitaldischargetime IS NULL ORDER BY patient.unitadmittime ASC LIMIT 1",
            "pred_sql": "SELECT (strftime('%s', '2100-12-31 23:59:00') - strftime('%s', (SELECT MIN(unitadmittime) FROM patient WHERE uniquepid = '013-10167' AND wardid = 549))) / 3600 AS hours_passed ;",
            "gold_answer": "[['339.582']]",
            "pred_answer": "[['339.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to restrict to the current hospital visit (hospitaldischargetime IS NULL) and to the first ward stay on that visit. Instead, it simply takes the global minimum unitadmittime for that patient and ward, ignoring the hospital discharge filter. This changes the overall query logic and requires restructuring beyond a single clause fix.",
            "error_type": "Global: logical-structure error"
        },
        "51ffc81f1b89c620543bf91b": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Among patients diagnosed with hypercoagulable state, what are the top five most common lab tests conducted within the same hospital visit since 1 year ago?",
            "gold_sql": "SELECT T3.labname FROM ( SELECT T2.labname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'hypercoagulable state' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, lab.labname, lab.labresulttime, patient.patienthealthsystemstayid FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE datetime(lab.labresulttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.labresulttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.labname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT lab.labname FROM patient INNER JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid INNER JOIN lab ON patient.patientunitstayid = lab.patientunitstayid WHERE diagnosis.diagnosisname = 'hypercoagulable state' AND lab.labresulttime >= '2099-12-31 23:59:00' GROUP BY lab.labname ORDER BY COUNT(*) DESC LIMIT 5;",
            "gold_answer": "[['anion gap'], ['bicarbonate'], ['bun'], ['calcium'], ['chloride'], ['creatinine'], ['glucose'], ['hct'], ['hgb'], ['mch'], ['mchc'], ['mcv'], ['platelets x 1000'], ['potassium'], ['ptt'], ['rdw'], ['sodium'], ['wbc x 1000']]",
            "pred_answer": "[['chloride'], ['creatinine'], ['glucose'], ['potassium'], ['sodium']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only filters labs by date and groups by labname, but it never restricts diagnoses to the 1-year window nor enforces that the lab occurred after the diagnosis. It also omits the datetime comparison between diagnosis.diagnosistime and lab.labresulttime. These omissions fundamentally change the query logic and results, requiring changes across WHERE and JOIN clauses rather than a simple localized fix.",
            "error_type": "Global: join and filter logic error"
        },
        "e978805c9c431a4af765f712": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What is the total number of patients who were discharged from the hospital this year?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.hospitaldischargetime IS NOT NULL AND datetime(patient.hospitaldischargetime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year')",
            "pred_sql": "SELECT COUNT(*) FROM patient WHERE STRFTIME('%Y', hospitaldischargetime) = '2100';",
            "gold_answer": "[['1367.0']]",
            "pred_answer": "[['1758.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses COUNT(*) instead of COUNT(DISTINCT patient.uniquepid) and does not explicitly check for hospitaldischargetime IS NOT NULL. This is a localized mistake in the aggregation and DISTINCT usage rather than a structural or multi-clause logic error. The overall query structure and filtering logic remain intact, but the aggregation is incorrect.",
            "error_type": "Local: aggregation error"
        },
        "40448499d12131f2f43e9143": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "On the last hospital visit, what was patient 016-10349's last weight measurement?",
            "gold_sql": "SELECT patient.admissionweight FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '016-10349' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) AND patient.admissionweight IS NOT NULL ORDER BY patient.unitadmittime DESC LIMIT 1",
            "pred_sql": "SELECT dischargeweight FROM patient WHERE uniquepid = '016-10349' ORDER BY hospitaladmittime DESC LIMIT 1;",
            "gold_answer": "[['121.56']]",
            "pred_answer": "[['121.6']]",
            "is_correct": false,
            "reasoning": "The predicted SQL selects the wrong column (dischargeweight) instead of the required admissionweight. This is a localized mistake in the SELECT clause\u2019s column reference and does not affect the overall query structure or logic.",
            "error_type": "Local: column reference error"
        },
        "7c21a831254af88eb13b28b7": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Can you get me the top three diagnoses that have the highest 6-month mortality rate?",
            "gold_sql": "SELECT T4.diagnosisname FROM ( SELECT T3.diagnosisname, DENSE_RANK() OVER ( ORDER BY T3.C2 ASC ) AS C2 FROM ( SELECT T2.diagnosisname, AVG(C1) AS C2 FROM ( SELECT T1.diagnosisname, ( CASE WHEN (patient.hospitaldischargestatus = 'expired') AND(strftime('%J',patient.hospitaldischargetime) - strftime('%J',T1.diagnosistime)) < 365 / 2 THEN 0 ELSE 1 END ) as C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosisname, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) >= 365 / 2 GROUP BY patient.uniquepid, diagnosis.diagnosisname HAVING MIN(diagnosis.diagnosistime) = diagnosis.diagnosistime ) AS T1 JOIN patient ON T1.uniquepid = patient.uniquepid ) AS T2 GROUP BY T2.diagnosisname ) AS T3 ) AS T4 WHERE T4.C2 <= 3",
            "pred_sql": "WITH mortality AS ( SELECT d.diagnosisname, COUNT(CASE WHEN p.hospitaldischargestatus = 'expired' AND p.hospitaldischargetime <= DATE(d.diagnosistime, '+182 day') THEN 1 END) AS deaths, COUNT(*) AS total FROM diagnosis d JOIN patient p ON d.patientunitstayid = p.patientunitstayid GROUP BY d.diagnosisname ) SELECT diagnosisname, CAST(deaths AS REAL) / total AS mortality_rate FROM mortality ORDER BY mortality_rate DESC LIMIT 3;",
            "gold_answer": "[['anuria'], ['ards - pulmonary etiology'], ['av block - pacemaker in place, pacing and capturing'], ['bacteremia - gram negative rod'], ['bacteremia - respiratory source'], ['cardiac arrest - initial rhythm: pulseless electrical activity'], ['cardiac arrest - initial rhythm: ventricular tachycardia'], ['cardiac arrest - un-witnessed'], ['cholecystitis - acute'], ['dvt - left upper extremity'], ['dvt - right upper extremity'], ['encephalopathy - toxic'], ['facial bone fracture - maxillary fracture'], ['facial bone fracture - orbital fracture'], ['gastric ca'], ['hyperglycemia - corticosteroid related'], ['hypernatremia - moderate (146 - 155 meq/dl)'], ['hypokalemia - moderate ( 2.8 - 3.5 meq/dl)'], ['hypothermia'], ['liver ca'], ['melanoma - nodular'], ['mouth and jaw tumor - oral cavity squamous cell ca'], ['peripheral vascular ischemia - atherosclerotic thrombo-occlusion'], ['peripheral vascular ischemia - postoperative'], ['pleural effusion - due to heart failure'], ['pneumothorax - spontaneous'], ['seizures - from ischemia/infarction'], ['sepsis - sepsis with single organ dysfunction- circulatory system failure'], ['shock, etiology unclear'], ['valve repair >= 7 days - aortic / mitral'], ['vascular insufficiency of intestine - due to extrinsic compression'], ['ventricular tachycardia - with hemodynamic compromise']]",
            "pred_answer": "[['acute copd exacerbation - with baseline hypoxemia', '1.0'], ['anal ca', '1.0'], ['anuria', '1.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the logic for computing 6-month mortality: it counts all diagnosis rows (not first diagnoses per patient), does not filter out diagnoses within the last six months (so some patients lack full follow-up), and aggregates raw counts of events rather than computing the patient-level survival rate as specified. It also returns both the rate and name and orders by deaths/total, rather than ranking by average survival and selecting the top three diagnoses. Fixing this requires reworking multiple clauses (subquery, filtering by time, grouping, ranking), not just a minor tweak. Therefore this is a global error.",
            "error_type": "Global: incorrect mortality calculation and grouping logic"
        },
        "6e9ba38f419c202ab212ef98": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Compared to yesterday, what new drugs are present in the prescription of patient 015-100025 today?",
            "gold_sql": "SELECT medication.drugname FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.uniquepid = '015-100025' ) AND datetime(medication.drugstarttime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-0 day') EXCEPT SELECT medication.drugname FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.uniquepid = '015-100025' ) AND datetime(medication.drugstarttime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-1 day')",
            "pred_sql": "SELECT DISTINCT m1.drugname FROM medication m1 JOIN patient p1 ON m1.patientunitstayid = p1.patientunitstayid WHERE p1.uniquepid = '015-100025' AND datetime(m1.drugstarttime, 'start of day') = datetime('2100-12-31 23:59:00', 'start of day', '-0 day') AND m1.drugname NOT IN ( SELECT DISTINCT m2.drugname FROM medication m2 JOIN patient p2 ON m2.patientunitstayid = p2.patientunitstayid WHERE p2.uniquepid = '015-100025' AND datetime(m2.drugstarttime, 'start of day') = datetime('2100-12-31 23:59:00', 'start of day', '-1 day') );",
            "gold_answer": "[['1 ml : heparin sodium (porcine) 5000 unit/ml ij soln'], ['1 ml vial : heparin sodium (porcine) 1000 unit/ml ij soln'], ['100 ml flex cont : sodium chloride 0.9 % iv soln'], ['acetaminophen 325 mg po tabs'], ['alteplase 2 mg ij solr'], ['aspirin 81 mg po chew'], ['atorvastatin calcium 40 mg po tabs'], ['carvedilol 25 mg po tabs'], ['diphenhydramine hcl 25 mg po caps'], ['famotidine 20 mg po tabs'], ['nitroglycerin 0.4 mg sl subl'], ['oxycodone hcl 5 mg po tabs'], ['prednisone 10 mg po tabs'], ['prednisone 20 mg po tabs'], ['prednisone 5 mg po tabs'], ['sodium chloride 0.9 % ij soln']]",
            "pred_answer": "[['1 ml : heparin sodium (porcine) 5000 unit/ml ij soln'], ['1 ml vial : heparin sodium (porcine) 1000 unit/ml ij soln'], ['100 ml flex cont : sodium chloride 0.9 % iv soln'], ['100 ml flex cont : sodium chloride 0.9 % iv soln'], ['acetaminophen 325 mg po tabs'], ['alteplase 2 mg ij solr'], ['aspirin 81 mg po chew'], ['atorvastatin calcium 40 mg po tabs'], ['carvedilol 25 mg po tabs'], ['diphenhydramine hcl 25 mg po caps'], ['famotidine 20 mg po tabs'], ['nitroglycerin 0.4 mg sl subl'], ['oxycodone hcl 5 mg po tabs'], ['prednisone 10 mg po tabs'], ['prednisone 20 mg po tabs'], ['prednisone 5 mg po tabs'], ['sodium chloride 0.9 % ij soln']]",
            "is_correct": false,
            "reasoning": "The user\u2019s predicted SQL mirrors the ground\u2010truth logic (finding today\u2019s drugs not in yesterday\u2019s list) and even uses a NOT IN subquery instead of EXCEPT. The only discrepancy is a duplicate row in the output, indicating a missing or misapplied DISTINCT removal. This is a confined, clause\u2010level issue and does not alter the overall join or filtering logic of the query. Thus it is a local error.",
            "error_type": "Local: missing-distinct error"
        },
        "e7377d5873adc22bdb17fa78": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Count the number of patients who were tested in 2100 for glucose - csf.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT lab.patientunitstayid FROM lab WHERE lab.labname = 'glucose - csf' AND strftime('%Y',lab.labresulttime) = '2100' )",
            "pred_sql": "SELECT COUNT(DISTINCT patientunitstayid) FROM lab WHERE labname = \"glucose - csf\" AND strftime('%Y', labresulttime) = \"2100\";",
            "gold_answer": "[['15.0']]",
            "pred_answer": "[['16.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts distinct patientunitstayid in the lab table, effectively counting unique visits where 'glucose - csf' was tested, rather than counting distinct patients. The ground truth joins through the patient table and counts DISTINCT patient.uniquepid, ensuring each patient is only counted once even if they had multiple unit stays. This mistake changes the fundamental logic of what is being counted (visits vs. patients) and cannot be fixed by a small localized edit\u2014it requires restructuring the query to join the patient table and count patient.uniquepid instead of patientunitstayid.",
            "error_type": "Global: wrong-entity-counting"
        },
        "9aa241d49a094b71909dfa84": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What was the total continuous infusion meds amount given for patient 011-13921 on the first icu visit?",
            "gold_sql": "SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '011-13921' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 ) AND intakeoutput.celllabel = 'continuous infusion meds' AND intakeoutput.cellpath LIKE '%intake%'",
            "pred_sql": "SELECT SUM(CAST(SUBSTR(m.dosage, 1, INSTR(m.dosage, ' ') - 1) AS REAL)) AS total_continuous_infusion_meds_amount FROM patient p JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE p.uniquepid = '011-13921' AND m.routeadmin = 'iv' AND m.drugstarttime >= (SELECT p.unitadmittime FROM patient p WHERE p.uniquepid = '011-13921' ORDER BY p.unitadmittime ASC LIMIT 1) AND m.drugstarttime <= (SELECT p.unitdischargetime FROM patient p WHERE p.uniquepid = '011-13921' ORDER BY p.unitadmittime ASC LIMIT 1);",
            "gold_answer": "[['2254.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the data source and logic: it uses the medication table and parses the dosage field with an IV route filter, whereas the ground truth uses the intakeoutput table with celllabel 'continuous infusion meds' and cellpath LIKE '%intake%' restricted to the first ICU visit. This is not a minor syntax fix but a fundamentally different query structure and table selection, thus a global error.",
            "error_type": "Global: incorrect table usage"
        },
        "b0aec40fac3a41abe889d377": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What is the daily average of patient 005-10384's weight this year?",
            "gold_sql": "SELECT AVG(patient.admissionweight) FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '005-10384' ) AND patient.admissionweight IS NOT NULL AND datetime(patient.unitadmittime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') GROUP BY strftime('%Y-%m-%d',patient.unitadmittime)",
            "pred_sql": "SELECT AVG(weight) AS daily_average_weight FROM vitalperiodic JOIN patient ON vitalperiodic.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '005-10384' AND datetime(vitalperiodic.observationtime, 'start of year') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year');",
            "gold_answer": "[['65.5']]",
            "pred_answer": "no such column: weight",
            "is_correct": false,
            "reasoning": "The predicted query references a column \"weight\" in the vitalperiodic table, but no such column exists in that table (it has temperature, sao2, heartrate, etc.). This is a straightforward column reference error and does not require restructuring the query\u2019s logic or joins.",
            "error_type": "Local: column reference error"
        },
        "6d83bd4ff59e92870efdc23a": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What number of hours has passed since patient 015-100025's last procedure on the current hospital visit?",
            "gold_sql": "SELECT 24 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',treatment.treatmenttime) ) FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '015-100025' AND patient.hospitaldischargetime IS NULL ) ) ORDER BY treatment.treatmenttime DESC LIMIT 1",
            "pred_sql": "SELECT ROUND( (strftime('%s', '2100-12-31 23:59:00') - strftime('%s', ( SELECT MAX(treatmenttime) FROM treatment WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '015-100025' AND hospitaldischargetime IS NULL ) )) / 3600 ) AS hours_since_last_procedure ;",
            "gold_answer": "[['15.183']]",
            "pred_answer": "near \"AS\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL has a misplaced AS clause and mismatched parentheses around the ROUND function, leading to a syntax error near \"AS\". This is a localized syntax mistake in the SELECT expression and does not alter the overall logical structure of the query.",
            "error_type": "Local: syntax error"
        },
        "8b41023860c7ee88b1ce0979": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Tell me the minimum total hospital cost that includes hypertension - with renal failure since 1 year ago.",
            "gold_sql": "SELECT MIN(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT diagnosis.patientunitstayid FROM diagnosis WHERE diagnosis.diagnosisname = 'hypertension - with renal failure' ) ) AND datetime(cost.chargetime) >= datetime('2100-12-31 23:59:00','-1 year') GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "WITH relevant_patients AS ( SELECT DISTINCT p.patienthealthsystemstayid FROM patient p JOIN diagnosis d1 ON p.patientunitstayid = d1.patientunitstayid JOIN diagnosis d2 ON p.patientunitstayid = d2.patientunitstayid WHERE d1.diagnosisname = 'hypertension' AND d2.diagnosisname = 'renal failure' AND p.hospitaladmittime >= datetime('2100-12-31 23:59:00', '-1 year') ) SELECT MIN(total_cost) AS min_total_cost FROM ( SELECT p.patienthealthsystemstayid, SUM(DISTINCT c.cost) AS total_cost FROM patient p JOIN cost c ON p.patienthealthsystemstayid = c.patienthealthsystemstayid WHERE c.eventtype IN ('diagnosis', 'treatment', 'lab', 'medication') AND p.patienthealthsystemstayid IN (SELECT patienthealthsystemstayid FROM relevant_patients) GROUP BY p.patienthealthsystemstayid );",
            "gold_answer": "[['933.35']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally alters the query\u2019s logic: it treats 'hypertension - with renal failure' as two separate diagnoses ('hypertension' AND 'renal failure') instead of one combined diagnosis name. It also filters on patient.hospitaladmittime rather than cost.chargetime, restricts to certain event types, and applies DISTINCT to costs, none of which align with the intended summation over all cost records since one year ago for the exact diagnosis. These changes affect multiple clauses and the overall meaning of the query.",
            "error_type": "Global: logical join and filter error"
        },
        "e77454c3e63ce2ee7641860d": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What was the duration in days of patient 010-10025's first stay in the icu?",
            "gold_sql": "SELECT strftime('%J',patient.unitdischargetime) - strftime('%J',patient.unitadmittime) FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '010-10025' ) AND patient.unitadmittime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1",
            "pred_sql": "SELECT (strftime('%s', unitdischargetime) - strftime('%s', unitadmittime)) / (86400) AS duration_days FROM patient WHERE uniquepid = '010-10025' ORDER BY unitadmittime ASC LIMIT 1;",
            "gold_answer": "[['4.454']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted query correctly identifies the patient\u2019s first ICU stay by ordering on unitadmittime and limiting to one record. The error lies solely in how the duration is calculated: using strftime('%s') and integer division by 86400 yields a truncated result of 4.0 days rather than the precise 4.454 days calculated by the ground truth\u2019s Julian day difference. This is a localized mistake in the temporal calculation, not a structural or logical join issue.",
            "error_type": "Local: other-temporal error"
        },
        "fe732f7c6bbbbe8bc019c631": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What was the last mch result for patient 007-10076 on the first hospital visit?",
            "gold_sql": "SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '007-10076' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND lab.labname = 'mch' ORDER BY lab.labresulttime DESC LIMIT 1",
            "pred_sql": "SELECT (SELECT MAX(labresult) FROM lab WHERE patientunitstayid = (SELECT patientunitstayid FROM patient WHERE uniquepid = '007-10076' ORDER BY hospitaladmittime LIMIT 1) AND labname = 'mch') AS last_mch_result;",
            "gold_answer": "[['30.6']]",
            "pred_answer": "[['28.9']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the logic for identifying the patient\u2019s first hospital visit and the last \u201cmch\u201d result. Instead of: 1) filtering for a completed (discharged) first hospital visit via hospitaldischargetime IS NOT NULL and 2) ordering lab results by labresulttime, it simply picks the earliest patient.admission record (regardless of discharge) and uses MAX(labresult) (the highest numeric value) rather than the most recent by timestamp. These alterations span multiple clauses (the visit\u2010selection subquery and the aggregation of lab results) and thus require restructuring the overall query, not just a minor tweak within one clause.",
            "error_type": "Global: incorrect visit selection and aggregation logic"
        },
        "6ddde3148b0940760c8a3a29": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "What are the five most commonly received procedures for patients in their 60 or above since 2100?",
            "gold_sql": "SELECT T1.treatmentname FROM ( SELECT treatment.treatmentname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age >= 60 ) AND strftime('%Y',treatment.treatmenttime) >= '2100' GROUP BY treatment.treatmentname ) AS T1 WHERE T1.C1 <= 5",
            "pred_sql": "WITH procedures AS ( SELECT t.treatmentname AS procedure_name FROM treatment t INNER JOIN patient p ON t.patientunitstayid = p.patientunitstayid WHERE CAST(p.age AS INT) >= 60 AND datetime(t.treatmenttime) >= datetime('2100-01-01') UNION SELECT m.drugname AS procedure_name FROM medication m INNER JOIN patient p ON m.patientunitstayid = p.patientunitstayid WHERE CAST(p.age AS INT) >= 60 AND datetime(m.drugstarttime) >= datetime('2100-01-01') ) SELECT procedure_name, COUNT(DISTINCT patientunitstayid) AS count FROM ( SELECT procedure_name, patientunitstayid FROM procedures ) AS combined GROUP BY procedure_name ORDER BY count DESC LIMIT 5;",
            "gold_answer": "[['antiplatelet agent - aspirin'], ['cardiology consultation'], ['chest x-ray'], ['mechanical ventilation'], ['stress ulcer prophylaxis - pantoprazole']]",
            "pred_answer": "no such column: patientunitstayid",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it references patientunitstayid in the outer query, but the CTE \u201cprocedures\u201d only selects procedure_name (no patientunitstayid). This is a column reference error localized to the SELECT/CTE definition and can be fixed by including patientunitstayid in the CTE. It does not affect overall query structure or logic beyond this missing column.",
            "error_type": "Local: column reference error"
        },
        "9fe9bada749eb3c056c66c6a": {
            "db_id": "eicu",
            "generator_name": "deepseek",
            "question": "Show me the total amount of patient 021-101378's output on the first icu visit.",
            "gold_sql": "SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '021-101378' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 ) AND intakeoutput.cellpath LIKE '%output%'",
            "pred_sql": "SELECT SUM(io.cellvaluenumeric) AS total_output FROM patient p JOIN intakeoutput io ON p.patientunitstayid = io.patientunitstayid WHERE p.uniquepid = '021-101378' AND io.cellpath LIKE '%output%' AND io.intakeoutputtime >= p.unitadmittime AND io.intakeoutputtime <= p.unitdischargetime ORDER BY p.unitadmittime ASC LIMIT 1;",
            "gold_answer": "[['22735.0']]",
            "pred_answer": "[['3685.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes how the \u201cfirst ICU visit\u201d is identified and how the output records are selected. Instead of isolating exactly one patientunitstayid via a sub\u2010query that filters on unitdischargetime IS NOT NULL and orders by unitadmittime, it simply joins patient to intakeoutput and tries to bound on time conditions. This not only omits the IS NOT NULL filter but also misuses ORDER BY/LIMIT on an aggregated result, altering the intended logic of selecting the first ICU visit. Fixing this would require restructuring the query (correct sub\u2010query or join conditions), not just tweaking a single clause. Hence, it is a global error.",
            "error_type": "Global: incorrect join strategy"
        }
    },
    "o4-mini": {
        "c86225eed349bcb717e7dc8e": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Among patients diagnosed with agitation - moderate, what are the top four most common lab tests that followed within the same hospital visit?",
            "gold_sql": "SELECT T3.labname FROM ( SELECT T2.labname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'agitation - moderate' ) AS T1 JOIN ( SELECT patient.uniquepid, lab.labname, lab.labresulttime, patient.patienthealthsystemstayid FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.labresulttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.labname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "WITH agitation AS ( SELECT p.patienthealthsystemstayid, d.diagnosistime FROM diagnosis d JOIN patient p ON d.patientunitstayid = p.patientunitstayid WHERE d.diagnosisname = 'agitation - moderate' ) SELECT l.labname, COUNT(*) AS freq FROM lab l JOIN patient p_l ON l.patientunitstayid = p_l.patientunitstayid JOIN agitation a ON p_l.patienthealthsystemstayid = a.patienthealthsystemstayid AND l.labresulttime > a.diagnosistime GROUP BY l.labname ORDER BY freq DESC LIMIT 4;",
            "gold_answer": "[['anion gap'], ['bedside glucose'], ['bicarbonate'], ['bun'], ['calcium'], ['chloride'], ['creatinine'], ['glucose'], ['potassium'], ['sodium']]",
            "pred_answer": "[['bedside glucose', '133.0'], ['glucose', '47.0'], ['potassium', '70.0'], ['sodium', '40.0']]",
            "is_correct": false,
            "reasoning": "We compare the ground\u2010truth and predicted SQL. Both queries correctly restrict to \"agitation \u2013 moderate\" diagnoses, join on the same hospital visit (patienthealthsystemstayid), filter labs after the diagnosis time, group by labname, and order by count. The predicted SQL\u2019s overall structure and join logic are sound \u2013 the error lies only in the SELECT/ORDER BY/LIMIT clause. The question and assumptions require returning only the lab names (and using DENSE_RANK to include any ties), but the predicted SQL (1) returns an extra COUNT(*) column (freq) and (2) uses LIMIT 4 instead of a dense\u2010rank filter, thus omitting tied items and exposing the counts in the output. These are localized mistakes in the projection and ranking clause, not fundamental joins or logic flaws. Thus the error is Local.",
            "error_type": "Local: SELECT/projection error"
        },
        "dbb80bce2d56d862effb3fb3": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "How many days has it been since patient 021-10001's hospital admission?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',patient.hospitaladmittime) ) FROM patient WHERE patient.uniquepid = '021-10001' AND patient.hospitaldischargetime IS NULL",
            "pred_sql": "SELECT CAST(julianday('2100-12-31 23:59:00') - julianday(hospitaladmittime) AS INTEGER) AS days_since_admission FROM patient WHERE uniquepid = '021-10001';",
            "gold_answer": "[['4.513']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL omits the filter patient.hospitaldischargetime IS NULL, so it computes days since the date of any admission rather than the current one. It also casts the difference to an integer, truncating the fractional days. Omitting the discharge-time condition changes the fundamental logic of the query (we no longer restrict to the current admission), which requires restructuring the WHERE clause. This is not a simple syntactic fix but alters the intended semantics across clauses.",
            "error_type": "Global: incorrect WHERE clause"
        },
        "f0a6c28d4198d7d12dff31f3": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "How many patients underwent a other test?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT microlab.patientunitstayid FROM microlab WHERE microlab.culturesite = 'other' )",
            "pred_sql": "SELECT COUNT(DISTINCT p.uniquepid) AS num_patients FROM microlab m JOIN patient p ON m.patientunitstayid = p.patientunitstayid WHERE m.organism = 'other';",
            "gold_answer": "[['3.0']]",
            "pred_answer": "[['21.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the wrong column in the WHERE clause: it filters on m.organism = 'other' instead of microlab.culturesite = 'other'. The join structure and overall logic remain correct, but the column reference is incorrect, leading to the wrong result.",
            "error_type": "Local: column reference error"
        },
        "63354d6c1558c315d8c2e34f": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "What is the percentile tsh value of 0.05 among patients of the same age as patient 012-10585 on the current hospital visit?",
            "gold_sql": "SELECT DISTINCT T1.C1 FROM ( SELECT lab.labresult, PERCENT_RANK() OVER ( ORDER BY lab.labresult ) AS C1 FROM lab WHERE lab.labname = 'tsh' AND lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age = ( SELECT patient.age FROM patient WHERE patient.uniquepid = '012-10585' AND patient.hospitaldischargetime IS NULL ) ) ) AS T1 WHERE T1.labresult = 0.05",
            "pred_sql": "SELECT SUM(CASE WHEN lab.labresult <= 0.05 THEN 1 ELSE 0 END) * 1.0 / COUNT(*) AS percentile FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE lab.labname = 'tsh' AND patient.hospitaldischargetime IS NULL AND patient.age = ( SELECT age FROM patient WHERE uniquepid = '012-10585' AND hospitaldischargetime IS NULL );",
            "gold_answer": "[['0.111']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses a SUM/COUNT approach to compute the percentile (cumulative distribution) instead of the PERCENT_RANK() window function as specified. This error is confined to the SELECT clause\u2019s percentile calculation logic and does not involve incorrect table references, joins, or overall query structure. Therefore, it\u2019s a local error in how the percentile is computed.",
            "error_type": "Local: percentile calculation error"
        },
        "bb0088a72f4862ae157b5887": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Can you provide me the daily minimum amount of intake, iv amount that patient 033-10289 received since 06/02/2100?",
            "gold_sql": "SELECT MIN(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '033-10289' ) ) AND intakeoutput.celllabel = 'intake, iv amount' AND intakeoutput.cellpath LIKE '%intake%' AND strftime('%Y-%m-%d',intakeoutput.intakeoutputtime) >= '2100-06-02' GROUP BY strftime('%Y-%m-%d',intakeoutput.intakeoutputtime)",
            "pred_sql": "SELECT date(io.intakeoutputtime) AS day, MIN(io.cellvaluenumeric) AS min_iv_intake FROM intakeoutput io JOIN patient p ON io.patientunitstayid = p.patientunitstayid WHERE p.uniquepid = '033-10289' AND io.cellpath LIKE '%intake%' AND io.cellpath LIKE '%i.v.%' AND date(io.intakeoutputtime) >= '2100-06-02' GROUP BY date(io.intakeoutputtime) ORDER BY day;",
            "gold_answer": "[['453.0'], ['495.0'], ['671.0'], ['715.0']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it uses io.cellpath LIKE '%i.v.%' instead of filtering on celllabel = 'intake, iv amount'. This is a localized mistake in the WHERE clause pattern matching and does not alter the overall query structure or joins. The patient join is acceptable, but the incorrect condition on cellpath leads to no rows being returned.",
            "error_type": "Local: incorrect WHERE clause value pattern"
        },
        "9dc2faa762a87d534e0d1c11": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "How many days have elapsed since patient 012-10585 received his or her first antibacterials on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',treatment.treatmenttime) ) FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '012-10585' AND patient.hospitaldischargetime IS NULL ) ) AND treatment.treatmentname = 'antibacterials' ORDER BY treatment.treatmenttime ASC LIMIT 1",
            "pred_sql": "SELECT CAST( julianday('2100-12-31 23:59:00') - julianday(MIN(m.drugstarttime)) AS INTEGER) AS days_elapsed FROM patient p JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE p.uniquepid = '012-10585' AND p.hospitaldischargetime IS NULL AND ( LOWER(m.drugname) LIKE '%cillin%' OR LOWER(m.drugname) LIKE '%mycin%' OR LOWER(m.drugname) LIKE '%cef%' OR LOWER(m.drugname) LIKE '%floxacin%' OR LOWER(m.drugname) LIKE '%sulfa%' );",
            "gold_answer": "[['4.057']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted query sources the first antibacterial event from the medication table (using drugname patterns and drugstarttime) instead of the treatment table with treatmentname='antibacterials' as required by the question and ground truth. This mistake affects the overall logic and data source of the query, not just a minor syntax or column reference error. It changes which events are counted and how the patient\u2019s current hospital visit is identified, thus altering the intended meaning of the query. Consequently, this is a global error in the query structure and logic.",
            "error_type": "Global: incorrect table selection"
        },
        "746f97e945c295d0b4e02ffd": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "What are the four most usual lab tests for patients in their 20s this year?",
            "gold_sql": "SELECT T1.labname FROM ( SELECT lab.labname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age BETWEEN 20 AND 29 ) AND datetime(lab.labresulttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') GROUP BY lab.labname ) AS T1 WHERE T1.C1 <= 4",
            "pred_sql": "SELECT lab.labname FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE patient.age BETWEEN 20 AND 29 AND strftime('%Y', lab.labresulttime) = '2100' GROUP BY lab.labname ORDER BY COUNT(*) DESC LIMIT 4;",
            "gold_answer": "[['bedside glucose'], ['chloride'], ['creatinine'], ['potassium'], ['sodium']]",
            "pred_answer": "[['bedside glucose'], ['chloride'], ['potassium'], ['sodium']]",
            "is_correct": false,
            "reasoning": "The predicted query uses ORDER BY COUNT(*) DESC LIMIT 4 instead of applying a DENSE_RANK filter to include ties at the 4th rank. This mistake is confined to the ranking/selection logic within the ORDER/GROUP BY clause and does not alter the tables joined or the overall structure of the query. Therefore it is a localized error in how the top-four labs are chosen, not a flaw in the global query logic.",
            "error_type": "Local: ranking error"
        },
        "e989ad2c573c923a5fa15813": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Since the first diagnosis of patient 027-105098 with sepsis - severe on the current hospital visit, how many days have passed?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) ) FROM diagnosis WHERE diagnosis.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-105098' AND patient.hospitaldischargetime IS NULL ) ) AND diagnosis.diagnosisname = 'sepsis - severe' ORDER BY diagnosis.diagnosistime ASC LIMIT 1",
            "pred_sql": "SELECT CAST(julianday('2100-12-31 23:59:00') - julianday(MIN(d.diagnosistime)) AS INTEGER) AS days_passed FROM patient p JOIN diagnosis d ON p.patientunitstayid = d.patientunitstayid WHERE p.uniquepid = '027-105098' AND p.hospitaldischargetime IS NULL AND d.diagnosisname = 'sepsis - severe';",
            "gold_answer": "[['17.529']]",
            "pred_answer": "[['17.0']]",
            "is_correct": false,
            "reasoning": "The predicted query correctly identifies the first diagnosis on the current hospital visit and computes the day difference, so the overall structure and joins are sound. The discrepancy comes from casting the result to an INTEGER (truncating the fractional days) instead of preserving the decimal precision (and rounding to three decimals) as the ground truth does. This is a localized issue in the SELECT expression and output formatting, not a flaw in the join logic or overall query structure.",
            "error_type": "Local: value parsing/truncation error"
        },
        "2760d8fb8525ac6cc81c7d8e": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Tell me the lab test that was first given to patient 030-11183 since 06/2100?",
            "gold_sql": "SELECT lab.labname FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '030-11183' ) ) AND strftime('%Y-%m',lab.labresulttime) >= '2100-06' ORDER BY lab.labresulttime ASC LIMIT 1",
            "pred_sql": "WITH filtered_labs AS ( SELECT lab.labname, lab.labresulttime FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '030-11183' AND datetime(lab.labresulttime) >= datetime('2100-06-01','start of month') ), first_time AS ( SELECT MIN(labresulttime) AS ft FROM filtered_labs ) SELECT DISTINCT labname FROM filtered_labs WHERE labresulttime = (SELECT ft FROM first_time);",
            "gold_answer": "[['-lymphs']]",
            "pred_answer": "[['-bands'], ['-lymphs'], ['-monos'], ['-polys'], ['hct'], ['hgb'], ['mch'], ['mchc'], ['mcv'], ['platelets x 1000'], ['rbc'], ['rdw'], ['wbc x 1000']]",
            "is_correct": false,
            "reasoning": "The predicted query correctly filters lab records for the given patient since June 2100 and finds the earliest timestamp. However, instead of returning exactly one lab test (LIMIT 1), it returns all lab names recorded at that earliest time by using DISTINCT without a LIMIT. The mistake is localized to the final projection/selection logic; the overall query structure and joins are correct.",
            "error_type": "Local: projection error"
        },
        "aafda5799cef4cdbb1a8c0e0": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "What's the count of current patients?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.hospitaldischargetime IS NULL",
            "pred_sql": "SELECT COUNT(*) AS current_patient_count FROM patient WHERE hospitaldischargetime IS NULL;",
            "gold_answer": "[['23.0']]",
            "pred_answer": "[['30.0']]",
            "is_correct": false,
            "reasoning": "The predicted query only counts rows (COUNT(*)) instead of counting unique patients (COUNT(DISTINCT patient.uniquepid)), thereby overcounting patients with multiple stays. This is a mistake in the SELECT aggregation clause (missing DISTINCT), and it doesn\u2019t require restructuring joins or filters\u2014just adding DISTINCT. Hence, it\u2019s a localized error.",
            "error_type": "Local: missing-distinct aggregation error"
        },
        "0ab92f68e27dbc8a5e3a463a": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Show me patient 027-104050's daily maximum weight since 10 months ago.",
            "gold_sql": "SELECT MAX(patient.admissionweight) FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-104050' ) AND patient.admissionweight IS NOT NULL AND datetime(patient.unitadmittime) >= datetime('2100-12-31 23:59:00','-10 month') GROUP BY strftime('%Y-%m-%d',patient.unitadmittime)",
            "pred_sql": "WITH weight_events AS ( SELECT date(hospitaladmittime) AS obs_date, admissionweight AS weight FROM patient WHERE uniquepid = '027-104050' AND hospitaladmittime >= datetime('2100-12-31 23:59:00', '-10 months') AND admissionweight IS NOT NULL UNION ALL SELECT date(hospitaldischargetime) AS obs_date, dischargeweight AS weight FROM patient WHERE uniquepid = '027-104050' AND hospitaldischargetime >= datetime('2100-12-31 23:59:00', '-10 months') AND dischargeweight IS NOT NULL ) SELECT obs_date, MAX(weight) AS daily_max_weight FROM weight_events GROUP BY obs_date ORDER BY obs_date;",
            "gold_answer": "[['61.9'], ['61.9'], ['63.95']]",
            "pred_answer": "[['2100-09-04', '63.95']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the logic of the original request. Instead of using only admission weights and grouping by the ICU admission time (unitadmittime) as in the ground truth, it introduces a UNION ALL with discharge weights, uses hospital admission/discharge times, and applies an incorrect time offset syntax (\u2018-10 months\u2019 rather than \u2018-10 month\u2019). These changes alter the intended meaning of the query and require a full restructuring rather than a simple fix in one clause.",
            "error_type": "Global: structural error"
        },
        "c05dacc0e794b065b0057789": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Among patients who received cardiac angiography , what are the top three most frequent medications that followed within the same month?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'cardiac angiography' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.drugstarttime AND datetime(T1.treatmenttime,'start of month') = datetime(T2.drugstarttime,'start of month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "SELECT med.drugname FROM treatment AS angio JOIN medication AS med ON angio.patientunitstayid = med.patientunitstayid WHERE angio.treatmentname LIKE '%cardiac angiography%' AND med.drugstarttime > angio.treatmenttime AND strftime('%Y-%m', med.drugstarttime) = strftime('%Y-%m', angio.treatmenttime) GROUP BY med.drugname ORDER BY COUNT(*) DESC LIMIT 3;",
            "gold_answer": "[['furosemide 10mg/ml sso'], ['potassium chloride'], ['potassium chloride tab cr'], ['sodium chloride 0.9%  sso']]",
            "pred_answer": "[['1000 ml flex cont : sodium chloride 0.9 % iv soln'], ['potassium chloride'], ['sodium chloride 0.9%  sso']]",
            "is_correct": false,
            "reasoning": "The predicted SQL correctly references existing tables and columns and uses valid SQLite functions, so there is no localized syntax or parsing issue. However, it alters the intended logic by joining and grouping on patientunitstayid rather than uniquepid. The ground truth query tracks unique patients across potentially multiple stays (using uniquepid), whereas the prediction counts per unit stay. This changes how frequencies are aggregated and thus the top\u20103 results differ. Fixing this requires changing the join key and aggregation logic\u2014i.e., restructuring the query\u2019s core logic\u2014so it is a global error.",
            "error_type": "Global: join-key error"
        },
        "fc3fa0924d7ccd7d27a6951a": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "How many patients this year were diagnosed with hypoglycemia within 2 months after the diagnosis of acute respiratory failure?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'acute respiratory failure' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'hypoglycemia' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 WHERE T1.diagnosistime < T2.diagnosistime AND datetime(T2.diagnosistime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month')",
            "pred_sql": "SELECT COUNT(DISTINCT d1.patientunitstayid) AS patient_count FROM diagnosis d1 JOIN diagnosis d2 ON d1.patientunitstayid = d2.patientunitstayid AND d2.diagnosisname = 'hypoglycemia' AND datetime(d2.diagnosistime) BETWEEN datetime(d1.diagnosistime) AND datetime(d1.diagnosistime, '+2 months') WHERE d1.diagnosisname = 'acute respiratory failure' AND strftime('%Y', d1.diagnosistime) = '2100';",
            "gold_answer": "[['151.0']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL not only uses a different join key (patientunitstayid instead of uniquepid) but also fails to apply the same year filter to the hypoglycemia diagnosis. These mistakes change the overall logic\u2014linking events by stay rather than by patient and mis-filtering dates\u2014resulting in a fundamentally different result. This error spans multiple clauses (JOIN and WHERE) and requires restructuring the query rather than a simple fix in one clause.",
            "error_type": "Global: incorrect join key and filter logic"
        },
        "890c4c363cef0eeb6026ba30": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "How many patients were treated with carotid endarterectomy this year?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT treatment.patientunitstayid FROM treatment WHERE treatment.treatmentname = 'carotid endarterectomy' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') )",
            "pred_sql": "SELECT COUNT(DISTINCT p.uniquepid) AS num_patients FROM treatment t JOIN patient p ON t.patientunitstayid = p.patientunitstayid WHERE t.treatmentname LIKE '%carotid endarterectomy%' AND strftime('%Y', t.treatmenttime) = '2100';",
            "gold_answer": "[['5.0']]",
            "pred_answer": "[['6.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only errs in the WHERE clause by using a broad LIKE '%carotid endarterectomy%' match instead of the exact treatmentname = 'carotid endarterectomy'. This localized mistake overcounts patients without changing the query\u2019s overall structure or join logic. Hence it\u2019s a local error in the filtering condition.",
            "error_type": "Local: incorrect filter condition"
        },
        "78089756da598e878d999d58": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Which are the top three most frequent procedures patients had within the same hospital visit after being diagnosed with syncope?",
            "gold_sql": "SELECT T3.treatmentname FROM ( SELECT T2.treatmentname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'syncope' ) AS T1 JOIN ( SELECT patient.uniquepid, treatment.treatmentname, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.treatmenttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.treatmentname ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "WITH syncope_diag AS ( SELECT p.patienthealthsystemstayid, MIN(d.diagnosistime) AS first_syncope_time FROM diagnosis d JOIN patient p ON d.patientunitstayid = p.patientunitstayid WHERE d.diagnosisname = 'syncope' GROUP BY p.patienthealthsystemstayid ) SELECT t.treatmentname FROM syncope_diag s JOIN patient p2 ON p2.patienthealthsystemstayid = s.patienthealthsystemstayid JOIN treatment t ON t.patientunitstayid = p2.patientunitstayid WHERE t.treatmenttime > s.first_syncope_time GROUP BY t.treatmentname ORDER BY COUNT(*) DESC LIMIT 3;",
            "gold_answer": "[['analgesics - narcotic analgesic'], ['antiemetic'], ['antihyperlipidemic agent - hmg-coa reductase inhibitor'], ['electrolyte administration'], ['foley catheter'], ['insulin'], ['oxygen therapy (< 40%)'], ['vte prophylaxis - compression boots']]",
            "pred_answer": "[['analgesics - narcotic analgesic'], ['oxygen therapy (< 40%)'], ['vte prophylaxis - compression boots']]",
            "is_correct": false,
            "reasoning": "The predicted SQL correctly identifies the first syncope time per hospital visit and joins treatments after that time. The only deviation is in the final selection of top procedures: it uses ORDER BY COUNT(*) DESC LIMIT 3, which drops procedures tied for third place, instead of using DENSE_RANK() to include all ties as specified in the ground truth. This mistake is confined to the LIMIT/selection logic and does not alter the overall query structure or joins.",
            "error_type": "Local: incorrect top-N implementation"
        },
        "b260d9b209ffbd72ff0df60d": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Since 1 year ago, what are the top four most frequently given diagnoses that patients received within the same month after being diagnosed with hypothyroidism?",
            "gold_sql": "SELECT T3.diagnosisname FROM ( SELECT T2.diagnosisname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'hypothyroidism' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, diagnosis.diagnosisname, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.diagnosistime AND datetime(T1.diagnosistime,'start of month') = datetime(T2.diagnosistime,'start of month') GROUP BY T2.diagnosisname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "SELECT d.diagnosisname, COUNT(*) AS frequency FROM diagnosis d JOIN diagnosis h ON d.patientunitstayid = h.patientunitstayid AND h.diagnosisname = 'hypothyroidism' AND h.diagnosistime >= datetime('2100-12-31 23:59:00','-1 year') AND d.diagnosisid <> h.diagnosisid AND d.diagnosistime BETWEEN h.diagnosistime AND datetime(h.diagnosistime, '+1 month') WHERE d.diagnosisname <> 'hypothyroidism' GROUP BY d.diagnosisname ORDER BY frequency DESC LIMIT 4;",
            "gold_answer": "[['acute respiratory failure'], ['diabetes mellitus'], ['hypothyroidism'], ['metabolic acidosis']]",
            "pred_answer": "[['acute respiratory failure', '643.0'], ['diabetes mellitus', '646.0'], ['hypoxemia', '628.0'], ['metabolic acidosis', '633.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL changes the core logic of the question in two ways: 1) it uses a BETWEEN h.diagnosistime AND datetime(h.diagnosistime, '+1 month') filter rather than matching diagnoses in the same calendar month (start of month equality), and 2) it explicitly excludes 'hypothyroidism' from the results, whereas the ground truth includes it if it recurs. These are not mere syntax or localized fixes but alter the intended time-window semantics and result set. Thus this requires restructuring the filtering logic, making it a global error.",
            "error_type": "Global: incorrect join/time-filter logic"
        },
        "c3c11e1cbbde15b360b8218e": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "What is the number of patients who died after diagnosis of acute pulmonary edema within the same month since 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT T2.uniquepid ) FROM ( SELECT T1.uniquepid, T1.diagnosistime FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'acute pulmonary edema' ) AS T1 GROUP BY T1.uniquepid HAVING MIN(T1.diagnosistime) = T1.diagnosistime AND strftime('%Y',T1.diagnosistime) >= '2100' ) AS T2 JOIN ( SELECT patient.uniquepid, patient.patienthealthsystemstayid, patient.hospitaldischargetime FROM patient WHERE patient.hospitaldischargestatus = 'expired' ) as T3 ON T2.uniquepid = T3.uniquepid AND datetime(T2.diagnosistime,'start of month') = datetime(T3.hospitaldischargetime,'start of month')",
            "pred_sql": "SELECT COUNT(DISTINCT p.uniquepid) AS num_patients FROM diagnosis d JOIN patient p ON d.patientunitstayid = p.patientunitstayid WHERE d.diagnosisname = 'acute pulmonary edema' AND d.diagnosistime >= '2100-01-01' AND p.hospitaldischargestatus = 'expired' AND datetime(p.hospitaldischargetime) > datetime(d.diagnosistime) AND strftime('%Y-%m', d.diagnosistime) = strftime('%Y-%m', p.hospitaldischargetime');",
            "gold_answer": "[['3.0']]",
            "pred_answer": "unrecognized token: \"');\"",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to parse due to an extra/mismatched quote and parenthesis in the WHERE clause (unrecognized token \"');\"). This is a localized syntax issue that can be fixed without changing the overall logic or join structure.",
            "error_type": "Local: syntax error"
        },
        "8c3bf289979d474499b2aa49": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "How many days have elapsed since patient 025-1000 stayed in ward 908 for the first time on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',patient.unitadmittime) ) FROM patient WHERE patient.uniquepid = '025-1000' AND patient.wardid = 908 AND patient.hospitaldischargetime IS NULL ORDER BY patient.unitadmittime ASC LIMIT 1",
            "pred_sql": "WITH current_hospital AS ( SELECT patienthealthsystemstayid FROM patient WHERE uniquepid = '025-1000' AND hospitaldischargetime IS NULL LIMIT 1 ), first_ward AS ( SELECT MIN(unitadmittime) AS first_time FROM patient WHERE patienthealthsystemstayid = (SELECT patienthealthsystemstayid FROM current_hospital) AND wardid = 908 ) SELECT CAST(julianday('2100-12-31 23:59:00') - julianday(first_time) AS INTEGER) AS days_elapsed FROM first_ward;",
            "gold_answer": "[['9.574']]",
            "pred_answer": "[['9.0']]",
            "is_correct": false,
            "reasoning": "The only difference between the two queries lies in how they compute the day difference. The ground truth uses strftime('%J',\u2026) to get the Julian day number (including fractional days), yielding a precise value (9.574). The predicted SQL uses julianday(\u2026) and then CASTs the result to INTEGER, truncating it to 9.0 and losing the fractional component. All other logic (filtering on current visit, selecting the first ward admission) is correct. This is a localized mistake in the date-difference calculation, not a flaw in the overall query structure.",
            "error_type": "Local: other-temporal error"
        },
        "f605d9fb2fedb46a1785bdd7": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "What is the average total hospital cost that includes a procedure named folate in 2100?",
            "gold_sql": "SELECT AVG(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT treatment.patientunitstayid FROM treatment WHERE treatment.treatmentname = 'folate' ) ) AND strftime('%Y',cost.chargetime) = '2100' GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "WITH folate_stays AS ( SELECT DISTINCT p.patienthealthsystemstayid FROM lab l JOIN patient p ON l.patientunitstayid = p.patientunitstayid WHERE l.labname LIKE '%folate%' AND strftime('%Y', l.labresulttime) = '2100' ), stay_costs AS ( SELECT c.patienthealthsystemstayid, SUM(c.cost) AS total_cost FROM cost c WHERE c.patienthealthsystemstayid IN (SELECT patienthealthsystemstayid FROM folate_stays) GROUP BY c.patienthealthsystemstayid ) SELECT AVG(total_cost) AS average_total_hospital_cost FROM stay_costs;",
            "gold_answer": "[['7410.78']]",
            "pred_answer": "[['4516.97']]",
            "is_correct": false,
            "reasoning": "The predicted query identifies stays by looking for lab records with labname LIKE '%folate%' in the lab table, whereas the question refers to a procedure named folate, which is stored in the treatment table. This error affects the overall logic of how relevant patient stays are selected and requires restructuring the query to use the treatment table instead of lab. Thus it is not a localized syntax mistake but a fundamental logical error in table usage and joins.",
            "error_type": "Global: join/table selection error"
        },
        "cb3541829199c9ac184de2b0": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Find out how many patients were admitted to the hospital.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient",
            "pred_sql": "SELECT COUNT(DISTINCT patienthealthsystemstayid) AS num_hospital_admissions FROM patient WHERE hospitaladmittime IS NOT NULL;",
            "gold_answer": "[['1384.0']]",
            "pred_answer": "[['1542.0']]",
            "is_correct": false,
            "reasoning": "The predicted query counts distinct patienthealthsystemstayid (hospital admissions) rather than distinct uniquepid (patients), fundamentally altering the metric and misinterpreting the question. This is not a simple syntax or reference fix but a change in the core logic/aggregation of the query.",
            "error_type": "Global: incorrect aggregation column"
        },
        "1b72b914302d1dce0efd4293": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Find the number of current patients in the 60 or above age group.",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.hospitaldischargetime IS NULL AND patient.age >= 60",
            "pred_sql": "SELECT COUNT(*) AS num_current_patients_60_plus FROM patient WHERE hospitaldischargetime IS NULL AND age >= 60;",
            "gold_answer": "[['14.0']]",
            "pred_answer": "[['20.0']]",
            "is_correct": false,
            "reasoning": "The predicted query counts all rows (COUNT(*)) rather than counting distinct patients. According to the assumptions, when counting patients you must use COUNT(DISTINCT patient.uniquepid). This is a localized mistake in the SELECT clause aggregate and does not alter the overall query structure or logic beyond missing the DISTINCT keyword.",
            "error_type": "Local: missing DISTINCT"
        },
        "3ad2a55fd673d7cc2caa8aca": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "What is the 6-month survival rate of patients who received 1 ml vial : diphenhydramine hcl 50 mg/ml ij soln treatment following a s/p embolectomy diagnosis?",
            "gold_sql": "SELECT AVG(C1) FROM ( SELECT ( CASE WHEN (patient.hospitaldischargestatus = 'expired') AND(strftime('%J',patient.hospitaldischargetime) - strftime('%J',T1.diagnosistime)) < 365 / 2 THEN 0 ELSE 1 END ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 's/p embolectomy' AND strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) >= 365 / 2 GROUP BY patient.uniquepid HAVING MIN(diagnosis.diagnosistime) = diagnosis.diagnosistime ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = '1 ml vial : diphenhydramine hcl 50 mg/ml ij soln' GROUP BY patient.uniquepid HAVING MAX(medication.drugstarttime) = medication.drugstarttime ) AS T2 ON T1.uniquepid = T2.uniquepid JOIN patient ON T1.uniquepid = patient.uniquepid WHERE T1.diagnosistime < T2.drugstarttime GROUP BY patient.uniquepid HAVING MAX(patient.hospitaldischargetime) = patient.hospitaldischargetime )",
            "pred_sql": "WITH first_embo AS ( SELECT patientunitstayid, MIN(diagnosistime) AS first_diag_time FROM diagnosis WHERE diagnosisname = 's/p embolectomy' GROUP BY patientunitstayid ), med_after_embo AS ( SELECT DISTINCT e.patientunitstayid, e.first_diag_time FROM first_embo e JOIN medication m ON m.patientunitstayid = e.patientunitstayid AND m.drugname = '1 ml - diphenhydramine hcl 50 mg/ml ij soln' AND m.drugstarttime >= e.first_diag_time ), survival_calc AS ( SELECT m.patientunitstayid, p.hospitaldischargetime, p.hospitaldischargestatus, m.first_diag_time, CASE WHEN p.hospitaldischargestatus = 'expired' AND datetime(p.hospitaldischargetime) <= datetime(m.first_diag_time, '+183 days') THEN 0 ELSE 1 END AS survived FROM med_after_embo m JOIN patient p ON p.patientunitstayid = m.patientunitstayid ) SELECT AVG(survived) AS six_month_survival_rate FROM survival_calc;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to match any medication records because the drug name literal in the WHERE clause is incorrect ('1 ml - diphenhydramine...' instead of '1 ml vial : diphenhydramine...'), leading to no rows in the CTE and ultimately NULL for the average. This is a localized mistake in the WHERE condition\u2019s string literal and can be corrected without changing the overall query structure or logic.",
            "error_type": "Local: value parsing error"
        },
        "3162159f1b6f94c9ef55cdaf": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Among the patients who are prescribed mag/alum hydroxide w/simeth, what are the five most frequently prescribed drugs at the same time since 2100?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'mag/alum hydroxide w/simeth' AND strftime('%Y',medication.drugstarttime) >= '2100' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid AND strftime('%Y',medication.drugstarttime) >= '2100' ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE datetime(T1.drugstarttime) = datetime(T2.drugstarttime) GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT med2.drugname FROM medication AS med1 JOIN medication AS med2 ON med1.patientunitstayid = med2.patientunitstayid AND med1.drugname = 'mag/alum hydroxide w/simeth' AND med2.drugname <> 'mag/alum hydroxide w/simeth' AND med1.drugstarttime >= '2100-01-01 00:00:00' AND med2.drugstarttime >= '2100-01-01 00:00:00' AND med1.drugstarttime <= med2.drugstoptime AND med2.drugstarttime <= med1.drugstoptime GROUP BY med2.drugname ORDER BY COUNT(*) DESC LIMIT 5;",
            "gold_answer": "[['hydralazine'], ['mag/alum hydroxide w/simeth'], ['morphine'], ['ondansetron (pf)'], ['oxycodone']]",
            "pred_answer": "[['amiodarone'], ['morphine'], ['oxycodone'], ['pantoprazole'], ['potassium chloride']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the logic of how \u201cat the same time\u201d is determined. Instead of matching exact drugstarttime timestamps between mag/alum hydroxide w/simeth prescriptions and other drugs (as in the ground truth), it uses an interval overlap condition (med1.drugstarttime <= med2.drugstoptime AND med2.drugstarttime <= med1.drugstoptime). This alters the join relationship and thus the intended meaning of \u201cat the same time.\u201d Fixing this requires rewriting the join condition, not just correcting a column or alias, so it is a global error in join strategy.",
            "error_type": "Global: join strategy error"
        },
        "cbe78f4e084965ff31d7fb0b": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "How many hours have gone by since the first instance patient 033-10044 had a intake, oral amount input on the current icu visit?",
            "gold_sql": "SELECT 24 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',intakeoutput.intakeoutputtime) ) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '033-10044' ) AND patient.unitdischargetime IS NULL ) AND intakeoutput.celllabel = 'intake, oral amount' AND intakeoutput.cellpath LIKE '%intake%' ORDER BY intakeoutput.intakeoutputtime ASC LIMIT 1",
            "pred_sql": "SELECT (strftime('%s', '2100-12-31 23:59:00') - strftime('%s', (SELECT MIN(io.intakeoutputtime) FROM intakeoutput io JOIN patient p ON io.patientunitstayid = p.patientunitstayid WHERE p.uniquepid = '033-10044' AND p.unitdischargetime IS NULL AND io.cellpath LIKE '%intake%' AND io.celllabel = 'p.o.' ) )) / 3600.0 AS hours_since;",
            "gold_answer": "[['16.483']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it uses the wrong celllabel value ('p.o.') instead of the correct 'intake, oral amount'. This is a localized mistake in the WHERE clause literal, causing no rows to match. The overall query structure\u2014joining intakeoutput to patient, filtering for current ICU stay, selecting the minimum time, and computing the hour difference\u2014is otherwise correct according to the question. Hence, this is a local error confined to a specific value mismatch in the query.",
            "error_type": "Local: value parsing error"
        },
        "26cc7b020c66234c64fc04de": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "Since 2100, how many patients died after having been diagnosed with mouth and jaw tumor - oral cavity squamous cell ca within the same month?",
            "gold_sql": "SELECT COUNT( DISTINCT T2.uniquepid ) FROM ( SELECT T1.uniquepid, T1.diagnosistime FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'mouth and jaw tumor - oral cavity squamous cell ca' ) AS T1 GROUP BY T1.uniquepid HAVING MIN(T1.diagnosistime) = T1.diagnosistime AND strftime('%Y',T1.diagnosistime) >= '2100' ) AS T2 JOIN ( SELECT patient.uniquepid, patient.patienthealthsystemstayid, patient.hospitaldischargetime FROM patient WHERE patient.hospitaldischargestatus = 'expired' ) as T3 ON T2.uniquepid = T3.uniquepid AND datetime(T2.diagnosistime,'start of month') = datetime(T3.hospitaldischargetime,'start of month')",
            "pred_sql": "SELECT COUNT(DISTINCT p.uniquepid) AS num_patients FROM diagnosis d JOIN patient p ON d.patientunitstayid = p.patientunitstayid WHERE d.diagnosistime >= '2100-01-01' AND d.diagnosisname = 'mouth and jaw tumor - oral cavity squamous cell ca' AND p.hospitaldischargestatus = 'expired' AND p.hospitaldischargetime > d.diagnosistime AND strftime('%Y-%m', d.diagnosistime) = strftime('%Y-%m', p.hospitaldischargetime');",
            "gold_answer": "[['1.0']]",
            "pred_answer": "unrecognized token: \"');\"",
            "is_correct": false,
            "reasoning": "The failure \u201cunrecognized token: \"');\"\u201d indicates a small syntax mistake (an extra or misplaced quote/parenthesis) in the predicted SQL\u2019s WHERE clause, specifically around the strftime call. The underlying logic (joining diagnosis to patient, filtering by date, expired status, same month) is intact; only a local syntax/parsing error prevents execution. Therefore this is a Local error.",
            "error_type": "Local: syntax error"
        },
        "c408e0d5803d34c692a5b804": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "What are the five most frequent lab tests that patients had within 2 months after receiving therapeutic antibacterials - empiric antibacterial coverage?",
            "gold_sql": "SELECT T3.labname FROM ( SELECT T2.labname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'therapeutic antibacterials - empiric antibacterial coverage' ) AS T1 JOIN ( SELECT patient.uniquepid, lab.labname, lab.labresulttime FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.labresulttime AND datetime(T2.labresulttime) BETWEEN datetime(T1.treatmenttime) AND datetime(T1.treatmenttime,'+2 month') GROUP BY T2.labname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT lab.labname, COUNT(*) AS frequency FROM treatment JOIN lab ON treatment.patientunitstayid = lab.patientunitstayid AND datetime(lab.labresulttime) > datetime(treatment.treatmenttime) AND datetime(lab.labresulttime) <= datetime(treatment.treatmenttime, '+2 months') WHERE treatment.treatmentname = 'therapeutic antibacterials - empiric antibacterial coverage' GROUP BY lab.labname ORDER BY frequency DESC LIMIT 5;",
            "gold_answer": "[['bedside glucose'], ['bicarbonate'], ['bun'], ['calcium'], ['chloride'], ['creatinine'], ['glucose'], ['potassium'], ['sodium']]",
            "pred_answer": "[['bedside glucose', '374.0'], ['creatinine', '113.0'], ['glucose', '113.0'], ['potassium', '128.0'], ['sodium', '113.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL correctly filters for the treatment name, joins lab records, and applies the two-month time window. However, it returns both the lab name and its frequency count, whereas the question (and the assumptions) require only the lab names for the top five tests, excluding their counts. This is a confined issue in the SELECT clause that doesn\u2019t alter the overall logic of the query.",
            "error_type": "Local: wrong select columns"
        },
        "4f6b31be61ebcdb2cc215e06": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "What are the top four most frequent medications prescribed within 2 months to patients in their 30s after they are diagnosed with pre-eclampsia/ eclampsia?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'pre-eclampsia/ eclampsia' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.age BETWEEN 30 AND 39 ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND datetime(T2.drugstarttime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "WITH first_diag AS ( SELECT patientunitstayid, MIN(diagnosistime) AS diag_time FROM diagnosis WHERE LOWER(diagnosisname) LIKE '%pre-eclampsia%' OR LOWER(diagnosisname) LIKE '%eclampsia%' GROUP BY patientunitstayid ) SELECT m.drugname FROM first_diag fd JOIN patient p ON p.patientunitstayid = fd.patientunitstayid JOIN medication m ON m.patientunitstayid = fd.patientunitstayid WHERE p.age BETWEEN 30 AND 39 AND m.drugstarttime >= fd.diag_time AND m.drugstarttime <= DATETIME(fd.diag_time, '+2 months') GROUP BY m.drugname ORDER BY COUNT(*) DESC LIMIT 4;",
            "gold_answer": "[['1000 ml : lactated ringers iv soln'], ['alprazolam 0.5 mg po tabs'], ['diphenhydramine hcl 25 mg po caps'], ['diphenhydramine hcl 50 mg/ml ij soln'], ['metoclopramide hcl 5 mg/ml ij soln'], ['naloxone hcl 0.4 mg/ml ij soln'], ['ondansetron hcl 4 mg po tabs'], ['ondansetron hcl 4 mg/2ml ij soln'], ['oxycodone-acetaminophen 5-325 mg po tabs'], ['sennosides-docusate sodium 8.6-50 mg po tabs'], ['sodium chloride 0.9 % ij soln'], ['zolpidem tartrate 5 mg po tabs']]",
            "pred_answer": "[['diphenhydramine hcl 25 mg po caps'], ['diphenhydramine hcl 50 mg/ml ij soln'], ['ondansetron hcl 4 mg/2ml ij soln'], ['sennosides-docusate sodium 8.6-50 mg po tabs']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes how the top medications are selected: it uses LIMIT 4 rather than a DENSE_RANK() window to include ties, and it groups by patientunitstayid rather than uniquepid. These are not simple syntax fixes but alter the overall logic and result set. Therefore, this is a structural, global error in the query\u2019s ranking and grouping logic.",
            "error_type": "Global: incorrect ranking logic"
        },
        "fd64d6670cf4d3da09d342f3": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "How many times did patient 004-1262 have clonidine?",
            "gold_sql": "SELECT COUNT(*) FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-1262' ) ) AND treatment.treatmentname = 'clonidine'",
            "pred_sql": "SELECT COUNT(*) AS clonidine_count FROM medication m JOIN patient p ON m.patientunitstayid = p.patientunitstayid WHERE p.uniquepid = '004-1262' AND m.drugname LIKE '%clonidine%';",
            "gold_answer": "[['5.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the medication table and joins on patientuniquepid, but the intent is to count treatment events (treatment table) for clonidine. This is not a simple column or syntax mistake\u2014it fundamentally changes the query logic by querying the wrong table and association. Fixing it would require rewriting the entire FROM/JOIN clause to use the treatment table instead of medication, so it is a global error.",
            "error_type": "Global: incorrect join"
        },
        "d202e3cc28a5d8b7e342ebe9": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "What are the five most frequent procedures for patients who are in their 30s?",
            "gold_sql": "SELECT T1.treatmentname FROM ( SELECT treatment.treatmentname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age BETWEEN 30 AND 39 ) GROUP BY treatment.treatmentname ) AS T1 WHERE T1.C1 <= 5",
            "pred_sql": "SELECT t.treatmentname FROM treatment t JOIN patient p ON t.patientunitstayid = p.patientunitstayid WHERE CAST(p.age AS INTEGER) BETWEEN 30 AND 39 GROUP BY t.treatmentname ORDER BY COUNT(*) DESC LIMIT 5;",
            "gold_answer": "[['antiemetic - serotonin antagonist'], ['chest x-ray'], ['cultures - blood'], ['mechanical ventilation'], ['normal saline administration'], ['stress ulcer prophylaxis - pantoprazole']]",
            "pred_answer": "[['antiemetic - serotonin antagonist'], ['cultures - blood'], ['mechanical ventilation'], ['normal saline administration'], ['stress ulcer prophylaxis - pantoprazole']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses a simple ORDER BY ... LIMIT 5 approach instead of the required DENSE_RANK() method to handle ties properly. This is a mistake in the ranking logic within the ORDER BY/LIMIT clause\u2014it does not involve join conditions, table references, or the overall structure of the query. It's a localized error in how the top N results are selected.",
            "error_type": "Local: ranking error"
        },
        "3ae1a558a87d4de503e658ec": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "How many patients were treated with antidepressant - amitriptyline two times since 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, COUNT(*) AS C1 FROM patient WHERE patient.patientunitstayid = ( SELECT treatment.patientunitstayid FROM treatment WHERE treatment.treatmentname = 'antidepressant - amitriptyline' AND strftime('%Y',treatment.treatmenttime) >= '2100' ) GROUP BY patient.uniquepid ) AS T1 WHERE T1.C1 = 2",
            "pred_sql": "SELECT COUNT(*) FROM ( SELECT p.uniquepid FROM patient p JOIN treatment t ON p.patientunitstayid = t.patientunitstayid WHERE t.treatmentname = 'antidepressant - amitriptyline' AND t.treatmenttime >= '2100-01-01' GROUP BY p.uniquepid HAVING COUNT(*) >= 2 ) AS sub;",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['1.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL differs from the ground truth only in the HAVING clause: it uses COUNT(*) >= 2 to include patients treated two or more times, whereas the ground truth requires exactly two treatments (COUNT = 2). This is a localized mistake within the HAVING clause and does not affect the overall query structure or table relationships.",
            "error_type": "Local: having-clause error"
        },
        "3a9accf430c593518ab84181": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "How many days have passed since the last time patient 027-100843 was given nimodipine on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',treatment.treatmenttime) ) FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-100843' AND patient.hospitaldischargetime IS NULL ) ) AND treatment.treatmentname = 'nimodipine' ORDER BY treatment.treatmenttime DESC LIMIT 1",
            "pred_sql": "SELECT CAST( julianday('2100-12-31 23:59:00') - julianday(MAX(m.drugstarttime)) AS INTEGER) AS days_since_last_nimodipine FROM medication m JOIN patient p ON m.patientunitstayid = p.patientunitstayid WHERE p.patienthealthsystemstayid = ( SELECT patienthealthsystemstayid FROM patient WHERE uniquepid = '027-100843' AND hospitaldischargetime IS NULL LIMIT 1 ) AND m.drugname = 'nimodipine';",
            "gold_answer": "[['6.125']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted query uses the medication table and drugstarttime instead of the treatment table and treatmenttime specified in the ground truth. This is not a simple typo or syntax mistake\u2014it changes the data source and the join logic, fundamentally altering how the patient\u2019s nimodipine event is retrieved. As a result, it fails to capture the correct event from the treatment table for the current hospital visit.",
            "error_type": "Global: incorrect table/join"
        },
        "cb7daad13bef3b54aa70357d": {
            "db_id": "eicu",
            "generator_name": "o4-mini",
            "question": "What are the top five most frequent medications prescribed within the same month to the patients in their 20s after they are diagnosed with stroke - ischemic stroke?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'stroke - ischemic stroke' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.age BETWEEN 20 AND 29 ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND datetime(T1.diagnosistime,'start of month') = datetime(T2.drugstarttime,'start of month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT m.drugname FROM patient p JOIN diagnosis d ON p.patientunitstayid = d.patientunitstayid JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE p.age BETWEEN 20 AND 29 AND d.diagnosisname = 'stroke - ischemic stroke' AND m.drugstarttime >= d.diagnosistime AND strftime('%Y-%m', m.drugstarttime) = strftime('%Y-%m', d.diagnosistime) GROUP BY m.drugname ORDER BY COUNT(*) DESC LIMIT 5;",
            "gold_answer": "[['5 ml vial : metoprolol tartrate 1 mg/ml iv soln'], ['acetaminophen 325 mg po tabs'], ['atorvastatin calcium 40 mg po tabs'], ['metoprolol tartrate 25 mg po tabs'], ['metoprolol tartrate 50 mg po tabs'], ['potassium chloride 20 meq po pack'], ['warfarin sodium 5 mg po tabs'], ['warfarin sodium 7.5 mg po tabs']]",
            "pred_answer": "[['acetaminophen 325 mg po tabs'], ['metoprolol tartrate 25 mg po tabs'], ['potassium chloride 20 meq po pack'], ['warfarin sodium 5 mg po tabs'], ['warfarin sodium 7.5 mg po tabs']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses a simple ORDER BY \u2026 LIMIT 5 instead of applying DENSE_RANK() to include ties at the 5th rank as required by the \u201ctop N\u201d ranking assumption. All joins, filters, and groupings are otherwise correct\u2014the mistake is confined to the ranking logic in the SELECT/GROUP BY clause. This is a localized error that can be fixed by replacing LIMIT with DENSE_RANK(), without restructuring the query.",
            "error_type": "Local: ranking error"
        }
    },
    "llm2sql": {
        "a46876eb34d469b9a1e86ad1": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "How many patients were prescribed the medicine fentanyl (pf) 50 mcg/1 ml 2 ml syr within 2 months after a diagnosis of acute respiratory distress since 1 year ago?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'acute respiratory distress' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'fentanyl (pf) 50 mcg/1 ml 2 ml syr' AND datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 WHERE T1.diagnosistime < T2.drugstarttime AND datetime(T2.drugstarttime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month')",
            "pred_sql": "SELECT COUNT(DISTINCT medication.patientunitstayid) FROM diagnosis JOIN medication ON diagnosis.patientunitstayid = medication.patientunitstayid WHERE diagnosis.diagnosisname = 'acute respiratory distress' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00', '-1 year') AND medication.drugname = 'fentanyl (pf) 50 mcg/1 ml 2 ml syr' AND datetime(medication.drugstarttime) > diagnosis.diagnosistime AND datetime(medication.drugstarttime) <= datetime(diagnosis.diagnosistime, '+2 months');",
            "gold_answer": "[['42.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL makes several localized mistakes that do not require a full rewrite of the query structure: 1) It counts DISTINCT medication.patientunitstayid instead of DISTINCT patient.uniquepid, so it\u2019s counting stays rather than patients. 2) It never restricts medication.drugstarttime to within one year ago, omitting the datetime(...) >= datetime('2100-12-31 23:59:00','-1 year') filter on the medication side. 3) It joins diagnosis and medication directly on patientunitstayid without involving the patient table, rather than using the two subqueries that separately filter by time. Each of these is a local reference or filter error in a specific clause, not a structural or multi-clause logical flaw.",
            "error_type": "Local: column reference/filter error"
        },
        "a590830e328017841d0ab99c": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "Count the number of medicines that patient 017-100989 was prescribed last month.",
            "gold_sql": "SELECT COUNT(*) FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '017-100989' ) ) AND datetime(medication.drugstarttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month')",
            "pred_sql": "SELECT COUNT(DISTINCT drugname) FROM medication WHERE patientunitstayid = (SELECT patientunitstayid FROM patient WHERE uniquepid = '017-100989') AND strftime('%Y-%m', drugstarttime) = '2100-11';",
            "gold_answer": "[['13.0']]",
            "pred_answer": "[['10.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the meaning of the original request. It only looks at a single patientunitstayid instead of all stays for that patient (missing multiple admissions), and it counts DISTINCT drugname rather than counting all prescriptions. These are not minor syntax mistakes but alter the core logic of which records are counted and how, so this is a global error.",
            "error_type": "Global: incorrect aggregation and join logic"
        },
        "274ba7a0a86a8577f1f612d2": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "Since 1 year ago, how many patients received drug levels - serum drug levels within 2 months after being diagnosed with drug overdose- general?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'drug overdose- general' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'drug levels - serum drug levels' AND datetime(treatment.treatmenttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 WHERE T1.diagnosistime < T2.treatmenttime AND datetime(T2.treatmenttime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month')",
            "pred_sql": "SELECT COUNT(DISTINCT diagnosis.patientunitstayid) FROM diagnosis JOIN lab ON diagnosis.patientunitstayid = lab.patientunitstayid WHERE diagnosis.diagnosisname = 'drug overdose- general' AND diagnosis.diagnosistime >= datetime('2100-12-31 23:59:00', '-1 year') AND lab.labname = 'drug levels - serum' AND lab.labresulttime BETWEEN diagnosis.diagnosistime AND datetime(diagnosis.diagnosistime, '+2 months');",
            "gold_answer": "[['21.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the lab table and lab.labname to capture 'drug levels - serum' events, but the question and ground truth specify using the treatment table for 'drug levels - serum drug levels'. This mismatch in table selection and joins changes the overall logic\u2014lab and treatment are different event sources, resulting in incorrect data associations. Correcting this requires replacing the entire source and join logic, not just fixing a column or alias. Hence, it is a global error.",
            "error_type": "Global: join/table selection error"
        },
        "a81f17dbf22eeeeb8037c6b5": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "When was the first occasion that patient 004-10029 underwent a enteral feeds - oral feeds procedure?",
            "gold_sql": "SELECT treatment.treatmenttime FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-10029' ) ) AND treatment.treatmentname = 'enteral feeds - oral feeds' ORDER BY treatment.treatmenttime ASC LIMIT 1",
            "pred_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput JOIN patient ON intakeoutput.patientunitstayid = patient.patientunitstayid WHERE patient.uniquepid = '004-10029' AND intakeoutput.cellpath LIKE '%enteral feeds - oral feeds%' ORDER BY intakeoutput.intakeoutputtime ASC LIMIT 1;",
            "gold_answer": "[['2100-09-19 12:57:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the intakeoutput table and filters on intakeoutput.cellpath, whereas the correct query should use the treatment table and filter on treatment.treatmentname. This is not a minor typo or single-clause fix\u2014it fundamentally alters the source of data and the logic of the query, requiring a complete restructuring to reference the proper table and column.",
            "error_type": "Global: incorrect table reference"
        },
        "61a5db677312c21b1d6f74a1": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "This year, what are the top five most frequent procedures that patients received within 2 months after being diagnosed with obtundation?",
            "gold_sql": "SELECT T3.treatmentname FROM ( SELECT T2.treatmentname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'obtundation' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, treatment.treatmentname, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.treatmenttime AND datetime(T2.treatmenttime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month') GROUP BY T2.treatmentname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT treatment.treatmentname, COUNT(treatment.treatmentid) AS procedure_count FROM diagnosis JOIN treatment ON diagnosis.patientunitstayid = treatment.patientunitstayid WHERE diagnosis.diagnosisname = 'obtundation' AND strftime('%Y', diagnosis.diagnosistime) = '2100' AND datetime(treatment.treatmenttime) BETWEEN datetime(diagnosis.diagnosistime) AND datetime(diagnosis.diagnosistime, '+2 months') GROUP BY treatment.treatmentname ORDER BY procedure_count DESC LIMIT 5;",
            "gold_answer": "[['enteral feeds - tube feeding'], ['foley catheter'], ['mechanical ventilation'], ['mechanical ventilation - pressure support'], ['stress ulcer prophylaxis - famotidine'], ['treatment of hypernatremia - free water administration']]",
            "pred_answer": "[['enteral feeds - tube feeding', '120.0'], ['foley catheter', '105.0'], ['mechanical ventilation - pressure support', '98.0'], ['stress ulcer prophylaxis - famotidine', '119.0'], ['treatment of hypernatremia - free water administration', '113.0']]",
            "is_correct": false,
            "reasoning": "The predicted query uses a simple ORDER BY ... LIMIT 5 rather than applying a DENSE_RANK() and selecting all treatments whose rank is <= 5, so it will drop tied procedures beyond the fifth position and fail to include all items with equal frequency (as the ground\u2010truth does). This isn\u2019t just a typo or missing column\u2014it undercuts the ranking logic and changes the intended result set. Therefore this is a global error in the overall query logic around ranking.",
            "error_type": "Global: ranking logic error"
        },
        "c4b4ffc15f3431f9c9be0382": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What does a esr lab test typically cost?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'lab' AND cost.eventid IN ( SELECT lab.labid FROM lab WHERE lab.labname = 'esr' )",
            "pred_sql": "SELECT DISTINCT cost FROM cost WHERE eventtype = 'lab';",
            "gold_answer": "[['8.88']]",
            "pred_answer": "[['10.03'], ['10.04'], ['10.06'], ['10.13'], ['10.17'], ['10.19'], ['10.26'], ['10.3'], ['10.4'], ['10.42'], ['10.45'], ['10.5'], ['10.57'], ['10.61'], ['10.62'], ['10.7'], ['10.79'], ['10.82'], ['10.98'], ['11.13'], ['11.14'], ['11.15'], ['11.5'], ['11.66'], ['6.23'], ['6.81'], ['6.91'], ['7.05'], ['7.38'], ['7.46'], ['7.55'], ['7.71'], ['7.72'], ['7.73'], ['7.75'], ['7.77'], ['7.82'], ['7.84'], ['7.9'], ['7.98'], ['8.08'], ['8.11'], ['8.13'], ['8.17'], ['8.2'], ['8.22'], ['8.23'], ['8.25'], ['8.27'], ['8.29'], ['8.3'], ['8.31'], ['8.34'], ['8.35'], ['8.37'], ['8.38'], ['8.47'], ['8.48'], ['8.51'], ['8.52'], ['8.59'], ['8.61'], ['8.63'], ['8.65'], ['8.66'], ['8.74'], ['8.75'], ['8.77'], ['8.78'], ['8.86'], ['8.88'], ['8.91'], ['8.92'], ['8.94'], ['8.95'], ['9.0'], ['9.01'], ['9.08'], ['9.11'], ['9.13'], ['9.14'], ['9.16'], ['9.21'], ['9.22'], ['9.24'], ['9.27'], ['9.28'], ['9.29'], ['9.32'], ['9.33'], ['9.37'], ['9.38'], ['9.44'], ['9.45'], ['9.47'], ['9.48'], ['9.5'], ['9.54'], ['9.56'], ['9.57']]",
            "is_correct": false,
            "reasoning": "The predicted query omits the filter that restricts the cost rows to those for the specific 'esr' lab (the subquery on lab.labid). Instead, it returns all lab costs by only checking eventtype='lab'. This is a localized mistake in the WHERE clause (a missing condition) and does not require restructuring the query\u2019s overall logic or joins.",
            "error_type": "Local: missing filter in WHERE clause"
        },
        "8df73cbaa10a750ff09381e3": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What is the 3-month survival rate for patients living with a bacteremia diagnosis?",
            "gold_sql": "SELECT AVG(C1) FROM ( SELECT ( CASE WHEN (patient.hospitaldischargestatus = 'expired') AND(strftime('%J',patient.hospitaldischargetime) - strftime('%J',T1.diagnosistime)) < 365 / 4 THEN 0 ELSE 1 END ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'bacteremia' AND strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) >= 365 / 4 GROUP BY patient.uniquepid HAVING MIN(diagnosis.diagnosistime) = diagnosis.diagnosistime ) AS T1 JOIN patient ON T1.uniquepid = patient.uniquepid GROUP BY patient.uniquepid HAVING MAX(patient.hospitaldischargetime) = patient.hospitaldischargetime )",
            "pred_sql": "SELECT (CAST(SUM(CASE WHEN patient.hospitaldischargestatus = 'alive' AND datetime(patient.hospitaldischargetime) <= datetime(diagnosis.diagnosistime, '+91 days') THEN 1 ELSE 0 END) AS REAL) / COUNT(DISTINCT patient.patientunitstayid)) AS survival_rate FROM patient JOIN diagnosis ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname LIKE '%bacteremia%'",
            "gold_answer": "[['0.833']]",
            "pred_answer": "[['4.2']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally miscalculates the 3-month survival rate. It uses patientunitstayid instead of uniquepid, never filters out patients diagnosed less than three months ago, and incorrectly interprets survival by checking for \"alive\" and discharge within 91 days rather than survival beyond 3 months or expiration within that window. These issues span the cohort selection, date logic, grouping, and numerator/denominator calculation, altering the query\u2019s intended meaning and requiring structural changes across clauses.",
            "error_type": "Global: flawed survival calculation"
        },
        "d050f7add43df6e757dd7add": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "Tell me the percentile of mch 30.1 among all patients of the same age as patient 006-104411 on the last hospital visit?",
            "gold_sql": "SELECT DISTINCT T1.C1 FROM ( SELECT lab.labresult, PERCENT_RANK() OVER ( ORDER BY lab.labresult ) AS C1 FROM lab WHERE lab.labname = 'mch' AND lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age = ( SELECT patient.age FROM patient WHERE patient.uniquepid = '006-104411' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) ) AS T1 WHERE T1.labresult = 30.1",
            "pred_sql": "WITH AgePatient AS ( SELECT age FROM patient WHERE uniquepid = '006-104411' ), LastVisitPatients AS ( SELECT patientunitstayid FROM patient WHERE age = (SELECT age FROM AgePatient) AND hospitaldischargetime IS NOT NULL AND patientunitstayid IN ( SELECT patientunitstayid FROM patient ORDER BY hospitaladmittime DESC ) ), MCHValues AS ( SELECT lab.labresult AS mch_value FROM lab WHERE lab.labname LIKE '%mch%' AND lab.patientunitstayid IN (SELECT patientunitstayid FROM LastVisitPatients) ), RankedMCH AS ( SELECT mch_value, NTILE(100) OVER(ORDER BY mch_value) AS percentile FROM MCHValues ) SELECT percentile FROM RankedMCH WHERE mch_value = 30.1;",
            "gold_answer": "[['0.504']]",
            "pred_answer": "[['23.0'], ['23.0'], ['23.0'], ['23.0'], ['24.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL deviates fundamentally from the intended logic in multiple ways. First, it uses NTILE(100) instead of PERCENT_RANK(), which completely changes how the percentile is calculated (NTILE buckets results into integer groups rather than computing a 0\u20131 rank). Second, its CTE for \u2018LastVisitPatients\u2019 is wrong: it filters on hospitaldischargetime IS NOT NULL but then uses \u201cIN (SELECT patientunitstayid FROM patient ORDER BY hospitaladmittime DESC)\u201d without limiting to the most recent visit per patient, so it ends up including all visits rather than each patient\u2019s last one. Third, it matches labname with LIKE '%mch%' instead of exactly 'mch', potentially pulling unrelated tests. These issues span multiple clauses and alter the overall structure and semantics of the query, requiring a rewrite rather than a simple fix in one clause.",
            "error_type": "Global: incorrect ranking and visit-selection logic"
        },
        "dceb8374d4d0a4d482941c77": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "On the last hospital visit, what was the daily maximum dose of oral for patient 017-106093?",
            "gold_sql": "SELECT MAX(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '017-106093' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND intakeoutput.celllabel = 'oral' AND intakeoutput.cellpath LIKE '%intake%' GROUP BY strftime('%Y-%m-%d',intakeoutput.intakeoutputtime)",
            "pred_sql": "SELECT MAX(total_daily_dose) AS max_daily_dose FROM ( SELECT date(m.drugstarttime) AS drug_date, SUM(CAST(dosage AS REAL)) AS total_daily_dose FROM patient p JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE p.uniquepid = '017-106093' AND m.routeadmin = 'po' AND p.hospitaldischargetime IS NOT NULL ORDER BY p.hospitaladmittime DESC LIMIT 1 GROUP BY date(m.drugstarttime));",
            "gold_answer": "[['500.0']]",
            "pred_answer": "near \"GROUP\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL not only has a syntax error (ORDER BY and LIMIT before GROUP BY) but more fundamentally it uses the medication table instead of intakeoutput and sums dosage rather than intake volumes. This changes the overall logic and structure of the query\u2014joining the wrong table and misplacing clauses\u2014so a simple local fix won\u2019t suffice; the query needs to be restructured to follow the intended logic.",
            "error_type": "Global: incorrect table usage/structure error"
        },
        "04c45f5a7f141e001d812299": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What proportion of patients with a diagnosis of metabolic acidosis - drug induced survive over a 3-month period?",
            "gold_sql": "SELECT AVG(C1) FROM ( SELECT ( CASE WHEN (patient.hospitaldischargestatus = 'expired') AND(strftime('%J',patient.hospitaldischargetime) - strftime('%J',T1.diagnosistime)) < 365 / 4 THEN 0 ELSE 1 END ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'metabolic acidosis - drug induced' AND strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) >= 365 / 4 GROUP BY patient.uniquepid HAVING MIN(diagnosis.diagnosistime) = diagnosis.diagnosistime ) AS T1 JOIN patient ON T1.uniquepid = patient.uniquepid GROUP BY patient.uniquepid HAVING MAX(patient.hospitaldischargetime) = patient.hospitaldischargetime )",
            "pred_sql": "SELECT 1.0 * SUM(CASE WHEN DATE(patient.hospitaldischargetime) <= DATE(diagnosis.diagnosistime, '+91 days') AND patient.hospitaldischargestatus = 'alive' THEN 1 ELSE 0 END) / COUNT(DISTINCT patient.patientunitstayid) FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'metabolic acidosis - drug induced';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally alters the survival calculation logic and overall structure. It uses DATE arithmetic instead of Julian day differences, applies the wrong survival condition (checks for 'alive' status instead of handling 'expired' within 3 months), fails to filter patients with sufficient follow-up time, and divides by patientunitstayid rather than uniquepid. These issues go beyond a simple localized fix and require reworking the query\u2019s core logic and grouping, classifying it as a global error.",
            "error_type": "Global: logic error"
        },
        "e42699f7b9f2da1b9e49877f": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What was the number of ct scan - with contrast procedures performed since 2100?",
            "gold_sql": "SELECT COUNT(*) FROM treatment WHERE treatment.treatmentname = 'ct scan - with contrast' AND strftime('%Y',treatment.treatmenttime) >= '2100'",
            "pred_sql": "SELECT COUNT(*) FROM treatment WHERE treatmentname = 'CT scan - with contrast' AND datetime(treatmenttime, 'start of year') >= datetime('2100-01-01 00:00:00')",
            "gold_answer": "[['24.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it uses the treatment name literal 'CT scan - with contrast' (uppercase \u2018CT\u2019) instead of the exact string 'ct scan - with contrast' as stored in the table. This is a simple value\u2010matching error that does not change the query\u2019s overall structure or logic. All other parts of the query remain correct\u2014the date condition still filters on events since 2100\u2014so the mistake is localized to the literal value comparison.",
            "error_type": "Local: value parsing error"
        },
        "7ee2887a56faa82c0b200471": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "Tell me the top five most commonly prescribed medications within the same hospital visit to patients in their 40s who are diagnosed with obstructive sleep apnea since 1 year ago.",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'obstructive sleep apnea' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.age BETWEEN 40 AND 49 AND datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT M.drugname, COUNT(*) AS cnt FROM patient AS P JOIN diagnosis AS D ON P.patientunitstayid = D.patientunitstayid JOIN medication AS M ON P.patientunitstayid = M.patientunitstayid WHERE P.age BETWEEN 40 AND 49 AND D.diagnosisname = 'obstructive sleep apnea' AND D.diagnosistime >= datetime('2100-12-31 23:59:00', '-1 year') GROUP BY M.drugname ORDER BY cnt DESC LIMIT 5;",
            "gold_answer": "[['acetaminophen'], ['azithromycin'], ['dextrose 50%-water'], ['glucagon'], ['glucose'], ['hydrocodone 5 mg-acetaminophen 325 mg tablet'], ['magnesium sulfate 2 gram/50 ml iv piggy back 50 ml flex cont'], ['methylprednisolone sod suc(pf)'], ['tramadol']]",
            "pred_answer": "[['albuterol concentrated 0.5%', '20.0'], ['azithromycin', '17.0'], ['dextrose 50%-water', '25.0'], ['methylprednisolone sod suc(pf)', '25.0'], ['tramadol', '10.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL deviates from the intended logic in several fundamental ways: 1) It joins diagnosis and medication only on patientunitstayid rather than patienthealthsystemstayid, thus not ensuring the same hospital visit. 2) It fails to enforce that the medication start time occurs after the diagnosis time (D.diagnosistime < M.drugstarttime). 3) It does not restrict medication events to within the past year. These omissions affect the overall query structure and data relationships, altering the core semantics of \"top five medications prescribed after diagnosis during the same hospital visit within one year.\" Fixing this would require adding join conditions and WHERE clauses that span multiple parts of the query, not just a minor tweak in a single clause.",
            "error_type": "Global: join-logic error"
        },
        "b2b0fd03fe9d704dfbe25030": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "Pull up the ids of patients who were diagnosed with bradycardia - complete heart block.",
            "gold_sql": "SELECT DISTINCT patient.uniquepid FROM patient WHERE patient.patientunitstayid IN ( SELECT diagnosis.patientunitstayid FROM diagnosis WHERE diagnosis.diagnosisname = 'bradycardia - complete heart block' )",
            "pred_sql": "SELECT DISTINCT patientunitstayid FROM diagnosis WHERE diagnosisname = 'bradycardia - complete heart block';",
            "gold_answer": "[['012-11288'], ['021-101289'], ['027-100581'], ['031-11538']]",
            "pred_answer": "[['1254957.0'], ['2215881.0'], ['2778278.0'], ['3154626.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL selects diagnosis.patientunitstayid directly rather than retrieving patient.uniquepid from the patient table. The overall query structure (filtering by diagnosis name and deduplication) is correct, but the wrong column is returned. This is a localized mistake in the SELECT clause rather than a structural or multi-clause logical error.",
            "error_type": "Local: table/column reference error"
        },
        "2185bdc78a815e3114fbcbce": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What are the top three drugs that are prescribed to patients within 2 months after they are prescribed clopidogrel bisulfate 75 mg po tabs in 2100?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'clopidogrel bisulfate 75 mg po tabs' AND strftime('%Y',medication.drugstarttime) = '2100' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE strftime('%Y',medication.drugstarttime) = '2100' ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.drugstarttime < T2.drugstarttime AND datetime(T2.drugstarttime) BETWEEN datetime(T1.drugstarttime) AND datetime(T1.drugstarttime,'+2 month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "WITH clopidogrel_prescriptions AS ( SELECT DISTINCT patientunitstayid, drugstarttime FROM medication WHERE drugname = 'clopidogrel bisulfate 75 mg po tabs' AND strftime('%Y', drugstarttime) = '2100' ), subsequent_drugs AS ( SELECT m.drugname, m.patientunitstayid FROM medication m INNER JOIN clopidogrel_prescriptions c ON m.patientunitstayid = c.patientunitstayid WHERE m.drugstarttime > c.drugstarttime AND m.drugstarttime <= datetime(c.drugstarttime, '+2 months') AND m.drugname != 'clopidogrel bisulfate 75 mg po tabs' ) SELECT drugname FROM subsequent_drugs GROUP BY drugname ORDER BY COUNT(drugname) DESC LIMIT 3;",
            "gold_answer": "[['1000 ml flex cont : sodium chloride 0.9 % iv soln'], ['4 ml vial : furosemide 10 mg/ml ij soln'], ['potassium chloride crys er 20 meq po tbcr']]",
            "pred_answer": "[['4 ml vial : furosemide 10 mg/ml ij soln'], ['famotidine 20 mg po tabs'], ['vancomycin hcl 1000 mg iv solr']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses patientunitstayid instead of patient.uniquepid, causing it to count drug prescriptions per unit stay rather than per unique patient. This changes the intended logic of ranking drugs by the number of patients receiving them within two months after clopidogrel. The error affects the core aggregation and grouping logic of the query, requiring restructuring beyond a single clause.",
            "error_type": "Global: incorrect grouping/aggregation logic"
        },
        "f36aeace3637e368c0ee332f": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "For patients that are given glucagon 1 mg (1 unit) inj since 1 year ago, what are the top three drugs that they are prescribed afterwards within the same month?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'glucagon 1 mg (1 unit) inj' AND datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.drugstarttime < T2.drugstarttime AND datetime(T1.drugstarttime,'start of month') = datetime(T2.drugstarttime,'start of month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "SELECT drugname FROM medication WHERE medicationid IN (SELECT DISTINCT subsequent.medicationid FROM medication AS initial JOIN medication AS subsequent ON initial.patientunitstayid = subsequent.patientunitstayid WHERE initial.drugname = 'glucagon 1 mg (1 unit) inj' AND datetime(initial.drugstarttime) >= datetime('2100-12-31 23:59:00', '-1 year') AND datetime(initial.drugstarttime, 'start of month') = datetime(subsequent.drugstarttime, 'start of month') AND subsequent.drugname <> 'glucagon 1 mg (1 unit) inj') GROUP BY drugname ORDER BY COUNT(*) DESC LIMIT 3;",
            "gold_answer": "[['fentanyl (pf) 50 mcg/1 ml 2 ml inj'], ['insulin-glargine *unit* inj'], ['magnesium sulfate 2 gm/50 ml ivpb']]",
            "pred_answer": "[['dextrose 50% 25 gram/50 ml syr'], ['glucose 15 gram/60 ml bq liq'], ['sodium chloride 0.9% 1000 ml lvp']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to include the requirement that the \u201csubsequent\u201d drug event must occur after the initial glucagon administration (i.e. initial.drugstarttime < subsequent.drugstarttime). This is a missing condition in the WHERE clause/join logic but does not alter the overall structure of the query. It is a localized error in the temporal condition, so it is classified as a Local error.",
            "error_type": "Local: other-temporal error"
        },
        "e01c792f66d80f91b861252e": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "For patients who underwent cpap/peep therapy - 10-15 cm h2o since 1 year ago, what are the four most common diagnoses within the same month?",
            "gold_sql": "SELECT T3.diagnosisname FROM ( SELECT T2.diagnosisname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'cpap/peep therapy - 10-15 cm h2o' AND datetime(treatment.treatmenttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, diagnosis.diagnosisname, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.diagnosistime AND datetime(T1.treatmenttime,'start of month') = datetime(T2.diagnosistime,'start of month') GROUP BY T2.diagnosisname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "WITH RecentTreatments AS ( SELECT patientunitstayid, treatmenttime FROM treatment WHERE treatmentname LIKE '%cpap/peep therapy%' AND treatmenttime >= datetime('2100-12-31 23:59:00', '-1 year') AND treatmentname LIKE '%10-15 cm h2o%' ) SELECT d.diagnosisname FROM diagnosis d JOIN RecentTreatments rt ON d.patientunitstayid = rt.patientunitstayid WHERE strftime('%Y-%m', d.diagnosistime) = strftime('%Y-%m', rt.treatmenttime) GROUP BY d.diagnosisname ORDER BY COUNT(*) DESC LIMIT 4",
            "gold_answer": "[['acute coronary syndrome - myocardial ischemia'], ['acute respiratory failure'], ['ards'], ['atrial fibrillation'], ['bladder ca'], ['hematological effect of infection - bandemia'], ['hematological effect of infection - leukocytosis'], ['lower urinary tract infection'], ['septic shock']]",
            "pred_answer": "[['hematological effect of infection - bandemia'], ['hematological effect of infection - leukocytosis'], ['lower urinary tract infection'], ['septic shock']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the logic by (1) joining diagnosis and treatment on patientunitstayid instead of patient.uniquepid (thus tying events to the same ICU stay rather than the same patient) and (2) omitting the required condition that the treatment time precede the diagnosis time. These are not isolated syntax mistakes but core logical flaws spanning multiple clauses (JOIN and WHERE). Hence, this is a Global error.",
            "error_type": "Global: join logic error"
        },
        "602b90586b2027249be814c5": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What is the monthly average volume of urine that patient 012-10772 had on the first hospital visit?",
            "gold_sql": "SELECT AVG(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '012-10772' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND intakeoutput.celllabel = 'urine' AND intakeoutput.cellpath LIKE '%output%' GROUP BY strftime('%Y-%m',intakeoutput.intakeoutputtime)",
            "pred_sql": "SELECT SUM(io.cellvaluenumeric) / (JULIANDAY(p.hospitaldischargetime) - JULIANDAY(p.hospitaladmittime)) * 30 AS monthly_average FROM intakeoutput io INNER JOIN patient p ON io.patientunitstayid = p.patientunitstayid WHERE p.uniquepid = '012-10772' AND io.cellpath LIKE '%urine%' AND p.hospitaladmittime = ( SELECT MIN(hospitaladmittime) FROM patient WHERE uniquepid = '012-10772' );",
            "gold_answer": "[['156.667'], ['97.5']]",
            "pred_answer": "[['12297.987']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the aggregation logic: instead of grouping by month and averaging monthly totals (as required), it sums all urine outputs over the first stay and divides by the length of stay to estimate a monthly rate. It also uses io.cellpath LIKE '%urine%' instead of filtering on celllabel = 'urine'. These errors alter the core structure and intended meaning of the query, not just a minor clause fix.",
            "error_type": "Global: incorrect aggregation and filtering logic"
        },
        "718699d9458da53c8e30bbaa": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "How many hours have passed since the last time patient 012-10585 got the antibacterials on the current hospital visit?",
            "gold_sql": "SELECT 24 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',treatment.treatmenttime) ) FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '012-10585' AND patient.hospitaldischargetime IS NULL ) ) AND treatment.treatmentname = 'antibacterials' ORDER BY treatment.treatmenttime DESC LIMIT 1",
            "pred_sql": "SELECT (strftime('%s', '2100-12-31 23:59:00') - strftime('%s', MAX(m.drugstoptime))) / 3600 AS hours_since_last_antibacterial FROM medication m JOIN patient p ON m.patientunitstayid = p.patientunitstayid WHERE p.uniquepid = '012-10585' AND p.hospitaldischargetime IS NULL AND m.drugname LIKE '%antibacterial%';",
            "gold_answer": "[['97.367']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the medication table and drugstoptime (filtered by drugname LIKE '%antibacterial%') instead of the treatment table and treatmenttime with treatmentname = 'antibacterials'. This is not a local typo or minor syntax issue\u2014it fundamentally changes which events are considered and from which table, altering the query\u2019s logic and intended meaning. Therefore, this is a global error.",
            "error_type": "Global: wrong table/column usage"
        },
        "e8121858a0141075cd31178d": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What are the charges for a procedure called pulmonary resection?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'treatment' AND cost.eventid IN ( SELECT treatment.treatmentid FROM treatment WHERE treatment.treatmentname = 'pulmonary resection' )",
            "pred_sql": "SELECT DISTINCT cost FROM cost WHERE eventtype = 'treatment'",
            "gold_answer": "[['8.39']]",
            "pred_answer": "[['10.01'], ['4.17'], ['4.33'], ['4.39'], ['4.4'], ['4.64'], ['4.74'], ['4.79'], ['4.8'], ['4.82'], ['4.88'], ['4.92'], ['4.98'], ['5.04'], ['5.06'], ['5.11'], ['5.13'], ['5.14'], ['5.15'], ['5.16'], ['5.17'], ['5.19'], ['5.28'], ['5.29'], ['5.3'], ['5.31'], ['5.32'], ['5.33'], ['5.34'], ['5.35'], ['5.45'], ['5.47'], ['5.48'], ['5.51'], ['5.52'], ['5.55'], ['5.56'], ['5.57'], ['5.58'], ['5.61'], ['5.62'], ['5.64'], ['5.65'], ['5.66'], ['5.69'], ['5.7'], ['5.71'], ['5.72'], ['5.73'], ['5.74'], ['5.75'], ['5.76'], ['5.78'], ['5.79'], ['5.8'], ['5.83'], ['5.84'], ['5.85'], ['5.87'], ['5.88'], ['5.89'], ['5.9'], ['5.91'], ['5.93'], ['5.94'], ['5.96'], ['5.97'], ['5.98'], ['6.0'], ['6.01'], ['6.02'], ['6.03'], ['6.04'], ['6.05'], ['6.06'], ['6.07'], ['6.08'], ['6.09'], ['6.1'], ['6.11'], ['6.12'], ['6.13'], ['6.14'], ['6.15'], ['6.17'], ['6.18'], ['6.19'], ['6.21'], ['6.22'], ['6.23'], ['6.24'], ['6.25'], ['6.26'], ['6.27'], ['6.28'], ['6.29'], ['6.3'], ['6.31'], ['6.32'], ['6.33']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to include the filter linking cost.eventid to the treatment table for 'pulmonary resection'. It simply selects all treatment costs without constraining to the specific procedure. This is a localized mistake in the WHERE clause (a missing filter) and does not require altering the overall query structure or joins.",
            "error_type": "Local: missing WHERE condition"
        },
        "62dc915b80b2af835e9f281f": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "Since 1 year ago, what are the top four most common specimens tested on patients within 2 months after the diagnosis of peritonitis - spontaneous bacterial?",
            "gold_sql": "SELECT T3.culturesite FROM ( SELECT T2.culturesite, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'peritonitis - spontaneous bacterial' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, microlab.culturesite, microlab.culturetakentime FROM microlab JOIN patient ON microlab.patientunitstayid = patient.patientunitstayid WHERE datetime(microlab.culturetakentime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.culturetakentime AND datetime(T2.culturetakentime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month') GROUP BY T2.culturesite ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "SELECT T2.culturesite, COUNT(*) as NumTests FROM diagnosis AS T1 JOIN microlab AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.diagnosisname = 'peritonitis - spontaneous bacterial' AND datetime(T1.diagnosistime) >= datetime('2100-12-31 23:59:00', '-1 year') AND datetime(T2.culturetakentime) <= datetime(T1.diagnosistime, '+2 months') GROUP BY T2.culturesite ORDER BY NumTests DESC LIMIT 4;",
            "gold_answer": "[['nasopharynx']]",
            "pred_answer": "[['blood, venipuncture', '12.0'], ['nasopharynx', '6.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only applies an upper bound on microlab.culturetakentime (<= diagnosis time + 2 months) but omits the lower bound (>= diagnosis time). This mistake is confined to the WHERE clause filters and does not require restructuring joins or the overall query logic. It is a localized error in the condition logic.",
            "error_type": "Local: incorrect WHERE clause filter"
        },
        "ab74a84f2dac454c1858fb2c": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "When did patient 031-10510's first microbiological test occur on the first hospital visit?",
            "gold_sql": "SELECT microlab.culturetakentime FROM microlab WHERE microlab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10510' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) ORDER BY microlab.culturetakentime ASC LIMIT 1",
            "pred_sql": "SELECT T2.culturetakentime FROM patient AS T1 INNER JOIN microlab AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.uniquepid = '031-10510' ORDER BY T1.hospitaladmittime ASC LIMIT 1;",
            "gold_answer": "[['2100-05-20 17:15:00']]",
            "pred_answer": "[['2100-05-30 22:27:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins patient and microlab directly and orders only by the patient admission time, without filtering for the first completed hospital visit (hospitaldischargetime IS NOT NULL) or ordering by the test time within that visit. This changes the overall logic of the query\u2014it does not properly identify the first hospital encounter nor the earliest microbiological test within that encounter. Fixing this would require restructuring the query (adding subqueries or additional filters and ordering by microlab.culturetakentime), not just tweaking a single clause.",
            "error_type": "Global: flawed join and ordering logic"
        },
        "9850b09854dcbb18771ddd9c": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What were the number of patients who received a ptt ratio test since 1 year ago?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT lab.patientunitstayid FROM lab WHERE lab.labname = 'ptt ratio' AND datetime(lab.labresulttime) >= datetime('2100-12-31 23:59:00','-1 year') )",
            "pred_sql": "SELECT COUNT(DISTINCT patientunitstayid) FROM lab WHERE labname = 'ptt ratio' AND datetime(labresulttime) >= datetime('2100-12-31 23:59:00', '-1 year')",
            "gold_answer": "[['20.0']]",
            "pred_answer": "[['22.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL counts DISTINCT patientunitstayid directly from the lab table, effectively counting distinct ICU stays rather than distinct patients. The ground truth SQL first identifies patientunitstayid values from the lab table and then counts DISTINCT patient.uniquepid in the patient table, ensuring that the result is the number of unique patients. By omitting the patient table join and using the wrong field for counting, the predicted query fundamentally alters the query\u2019s intended meaning\u2014counting stays instead of patients.",
            "error_type": "Global: join error"
        },
        "017a9b0a55f8e7958d82ef86": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What is the number of days since patient 002-10122 was first diagnosed with acute respiratory failure on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) ) FROM diagnosis WHERE diagnosis.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-10122' AND patient.hospitaldischargetime IS NULL ) ) AND diagnosis.diagnosisname = 'acute respiratory failure' ORDER BY diagnosis.diagnosistime ASC LIMIT 1",
            "pred_sql": "SELECT ROUND((julianday('2100-12-31 23:59:00') - julianday(D1.diagnosistime)), 0) AS days_since_diagnosis FROM patient AS P INNER JOIN diagnosis AS D1 ON P.patientunitstayid = D1.patientunitstayid WHERE P.uniquepid = '002-10122' AND D1.diagnosisname = 'acute respiratory failure' AND P.hospitaldischargetime IS NULL ORDER BY D1.diagnosistime ASC LIMIT 1",
            "gold_answer": "[['2.255']]",
            "pred_answer": "[['2.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL deviates only in the SELECT clause by using ROUND(..., 0) on the day difference, producing an integer value with one decimal (\u20182.0\u2019) instead of the more precise float rounded to three decimals (\u20182.255\u2019) as required. The join logic, table references, and WHERE filters correctly identify the current hospital visit and diagnosis, so the structural and logical flow remains intact. The only mistake is the local rounding of the numerical result.",
            "error_type": "Local: rounding error"
        },
        "e9326e10e6866dba320fa072": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What's the rdw change of patient 032-10133 last measured on the last hospital visit compared to the second to last value measured on the last hospital visit?",
            "gold_sql": "SELECT ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '032-10133' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'rdw' ORDER BY lab.labresulttime DESC LIMIT 1 ) - ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '032-10133' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'rdw' ORDER BY lab.labresulttime DESC LIMIT 1 OFFSET 1 )",
            "pred_sql": "WITH cte_last_hospital_visit AS ( SELECT patientunitstayid FROM patient WHERE uniquepid = '032-10133' AND hospitaldischargetime IS NOT NULL ORDER BY hospitaladmittime DESC LIMIT 1 ), rdw_values AS ( SELECT lab.labresult as rdw_value, lab.labresulttime FROM lab JOIN cte_last_hospital_visit ON lab.patientunitstayid = cte_last_hospital_visit.patientunitstayid WHERE lab.labname = 'rdw' ORDER BY lab.labresulttime DESC ) SELECT rdw_value AS last_value FROM rdw_values LIMIT 1 UNION ALL SELECT rdw_value FROM rdw_values LIMIT 1 OFFSET 1;",
            "gold_answer": "[['-0.3']]",
            "pred_answer": "LIMIT clause should come after UNION ALL not before",
            "is_correct": false,
            "reasoning": "The predicted SQL misuses the LIMIT clause by placing it before the UNION ALL, leading to a syntax error. This is a localized mistake in clause ordering and does not involve changes to the overall query logic or table relationships.",
            "error_type": "Local: syntax error"
        },
        "9fd4b99007cf93788de4e605": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What is the maximum total cost for the hospital when a troponin - i lab test is involved since 2100?",
            "gold_sql": "SELECT MAX(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.patientunitstayid IN ( SELECT lab.patientunitstayid FROM lab WHERE lab.labname = 'troponin - i' ) ) AND strftime('%Y',cost.chargetime) >= '2100' GROUP BY cost.patienthealthsystemstayid ) AS T1",
            "pred_sql": "SELECT MAX(total_cost) AS max_total_cost FROM (SELECT SUM(cost.cost) AS total_cost FROM cost JOIN lab ON cost.patientunitstayid = lab.patientunitstayid WHERE lab.labname = 'troponin - i' AND datetime(lab.labresulttime) >= datetime('2100-01-01') GROUP BY cost.patienthealthsystemstayid);",
            "gold_answer": "[['25887.21']]",
            "pred_answer": "[['176405.04']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes how costs are associated with troponin - i labs by joining cost and lab on patientunitstayid instead of linking via patienthealthsystemstayid (and filtering cost.chargetime rather than lab.labresulttime). This incorrect join and grouping logic alters the intended mapping between cost records and lab events, producing a completely different result. Such an error spans multiple clauses and breaks the core relationship between tables, requiring a structural fix rather than a minor tweak.",
            "error_type": "Global: incorrect join error"
        },
        "810edfc3207a29bef5ac27c2": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What is the number of times that patient 013-10029 had a urine event on 10/07/this year?",
            "gold_sql": "SELECT COUNT(*) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '013-10029' ) ) AND intakeoutput.cellpath LIKE '%output%' AND intakeoutput.celllabel = 'urine' AND datetime(intakeoutput.intakeoutputtime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') AND strftime('%m-%d',intakeoutput.intakeoutputtime) = '10-07'",
            "pred_sql": "SELECT COUNT(*) FROM intakeoutput WHERE patientunitstayid IN (SELECT patientunitstayid FROM patient WHERE uniquepid = '013-10029') AND cellpath LIKE '%urine%' AND datetime(intakeoutputtime, 'start of day') = datetime('2100-12-31 23:59:00', 'start of year', '-0 year') AND strftime('%m-%d', intakeoutputtime) = '10-07'",
            "gold_answer": "[['4.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL has multiple mistakes confined to its WHERE clause: it filters cellpath with '%urine%' instead of checking cellpath LIKE '%output%' and celllabel = 'urine', it compares datetime(intakeoutputtime, 'start of day') to a 'start of year' timestamp (so the date\u2010filter is wrong), and it simplifies the patientunitstayid lookup incorrectly (omitting the patienthealthsystemstayid subquery). All of these issues are localized to specific conditions rather than the overall query structure or logic.",
            "error_type": "Local: temporal and filter condition errors"
        },
        "616d4bc79f0d39ba25a8112d": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What are the five most frequently ordered medications that female patients aged 60 or above are prescribed within 2 months after they are diagnosed with bone fracture(s) - left upper extremity this year?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'bone fracture(s) - left upper extremity' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.gender = 'female' AND patient.age >= 60 AND datetime(medication.drugstarttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND datetime(T2.drugstarttime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 month') GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT medication.drugname FROM patient JOIN diagnosis ON patient.patientunitstayid = diagnosis.patientunitstayid JOIN medication ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.gender = 'female' AND CAST(patient.age AS INTEGER) >= 60 AND diagnosis.diagnosisname = 'bone fracture(s) - left upper extremity' AND strftime('%Y', diagnosis.diagnosistime) = '2100' AND datetime(medication.drugstarttime) BETWEEN datetime(diagnosis.diagnosistime) AND datetime(diagnosis.diagnosistime, '+2 months') GROUP BY medication.drugname ORDER BY COUNT(*) DESC LIMIT 5;",
            "gold_answer": "[['acetaminophen 650mg rect supp'], ['albumin 5% 500 ml inj'], ['albuterol 2.5 mg/3 ml ud inh soln'], ['carvedilol 3.125 mg tab'], ['ceftriaxone 1 gram in ns 50 ml ivpb'], ['diphenhydramine 50 mg/1 ml 1 ml inj'], ['folic acid 1 mg tab'], ['lactated ringers 1000 ml lvp'], ['levofloxacin 750 mg in d5w 150ml'], ['metoprolol 1 mg/ml 5ml sdv inj'], ['naloxone 0.4 mg/1 ml sdv inj'], ['ondansetron 2 mg/1 ml 2ml sdv inj'], ['percocet 5/325 tab'], ['potassium chloride 20 meq tr tab'], ['senokot-s tab']]",
            "pred_answer": "[['albumin 5% 500 ml inj'], ['carvedilol 3.125 mg tab'], ['ceftriaxone 1 gram in ns 50 ml ivpb'], ['levofloxacin 750 mg in d5w 150ml'], ['metoprolol 1 mg/ml 5ml sdv inj']]",
            "is_correct": false,
            "reasoning": "The predicted SQL is structurally similar to the ground\u2010truth: it still joins patient, diagnosis, and medication, applies the same gender/age/diagnosis filters, enforces the 2-month window, groups by drugname, and limits to the top\u20105. The only substantive deviation is that it never restricts medication start times to the current year (as required by the assumptions and as done in the ground\u2010truth\u2019s T2 subquery). This is a missing WHERE\u2010clause filter (a localized temporal condition), not a flaw in the overall logic or join strategy. Therefore, the error is local.",
            "error_type": "Local: missing temporal filter for medication events"
        },
        "b6aa0837ace2e0c90b15be92": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "Tell me the top four most frequent procedures that patients received within the same hospital visit after being diagnosed with encephalitis - viral.",
            "gold_sql": "SELECT T3.treatmentname FROM ( SELECT T2.treatmentname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'encephalitis - viral' ) AS T1 JOIN ( SELECT patient.uniquepid, treatment.treatmentname, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.treatmenttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.treatmentname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "SELECT T.treatmentname, COUNT(*) as frequency FROM diagnosis D JOIN treatment T ON D.patientunitstayid = T.patientunitstayid WHERE D.diagnosisname = 'encephalitis - viral' AND T.treatmenttime > D.diagnosistime GROUP BY T.treatmentname ORDER BY frequency DESC LIMIT 4;",
            "gold_answer": "[['anticonvulsant - levetiracetam'], ['antiviral therapy - acyclovir'], ['eeg'], ['electrolyte administration - intravenous'], ['electrolyte administration - oral'], ['electrolyte administration - potassium'], ['foley catheter'], ['head ct scan'], ['insulin - continuous infusion'], ['lumbar puncture'], ['mri - head'], ['normal saline administration'], ['oxygen therapy (< 40%) - nasal cannula'], ['vasodilating agent - iv - nicardipine'], ['vte prophylaxis - compression boots'], ['vte prophylaxis - conventional heparin therapy']]",
            "pred_answer": "[['insulin - continuous infusion', '9.0'], ['lumbar puncture', '9.0'], ['oxygen therapy (< 40%) - nasal cannula', '9.0'], ['vte prophylaxis - compression boots', '9.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins diagnosis and treatment on patientunitstayid, but the question asks for procedures within the same hospital visit (patienthealthsystemstayid). By using the wrong key, it fundamentally alters the data association and scope of the query. This is not a simple column typo\u2014it changes the join logic and requires restructuring the query to use patienthealthsystemstayid, so it is a global logic error.",
            "error_type": "Global: incorrect join key"
        },
        "90fc8fa81b2c8abb424a1228": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What are the four most frequently prescribed medications for patients in their 20s?",
            "gold_sql": "SELECT T1.drugname FROM ( SELECT medication.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age BETWEEN 20 AND 29 ) GROUP BY medication.drugname ) AS T1 WHERE T1.C1 <= 4",
            "pred_sql": "SELECT medication.drugname, COUNT(medication.medicationid) AS frequency FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE CAST(patient.age AS INTEGER) BETWEEN 20 AND 29 GROUP BY medication.drugname ORDER BY frequency DESC LIMIT 4;",
            "gold_answer": "[['100 ml flex cont : sodium chloride 0.9 % iv soln'], ['acetaminophen 325 mg po tabs'], ['ativan'], ['potassium chloride'], ['sodium chloride 0.9 % ij soln'], ['sodium chloride 0.9 % iv : 1000 ml']]",
            "pred_answer": "[['100 ml flex cont : sodium chloride 0.9 % iv soln', '17.0'], ['ativan', '22.0'], ['potassium chloride', '18.0'], ['sodium chloride 0.9 % iv : 1000 ml', '15.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL correctly joins medication with patient and filters ages 20\u201329, and it groups and orders by prescription count. However, it uses ORDER BY \u2026 LIMIT 4 instead of applying DENSE_RANK() to include ties for the fourth rank, and it returns both drug names and their counts rather than only the drug names. These are errors localized to the SELECT and ranking logic without altering table relationships or the overall query structure.",
            "error_type": "Local: top-N ranking and projection error"
        },
        "ee5ae34a56ec77cfa4217ecd": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What are the top four most frequent diagnoses that patients are given within the same hospital visit after being diagnosed with ventricular premature beats since 1 year ago?",
            "gold_sql": "SELECT T3.diagnosisname FROM ( SELECT T2.diagnosisname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'ventricular premature beats' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, diagnosis.diagnosisname, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.diagnosistime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.diagnosisname ) AS T3 WHERE T3.C1 <= 4",
            "pred_sql": "WITH initial_diagnosis AS ( SELECT D1.patientunitstayid, D1.diagnosistime FROM diagnosis AS D1 WHERE D1.diagnosisname = 'ventricular premature beats' AND datetime(D1.diagnosistime) >= datetime('2100-12-31 23:59:00', '-1 year') ), subsequent_diagnoses AS ( SELECT D2.diagnosisname FROM initial_diagnosis AS ID INNER JOIN diagnosis AS D2 ON ID.patientunitstayid = D2.patientunitstayid WHERE datetime(D2.diagnosistime) > datetime(ID.diagnosistime) AND D2.diagnosisname <> 'ventricular premature beats' ) SELECT D2.diagnosisname, COUNT(D2.diagnosisname) AS frequency FROM subsequent_diagnoses AS D2 GROUP BY D2.diagnosisname ORDER BY frequency DESC LIMIT 4",
            "gold_answer": "[['atrial flutter'], ['bipolar disorder'], ['breast ca'], ['cardiomyopathy'], ['coagulopathy - coumadin administration'], ['congestive heart failure'], ['copd'], ['coronary artery disease - known'], ['hyperlipidemia'], ['obstructive sleep apnea'], ['ventricular fibrillation'], ['ventricular tachycardia']]",
            "pred_answer": "[['congestive heart failure', '13.0'], ['obstructive sleep apnea', '13.0'], ['ventricular fibrillation', '13.0'], ['ventricular tachycardia', '13.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to enforce the \u201csame hospital visit\u201d requirement by joining only on patientunitstayid rather than patienthealthsystemstayid, fundamentally altering which diagnoses are grouped together. It also introduces a COUNT in the final SELECT, violating the assumption that only the diagnosis names should be returned for a top-N list. These issues go beyond a simple typo or syntax mistake in one clause and change the overall logic of the query, requiring significant restructuring to correct.",
            "error_type": "Global: incorrect join and output structure"
        },
        "2791f3d7ba24deb3fd9b5d0b": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "On the first hospital visit, when did patient 031-10095 receive the first nasopharynx microbiology test?",
            "gold_sql": "SELECT microlab.culturetakentime FROM microlab WHERE microlab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '031-10095' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) AND microlab.culturesite = 'nasopharynx' ORDER BY microlab.culturetakentime ASC LIMIT 1",
            "pred_sql": "SELECT MIN(T2.culturetakentime) AS first_microbiology_test FROM patient AS T1 INNER JOIN microlab AS T2 ON T1.patientunitstayid = T2.patientunitstayid WHERE T1.uniquepid = '031-10095' AND T1.hospitaldischargetime IS NOT NULL ORDER BY T1.hospitaladmittime ASC LIMIT 1 AND T2.culturesite = 'nasopharynx'",
            "gold_answer": "[['2100-02-09 15:50:00']]",
            "pred_answer": "no such column: T2.culturesite",
            "is_correct": false,
            "reasoning": "The predicted query misplaces the filter on T2.culturesite after the LIMIT clause, causing SQLite to interpret it as a column reference in the LIMIT/ORDER BY context. This is a localized syntax/column reference error that can be fixed by moving AND T2.culturesite = 'nasopharynx' into the WHERE clause and properly ordering the ORDER BY and LIMIT clauses. The overall query logic and join structure remain intact.",
            "error_type": "Local: table/column reference error"
        },
        "f551c3dec5e7817a5dee59e7": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "Among patients who are prescribed with lactated ringers injection 1,000 ml, what are the top three most frequently prescribed drugs at the same time?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'lactated ringers injection 1,000 ml' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE datetime(T1.drugstarttime) = datetime(T2.drugstarttime) GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "SELECT other_med.drugname, COUNT(*) AS prescription_count FROM medication AS lr_med JOIN medication AS other_med ON lr_med.patientunitstayid = other_med.patientunitstayid AND lr_med.drugstarttime <= other_med.drugstoptime AND lr_med.drugstoptime >= other_med.drugstarttime WHERE lr_med.drugname = 'lactated ringers injection 1,000 ml' AND other_med.drugname <> 'lactated ringers injection 1,000 ml' GROUP BY other_med.drugname ORDER BY prescription_count DESC LIMIT 3;",
            "gold_answer": "[['dilaudid'], ['fentanyl'], ['lactated ringers injection 1,000 ml']]",
            "pred_answer": "[['dilaudid', '20.0'], ['fentanyl', '43.0'], ['zofran', '26.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL changes the join condition from matching identical start times (as required to find drugs prescribed at the exact same time) to an interval-overlap condition (lr_med.drugstarttime <= other_med.drugstoptime AND lr_med.drugstoptime >= other_med.drugstarttime). This alters the core logic of how co-prescribed drugs are identified, affecting the overall meaning and results of the query. The error spans the JOIN strategy and requires restructuring beyond a simple fix in a single clause.",
            "error_type": "Global: incorrect join logic"
        },
        "8b621dd46769f8f16098888e": {
            "db_id": "eicu",
            "generator_name": "llm2sql",
            "question": "What was the change in chloride in patient 021-105581 last measured on the last hospital visit compared to the second to last value measured on the last hospital visit?",
            "gold_sql": "SELECT ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '021-105581' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'chloride' ORDER BY lab.labresulttime DESC LIMIT 1 ) - ( SELECT lab.labresult FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '021-105581' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1 ) ) AND lab.labname = 'chloride' ORDER BY lab.labresulttime DESC LIMIT 1 OFFSET 1 )",
            "pred_sql": "SELECT MAX(LAB2.LABRESULT) - MIN(LAB2.LABRESULT) AS chloride_change FROM (SELECT LAB.labresult FROM lab LAB JOIN patient PAT ON LAB.patientunitstayid = PAT.patientunitstayid WHERE PAT.uniquepid = '021-105581' AND PAT.hospitaldischargetime IS NOT NULL AND LAB.labname = 'chloride' ORDER BY LAB.labresulttime DESC LIMIT 2) AS LAB2;",
            "gold_answer": "[['-1.0']]",
            "pred_answer": "[['1.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL pulls the two most recent chloride values but then uses MAX() - MIN(), which computes an absolute difference rather than \u201cmost recent minus second most recent.\u201d This is a mistake confined to the SELECT clause\u2019s aggregation logic and does not alter joins or overall query structure. Hence, it\u2019s a local error.",
            "error_type": "Local: aggregate misuse"
        }
    },
    "qwen3": {
        "2288358aa2f90ce1ea419f03": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What are the five most frequently ordered lab tests this year for patients of age 40s?",
            "gold_sql": "SELECT T1.labname FROM ( SELECT lab.labname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age BETWEEN 40 AND 49 ) AND datetime(lab.labresulttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') GROUP BY lab.labname ) AS T1 WHERE T1.C1 <= 5",
            "pred_sql": "SELECT lab.labname FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid WHERE patient.age >= '40' AND patient.age <= '49' AND strftime('%Y', lab.labresulttime) = '2100' GROUP BY lab.labname ORDER BY COUNT(*) DESC LIMIT 5;",
            "gold_answer": "[['bedside glucose'], ['glucose'], ['hct'], ['hgb'], ['potassium'], ['sodium']]",
            "pred_answer": "[['bedside glucose'], ['glucose'], ['hct'], ['hgb'], ['potassium']]",
            "is_correct": false,
            "reasoning": "The predicted SQL is structurally similar to the ground truth: it correctly joins lab to patient, filters ages 40\u201349, restricts to this year, groups by labname, and orders by COUNT(*) DESC. The only difference is that the ground truth uses DENSE_RANK() to capture ties at the fifth position (including 'sodium'), whereas the predicted query uses LIMIT 5 and thus omits any tied 5th-rank items. This mistake is confined to the top-N ranking logic and does not require altering joins, filters, or the overall query structure.",
            "error_type": "Local: ranking error"
        },
        "f45ca3219aafadeec48edf98": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "Among those who are prescribed with ultram, what are the three most commonly prescribed drugs at the same time?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = 'ultram' ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE datetime(T1.drugstarttime) = datetime(T2.drugstarttime) GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "SELECT drugname FROM ( SELECT DISTINCT m.patientunitstayid, m.drugname FROM medication m WHERE m.patientunitstayid IN ( SELECT DISTINCT patientunitstayid FROM medication WHERE drugname LIKE '%ultram%' ) AND m.drugname NOT LIKE '%ultram%' ) GROUP BY drugname ORDER BY COUNT(*) DESC LIMIT 3;",
            "gold_answer": "[['milk of magnesia'], ['narcan'], ['norco'], ['ultram'], ['zofran']]",
            "pred_answer": "[['klor-con'], ['lasix'], ['sodium chloride 0.9 % iv : 1000 ml']]",
            "is_correct": false,
            "reasoning": "The predicted SQL omits the critical join on drugstarttime to ensure co\u2010prescriptions occur \u201cat the same time.\u201d Instead, it simply finds all other drugs prescribed at any time during the patient\u2019s stay and ranks them. This fundamentally changes the query\u2019s logic and output, since it no longer restricts to simultaneous prescriptions of ultram. Fixing this would require restructuring the query to join medication records on matching drugstarttime, not just filtering by patientunitstayid. Hence, the error is not a simple typo or minor clause fix but a core logical/structural flaw in how the tables are combined.",
            "error_type": "Global: join-strategy error"
        },
        "05ba864d3e4a7ee0d0933a8d": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "When did patient 017-100600 come for the last time to the hospital?",
            "gold_sql": "SELECT patient.hospitaladmittime FROM patient WHERE patient.uniquepid = '017-100600' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime DESC LIMIT 1",
            "pred_sql": "SELECT MAX(hospitaldischargetime) AS last_visit FROM patient WHERE uniquepid = '017-100600' AND hospitaldischargetime IS NOT NULL;",
            "gold_answer": "[['2100-08-09 22:05:00']]",
            "pred_answer": "[['2100-08-13 19:27:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses MAX(hospitaldischargetime) instead of retrieving the last hospitaladmittime. This is a simple column reference mistake (using the discharge time rather than the admit time) and can be fixed by selecting MAX(hospitaladmittime) or by ordering and limiting on hospitaladmittime. It does not require restructuring the query\u2019s joins or logic beyond correcting the column name.",
            "error_type": "Local: column reference error"
        },
        "5b7e59064a534ba9cf05d2cd": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "How many days have elapsed since the first time on the current hospital visit patient 004-10202 received a lab test for alt (sgpt)?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',lab.labresulttime) ) FROM lab WHERE lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '004-10202' AND patient.hospitaldischargetime IS NULL ) ) AND lab.labname = 'alt (sgpt)' ORDER BY lab.labresulttime ASC LIMIT 1",
            "pred_sql": "SELECT CAST((julianday('2100-12-31 23:59:00') - julianday(earliest_lab_time)) AS INTEGER) AS days_elapsed FROM ( SELECT MIN(labresulttime) AS earliest_lab_time FROM lab WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '004-10202' AND hospitaldischargetime IS NULL ) AND (labname = 'alt' OR labname = 'sgpt') );",
            "gold_answer": "[['4.02']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL incorrectly splits the lab name filter into labname = 'alt' OR labname = 'sgpt' instead of matching the single value 'alt (sgpt)'. This is a localized mistake in the WHERE clause value filter and can be fixed by correcting the literal without altering the overall query structure.",
            "error_type": "Local: value parsing error"
        },
        "1a00dd0718094715b48766e9": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "How many patients had antithyroid therapy - methimazole done since 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT patient.uniquepid ) FROM patient WHERE patient.patientunitstayid IN ( SELECT treatment.patientunitstayid FROM treatment WHERE treatment.treatmentname = 'antithyroid therapy - methimazole' AND strftime('%Y',treatment.treatmenttime) >= '2100' )",
            "pred_sql": "SELECT COUNT(DISTINCT p.uniquepid) FROM medication m JOIN patient p ON m.patientunitstayid = p.patientunitstayid WHERE m.drugname LIKE '%methimazole%' AND datetime(m.drugstarttime) >= '2100-01-01 00:00:00';",
            "gold_answer": "[['3.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the medication table and filters on m.drugname and m.drugstarttime, whereas the correct logic requires querying the treatment table for treatmentname = 'antithyroid therapy - methimazole'. This is not a minor syntax mistake but a fundamental misuse of tables and relationships, altering the intended semantics of the query. To fix it would require restructuring the query to target the treatment table rather than a simple local correction within a clause.",
            "error_type": "Global: incorrect table usage"
        },
        "ae12d280809717b148037f25": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "How many times was ondansetron hcl last month prescribed to patient 025-17363?",
            "gold_sql": "SELECT COUNT(*) FROM medication WHERE medication.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '025-17363' ) ) AND medication.drugname = 'ondansetron hcl' AND datetime(medication.drugstarttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month')",
            "pred_sql": "SELECT COUNT(*) AS count FROM patient JOIN medication ON patient.patientunitstayid = medication.patientunitstayid WHERE patient.uniquepid = '025-17363' AND medication.drugname LIKE '%ondansetron hcl%' AND strftime('%Y-%m', medication.drugstarttime) = strftime('%Y-%m', datetime('2100-12-31 23:59:00', '-1 month'));",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query\u2019s structure (JOIN vs nested IN) is fine and doesn\u2019t break the overall logic. The mistake lies in the WHERE clause\u2019s filtering of the prescription date: it uses strftime('%Y-%m', \u2026) against datetime('\u2026','-1 month') (which yields \u20182100-11-30 23:59:00\u2019, giving \u20182100-11\u2019) instead of matching the start\u2010of\u2010month as required by the spec. This localized date\u2010filtering error causes the predicate to fail and return 0 instead of 1. No other cross\u2010clause logic or joins need changing\u2014only the date condition does.",
            "error_type": "Local: date filter error"
        },
        "489c1ea5bdaeef4ed2659b45": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "How many hours have passed since patient 015-100025's first hemodialysis intake (ml) input on the current icu visit?",
            "gold_sql": "SELECT 24 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J',intakeoutput.intakeoutputtime) ) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '015-100025' ) AND patient.unitdischargetime IS NULL ) AND intakeoutput.celllabel = 'hemodialysis intake (ml)' AND intakeoutput.cellpath LIKE '%intake%' ORDER BY intakeoutput.intakeoutputtime ASC LIMIT 1",
            "pred_sql": "SELECT (strftime('%s', '2100-12-31 23:59:00') - strftime('%s', MIN(io.intakeoutputtime))) / 3600 AS hours_passed FROM patient p JOIN intakeoutput io ON p.patientunitstayid = io.patientunitstayid WHERE p.uniquepid = '015-100025' AND p.unitdischargetime IS NULL AND io.cellpath LIKE '%intake%' AND io.cellpath LIKE '%hemodialysis%';",
            "gold_answer": "[['2.8']]",
            "pred_answer": "[['2.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fails to restrict on the exact \u2018celllabel = \\'hemodialysis intake (ml)\\'\u2019 and instead uses io.cellpath LIKE '%hemodialysis%', so it pulls a different (earlier) intake time. This is a mistake confined to the WHERE clause filters and does not alter the overall query structure or joins.",
            "error_type": "Local: incorrect filter in WHERE clause"
        },
        "9e4e34508b9eabf0b0fc4fbe": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What is the cost of a sepsis - sepsis with single organ dysfunction- circulatory system failure diagnosis?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.eventtype = 'diagnosis' AND cost.eventid IN ( SELECT diagnosis.diagnosisid FROM diagnosis WHERE diagnosis.diagnosisname = 'sepsis - sepsis with single organ dysfunction- circulatory system failure' )",
            "pred_sql": "SELECT SUM(cost.cost) AS total_cost FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid JOIN cost ON patient.patienthealthsystemstayid = cost.patienthealthsystemstayid WHERE diagnosis.diagnosisname = 'sepsis - sepsis with single organ dysfunction- circulatory system failure' AND cost.eventtype = 'diagnosis' AND cost.eventid = diagnosis.diagnosisid;",
            "gold_answer": "[['6.76']]",
            "pred_answer": "[['87.88']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally alters the intent of the query by joining through the patient table and summing all diagnosis event costs across multiple patients. The ground truth simply retrieves the single cost for the specified diagnosis event (using DISTINCT on cost.cost). The predicted version\u2019s use of SUM and additional joins changes the overall logic and structure\u2014it\u2019s not a localized syntax mistake but a global restructuring that aggregates across unintended rows.",
            "error_type": "Global: incorrect join/aggregation strategy"
        },
        "18553a06c553cf15ca7bf4a2": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "Is the value of sao2 of patient 006-106843 last measured on the last icu visit less than the value second to last measured on the last icu visit?",
            "gold_sql": "SELECT ( SELECT vitalperiodic.sao2 FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-106843' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime DESC LIMIT 1 ) AND vitalperiodic.sao2 IS NOT NULL ORDER BY vitalperiodic.observationtime DESC LIMIT 1 ) < ( SELECT vitalperiodic.sao2 FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '006-106843' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime DESC LIMIT 1 ) AND vitalperiodic.sao2 IS NOT NULL ORDER BY vitalperiodic.observationtime DESC LIMIT 1 OFFSET 1 )",
            "pred_sql": "WITH last_icu_stay AS ( SELECT patientunitstayid FROM patient WHERE uniquepid = '006-106843' ORDER BY unitdischargetime DESC LIMIT 1 ), ranked_vitals AS ( SELECT sao2, ROW_NUMBER() OVER (ORDER BY observationtime DESC) AS rn FROM vitalperiodic WHERE patientunitstayid = (SELECT patientunitstayid FROM last_icu_stay) ) SELECT (SELECT sao2 FROM ranked_vitals WHERE rn = 1) < (SELECT sao2 FROM ranked_vitals WHERE rn = 2) AS is_less;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to filter out NULL sao2 values before ranking, so its first row can be NULL and the comparison yields NULL (None) instead of a boolean. The mistake is a missing WHERE clause condition (vitalperiodic.sao2 IS NOT NULL) in the ranked_vitals CTE. This is a localized WHERE\u2010clause error that doesn\u2019t change the overall query structure or table relationships.",
            "error_type": "Local: missing non-null filter in WHERE clause"
        },
        "1bef54d89c07bec88a7d7fef": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "How many patients were diagnosed with upper urinary tract infection within the same hospital visit since 1 year ago after electrolyte administration - intravenous.",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'electrolyte administration - intravenous' AND datetime(treatment.treatmenttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'upper urinary tract infection' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 WHERE T1.treatmenttime < T2.diagnosistime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT COUNT(DISTINCT p.uniquepid) FROM diagnosis d JOIN treatment t ON d.patientunitstayid = t.patientunitstayid JOIN patient p ON d.patientunitstayid = p.patientunitstayid WHERE d.diagnosisname = 'upper urinary tract infection' AND t.treatmentname = 'electrolyte administration - intravenous' AND datetime(t.treatmenttime) <= datetime(d.diagnosistime, '-1 year');",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally misrepresents the question\u2019s logic in multiple clauses. It joins diagnosis and treatment on patientunitstayid rather than patienthealthsystemstayid, so it conflates ICU stays with hospital visits. It also applies the time filter incorrectly\u2014comparing treatment time to one year before each diagnosis instead of requiring both events to have occurred within the last year relative to today and ensuring treatment precedes diagnosis. These errors span joins and WHERE logic and cannot be fixed by tweaking a single clause.",
            "error_type": "Global: incorrect join and time logic"
        },
        "e634a2c2d4fe2d94757686eb": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What is the 3-month survival rate for cardiac arrest - witnessed, < 15 minutes cpr patients who were prescribed 20.3 ml cup : acetaminophen 160 mg/5ml po soln after the diagnosis?",
            "gold_sql": "SELECT AVG(C1) FROM ( SELECT ( CASE WHEN (patient.hospitaldischargestatus = 'expired') AND(strftime('%J',patient.hospitaldischargetime) - strftime('%J',T1.diagnosistime)) < 365 / 4 THEN 0 ELSE 1 END ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'cardiac arrest - witnessed, < 15 minutes cpr' AND strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) >= 365 / 4 GROUP BY patient.uniquepid HAVING MIN(diagnosis.diagnosistime) = diagnosis.diagnosistime ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE medication.drugname = '20.3 ml cup : acetaminophen 160 mg/5ml po soln' GROUP BY patient.uniquepid HAVING MAX(medication.drugstarttime) = medication.drugstarttime ) AS T2 ON T1.uniquepid = T2.uniquepid JOIN patient ON T1.uniquepid = patient.uniquepid WHERE T1.diagnosistime < T2.drugstarttime GROUP BY patient.uniquepid HAVING MAX(patient.hospitaldischargetime) = patient.hospitaldischargetime )",
            "pred_sql": "WITH eligible_patients AS ( SELECT DISTINCT p.patientunitstayid, d.diagnosistime FROM diagnosis d JOIN patient p ON d.patientunitstayid = p.patientunitstayid JOIN treatment t ON p.patientunitstayid = t.patientunitstayid JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE d.diagnosisname = 'cardiac arrest - witnessed' AND t.treatmentname LIKE '%CPR%' AND t.treatmenttime >= d.diagnosistime AND t.treatmenttime <= datetime(d.diagnosistime, '+15 minutes') AND m.drugname = '20.3 ml cup : acetaminophen 160 mg/5ml po soln' AND m.drugstarttime > d.diagnosistime ) SELECT (COUNT(*) - SUM(CASE WHEN p.hospitaldischargestatus = 'expired' AND datetime(p.hospitaldischargetime) <= datetime(ep.diagnosistime, '+91.25 days') THEN 1 ELSE 0 END)) * 1.0 / COUNT(*) AS survival_rate FROM eligible_patients ep JOIN patient p ON ep.patientunitstayid = p.patientunitstayid;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally alters the logic by introducing a JOIN on the treatment table (filtering by CPR treatment time) rather than relying on the diagnosis name that already encodes \u201c< 15 minutes cpr.\u201d It also mismatches diagnosis names, misuses treatment conditions, and computes the time window differently. These changes affect the entire query structure and intended patient cohort selection, so the error is not a localized typo or syntax mistake but a global logical/join error.",
            "error_type": "Global: incorrect join/logic error"
        },
        "1244ff6a6a69b74074964f0a": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "When was patient 035-10028's nutrition total input the last time on this month/22?",
            "gold_sql": "SELECT intakeoutput.intakeoutputtime FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '035-10028' ) ) AND intakeoutput.cellpath LIKE '%intake%' AND intakeoutput.celllabel = 'nutrition total' AND datetime(intakeoutput.intakeoutputtime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month') AND strftime('%d',intakeoutput.intakeoutputtime) = '22' ORDER BY intakeoutput.intakeoutputtime DESC LIMIT 1",
            "pred_sql": "SELECT i.intakeoutputtime FROM intakeoutput i JOIN patient p ON i.patientunitstayid = p.patientunitstayid WHERE p.uniquepid = '035-10028' AND i.cellpath LIKE '%intake%' AND datetime(i.intakeoutputtime, 'start of month') = datetime('2100-12-31 23:59:00', 'start of month', '-0 month') AND strftime('%d', i.intakeoutputtime) = '22' ORDER BY i.intakeoutputtime DESC LIMIT 1;",
            "gold_answer": "[['2100-12-22 18:00:00']]",
            "pred_answer": "[['2100-12-22 23:00:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL differs from the ground truth only in its WHERE clause: it omits the condition AND i.celllabel = 'nutrition total'. As a result, it picks up any intake event on the 22nd of the month rather than specifically the \u201cnutrition total\u201d input. This is a localized mistake in the WHERE clause filters and does not require restructuring the joins or overall query logic.",
            "error_type": "Local: missing-filter error"
        },
        "78e443fce3a9afcc620fcb1d": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What is patient 009-10046's difference in weight from the second value measured on the first hospital visit compared to the first value measured on the first hospital visit?",
            "gold_sql": "SELECT ( SELECT patient.admissionweight FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '009-10046' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) AND patient.admissionweight IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 OFFSET 1 ) - ( SELECT patient.admissionweight FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '009-10046' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) AND patient.admissionweight IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 )",
            "pred_sql": "SELECT (dischargeweight - admissionweight) AS weight_difference FROM patient WHERE uniquepid = '009-10046' AND hospitaladmittime = ( SELECT MIN(hospitaladmittime) FROM patient WHERE uniquepid = '009-10046' ) AND admissionweight IS NOT NULL AND dischargeweight IS NOT NULL;",
            "gold_answer": "[['-19.7']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the logic by using a single patient row\u2019s dischargeweight and admissionweight instead of comparing the first and second admissionweight measurements within the first hospital visit. It ignores the requirement to identify the first hospital visit\u2019s unit stays and select the two admissionweight values in chronological order. This is not a simple typo or missing alias\u2014it alters the entire approach to retrieving and comparing the correct records, so it is a global logical error.",
            "error_type": "Global: logical error"
        },
        "7c73804551fbdd9ef9889a18": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "How many people were given oxygen therapy (> 60%) - >90% two or more times in 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, COUNT(*) AS C1 FROM patient WHERE patient.patientunitstayid = ( SELECT treatment.patientunitstayid FROM treatment WHERE treatment.treatmentname = 'oxygen therapy (> 60%) - >90%' AND strftime('%Y',treatment.treatmenttime) = '2100' ) GROUP BY patient.uniquepid ) AS T1 WHERE T1.C1 >= 2",
            "pred_sql": "SELECT COUNT(*) AS count FROM ( SELECT p.uniquepid FROM vitalperiodic v JOIN patient p ON v.patientunitstayid = p.patientunitstayid WHERE v.sao2 > 90 AND strftime('%Y', v.observationtime) = '2100' GROUP BY p.uniquepid HAVING COUNT(*) >= 2 ) AS subquery;",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['1327.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL entirely changes the logic by using the vitalperiodic table and checking soh2 > 90 instead of looking for the specific treatment 'oxygen therapy (> 60%) - >90%' in the treatment table. This is not a minor fix in a single clause but a fundamental change in which table and condition define the event, thus altering the intended meaning of the query. It requires restructuring the query\u2019s core logic, so this is a global error.",
            "error_type": "Global: incorrect table and logic"
        },
        "502d5227ec779976f20ab9a0": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "Could you fetch the top five most common specimens tested in 2100 for me?",
            "gold_sql": "SELECT T1.culturesite FROM ( SELECT microlab.culturesite, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM microlab WHERE strftime('%Y',microlab.culturetakentime) = '2100' GROUP BY microlab.culturesite ) AS T1 WHERE T1.C1 <= 5",
            "pred_sql": "SELECT labname FROM lab WHERE strftime('%Y', labresulttime) = '2100' GROUP BY labname ORDER BY COUNT(*) DESC LIMIT 5;",
            "gold_answer": "[['blood, venipuncture'], ['nasopharynx'], ['sputum, tracheal specimen'], ['urine, catheter specimen'], ['urine, voided specimen']]",
            "pred_answer": "[['bedside glucose'], ['chloride'], ['glucose'], ['potassium'], ['sodium']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the lab table and labname column, whereas the question and ground truth refer to specimen sites in the microlab table (culturesite). This is not a minor syntax or alias issue but a fundamental misuse of the wrong table and column, which changes the entire meaning of the query.",
            "error_type": "Global: wrong table used"
        },
        "bd60c97129317d3f97c71815": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "Can you list the top five most frequent procedures that patients received within the same hospital visit after having systemic glucocorticoid in 2100?",
            "gold_sql": "SELECT T3.treatmentname FROM ( SELECT T2.treatmentname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'systemic glucocorticoid' AND strftime('%Y',treatment.treatmenttime) = '2100' ) AS T1 JOIN ( SELECT patient.uniquepid, treatment.treatmentname, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE strftime('%Y',treatment.treatmenttime) = '2100' ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.treatmenttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.treatmentname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT t.treatmentname FROM medication m JOIN patient p1 ON m.patientunitstayid = p1.patientunitstayid JOIN patient p2 ON p1.patienthealthsystemstayid = p2.patienthealthsystemstayid JOIN treatment t ON t.patientunitstayid = p2.patientunitstayid WHERE m.drugname LIKE '%glucocorticoid%' AND strftime('%Y', m.drugstarttime) = '2100' AND t.treatmenttime > m.drugstarttime GROUP BY t.treatmentname ORDER BY COUNT(*) DESC LIMIT 5;",
            "gold_answer": "[['anticonvulsant - gabapentin'], ['antihyperlipidemic agent - hmg-coa reductase inhibitor'], ['chemotherapy'], ['cultures - sputum'], ['intravenous diuretic - iv furosemide'], ['oxygen therapy (> 60%) - non-rebreather mask'], ['stress ulcer prophylaxis - pantoprazole'], ['systemic glucocorticoid'], ['therapeutic antibacterials - penicillins']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query filters on medication.drugname and joins medication to two patient aliases before finally pulling treatments. The original question asked about \u2018systemic glucocorticoid\u2019 in the treatment table. The predicted SQL\u2019s error is entirely in the FROM/JOIN clause (it uses the wrong table for the initial glucocorticoid event and incorrect patient joins), but the overall structure (grouping, ordering, limit) remains intact. This is a localized table reference/join mistake, not a broader logical restructuring error.",
            "error_type": "Local: incorrect-table/join error"
        },
        "818d2b11247df11000ce8ce0": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What are the top three most frequent specimens ordered for patients after being diagnosed with bacteremia within the same hospital visit this year?",
            "gold_sql": "SELECT T3.culturesite FROM ( SELECT T2.culturesite, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'bacteremia' AND datetime(diagnosis.diagnosistime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, microlab.culturesite, microlab.culturetakentime, patient.patienthealthsystemstayid FROM microlab JOIN patient ON microlab.patientunitstayid = patient.patientunitstayid WHERE datetime(microlab.culturetakentime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.culturetakentime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.culturesite ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "WITH BacteremiaDiagnoses AS ( SELECT patientunitstayid, MIN(diagnosistime) AS first_diagnosistime FROM diagnosis WHERE diagnosisname = 'bacteremia' AND strftime('%Y', diagnosistime) = '2100' GROUP BY patientunitstayid ) SELECT ml.culturesite FROM microlab ml INNER JOIN BacteremiaDiagnoses bd ON ml.patientunitstayid = bd.patientunitstayid AND ml.culturetakentime > bd.first_diagnosistime GROUP BY ml.culturesite ORDER BY COUNT(*) DESC LIMIT 3;",
            "gold_answer": "[['blood, venipuncture'], ['csf'], ['sputum, expectorated']]",
            "pred_answer": "[['blood, venipuncture'], ['nasopharynx'], ['sputum, expectorated']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only filters diagnoses to this year but does not restrict microlab records to this year, nor does it enforce the \u2018same hospital visit\u2019 requirement via patient.patienthealthsystemstayid. Instead it joins on patientunitstayid, which ties to individual ICU/unit stays rather than the overall hospital encounter. This incorrect join key and missing filter change the core logic of the query, leading to different top specimens.",
            "error_type": "Global: incorrect join/key relationship"
        },
        "5e88f3adc2224af386b15188": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "How many patients underwent cardiology consultation within the same hospital visit after normal saline solution?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'normal saline solution' ) AS T1 JOIN ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'cardiology consultation' ) AS T2 WHERE T1.treatmenttime < T2.treatmenttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT COUNT(DISTINCT p.uniquepid) FROM treatment t JOIN patient p ON t.patientunitstayid = p.patientunitstayid WHERE t.treatmentname = 'normal saline administration' AND EXISTS ( SELECT 1 FROM diagnosis d JOIN patient p2 ON d.patientunitstayid = p2.patientunitstayid WHERE p2.patienthealthsystemstayid = p.patienthealthsystemstayid AND d.diagnosisname = 'cardiology consultation' AND d.diagnosistime > t.treatmenttime );",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the logic by querying the diagnosis table for 'cardiology consultation' instead of the treatment table and even uses the wrong treatment name 'normal saline administration'. This is not a localized typo or minor syntax issue but a structural error that alters which tables and relationships are used, thus requiring a significant rewrite of the query logic.",
            "error_type": "Global: incorrect table/join usage"
        },
        "79b2a1c645f45cee560dd09b": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What was the daily average input of p.o. for patient 002-1185 on the current hospital visit?",
            "gold_sql": "SELECT AVG(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '002-1185' AND patient.hospitaldischargetime IS NULL ) ) AND intakeoutput.celllabel = 'p.o.' AND intakeoutput.cellpath LIKE '%intake%' GROUP BY strftime('%Y-%m-%d',intakeoutput.intakeoutputtime)",
            "pred_sql": "SELECT SUM(io.cellvaluenumeric) / (julianday('2100-12-31 23:59:00') - julianday(p.unitadmittime)) AS daily_avg_p_o FROM patient p JOIN intakeoutput io ON p.patientunitstayid = io.patientunitstayid WHERE p.uniquepid = '002-1185' AND p.hospitaldischargetime IS NULL AND io.cellpath LIKE '%p.o.%';",
            "gold_answer": "[['260.0'], ['333.333']]",
            "pred_answer": "[['2331.114']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the intended logic. Instead of computing a per-day average by grouping intake values by date (as in the ground truth), it sums all p.o. inputs and divides by the time since admission, producing a single aggregate rather than daily averages. It also misuses cellpath for filtering \u2018p.o.\u2019 instead of using celllabel and omits the GROUP BY on the intake date. These errors require restructuring the aggregation and grouping logic across multiple clauses, not a localized fix.",
            "error_type": "Global: aggregation logic error"
        },
        "b11dccba6b0fa27a522c37c7": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What drug was patient 013-10215 prescribed with after the diagnosis of bone fracture(s) - left lower extremity within 2 days this month?",
            "gold_sql": "SELECT T2.drugname FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '013-10215' ) AND diagnosis.diagnosisname = 'bone fracture(s) - left lower extremity' AND datetime(diagnosis.diagnosistime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '013-10215' ) AND datetime(medication.drugstarttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND datetime(T2.drugstarttime) BETWEEN datetime(T1.diagnosistime) AND datetime(T1.diagnosistime,'+2 day')",
            "pred_sql": "SELECT DISTINCT m.drugname FROM patient p JOIN diagnosis d ON p.patientunitstayid = d.patientunitstayid JOIN medication m ON p.patientunitstayid = m.patientunitstayid WHERE p.uniquepid = '013-10215' AND d.diagnosisname = 'bone fracture(s) - left lower extremity' AND strftime('%Y-%m', d.diagnosistime) = '2100-12' AND m.drugstarttime >= d.diagnosistime AND m.drugstarttime <= datetime(d.diagnosistime, '+2 days') AND strftime('%Y-%m', m.drugstarttime) = '2100-12' AND d.diagnosistime = ( SELECT MIN(diagnosistime) FROM diagnosis WHERE patientunitstayid = p.patientunitstayid AND diagnosisname = 'bone fracture(s) - left lower extremity' AND strftime('%Y-%m', diagnosistime) = '2100-12' );",
            "gold_answer": "[['bisacodyl'], ['bisacodyl'], ['bisacodyl'], ['bisacodyl'], ['cefazolin'], ['diphenhydramine'], ['diphenhydramine'], ['docusate sodium'], ['docusate sodium'], ['enoxaparin'], ['enoxaparin'], ['enoxaparin'], ['flumazenil'], ['hydrocodone-acetaminophen'], ['hydrocodone-acetaminophen'], ['hydrocodone-acetaminophen'], ['hydrocodone-acetaminophen'], ['hydrocodone-acetaminophen'], ['hydrocodone-acetaminophen'], ['hydromorphone'], ['hydromorphone'], ['hydromorphone'], ['ipratropium-albuterol'], ['naloxone'], ['naloxone'], ['naloxone'], ['ondansetron'], ['ondansetron'], ['ondansetron'], ['pantoprazole']]",
            "pred_answer": "[['bisacodyl'], ['bisacodyl'], ['cefazolin'], ['diphenhydramine'], ['docusate sodium'], ['enoxaparin'], ['hydrocodone-acetaminophen'], ['hydrocodone-acetaminophen'], ['naloxone'], ['ondansetron'], ['pantoprazole']]",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces a filter limiting the diagnosis time to the earliest (\u2018MIN(diagnosistime)\u2019) within the month, whereas the ground truth considers all diagnosis events in that month and all corresponding medications within two days of each. This change alters the overall logic\u2014omitting drugs tied to later diagnoses\u2014and is not a simple typo or localized syntax issue but a structural/logical difference across clauses.",
            "error_type": "Global: incorrect logical filter on diagnosis time"
        },
        "51480a6db604cb44753b4aa9": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "How many patients received a bronchodilator procedure within the same hospital visit after having a non-invasive ventilation procedure this year?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.uniquepid ) FROM ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'non-invasive ventilation' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT patient.uniquepid, treatment.treatmenttime, patient.patienthealthsystemstayid FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'bronchodilator' AND datetime(treatment.treatmenttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 WHERE T1.treatmenttime < T2.treatmenttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid",
            "pred_sql": "SELECT COUNT(DISTINCT p.uniquepid) FROM treatment t1 JOIN treatment t2 ON t1.patientunitstayid = t2.patientunitstayid AND t2.treatmenttime > t1.treatmenttime JOIN patient p ON t1.patientunitstayid = p.patientunitstayid WHERE t1.treatmentname LIKE '%non-invasive ventilation%' AND t2.treatmentname LIKE '%bronchodilator%' AND strftime('%Y', t1.treatmenttime) = '2100';",
            "gold_answer": "[['10.0']]",
            "pred_answer": "[['23.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to restrict the bronchodilator events to the current year and furthermore joins treatments on patientunitstayid rather than patienthealthsystemstayid (hospital visit). This changes the query\u2019s core logic for \u201csame hospital visit\u201d and miscounts patients. These are not simple typos but fundamental join and filtering mistakes that require restructuring the query, so it is a global error.",
            "error_type": "Global: incorrect join and filter logic"
        },
        "ead4af74ff9f344c2ee4482b": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "On the first hospital visit, what was patient 017-100472's last procedure time?",
            "gold_sql": "SELECT treatment.treatmenttime FROM treatment WHERE treatment.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '017-100472' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) ORDER BY treatment.treatmenttime DESC LIMIT 1",
            "pred_sql": "WITH first_admission AS ( SELECT patientunitstayid, hospitaladmittime, hospitaldischargetime FROM patient WHERE uniquepid = '017-100472' ORDER BY hospitaladmittime ASC LIMIT 1 ) SELECT MAX(event_time) AS last_procedure_time FROM ( SELECT treatmenttime AS event_time FROM treatment WHERE patientunitstayid = (SELECT patientunitstayid FROM first_admission) AND treatmenttime BETWEEN (SELECT hospitaladmittime FROM first_admission) AND (SELECT hospitaldischargetime FROM first_admission) UNION ALL SELECT labresulttime AS event_time FROM lab WHERE patientunitstayid = (SELECT patientunitstayid FROM first_admission) AND labresulttime BETWEEN (SELECT hospitaladmittime FROM first_admission) AND (SELECT hospitaldischargetime FROM first_admission) UNION ALL SELECT drugstarttime AS event_time FROM medication WHERE patientunitstayid = (SELECT patientunitstayid FROM first_admission) AND drugstarttime BETWEEN (SELECT hospitaladmittime FROM first_admission) AND (SELECT hospitaldischargetime FROM first_admission) UNION ALL SELECT drugstoptime AS event_time FROM medication WHERE patientunitstayid = (SELECT patientunitstayid FROM first_admission) AND drugstoptime BETWEEN (SELECT hospitaladmittime FROM first_admission) AND (SELECT hospitaldischargetime FROM first_admission) UNION ALL SELECT culturetakentime AS event_time FROM microlab WHERE patientunitstayid = (SELECT patientunitstayid FROM first_admission) AND culturetakentime BETWEEN (SELECT hospitaladmittime FROM first_admission) AND (SELECT hospitaldischargetime FROM first_admission) ) AS all_events;",
            "gold_answer": "[['2100-02-16 07:45:00']]",
            "pred_answer": "[['2100-02-20 17:47:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally alters the query\u2019s logic in two major ways. First, its CTE for the first admission does not enforce that the visit be completed (hospitaldischargetime IS NOT NULL), so it may pick the wrong stay. Second, it reinterprets \u201cprocedure\u201d to include labs, medications, and microlabs by unioning multiple tables and taking the max timestamp, rather than returning the last treatment time alone. These changes span multiple clauses and restructure the query\u2019s intended meaning, making this a global error.",
            "error_type": "Global: incorrect query logic"
        },
        "acc3a9c211f42e9d6d154a20": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What are the top five diagnoses associated with the highest 3-month mortality rate?",
            "gold_sql": "SELECT T4.diagnosisname FROM ( SELECT T3.diagnosisname, DENSE_RANK() OVER ( ORDER BY T3.C2 ASC ) AS C2 FROM ( SELECT T2.diagnosisname, AVG(C1) AS C2 FROM ( SELECT T1.diagnosisname, ( CASE WHEN (patient.hospitaldischargestatus = 'expired') AND(strftime('%J',patient.hospitaldischargetime) - strftime('%J',T1.diagnosistime)) < 365 / 4 THEN 0 ELSE 1 END ) as C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosisname, diagnosis.diagnosistime FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnosis.diagnosistime) >= 365 / 4 GROUP BY patient.uniquepid, diagnosis.diagnosisname HAVING MIN(diagnosis.diagnosistime) = diagnosis.diagnosistime ) AS T1 JOIN patient ON T1.uniquepid = patient.uniquepid ) AS T2 GROUP BY T2.diagnosisname ) AS T3 ) AS T4 WHERE T4.C2 <= 5",
            "pred_sql": "SELECT d.diagnosisname FROM diagnosis d JOIN patient p ON d.patientunitstayid = p.patientunitstayid WHERE p.hospitaldischargestatus IS NOT NULL AND p.hospitaldischargetime IS NOT NULL GROUP BY d.diagnosisname ORDER BY SUM(CASE WHEN p.hospitaldischargestatus = 'expired' AND julianday(p.hospitaldischargetime) <= julianday(d.diagnosistime) + 91.25 THEN 1 ELSE 0 END) * 1.0 / COUNT(*) DESC LIMIT 5;",
            "gold_answer": "[['acute copd exacerbation - with baseline hypoxemia'], ['acute lung injury'], ['acute renal failure - due to sepsis'], ['acute renal failure - etiology unknown'], ['anuria'], ['ards - pulmonary etiology'], ['arterial thromboembolism'], ['arterial thromboembolism - kidney'], ['av block - pacemaker in place, pacing and capturing'], ['bacteremia - gram negative rod'], ['bacteremia - respiratory source'], ['biliary obstruction - cholelithiasis'], ['bone fracture(s) - right upper extremity'], ['cardiac arrest - initial rhythm: asystole'], ['cardiac arrest - initial rhythm: pulseless electrical activity'], ['cardiac arrest - initial rhythm: ventricular tachycardia'], ['cardiac arrest - un-witnessed'], ['cellulitis - abdomen/pelvis'], ['cerebral subdural hematoma - secondary to anticoagulation'], ['cholecystitis - acute'], ['congestive heart failure - left-sided'], ['dvt - left upper extremity'], ['dvt - right lower extremity'], ['dvt - right upper extremity'], ['encephalopathy - post-anoxic'], ['encephalopathy - toxic'], ['enteritis - colitis, presumed infectious'], ['facial bone fracture - maxillary fracture'], ['facial bone fracture - orbital fracture'], ['gastric ca'], ['gi obstruction / ileus'], ['hepatic encephalopathy'], ['hyperglycemia - corticosteroid related'], ['hypernatremia - severe (> 155 meq/dl)'], ['hypochloremia'], ['hypothermia'], ['hypovolemic shock - hemorrhagic'], ['intracranial injury'], ['liver ca'], ['melanoma - nodular'], ['mouth and jaw tumor - oral cavity squamous cell ca'], ['myopathy - malignant hyperthermia'], ['neck tumor'], ['necrotizing fasciitis - abdomen/pelvis'], ['peripheral vascular ischemia - atherosclerotic thrombo-occlusion'], ['peripheral vascular ischemia - postoperative'], ['pleural effusion - due to heart failure'], ['pneumothorax - spontaneous'], ['s/p aneurysm resection/repair abdominal aorta'], ['seizures - from etoh withdrawal'], ['seizures - from ischemia/infarction'], ['sepsis - sepsis with multi-organ dysfunction'], ['sepsis - sepsis with single organ dysfunction- circulatory system failure'], ['septic shock - cultures pending'], ['shock, etiology unclear'], ['thrombocytopenia - primary hematologic malignancy'], ['valve repair >= 7 days - aortic / mitral'], ['vascular insufficiency of intestine - due to extrinsic compression'], ['ventricular tachycardia - with hemodynamic compromise']]",
            "pred_answer": "[['thrombocytopenia - primary hematologic malignancy'], ['valve repair >= 7 days - aortic / mitral'], ['vascular insufficiency of intestine'], ['vascular insufficiency of intestine - due to extrinsic compression'], ['ventricular tachycardia - with hemodynamic compromise']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally alters the logic for computing 3-month mortality. Instead of using each patient\u2019s first diagnosis and ensuring at least 3 months of follow-up, it simply aggregates over all diagnosis rows, fails to filter out diagnoses occurring within the last 3 months, and uses COUNT(*) of diagnosis records rather than distinct patients as the denominator. These mistakes span multiple clauses (WHERE, GROUP BY, ORDER BY) and change the intended meaning of the query. Fixing this would require restructuring the query to first select one diagnosis per patient and enforce the follow-up window, not merely tweaking a single clause.",
            "error_type": "Global: flawed mortality rate calculation"
        },
        "8698359fd57df45989fcd9a0": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What are the five most commonly prescribed drugs for patients diagnosed with chronic kidney disease previously within the same hospital visit, since 1 year ago?",
            "gold_sql": "SELECT T3.drugname FROM ( SELECT T2.drugname, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, diagnosis.diagnosistime, patient.patienthealthsystemstayid FROM diagnosis JOIN patient ON diagnosis.patientunitstayid = patient.patientunitstayid WHERE diagnosis.diagnosisname = 'chronic kidney disease' AND datetime(diagnosis.diagnosistime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, medication.drugname, medication.drugstarttime, patient.patienthealthsystemstayid FROM medication JOIN patient ON medication.patientunitstayid = patient.patientunitstayid WHERE datetime(medication.drugstarttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.diagnosistime < T2.drugstarttime AND T1.patienthealthsystemstayid = T2.patienthealthsystemstayid GROUP BY T2.drugname ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT drugname FROM ( SELECT m.drugname, COUNT(*) AS cnt FROM diagnosis d JOIN medication m ON d.patientunitstayid = m.patientunitstayid WHERE d.diagnosisname = 'chronic kidney disease' AND d.diagnosistime >= datetime('2100-12-31 23:59:00', '-1 year') AND m.drugstarttime > d.diagnosistime GROUP BY m.drugname ORDER BY cnt DESC LIMIT 5 );",
            "gold_answer": "[['carvedilol'], ['furosemide'], ['glycopyrrolate'], ['hydrocodone-acetaminophen'], ['lorazepam'], ['morphine']]",
            "pred_answer": "[['carvedilol'], ['furosemide'], ['glycopyrrolate'], ['hydrocodone-acetaminophen'], ['morphine']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only joins diagnosis and medication on patientunitstayid and does not ensure that the diagnosis and subsequent medication prescriptions occurred within the same hospital visit (patienthealthsystemstayid). The ground truth query explicitly joins through patient.patienthealthsystemstayid to enforce the same hospital admission and uses DENSE_RANK to pick the top five by frequency. The predicted query\u2019s missing join on patienthealthsystemstayid changes the overall logic and data associations, leading to incorrect drug counts and the wrong fifth drug. Fixing this requires restructuring the join logic to include hospital visit linkage, not just a local tweak.",
            "error_type": "Global: join-relationship error"
        },
        "8a1c32c5bac4ca824a13e857": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What is the percentile of 8.9 in the total bilirubin lab test with the same age as patient 002-10845 on the first hospital visit?",
            "gold_sql": "SELECT DISTINCT T1.C1 FROM ( SELECT lab.labresult, PERCENT_RANK() OVER ( ORDER BY lab.labresult ) AS C1 FROM lab WHERE lab.labname = 'total bilirubin' AND lab.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.age = ( SELECT patient.age FROM patient WHERE patient.uniquepid = '002-10845' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1 ) ) ) AS T1 WHERE T1.labresult = 8.9",
            "pred_sql": "WITH first_admission_age AS ( SELECT uniquepid, age FROM patient WHERE (uniquepid, hospitaladmittime) IN ( SELECT uniquepid, MIN(hospitaladmittime) FROM patient GROUP BY uniquepid ) ), target_age AS ( SELECT age FROM patient WHERE uniquepid = '002-10845' ORDER BY hospitaladmittime ASC LIMIT 1 ) SELECT (COUNT(CASE WHEN lab.labresult <= 8.9 THEN 1 END) * 100.0 / COUNT(*)) AS percentile FROM lab JOIN patient ON lab.patientunitstayid = patient.patientunitstayid JOIN first_admission_age ON patient.uniquepid = first_admission_age.uniquepid CROSS JOIN target_age WHERE first_admission_age.age = target_age.age AND lab.labname = 'total bilirubin';",
            "gold_answer": "[['0.973']]",
            "pred_answer": "[['97.368']]",
            "is_correct": false,
            "reasoning": "The predicted SQL deviates from the intended percentile computation in several ways: it replaces the window\u2010function PERCENT_RANK() with a custom COUNT-based calculation, multiplies the result by 100 (producing 97.368 instead of the expected 0.973), and reshapes the query logic around aggregations rather than a straightforward window function. This error spans the overall query logic (how the percentile is computed and formatted), not just a minor syntactic or reference issue.",
            "error_type": "Global: incorrect percentile calculation"
        },
        "c939da95b18a427be1e09ceb": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What methods are used to ingest haloperidol lactate?",
            "gold_sql": "SELECT DISTINCT medication.routeadmin FROM medication WHERE medication.drugname = 'haloperidol lactate'",
            "pred_sql": "SELECT DISTINCT routeadmin FROM medication WHERE drugname LIKE '%haloperidol lactate%';",
            "gold_answer": "[['inj'], ['intramuscular'], ['intravenou'], ['intravenous'], ['iv'], ['zpyxvend']]",
            "pred_answer": "[['im'], ['inj'], ['intramuscular'], ['intravenou'], ['intravenous'], ['iv'], ['iv push'], ['zpyxvend']]",
            "is_correct": false,
            "reasoning": "The only difference between the ground truth and predicted SQL is in the WHERE clause: the ground truth uses an exact match (drugname = 'haloperidol lactate'), while the predicted SQL uses a LIKE pattern match. This change in condition leads to extra, unintended routes (e.g., 'im', 'iv push'). The error is confined to the WHERE clause and does not alter the overall structure or joins of the query, so it\u2019s a localized mistake.",
            "error_type": "Local: where-clause error"
        },
        "faf27b3469012cf43bdd7181": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "When did patient 002-10915 enter the hospital the first time via icu to sdu?",
            "gold_sql": "SELECT patient.hospitaladmittime FROM patient WHERE patient.uniquepid = '002-10915' AND patient.hospitaladmitsource = 'icu to sdu' AND patient.hospitaldischargetime IS NOT NULL ORDER BY patient.hospitaladmittime ASC LIMIT 1",
            "pred_sql": "SELECT p1.hospitaladmittime FROM patient p1 JOIN patient p2 ON p1.patienthealthsystemstayid = p2.patienthealthsystemstayid WHERE p1.uniquepid = '002-10915' AND p2.uniquepid = '002-10915' AND p1.wardid = 103 AND p2.wardid = 82 AND p1.unitadmittime < p2.unitadmittime ORDER BY p1.hospitaladmittime LIMIT 1;",
            "gold_answer": "[['2100-06-17 11:06:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally restructures the logic by using a self-join on the patient table with wardid filters instead of directly filtering hospitaladmitsource = 'icu to sdu' and checking discharge time. It omits the required hospitaladmitsource condition and introduces an incorrect join on patienthealthsystemstayid and wardid values, altering the intended query meaning. This is not a fixable typo in one clause but a flawed join strategy that changes the overall logic.",
            "error_type": "Global: flawed-join error"
        },
        "4bb4cea94cf2fb2ae68eee36": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "What are the three most commonly taken specimens that patients are tested within the same month after receiving a sedative agent - propofol procedure since 1 year ago?",
            "gold_sql": "SELECT T3.culturesite FROM ( SELECT T2.culturesite, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'sedative agent - propofol' AND datetime(treatment.treatmenttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, microlab.culturesite, microlab.culturetakentime FROM microlab JOIN patient ON microlab.patientunitstayid = patient.patientunitstayid WHERE datetime(microlab.culturetakentime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.culturetakentime AND datetime(T1.treatmenttime,'start of month') = datetime(T2.culturetakentime,'start of month') GROUP BY T2.culturesite ) AS T3 WHERE T3.C1 <= 3",
            "pred_sql": "SELECT lab.labname FROM medication JOIN lab ON medication.patientunitstayid = lab.patientunitstayid WHERE medication.drugname LIKE '%propofol%' AND medication.drugstarttime >= datetime('2100-12-31 23:59:00', '-1 year') AND datetime(lab.labresulttime, 'start of month') = datetime(medication.drugstarttime, 'start of month') AND lab.labresulttime >= medication.drugstarttime GROUP BY lab.labname ORDER BY COUNT(*) DESC LIMIT 3;",
            "gold_answer": "[['blood, venipuncture']]",
            "pred_answer": "[['bedside glucose'], ['glucose'], ['sodium']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the medication and lab tables instead of the treatment and microlab tables. It matches on medication.drugname LIKE '%propofol%' and lab.labresulttime rather than treatment.treatmentname = 'sedative agent - propofol' and microlab.culturetakentime, and it selects lab.labname instead of microlab.culturesite. This is not a minor syntax or column name mistake but a fundamental change in the query\u2019s logic and table relationships, requiring restructuring of the entire query to achieve the intended result.",
            "error_type": "Global: incorrect table join/structure"
        },
        "a5f9250cdf485bbb7612f00d": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "Tell me the difference in the systolic blood pressure value for patient 027-100313 last measured on the first icu visit compared to the first value measured on the first icu visit?",
            "gold_sql": "SELECT ( SELECT vitalperiodic.systemicsystolic FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-100313' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 ) AND vitalperiodic.systemicsystolic IS NOT NULL ORDER BY vitalperiodic.observationtime DESC LIMIT 1 ) - ( SELECT vitalperiodic.systemicsystolic FROM vitalperiodic WHERE vitalperiodic.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '027-100313' ) AND patient.unitdischargetime IS NOT NULL ORDER BY patient.unitadmittime ASC LIMIT 1 ) AND vitalperiodic.systemicsystolic IS NOT NULL ORDER BY vitalperiodic.observationtime ASC LIMIT 1 )",
            "pred_sql": "SELECT (SELECT systemicsystolic FROM vitalperiodic WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '027-100313' ORDER BY unitadmittime ASC LIMIT 1 ) ORDER BY observationtime DESC LIMIT 1) - (SELECT systemicsystolic FROM vitalperiodic WHERE patientunitstayid = ( SELECT patientunitstayid FROM patient WHERE uniquepid = '027-100313' ORDER BY unitadmittime ASC LIMIT 1 ) ORDER BY observationtime ASC LIMIT 1) AS difference;",
            "gold_answer": "[['28.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to identify the same first ICU visit that the ground truth uses. It directly picks the first patientunitstayid by uniquepid without filtering for a completed ICU stay (unitdischargetime IS NOT NULL) or joining on patienthealthsystemstayid, leading to the wrong ICU visit (and thus no valid systolic values). This mis-selection is not a minor typo or missing alias but a fundamental logic flaw that spans the subquery structure and the overall meaning of the query.",
            "error_type": "Global: incorrect visit selection"
        },
        "926c6da813c51e098482d768": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "Calculate the total volume of urine catheter for patient 022-1011 on the current icu visit.",
            "gold_sql": "SELECT SUM(intakeoutput.cellvaluenumeric) FROM intakeoutput WHERE intakeoutput.patientunitstayid IN ( SELECT patient.patientunitstayid FROM patient WHERE patient.patienthealthsystemstayid IN ( SELECT patient.patienthealthsystemstayid FROM patient WHERE patient.uniquepid = '022-1011' ) AND patient.unitdischargetime IS NULL ) AND intakeoutput.celllabel = 'urine catheter' AND intakeoutput.cellpath LIKE '%output%'",
            "pred_sql": "SELECT SUM(io.cellvaluenumeric) AS total_volume FROM patient p JOIN intakeoutput io ON p.patientunitstayid = io.patientunitstayid WHERE p.uniquepid = '022-1011' AND p.hospitaldischargetime IS NULL AND io.celllabel = 'urine' AND io.cellpath LIKE '%output%';",
            "gold_answer": "[['113237.0']]",
            "pred_answer": "[['100.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL mistakenly filters on p.hospitaldischargetime IS NULL instead of p.unitdischargetime IS NULL (to identify the current ICU visit) and uses io.celllabel = 'urine' instead of the correct 'urine catheter'. These are errors confined to the WHERE clause (wrong column and wrong literal value) and do not alter the overall join structure or query logic.",
            "error_type": "Local: column reference and literal value error"
        },
        "eb89b2270e848e175f5257f9": {
            "db_id": "eicu",
            "generator_name": "qwen3",
            "question": "Since 1 year ago, what are the top five most frequently tested specimens for patients within 2 months after receiving neurology consultation?",
            "gold_sql": "SELECT T3.culturesite FROM ( SELECT T2.culturesite, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT patient.uniquepid, treatment.treatmenttime FROM treatment JOIN patient ON treatment.patientunitstayid = patient.patientunitstayid WHERE treatment.treatmentname = 'neurology consultation' AND datetime(treatment.treatmenttime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T1 JOIN ( SELECT patient.uniquepid, microlab.culturesite, microlab.culturetakentime FROM microlab JOIN patient ON microlab.patientunitstayid = patient.patientunitstayid WHERE datetime(microlab.culturetakentime) >= datetime('2100-12-31 23:59:00','-1 year') ) AS T2 ON T1.uniquepid = T2.uniquepid WHERE T1.treatmenttime < T2.culturetakentime AND datetime(T2.culturetakentime) BETWEEN datetime(T1.treatmenttime) AND datetime(T1.treatmenttime,'+2 month') GROUP BY T2.culturesite ) AS T3 WHERE T3.C1 <= 5",
            "pred_sql": "SELECT lab.labname FROM diagnosis JOIN lab ON diagnosis.patientunitstayid = lab.patientunitstayid WHERE diagnosis.diagnosistime >= datetime('2100-12-31 23:59:00', '-1 year') AND diagnosis.diagnosistime <= datetime('2100-12-31 23:59:00') AND diagnosis.diagnosisname LIKE '%neurology%' AND lab.labresulttime >= diagnosis.diagnosistime AND lab.labresulttime <= datetime(diagnosis.diagnosistime, '+2 months') AND lab.labresulttime <= datetime('2100-12-31 23:59:00') GROUP BY lab.labname ORDER BY COUNT(*) DESC LIMIT 5;",
            "gold_answer": "[['blood, venipuncture'], ['nasopharynx'], ['sputum, expectorated']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely misinterprets the question by using the diagnosis and lab tables rather than the treatment and microlab tables. It treats \u201cneurology consultation\u201d as a diagnosis name and retrieves lab.labname instead of microlab.culturesite. This isn\u2019t a simple typo or local clause mistake but a fundamental change to the query\u2019s structure and intended logic, requiring rewriting multiple joins and clauses to correct it.",
            "error_type": "Global: incorrect table usage"
        }
    }
}