{
    "codes": {
        "b1bf14bf9333394d698cdcb5": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "When was the last sodium test that patient 10037928 received since 11/2100?",
            "gold_sql": "SELECT labevents.charttime FROM labevents WHERE labevents.itemid IN ( SELECT d_labitems.itemid FROM d_labitems WHERE d_labitems.label = 'sodium' ) AND labevents.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10037928 ) AND strftime('%Y-%m',labevents.charttime) >= '2100-11' ORDER BY labevents.charttime DESC LIMIT 1",
            "pred_sql": "SELECT charttime FROM chartevents WHERE itemid IN (225464, 220739) AND subject_id = 10037928 AND strftime('%Y %m', charttime) = '2100 11' ORDER BY charttime DESC LIMIT 1",
            "gold_answer": "[['2100-11-12 23:49:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query pulls from chartevents instead of labevents (the sodium test is a lab event), and it misuses strftime formatting and comparison. The core mistake is using the wrong table reference, a localized error that can be fixed by correcting the table name (and minor formatting), without altering the overall query structure.",
            "error_type": "Local: table reference error"
        },
        "5e11ebb43f301cecc472e7c7": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "When did patient 10036156's last visit to the hospital occur?",
            "gold_sql": "SELECT admissions.admittime FROM admissions WHERE admissions.subject_id = 10036156 AND admissions.dischtime IS NOT NULL ORDER BY admissions.admittime DESC LIMIT 1",
            "pred_sql": "SELECT admissions.dischtime FROM admissions INNER JOIN icustays ON admissions.hadm_id = icustays.hadm_id WHERE admissions.subject_id = 10036156 ORDER BY admissions.dischtime DESC LIMIT 1",
            "gold_answer": "[['2100-07-15 04:52:00']]",
            "pred_answer": "[['2100-07-17 15:08:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL not only selects the wrong column (discharge time instead of admission time) but also introduces an unnecessary INNER JOIN to icustays, thereby changing the scope of the query to ICU stays rather than all hospital visits. This is a structural change affecting overall query logic and the relationships between tables, rather than a simple local typo or syntax issue.",
            "error_type": "Global: incorrect join and column selection"
        },
        "6ee50f63ab0ecd43a03d1c47": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "What was the daily average input of nitroglycerin for patient 10019172 last month?",
            "gold_sql": "SELECT AVG(inputevents.totalamount) FROM inputevents WHERE inputevents.stay_id IN ( SELECT icustays.stay_id FROM icustays WHERE icustays.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10019172 ) ) AND inputevents.itemid IN ( SELECT d_items.itemid FROM d_items WHERE d_items.label = 'nitroglycerin' AND d_items.linksto = 'inputevents' ) AND datetime(inputevents.starttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month') GROUP BY strftime('%Y-%m-%d',inputevents.starttime)",
            "pred_sql": "SELECT sum(inputevents.amount) FROM patients INNER JOIN inputevents ON patients.subject_id = inputevents.subject_id WHERE patients.subject_id = 10019172 AND inputevents.amount > 0 AND strftime('%Y-%m', inputevents.starttime) = '2015-03' AND inputevents.itemid = 62248",
            "gold_answer": "[['250.0'], ['250.0']]",
            "pred_answer": "no such column: inputevents.amount",
            "is_correct": false,
            "reasoning": "The predicted SQL fails due to a column reference error: it uses inputevents.amount, which does not exist in the schema (the correct column is totalamount). This is a localized mistake within the SELECT clause and does not impact the overall query structure or logic.",
            "error_type": "Local: table/column reference error"
        },
        "8d4345c0ed9926353a1fe59a": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "How many patients had introduction of nutritional substance into central vein, percutaneous approach done in 2100?",
            "gold_sql": "SELECT COUNT( DISTINCT admissions.subject_id ) FROM admissions WHERE admissions.hadm_id IN ( SELECT procedures_icd.hadm_id FROM procedures_icd WHERE procedures_icd.icd_code = ( SELECT d_icd_procedures.icd_code FROM d_icd_procedures WHERE d_icd_procedures.long_title = 'introduction of nutritional substance into central vein, percutaneous approach' ) AND strftime('%Y',procedures_icd.charttime) = '2100' )",
            "pred_sql": "SELECT count(DISTINCT subject_id) FROM procedures_icd WHERE icd_code LIKE '456.3%' AND charttime LIKE '2100%'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only queries the procedures_icd table with a LIKE filter on icd_code and a prefix match on charttime, rather than joining to d_icd_procedures to map the long_title to the exact code and using strftime to extract the year. These mistakes are confined to the WHERE clause (incorrect filter conditions) and do not require restructuring joins or the overall query logic.",
            "error_type": "Local: incorrect WHERE clause"
        },
        "c3eb5302bcf43b5a5d43efcf": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "What was the last dose of glucagon since 05/2100, prescribed to patient 10020306?",
            "gold_sql": "SELECT prescriptions.dose_val_rx FROM prescriptions WHERE prescriptions.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10020306 ) AND prescriptions.drug = 'glucagon' AND strftime('%Y-%m',prescriptions.starttime) >= '2100-05' ORDER BY prescriptions.starttime DESC LIMIT 1",
            "pred_sql": "SELECT dose_val_rx FROM prescriptions WHERE subject_id = 10020306 AND starttime > '2100-05-21 00:00:00' ORDER BY starttime DESC LIMIT 1",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['75.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to include the drug filter (prescriptions.drug = 'glucagon') and misinterprets the \u201csince 05/2100\u201d condition by using a fixed date of '2100-05-21 00:00:00' instead of filtering by month. These mistakes are confined to the WHERE clause and do not require changing the overall query structure or JOIN logic.",
            "error_type": "Local: where-clause error"
        },
        "2fe27400810c706671948c64": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "What was the microbiology test given to patient 10004720 for the last time since 12/2100?",
            "gold_sql": "SELECT microbiologyevents.test_name FROM microbiologyevents WHERE microbiologyevents.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10004720 ) AND strftime('%Y-%m',microbiologyevents.charttime) >= '2100-12' ORDER BY microbiologyevents.charttime DESC LIMIT 1",
            "pred_sql": "SELECT test_name FROM microbiologyevents WHERE strftime('%Y %m', charttime) < '2100 12' AND subject_id = 10004720 ORDER BY charttime DESC LIMIT 1",
            "gold_answer": "[['gram stain']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query\u2019s mistake lies entirely in the WHERE clause\u2019s date filtering: it uses strftime('%Y %m') with a space instead of '%Y-%m', applies the wrong comparison operator (< instead of >=), and compares against an incorrectly formatted literal ('2100 12' rather than '2100-12'). The rest of the query structure (SELECT, ORDER BY, LIMIT) remains intact, so this is a localized temporal\u2010filter error that does not require restructuring the overall query logic.",
            "error_type": "Local: other-temporal error"
        },
        "c58a5ec41c71bc32e692d0b7": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "What would be the monthly average weight of patient 10012552 in 2100?",
            "gold_sql": "SELECT AVG(chartevents.valuenum) FROM chartevents WHERE chartevents.stay_id IN ( SELECT icustays.stay_id FROM icustays WHERE icustays.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10012552 ) ) AND chartevents.itemid IN ( SELECT d_items.itemid FROM d_items WHERE d_items.label = 'daily weight' AND d_items.linksto = 'chartevents' ) AND strftime('%Y',chartevents.charttime) = '2100' GROUP BY strftime('%Y-%m',chartevents.charttime)",
            "pred_sql": "SELECT avg(patients.weight) FROM patients INNER JOIN admissions ON patients.subject_id = admissions.subject_id WHERE patients.subject_id = 10012552 AND admissions.admittime LIKE '2100%'",
            "gold_answer": "[['83.2']]",
            "pred_answer": "no such column: patients.weight",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column patients.weight, causing a column reference error. This is a localized mistake that does not affect the overall query structure or logic\u2014only the column name is wrong.",
            "error_type": "Local: table/column reference error"
        },
        "75072ceb723a2148aae97311": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "How much does quinidine gluconate e.r. cost?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.event_type = 'prescriptions' AND cost.event_id IN ( SELECT prescriptions.row_id FROM prescriptions WHERE prescriptions.drug = 'quinidine gluconate e.r.' )",
            "pred_sql": "SELECT cost.cost FROM prescriptions INNER JOIN cost ON prescriptions.row_id = cost.event_id WHERE prescriptions.drug = 'quinidine gluconate e.r.'",
            "gold_answer": "[['11.42']]",
            "pred_answer": "[['11.42'], ['8.95']]",
            "is_correct": false,
            "reasoning": "The predicted SQL joins prescriptions and cost correctly but omits the filter cost.event_type = 'prescriptions' and also fails to use DISTINCT, causing extra rows to appear. This is a localized mistake in the WHERE clause rather than a structural or multi-clause logical issue.",
            "error_type": "Local: missing event_type filter"
        },
        "baeb70e8d9a9783d1d063250": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "When was the first time that patient 10021312 had the minimum value of heart rate?",
            "gold_sql": "SELECT chartevents.charttime FROM chartevents WHERE chartevents.stay_id IN ( SELECT icustays.stay_id FROM icustays WHERE icustays.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10021312 ) ) AND chartevents.itemid IN ( SELECT d_items.itemid FROM d_items WHERE d_items.label = 'heart rate' AND d_items.linksto = 'chartevents' ) ORDER BY chartevents.valuenum ASC, chartevents.charttime ASC LIMIT 1",
            "pred_sql": "SELECT min(charttime) FROM chartevents WHERE subject_id = 10021312 AND itemid IN (112, 402, 111, 128)",
            "gold_answer": "[['2100-09-17 22:11:00']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the query\u2019s logic: it simply takes the earliest charttime for a loosely defined set of itemids and ignores the need to filter by ICU stays, admissions, or to identify the record with the minimum heart rate value. It also misuses MIN on charttime instead of ordering by valuenum then charttime, and it does not reference d_items to select the correct heart rate item. This is a structural/logical flaw spanning multiple clauses, not a localized syntax or reference error.",
            "error_type": "Global: incorrect logic"
        },
        "598a0007438cebbb5e0202c7": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "Do you know the minimum transitional epithelial cells value of patient 10018081 this month?",
            "gold_sql": "SELECT MIN(labevents.valuenum) FROM labevents WHERE labevents.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10018081 ) AND labevents.itemid IN ( SELECT d_labitems.itemid FROM d_labitems WHERE d_labitems.label = 'transitional epithelial cells' ) AND datetime(labevents.charttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month')",
            "pred_sql": "SELECT DISTINCT CASE WHEN label = 'transitional epithelial cells' THEN valuenum ELSE NULL END FROM chartevents WHERE strftime('%Y-%m', charttime) = '2100-11' AND subject_id = 10018081",
            "gold_answer": "[['1.0']]",
            "pred_answer": "no such column: label",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the wrong table (chartevents instead of labevents) and references a non-existent column (label) without joining the mapping table (d_labitems). These are isolated table/column reference errors that can be fixed by correcting the FROM clause and column references without restructuring the overall query logic.",
            "error_type": "Local: table/column reference error"
        }
    },
    "dinsql": {
        "f9cf8541bcbfc43ebc43f833": {
            "db_id": "mimic_iv",
            "generator_name": "dinsql",
            "question": "How much is the average total cost of a hospital that involves a drug named 0.9% sodium chloride (mini bag plus) since 2100?",
            "gold_sql": "SELECT AVG(T1.C1) FROM ( SELECT SUM(cost.cost) AS C1 FROM cost WHERE cost.hadm_id IN ( SELECT prescriptions.hadm_id FROM prescriptions WHERE prescriptions.drug = '0.9% sodium chloride (mini bag plus)' ) AND strftime('%Y',cost.chargetime) >= '2100' GROUP BY cost.hadm_id ) AS T1",
            "pred_sql": "SELECT AVG(total_cost) FROM ( SELECT SUM(DISTINCT c.cost) AS total_cost FROM prescriptions AS p INNER JOIN cost AS c ON p.hadm_id = c.hadm_id AND c.event_id = p.row_id AND c.event_type = 'prescriptions' WHERE p.drug = '0.9% sodium chloride (mini bag plus)' AND datetime(p.starttime) >= datetime('2100-01-01 00:00:00') GROUP BY p.hadm_id ) AS subquery",
            "gold_answer": "[['4369.491']]",
            "pred_answer": "[['9.87']]",
            "is_correct": false,
            "reasoning": "The predicted SQL restricts costs to only prescription events by joining cost on event_type = 'prescriptions' and event_id = p.row_id, and it filters by p.starttime rather than cost.chargetime. This fundamentally changes the query\u2019s logic: instead of summing all costs for the relevant admissions since 2100, it only sums prescription costs and uses the wrong time filter. Fixing this would require restructuring the join, WHERE clauses, and aggregation, not just a small local correction.",
            "error_type": "Global: incorrect join and filtering logic"
        },
        "a029b2e1430d15462ca84d28": {
            "db_id": "mimic_iv",
            "generator_name": "dinsql",
            "question": "What is the minimum monthly number of patient records marked with atrioventricular block, complete?",
            "gold_sql": "SELECT MIN(T1.C1) FROM ( SELECT COUNT( DISTINCT diagnoses_icd.hadm_id ) AS C1 FROM diagnoses_icd WHERE diagnoses_icd.icd_code = ( SELECT d_icd_diagnoses.icd_code FROM d_icd_diagnoses WHERE d_icd_diagnoses.long_title = 'atrioventricular block, complete' ) GROUP BY strftime('%Y-%m',diagnoses_icd.charttime) ) AS T1",
            "pred_sql": "SELECT MIN(monthly_count) FROM ( SELECT strftime('%Y-%m', charttime) AS month, COUNT(DISTINCT subject_id) AS monthly_count FROM diagnoses_icd WHERE icd_code = '4260' -- Assuming '4260' is the code for atrioventricular block, complete GROUP BY month )",
            "gold_answer": "[['1.0']]",
            "pred_answer": "incomplete input",
            "is_correct": false,
            "reasoning": "The predicted SQL incorrectly counts distinct subject_id instead of distinct hadm_id and uses a hard\u2010coded icd_code rather than retrieving it via the d_icd_diagnoses lookup. These are errors confined to a specific clause (the SELECT/count expression and WHERE filter) and do not require restructuring the overall query. Hence, this is a local error.",
            "error_type": "Local: column reference error"
        },
        "d351c1981c8f0350905da618": {
            "db_id": "mimic_iv",
            "generator_name": "dinsql",
            "question": "When was the last time this month that patient 10004733 was prescribed with vancomycin and iso-osmotic dextrose at the same time?",
            "gold_sql": "SELECT T1.starttime FROM ( SELECT prescriptions.subject_id, prescriptions.starttime FROM prescriptions WHERE prescriptions.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10004733 ) AND prescriptions.drug = 'vancomycin' AND datetime(prescriptions.starttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month') ) AS T1 JOIN ( SELECT prescriptions.subject_id, prescriptions.starttime FROM prescriptions WHERE prescriptions.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10004733 ) AND prescriptions.drug = 'iso-osmotic dextrose' AND datetime(prescriptions.starttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-0 month') ) AS T2 ON T1.subject_id = T2.subject_id WHERE datetime(T1.starttime) = datetime(T2.starttime) ORDER BY T1.starttime DESC LIMIT 1",
            "pred_sql": "SELECT MAX(datetime(starttime)) FROM prescriptions WHERE subject_id = 10004733 AND drug IN ('vancomycin', 'iso-osmotic dextrose') AND datetime(starttime, 'start of month') = datetime('2100-12-31 23:59:00', 'start of month', '-0 month') GROUP BY datetime(starttime) HAVING COUNT(DISTINCT drug) = 2",
            "gold_answer": "[['2100-12-26 09:00:00']]",
            "pred_answer": "[['2100-12-22 15:00:00'], ['2100-12-22 20:00:00'], ['2100-12-24 11:00:00'], ['2100-12-26 08:00:00'], ['2100-12-26 09:00:00']]",
            "is_correct": false,
            "reasoning": "The predicted query groups by each prescription start time and applies MAX() within that group, which simply returns each matching timestamp rather than the single latest timestamp overall. This is an error in the aggregation and GROUP BY logic within the SELECT clause and does not involve changing table relationships or the overall query structure. It can be corrected by removing the GROUP BY or wrapping the grouped results to take a global MAX. Hence it is a localized aggregation/grouping error.",
            "error_type": "Local: grouping error"
        },
        "d0de56f72573390c2bf52877": {
            "db_id": "mimic_iv",
            "generator_name": "dinsql",
            "question": "What was the drug that was prescribed to patient 10019777 within the same day after the angioplasty of other non-coronary vessel(s) on the first hospital visit?",
            "gold_sql": "SELECT T2.drug FROM ( SELECT procedures_icd.subject_id, procedures_icd.charttime FROM procedures_icd WHERE procedures_icd.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10019777 AND admissions.dischtime IS NOT NULL ORDER BY admissions.admittime ASC LIMIT 1 ) AND procedures_icd.icd_code = ( SELECT d_icd_procedures.icd_code FROM d_icd_procedures WHERE d_icd_procedures.long_title = 'angioplasty of other non-coronary vessel(s)' ) ) AS T1 JOIN ( SELECT prescriptions.subject_id, prescriptions.drug, prescriptions.starttime FROM prescriptions WHERE prescriptions.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10019777 AND admissions.dischtime IS NOT NULL ORDER BY admissions.admittime ASC LIMIT 1 ) ) AS T2 ON T1.subject_id = T2.subject_id WHERE T1.charttime < T2.starttime AND datetime(T1.charttime,'start of day') = datetime(T2.starttime,'start of day')",
            "pred_sql": "SELECT DISTINCT P.drug FROM procedures_icd AS PI JOIN prescriptions AS P ON PI.subject_id = P.subject_id AND PI.hadm_id = P.hadm_id WHERE PI.subject_id = 10019777 AND PI.icd_code = 'icd9|3961' -- Assuming 'icd9|3961' is the code for angioplasty of other non-coronary vessel(s) AND datetime(P.starttime, 'start of day') = datetime(PI.charttime, 'start of day') AND PI.hadm_id = ( SELECT hadm_id FROM admissions WHERE subject_id = 10019777 ORDER BY admittime ASC LIMIT 1 )",
            "gold_answer": "[['0.9% sodium chloride'], ['0.9% sodium chloride (mini bag plus)'], ['0.9% sodium chloride (mini bag plus)'], ['5% dextrose'], ['alteplase (catheter clearance)'], ['iso-osmotic dextrose'], ['iso-osmotic dextrose'], ['iso-osmotic dextrose'], ['lactated ringers'], ['metronidazole (flagyl)'], ['ns'], ['octreotide acetate'], ['sodium chloride 0.9%'], ['sodium chloride 0.9%'], ['vancomycin'], ['vancomycin']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": [
                "The predicted query fails to restrict to the first completed hospital visit: it omits `admissions.dischtime IS NOT NULL` when picking the first hadm_id, altering the intended admission context.",
                "It also omits the requirement that the prescription start time follow the procedure charttime (`T1.charttime < T2.starttime`), only enforcing same-day equality.",
                "These omissions are not mere typos or minor syntax mistakes but undermine the core logic of selecting the correct visit and ensuring the drug was prescribed after the procedure.",
                "Fixing this requires adding filters in multiple clauses (the admission subquery and the WHERE clause), indicating a broader structural/logical flaw."
            ],
            "error_type": "Global: incorrect admission selection and time\u2010ordering logic"
        }
    },
    "llm2sql": {
        "7351edf011015936356fbbda": {
            "db_id": "mimic_iv",
            "generator_name": "llm2sql",
            "question": "How many days is it since patient 10039831 last stayed in the careunit surgical intensive care unit (sicu) on the current hospital visit?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J', transfers.intime) ) FROM transfers WHERE transfers.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10039831 AND admissions.dischtime IS NULL ) AND transfers.careunit = 'surgical intensive care unit (sicu)' ORDER BY transfers.intime DESC LIMIT 1",
            "pred_sql": "SELECT ROUND((JULIANDAY('2100-12-31 23:59:00') - JULIANDAY(T1.outtime))) AS days_since_last_sicu_stay FROM transfers T1 JOIN admissions T2 ON T1.hadm_id = T2.hadm_id WHERE T1.subject_id = 10039831 AND T1.careunit = 'sicu' AND T2.dischtime IS NULL ORDER BY T1.outtime DESC LIMIT 1;",
            "gold_answer": "[['0.182']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL misuses the careunit literal ('sicu' instead of 'surgical intensive care unit (sicu)') and references the wrong timestamp column (outtime instead of intime). These are errors confined to specific parts of the query (WHERE clause and SELECT expression) and do not alter the overall structure or logic of joining the current admission and transfers tables.",
            "error_type": "Local: column reference/value error"
        },
        "44c1c9cab30e5eb3386c026e": {
            "db_id": "mimic_iv",
            "generator_name": "llm2sql",
            "question": "What is the 3-month survival rate of patients who received pancrelipase 5000 treatment following a other alteration of consciousness diagnosis?",
            "gold_sql": "SELECT AVG(C1) FROM ( SELECT ( CASE WHEN strftime('%J',patients.dod) - strftime('%J',T3.charttime) < 365 / 4 THEN 0 ELSE 1 END ) AS C1 FROM ( SELECT T1.subject_id, T1.charttime FROM ( SELECT admissions.subject_id, diagnoses_icd.charttime FROM diagnoses_icd JOIN admissions ON diagnoses_icd.hadm_id = admissions.hadm_id WHERE diagnoses_icd.icd_code = ( SELECT d_icd_diagnoses.icd_code FROM d_icd_diagnoses WHERE d_icd_diagnoses.long_title = 'other alteration of consciousness' ) AND strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnoses_icd.charttime) >= 365 / 4 GROUP BY admissions.subject_id HAVING MIN(diagnoses_icd.charttime) = diagnoses_icd.charttime ) AS T1 JOIN ( SELECT admissions.subject_id, prescriptions.starttime FROM prescriptions JOIN admissions ON prescriptions.hadm_id = admissions.hadm_id WHERE prescriptions.drug = 'pancrelipase 5000' GROUP BY admissions.subject_id HAVING MAX(prescriptions.starttime) = prescriptions.starttime ) AS T2 ON T1.subject_id = T2.subject_id WHERE T1.charttime < T2.starttime ) AS T3 JOIN patients ON T3.subject_id = patients.subject_id )",
            "pred_sql": "WITH diagnosis_cte AS ( SELECT di.subject_id, di.hadm_id, MIN(di.charttime) AS diagnosis_date FROM diagnoses_icd di JOIN d_icd_diagnoses dd ON di.icd_code = dd.icd_code WHERE dd.long_title LIKE '%other alteration of consciousness%' GROUP BY di.subject_id, di.hadm_id ), pancrelipase_cte AS ( SELECT DISTINCT p.subject_id, p.hadm_id FROM prescriptions p WHERE p.drug = 'pancrelipase 5000' ), qualified_patients AS ( SELECT d.subject_id, d.hadm_id, d.diagnosis_date FROM diagnosis_cte d JOIN pancrelipase_cte p ON d.subject_id = p.subject_id AND d.hadm_id = p.hadm_id WHERE p.starttime > d.diagnosis_date ), death_check AS ( SELECT qp.subject_id, qp.diagnosis_date FROM qualified_patients qp LEFT JOIN patients pt ON qp.subject_id = pt.subject_id WHERE pt.dod IS NULL OR pt.dod > datetime(qp.diagnosis_date, '+3 months') ) SELECT CAST(COUNT(dc.subject_id) AS FLOAT) / COUNT(qp.subject_id) AS survival_rate FROM qualified_patients qp LEFT JOIN death_check dc ON qp.subject_id = dc.subject_id;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "no such column: p.starttime",
            "is_correct": false,
            "reasoning": "The error arises because the CTE \"pancrelipase_cte\" selects only subject_id and hadm_id, but later the query references p.starttime, which was not selected. This is a column reference error localized to the SELECT clause of the CTE and can be fixed by including starttime in the CTE. No overall query structure or logic needs to be changed beyond this clause.",
            "error_type": "Local: table/column reference error"
        },
        "0999752695013d993950a661": {
            "db_id": "mimic_iv",
            "generator_name": "llm2sql",
            "question": "Calculate the total volume of or urine for patient 10039831 today.",
            "gold_sql": "SELECT SUM(outputevents.value) FROM outputevents WHERE outputevents.stay_id IN ( SELECT icustays.stay_id FROM icustays WHERE icustays.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10039831 ) ) AND outputevents.itemid IN ( SELECT d_items.itemid FROM d_items WHERE d_items.label = 'or urine' AND d_items.linksto = 'outputevents' ) AND datetime(outputevents.charttime,'start of day') = datetime('2100-12-31 23:59:00','start of day','-0 day')",
            "pred_sql": "SELECT SUM(value) AS total_urine_volume FROM outputevents WHERE subject_id = 10039831 AND datetime(charttime, 'start of day') = datetime('2100-12-31 23:59:00', 'start of day')",
            "gold_answer": "[['880.0']]",
            "pred_answer": "[['2360.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to filter by the specific output type (\u201cor urine\u201d) and does not restrict to the patient\u2019s ICU stays, but instead uses only subject_id and date. This is a mistake in the WHERE clause\u2014a missing condition\u2014rather than a fundamental restructuring of joins or subqueries. Hence, it is a localized error in filtering.",
            "error_type": "Local: missing-filter error"
        }
    },
    "macsql": {
        "18168ef8762ec6a8dec80897": {
            "db_id": "mimic_iv",
            "generator_name": "macsql",
            "question": "What number of patients stayed in medical intensive care unit (micu) since 1 year ago?",
            "gold_sql": "SELECT COUNT( DISTINCT admissions.subject_id ) FROM admissions WHERE admissions.hadm_id IN ( SELECT transfers.hadm_id FROM transfers WHERE transfers.careunit = 'medical intensive care unit (micu)' AND datetime(transfers.intime) >= datetime('2100-12-31 23:59:00','-1 year') )",
            "pred_sql": "SELECT COUNT(DISTINCT `subject_id`) AS num_patients FROM icustays WHERE `first_careunit` = 'medical intensive care unit (micu)' AND datetime(`intime`) >= datetime('2100-12-31 23:59:00', '-1 year')",
            "gold_answer": "[['20.0']]",
            "pred_answer": "[['18.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the logic of the question by using the icustays table and its first_careunit field instead of the transfers table to identify all MICU stays. The ground truth correctly captures any transfer into the MICU within the past year, whereas the prediction only counts stays where the patient\u2019s first ICU unit was MICU and occurred in the last year. This is not a simple column name or syntax mistake but an overall structural error in table choice and join logic, altering the intended meaning of the query. Therefore, this is a global error.",
            "error_type": "Global: incorrect join/structure error"
        }
    },
    "qwen3": {
        "bb4987c184d509429ea2e482": {
            "db_id": "mimic_iv",
            "generator_name": "qwen3",
            "question": "How many patients received a plasma lab test since 1 year ago?",
            "gold_sql": "SELECT COUNT( DISTINCT admissions.subject_id ) FROM admissions WHERE admissions.hadm_id IN ( SELECT labevents.hadm_id FROM labevents WHERE labevents.itemid IN ( SELECT d_labitems.itemid FROM d_labitems WHERE d_labitems.label = 'plasma' ) AND datetime(labevents.charttime) >= datetime('2100-12-31 23:59:00','-1 year') )",
            "pred_sql": "SELECT COUNT(DISTINCT le.subject_id) FROM labevents le JOIN d_labitems dli ON le.itemid = dli.itemid WHERE dli.label LIKE '%plasma%' AND le.charttime >= datetime('2100-12-31 23:59:00', '-1 year');",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['2.0']]",
            "is_correct": false,
            "reasoning": "The only difference is in the WHERE clause\u2019s label filter: the ground truth requires an exact match (d_labitems.label = 'plasma') while the prediction uses a broad LIKE '%plasma%', which pulls in extra rows and inflates the count. This is a localized mistake in the condition, not a structural or multi-clause logic error, so it\u2019s a Local error.",
            "error_type": "Local: where-clause value-matching error"
        },
        "227b5e0e2e01df82980de19b": {
            "db_id": "mimic_iv",
            "generator_name": "qwen3",
            "question": "Since patient 10039831's admission in the icu, how many days have elapsed?",
            "gold_sql": "SELECT 1 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J', icustays.intime) ) FROM icustays WHERE icustays.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10039831 ) AND icustays.outtime IS NULL",
            "pred_sql": "SELECT CAST((julianday('2100-12-31 23:59:00') - julianday(intime)) AS INTEGER) AS days_elapsed FROM icustays WHERE subject_id = 10039831 ORDER BY intime DESC LIMIT 1;",
            "gold_answer": "[['0.182']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL completely changes the logic for selecting the relevant ICU stay. Instead of restricting to the current ICU stay (outtime IS NULL) for the patient\u2019s hospital admission, it simply picks the most recent ICU stay by ORDER BY and ignores the outtime filter and hadm_id relationship. This is not a minor typo or localized mistake\u2014it alters the core query structure and the intended meaning, so it is a global error.",
            "error_type": "Global: flawed join/filter logic"
        }
    }
}