{
    "macsql": {
        "6db0ca7ff25c436c79d07413": {
            "db_id": "mimic_iv",
            "generator_name": "macsql",
            "question": "What was the diagnosis received by patient 10038081 for the last time?",
            "gold_sql": "SELECT d_icd_diagnoses.long_title FROM d_icd_diagnoses WHERE d_icd_diagnoses.icd_code IN ( SELECT diagnoses_icd.icd_code FROM diagnoses_icd WHERE diagnoses_icd.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10038081 ) ORDER BY diagnoses_icd.charttime DESC LIMIT 1 )",
            "pred_sql": "SELECT T2.`long_title` FROM diagnoses_icd AS T1 INNER JOIN d_icd_diagnoses AS T2 ON T1.`icd_code` = T2.`icd_code` WHERE T1.`hadm_id` = ( SELECT `hadm_id` FROM admissions WHERE `subject_id` = 10038081 ORDER BY `dischtime` DESC LIMIT 1 )",
            "gold_answer": "[['transfusion related acute lung injury (trali)']]",
            "pred_answer": "[['acquired hypertrophic pyloric stenosis'], ['acute kidney failure, unspecified'], ['acute respiratory failure'], ['altered mental status'], ['anemia, unspecified'], ['asthma, unspecified type, unspecified'], ['cachexia'], ['chronic kidney disease, unspecified'], ['cirrhosis of liver without mention of alcohol'], ['diabetes mellitus without mention of complication, type ii or unspecified type, uncontrolled'], ['do not resuscitate status'], ['encounter for palliative care'], ['epistaxis'], ['esophageal varices without mention of bleeding'], ['glucocorticoid deficiency'], ['hyperpotassemia'], ['hypertensive chronic kidney disease, unspecified, with chronic kidney disease stage i through stage iv, or unspecified'], ['hyposmolality and/or hyponatremia'], ['hypotension, unspecified'], ['jaundice, unspecified, not of newborn'], ['natural blood and blood products causing adverse effects in therapeutic use'], ['oliguria and anuria'], ['other and unspecified coagulation defects'], ['other and unspecified hyperlipidemia'], ['other ascites'], ['other disorders of muscle, ligament, and fascia'], ['other fluid overload'], ['other specified disorders of stomach and duodenum'], ['other specified pre-operative examination'], ['paralytic ileus'], ['paroxysmal ventricular tachycardia'], ['personal history of malignant neoplasm of tongue'], ['portal hypertension'], ['pulmonary congestion and hypostasis'], ['spontaneous bacterial peritonitis'], ['tachypnea'], ['transfusion related acute lung injury (trali)'], ['unspecified vascular insufficiency of intestine']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the query\u2019s logic by selecting diagnoses based on the patient\u2019s last hospital admission (using discharge time) rather than the single most recent diagnosis record (using diagnoses_icd.charttime). It retrieves all diagnoses for that admission instead of the one latest diagnosis, thereby altering the overall intended result. This error spans multiple clauses and requires restructuring the core query logic, so it is a global issue.",
            "error_type": "Global: incorrect logic"
        },
        "a426a5f7267fbe34c05da68d": {
            "db_id": "mimic_iv",
            "generator_name": "macsql",
            "question": "What's the white blood cells change of patient 10008287 last measured on the last hospital visit compared to the first value measured on the last hospital visit?",
            "gold_sql": "SELECT ( SELECT labevents.valuenum FROM labevents WHERE labevents.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10008287 AND admissions.dischtime IS NOT NULL ORDER BY admissions.admittime DESC LIMIT 1 ) AND labevents.itemid IN ( SELECT d_labitems.itemid FROM d_labitems WHERE d_labitems.label = 'white blood cells' ) ORDER BY labevents.charttime DESC LIMIT 1 ) - ( SELECT labevents.valuenum FROM labevents WHERE labevents.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10008287 AND admissions.dischtime IS NOT NULL ORDER BY admissions.admittime DESC LIMIT 1 ) AND labevents.itemid IN ( SELECT d_labitems.itemid FROM d_labitems WHERE d_labitems.label = 'white blood cells' ) ORDER BY labevents.charttime ASC LIMIT 1 )",
            "pred_sql": "SELECT (last_value - first_value) AS wbc_change FROM ( SELECT (SELECT valuenum FROM labevents WHERE subject_id = 10008287 AND hadm_id = ( SELECT hadm_id FROM admissions WHERE subject_id = 10008287 AND dischtime IS NOT NULL ORDER BY admittime DESC LIMIT 1 ) AND itemid = 51006 AND charttime = ( SELECT MIN(charttime) FROM labevents WHERE subject_id = 10008287 AND hadm_id = ( SELECT hadm_id FROM admissions WHERE subject_id = 10008287 AND dischtime IS NOT NULL ORDER BY admittime DESC LIMIT 1 ) AND itemid = 51006 ) ) AS first_value, (SELECT valuenum FROM labevents WHERE subject_id = 10008287 AND hadm_id = ( SELECT hadm_id FROM admissions WHERE subject_id = 10008287 AND dischtime IS NOT NULL ORDER BY admittime DESC LIMIT 1 ) AND itemid = 51006 AND charttime = ( SELECT MAX(charttime) FROM labevents WHERE subject_id = 10008287 AND hadm_id = ( SELECT hadm_id FROM admissions WHERE subject_id = 10008287 AND dischtime IS NOT NULL ORDER BY admittime DESC LIMIT 1 ) AND itemid = 51006 ) ) AS last_value ) AS wbc_values",
            "gold_answer": "[['-1.0']]",
            "pred_answer": "[['3.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL differs from the ground truth only in how it identifies the \u201cwhite blood cells\u201d lab test\u2014it hard-codes itemid = 51006 instead of looking up d_labitems.label = 'white blood cells'. This causes the wrong measurements to be pulled and hence the wrong change value. All other structure (subqueries, date ordering, hadm_id filtering) matches the intended logic. The error is confined to the WHERE clause\u2019s itemid filter (a simple misreference), without impacting joins or overall query flow. Therefore it is a localized column/value reference error.",
            "error_type": "Local: incorrect itemid reference error"
        },
        "bd635bf7a1d3589befdf1632": {
            "db_id": "mimic_iv",
            "generator_name": "macsql",
            "question": "Tell me the top five diagnoses with the highest 6-month mortality rate.",
            "gold_sql": "SELECT d_icd_diagnoses.long_title FROM d_icd_diagnoses WHERE d_icd_diagnoses.icd_code IN ( SELECT T4.icd_code FROM ( SELECT T3.icd_code, DENSE_RANK() OVER ( ORDER BY T3.C2 ASC ) AS C3 FROM ( SELECT T2.icd_code, AVG(C1) AS C2 FROM ( SELECT T1.icd_code, ( CASE WHEN strftime('%J',patients.dod) - strftime('%J',T1.charttime) < 365 / 2 THEN 0 ELSE 1 END ) as C1 FROM ( SELECT admissions.subject_id, diagnoses_icd.icd_code, diagnoses_icd.charttime FROM diagnoses_icd JOIN admissions ON diagnoses_icd.hadm_id = admissions.hadm_id WHERE strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnoses_icd.charttime) >= 365 / 2 GROUP BY admissions.subject_id, diagnoses_icd.icd_code HAVING MIN(diagnoses_icd.charttime) = diagnoses_icd.charttime ) AS T1 JOIN patients ON T1.subject_id = patients.subject_id ) AS T2 GROUP BY T2.icd_code ) AS T3 ) AS T4 WHERE T4.C3 <= 5 )",
            "pred_sql": "WITH DiagnosisMortality AS ( SELECT D.icd_code, COUNT(DISTINCT P.subject_id) AS total_patients, SUM(CASE WHEN P.dod IS NOT NULL AND P.dod <= datetime(F.first_diagnosis_time, '+6 months') THEN 1 ELSE 0 END) AS deaths_within_6_months FROM diagnoses_icd D JOIN (SELECT subject_id, MIN(charttime) AS first_diagnosis_time FROM diagnoses_icd GROUP BY subject_id) F ON D.subject_id = F.subject_id JOIN patients P ON D.subject_id = P.subject_id GROUP BY D.icd_code ) SELECT icd_code FROM DiagnosisMortality ORDER BY CAST(deaths_within_6_months AS REAL) / total_patients DESC LIMIT 5",
            "gold_answer": "[['abnormal involuntary movements'], ['acidosis'], ['acute and subacute hepatic failure with coma'], ['acute and subacute hepatic failure without coma'], ['acute kidney failure with lesion of tubular necrosis'], ['acute kidney failure, unspecified'], ['acute posthemorrhagic anemia'], ['acute respiratory failure'], ['acute respiratory failure, unspecified whether with hypoxia or hypercapnia'], ['alcohol abuse, continuous'], ['alcohol abuse, in remission'], ['alcoholic cirrhosis of liver'], ['alcoholic polyneuropathy'], ['amyotrophic lateral sclerosis'], ['anemia in other chronic diseases classified elsewhere'], ['arthrodesis status'], ['atelectasis'], ['atherosclerotic heart disease of native coronary artery with other forms of angina pectoris'], ['automatic implantable cardiac defibrillator in situ'], ['benign neoplasm of cerebral meninges'], ['bipolar disorder, unspecified'], ['chronic airway obstruction, not elsewhere classified'], ['chronic kidney disease, stage 3 (moderate)'], ['chronic kidney disease, stage iii (moderate)'], ['chronic kidney disease, unspecified'], ['chronic osteomyelitis, site unspecified'], ['chronic systolic heart failure'], ['cirrhosis of liver without mention of alcohol'], ['constipation, unspecified'], ['delirium due to conditions classified elsewhere'], ['dementia, unspecified, without behavioral disturbance'], ['dependence on respirator, status'], ['diarrhea'], ['diplopia'], ['do not resuscitate status'], ['early satiety'], ['edema'], ['embolism and thrombosis of other specified artery'], ['encounter for palliative care'], ['hemoperitoneum'], ['hemorrhage of gastrointestinal tract, unspecified'], ['hip joint replacement'], ['hyperosmolality and/or hypernatremia'], ['hyperpotassemia'], ['hypertensive chronic kidney disease with stage 1 through stage 4 chronic kidney disease, or unspecified chronic kidney disease'], ['hypertensive chronic kidney disease, unspecified, with chronic kidney disease stage i through stage iv, or unspecified'], ['hypertrophy (benign) of prostate without urinary obstruction and other lower urinary tract symptom (luts)'], ['hypo-osmolality and hyponatremia'], ['hypospadias'], ['hypotension, unspecified'], ['hypovolemic shock'], ['ileus, unspecified'], ['infection with microorganisms resistant to penicillins'], ['jaundice, unspecified, not of newborn'], ['leukocytosis, unspecified'], ['long term (current) use of insulin'], ['malignant neoplasm of body of pancreas'], ['malignant neoplasm of liver, secondary'], ['malignant neoplasm of rectosigmoid junction'], ['metabolic encephalopathy'], ['methicillin susceptible staphylococcus aureus infection as the cause of diseases classified elsewhere'], ['migraine, unspecified, without mention of intractable migraine without mention of status migrainosus'], ['mycosis fungoides, unspecified site, extranodal and solid organ sites'], ['neoplasm related pain (acute) (chronic)'], ['nephritis and nephropathy, not specified as acute or chronic, with other specified pathological lesion in kidney'], ['nonalcoholic steatohepatitis (nash)'], ['nonspecific elevation of levels of transaminase or lactic acid dehydrogenase [ldh]'], ['old myocardial infarction'], ['other ascites'], ['other chronic pulmonary heart diseases'], ['other cirrhosis of liver'], ['other closed fractures of distal end of radius (alone)'], ['other complications due to other vascular device, implant, and graft'], ['other constipation'], ['other convulsions'], ['other diseases of lung, not elsewhere classified'], ['other disorders of neurohypophysis'], ['other dysphagia'], ['other postprocedural shock, initial encounter'], ['other respiratory abnormalities'], ['other secondary thrombocytopenia'], ['other septicemia due to gram-negative organisms'], ['other specified analgesics and antipyretics causing adverse effects in therapeutic use'], ['other specified bacterial agents as the cause of diseases classified elsewhere'], ['other specified disorders of peritoneum'], ['other specified forms of hearing loss'], ['palpitations'], ['peritonitis, unspecified'], ['personal history of alcoholism'], ['personal history of colonic polyps'], ['personal history of other malignant neoplasm of skin'], ['personal history of peptic ulcer disease'], ['personal history of poliomyelitis'], ['personal history of pulmonary embolism'], ['personal history of tobacco use'], ['personal history of transient ischemic attack (tia), and cerebral infarction without residual deficits'], ['pneumonia due to klebsiella pneumoniae'], ['postprocedural hemorrhage of a circulatory system organ or structure following a cardiac catheterization'], ['posttraumatic stress disorder'], ['presence of coronary angioplasty implant and graft']]",
            "pred_answer": "[['icd9|29680'], ['icd9|496'], ['icd9|5715'], ['icd9|v08'], ['icd9|v462']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally miscalculates the 6-month mortality rate by using each patient\u2019s overall first diagnosis time (across all codes) rather than the first occurrence of each specific diagnosis. It also fails to filter out diagnoses that occurred less than 6 months before the fixed \u2018today\u2019 and misuses the '+6 months' offset instead of the prescribed 365/2-day window, thereby altering the intended grouping, timing logic, and mortality calculation. This is not a simple column or syntax mistake but a flaw that spans multiple clauses (CTE definition, joins, date arithmetic, grouping), requiring a major rewrite of the query\u2019s logic rather than a localized fix.",
            "error_type": "Global: flawed mortality calculation logic"
        }
    },
    "qwen3": {
        "fb35e5711bd598ff9c938892": {
            "db_id": "mimic_iv",
            "generator_name": "qwen3",
            "question": "What was the name of the specimen test that patient 10038992 had for the last time last month?",
            "gold_sql": "SELECT microbiologyevents.spec_type_desc FROM microbiologyevents WHERE microbiologyevents.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10038992 ) AND datetime(microbiologyevents.charttime,'start of month') = datetime('2100-12-31 23:59:00','start of month','-1 month') ORDER BY microbiologyevents.charttime DESC LIMIT 1",
            "pred_sql": "SELECT test_name FROM microbiologyevents WHERE subject_id = 10038992 AND datetime(charttime, 'start of month') = datetime('2100-12-31 23:59:00', 'start of month', '-1 month') ORDER BY charttime DESC LIMIT 1;",
            "gold_answer": "[['blood culture']]",
            "pred_answer": "[['blood culture, routine']]",
            "is_correct": false,
            "reasoning": "The predicted query errs only in the SELECT clause by choosing microbiologyevents.test_name instead of spec_type_desc. Everything else (filtering by month, ordering, LIMIT) maintains the same structure and logical flow. This is a localized column\u2010reference mistake, not a structural or multi\u2010clause logic error.",
            "error_type": "Local: column reference error"
        }
    },
    "codes": {
        "8346d40a91793343d5e5393e": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "What are the charges for a procedure called excision of right internal mammary artery, percutaneous endoscopic approach?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.event_type = 'procedures_icd' AND cost.event_id IN ( SELECT procedures_icd.row_id FROM procedures_icd WHERE procedures_icd.icd_code = ( SELECT d_icd_procedures.icd_code FROM d_icd_procedures WHERE d_icd_procedures.long_title = 'excision of right internal mammary artery, percutaneous endoscopic approach' ) )",
            "pred_sql": "SELECT cost.cost FROM procedures_icd INNER JOIN d_icd_procedures ON procedures_icd.icd_code = d_icd_procedures.icd_code INNER JOIN cost ON cost.event_id = procedures_icd.row_id WHERE d_icd_procedures.long_title LIKE '%excision of right internal mammary artery, percutaneous endoscopic approach%'",
            "gold_answer": "[['6.96']]",
            "pred_answer": "[['13.43'], ['5.13'], ['6.96'], ['9.34']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fails to include the required filter cost.event_type = 'procedures_icd' and also omits DISTINCT, leading to extra cost rows that are unrelated to the intended procedure. This is a mistake confined to the WHERE clause and does not alter the overall join structure or logic beyond this missing condition.",
            "error_type": "Local: missing event_type filter"
        },
        "d395b7b77c91a485233becad": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "What was the last prescribed dose of aspirin (buffered) that patient 10024043 got in 04/2100?",
            "gold_sql": "SELECT prescriptions.dose_val_rx FROM prescriptions WHERE prescriptions.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10024043 ) AND prescriptions.drug = 'aspirin (buffered)' AND strftime('%Y-%m',prescriptions.starttime) = '2100-04' ORDER BY prescriptions.starttime DESC LIMIT 1",
            "pred_sql": "SELECT prescriptions.drug FROM prescriptions WHERE prescriptions.subject_id = 10024043 AND prescriptions.starttime LIKE '2100-04-21%' AND prescriptions.drug = 'aspirin (buffered)' ORDER BY prescriptions.stoptime DESC LIMIT 1",
            "gold_answer": "[['325.0']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query makes several localized mistakes without altering the overall structure:\n1. SELECT clause is wrong: it returns prescriptions.drug instead of prescriptions.dose_val_rx.\n2. The WHERE clause filters starttime to a single day ('2100-04-21%') instead of the whole month ('2100-04').\n3. It orders by stoptime rather than starttime.  \nNone of these errors require changing the join logic or overall query structure\u2014they are confined to column selection, filtering literals, and ordering. Therefore it\u2019s a Local error.",
            "error_type": "Local: where-clause and select-column error"
        },
        "859c5d5288e0f9d7cdce7d9c": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "What is the 6-month survival rate for patients diagnosed with nonrheumatic mitral (valve) insufficiency?",
            "gold_sql": "SELECT AVG(C1) FROM ( SELECT ( CASE WHEN (strftime('%J',patients.dod) - strftime('%J',T1.charttime)) < 365 / 2 THEN 0 ELSE 1 END ) AS C1 FROM ( SELECT admissions.subject_id, diagnoses_icd.charttime FROM diagnoses_icd JOIN admissions ON diagnoses_icd.hadm_id = admissions.hadm_id WHERE diagnoses_icd.icd_code = ( SELECT d_icd_diagnoses.icd_code FROM d_icd_diagnoses WHERE d_icd_diagnoses.long_title = 'nonrheumatic mitral (valve) insufficiency' ) AND strftime('%J','2100-12-31 23:59:00') - strftime('%J',diagnoses_icd.charttime) >= 365 / 2 GROUP BY admissions.subject_id HAVING MIN(diagnoses_icd.charttime) = diagnoses_icd.charttime ) AS T1 JOIN patients ON T1.subject_id = patients.subject_id )",
            "pred_sql": "SELECT cast(sum(CASE WHEN patients.dod IS NULL THEN 1 ELSE 0 END) AS REAL) * 100 / count(patients.subject_id) FROM patients INNER JOIN diagnoses_icd ON patients.subject_id = diagnoses_icd.subject_id WHERE diagnoses_icd.icd_code = '493.81' GROUP BY patients.subject_id HAVING count(patients.subject_id) > 0",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted query completely ignores the 6-month time window, uses a hard-coded (and incorrect) ICD code rather than looking up the diagnosis by its long_title, and aggregates survival incorrectly by grouping per patient and computing a percentage at that level. These issues span the overall logic\u2014date filtering, code lookup, and aggregation strategy\u2014so this is not a small localized typo or syntax fix but a fundamentally flawed approach requiring a restructuring of the query.",
            "error_type": "Global: logical inconsistency error"
        },
        "4fd9504906ec9a8655390830": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "How many hours have passed from the time when patient 10018081 was admitted to the icu?",
            "gold_sql": "SELECT 24 * ( strftime('%J','2100-12-31 23:59:00') - strftime('%J', icustays.intime) ) FROM icustays WHERE icustays.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10018081 ) AND icustays.outtime IS NULL",
            "pred_sql": "SELECT cast(strftime('%J', icustays.intime) - strftime('%J', admissions.admittime) AS REAL) * 24 FROM admissions INNER JOIN icustays ON admissions.hadm_id = icustays.hadm_id WHERE admissions.subject_id = 10018081",
            "gold_answer": "[['126.817']]",
            "pred_answer": "[['0.2']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally misinterprets the question\u2019s intent by computing the time between hospital admission and ICU admission rather than the hours since ICU admission until now. It also omits the filter for a current ICU stay (outtime IS NULL) and uses the wrong timestamp for \u201cnow.\u201d These flaws span multiple clauses (JOIN logic, WHERE conditions, time calculations) and change the core purpose of the query, indicating a global logical error.",
            "error_type": "Global: logical inconsistency"
        },
        "0f238fbe279f08c43dc8c8dc": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "In patients who had the continuous invasive mechanical ventilation for less than 96 consecutive hours this year, what are the three most common diagnoses that followed within 2 months?",
            "gold_sql": "SELECT d_icd_diagnoses.long_title FROM d_icd_diagnoses WHERE d_icd_diagnoses.icd_code IN ( SELECT T3.icd_code FROM ( SELECT T2.icd_code, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM ( SELECT admissions.subject_id, procedures_icd.charttime FROM procedures_icd JOIN admissions ON procedures_icd.hadm_id = admissions.hadm_id WHERE procedures_icd.icd_code = ( SELECT d_icd_procedures.icd_code FROM d_icd_procedures WHERE d_icd_procedures.long_title = 'continuous invasive mechanical ventilation for less than 96 consecutive hours' ) AND datetime(procedures_icd.charttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT admissions.subject_id, diagnoses_icd.icd_code, diagnoses_icd.charttime FROM diagnoses_icd JOIN admissions ON diagnoses_icd.hadm_id = admissions.hadm_id WHERE datetime(diagnoses_icd.charttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.subject_id = T2.subject_id WHERE T1.charttime < T2.charttime AND datetime(T2.charttime) BETWEEN datetime(T1.charttime) AND datetime(T1.charttime,'+2 month') GROUP BY T2.icd_code ) AS T3 WHERE T3.C1 <= 3 )",
            "pred_sql": "SELECT diagnoses_icd.icd_code, count(diagnoses_icd.icd_code) FROM diagnoses_icd INNER JOIN ( SELECT subject_id, hadm_id FROM admissions WHERE dischtime IS NOT NULL AND dischtime - admittime < 1095 AND admission_type = 'ELECTIVE' GROUP BY subject_id, hadm_id ) AS t3 ON diagnoses_icd.hadm_id = t3.hadm_id WHERE t3.admission_type = 'ELECTIVE' AND t3.dischtime - t3.admittime < 1095 GROUP BY diagnoses_icd.icd_code ORDER BY count(diagnoses_icd.icd_code) DESC LIMIT 3",
            "gold_answer": "[['accidental cut, puncture, perforation or hemorrhage during heart catheterization'], ['accidental puncture or laceration during a procedure, not elsewhere classified'], ['acute on chronic diastolic heart failure'], ['acute pancreatitis'], ['alkalosis'], ['anemia, unspecified'], ['asthma, unspecified type, unspecified'], ['calculus of bile duct without mention of cholecystitis, without mention of obstruction'], ['congestive heart failure, unspecified'], ['cystic kidney disease, unspecified'], ['depressive disorder, not elsewhere classified'], ['diabetes mellitus without mention of complication, type ii or unspecified type, not stated as uncontrolled'], ['hypovolemia'], ['long-term (current) use of insulin'], ['mitral valve disorders'], ['obstructive sleep apnea (adult)(pediatric)'], ['other and unspecified hyperlipidemia'], ['other chronic pulmonary heart diseases'], ['other iatrogenic hypotension'], ['other postprocedural status'], ['peritoneal adhesions (postoperative) (postinfection)'], ['personal history of methicillin resistant staphylococcus aureus'], ['physical restraints status'], ['portal hypertension'], ['postinflammatory pulmonary fibrosis'], ['schizoaffective disorder, unspecified'], ['thrombocytopenia, unspecified'], ['umbilical hernia without mention of obstruction or gangrene']]",
            "pred_answer": "no such column: t3.admission_type",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s subquery aliased as t3 only selects subject_id and hadm_id, yet the outer query refers to t3.admission_type (and also t3.dischtime and t3.admittime) which do not exist in t3\u2019s projection. This is a column reference error in a specific part of the query and does not require restructuring the overall logic.",
            "error_type": "Local: table/column reference error"
        },
        "620dde6d062ca27f785e6250": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "How old is patient 10038992 on the last hospital visit?",
            "gold_sql": "SELECT admissions.age FROM admissions WHERE admissions.subject_id = 10038992 AND admissions.dischtime IS NOT NULL ORDER BY admissions.admittime DESC LIMIT 1",
            "pred_sql": "SELECT admissions.admittime, admissions.dischtime FROM admissions WHERE admissions.subject_id = 10038992 ORDER BY admissions.admittime DESC LIMIT 1",
            "gold_answer": "[['70.0']]",
            "pred_answer": "[['2100-11-23 18:26:00', '2100-11-29 16:22:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL selects the admission and discharge times instead of the patient's age and fails to filter for only completed (discharged) visits. It fundamentally alters the query\u2019s intent by returning different columns and missing the dischtime IS NOT NULL condition, thus changing the overall logic rather than fixing a localized issue.",
            "error_type": "Global: incorrect selection and filter"
        },
        "33423e8e52128ee0f0498b33": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "What was the name of the last input that patient 10004422 had?",
            "gold_sql": "SELECT d_items.label FROM d_items WHERE d_items.itemid IN ( SELECT inputevents.itemid FROM inputevents WHERE inputevents.stay_id IN ( SELECT icustays.stay_id FROM icustays WHERE icustays.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10004422 ) ) ORDER BY inputevents.starttime DESC LIMIT 1 )",
            "pred_sql": "SELECT inputevents.itemid FROM patients INNER JOIN inputevents ON patients.subject_id = inputevents.subject_id WHERE patients.subject_id = 10004422 ORDER BY inputevents.charttime DESC LIMIT 1",
            "gold_answer": "[['po intake']]",
            "pred_answer": "no such column: inputevents.charttime",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column inputevents.charttime instead of inputevents.starttime. This is a simple column reference mistake and can be fixed by correcting the column name without altering the overall query structure or logic.",
            "error_type": "Local: table/column reference error"
        },
        "b46069965a45836dc176614f": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "What was the first 5% dextrose (excel bag) dose that patient 10018081 was prescribed on the current hospital visit?",
            "gold_sql": "SELECT prescriptions.dose_val_rx FROM prescriptions WHERE prescriptions.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10018081 AND admissions.dischtime IS NULL ) AND prescriptions.drug = '5% dextrose (excel bag)' ORDER BY prescriptions.starttime ASC LIMIT 1",
            "pred_sql": "SELECT dose_val_rx FROM prescriptions WHERE subject_id = 10018081 AND drug = 'dextrose 5%' ORDER BY dose_val_rx DESC LIMIT 0, 0.05",
            "gold_answer": "[['500.0']]",
            "pred_answer": "datatype mismatch",
            "is_correct": false,
            "reasoning": "The predicted SQL fails immediately with a datatype mismatch due to the LIMIT clause using a non\u2010integer (0.05). This is a localized issue in value parsing/syntax. The overall query structure (selecting from prescriptions) remains intact, so no global restructuring is required.",
            "error_type": "Local: value parsing error"
        },
        "50727c16951cf4ee1f147513": {
            "db_id": "mimic_iv",
            "generator_name": "codes",
            "question": "What's the mean blood pressure change of patient 10018328 second measured on the first icu visit compared to the first value measured on the first icu visit?",
            "gold_sql": "SELECT ( SELECT chartevents.valuenum FROM chartevents WHERE chartevents.stay_id IN ( SELECT icustays.stay_id FROM icustays WHERE icustays.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10018328 ) AND icustays.outtime IS NOT NULL ORDER BY icustays.intime ASC LIMIT 1 ) AND chartevents.itemid IN ( SELECT d_items.itemid FROM d_items WHERE d_items.label = 'arterial blood pressure mean' AND d_items.linksto = 'chartevents' ) ORDER BY chartevents.charttime ASC LIMIT 1 OFFSET 1 ) - ( SELECT chartevents.valuenum FROM chartevents WHERE chartevents.stay_id IN ( SELECT icustays.stay_id FROM icustays WHERE icustays.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10018328 ) AND icustays.outtime IS NOT NULL ORDER BY icustays.intime ASC LIMIT 1 ) AND chartevents.itemid IN ( SELECT d_items.itemid FROM d_items WHERE d_items.label = 'arterial blood pressure mean' AND d_items.linksto = 'chartevents' ) ORDER BY chartevents.charttime ASC LIMIT 1 )",
            "pred_sql": "SELECT avg(chartevents.valuenum) FROM chartevents INNER JOIN icustays ON chartevents.stay_id = icustays.stay_id WHERE icustays.subject_id = 10018328 AND chartevents.itemid IN (211,220045)",
            "gold_answer": "[['4.0']]",
            "pred_answer": "[['68.278']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally changes the logic: instead of calculating the difference between the second and first measurements on the first ICU visit, it averages all values for two itemids across all ICU stays for the patient. It ignores the first ICU visit restriction, the ordering of measurements, and the subtraction operation. This is not a localized typo or missing alias, but a completely different aggregation and filtering strategy, thus a global error.",
            "error_type": "Global: incorrect aggregation logic"
        }
    },
    "llm2sql": {
        "7a6abe3bd11c83f13ac6651a": {
            "db_id": "mimic_iv",
            "generator_name": "llm2sql",
            "question": "When did patient 10038933 come to the hospital via emergency room for the last time?",
            "gold_sql": "SELECT admissions.admittime FROM admissions WHERE admissions.subject_id = 10038933 AND admissions.admission_location = 'emergency room' AND admissions.dischtime IS NOT NULL ORDER BY admissions.admittime DESC LIMIT 1",
            "pred_sql": "SELECT admittime FROM admissions WHERE subject_id = 10038933 AND admission_type = 'emergency' AND dischtime IS NOT NULL ORDER BY admittime DESC LIMIT 1",
            "gold_answer": "[['2100-09-22 12:09:00']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses admission_type = 'emergency' instead of the correct column admission_location = 'emergency room'. This is a column reference error that does not alter the overall query structure or logic and can be fixed by using the correct column name and value.",
            "error_type": "Local: table/column reference error"
        },
        "355dc4cb5c3c6b88cd291cd3": {
            "db_id": "mimic_iv",
            "generator_name": "llm2sql",
            "question": "Get me patient 10020740's total tpn without lipids input amount on the first icu visit.",
            "gold_sql": "SELECT SUM(inputevents.totalamount) FROM inputevents WHERE inputevents.stay_id IN ( SELECT icustays.stay_id FROM icustays WHERE icustays.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10020740 ) AND icustays.outtime IS NOT NULL ORDER BY icustays.intime ASC LIMIT 1 ) AND inputevents.itemid IN ( SELECT d_items.itemid FROM d_items WHERE d_items.label = 'tpn without lipids' AND d_items.linksto = 'inputevents' )",
            "pred_sql": "SELECT SUM(I.amount) AS total_tpn_without_lipids nFROM inputevents I nJOIN icustays S ON I.stay_id = S.stay_id nWHERE I.subject_id = 10020740 nAND S.subject_id = 10020740 nAND I.itemid IN (/* list of itemIDs for TPN without lipids */) nAND S.intime = ( n SELECT MIN(intime)  n FROM icustays  n WHERE subject_id = 10020740 n) *Note:* Replace `/* list of itemIDs for TPN without lipids */` with actual item IDs corresponding to TPN without lipids if they are known. If the item IDs are unknown, further look-up in `d_items` might be necessary based on dataset documentation or manual inspection.",
            "gold_answer": "[['9000.0']]",
            "pred_answer": "near \"nFROM\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL contains a localized syntax mistake\u2014specifically the stray \u201cn\u201d prefix before FROM (\"AS total_tpn_without_lipids nFROM\") leading to a syntax error. This is a confined, clause-level issue and does not reflect a fundamental logic or structural flaw in the overall query intent. Therefore, it is a local error.",
            "error_type": "Local: syntax error"
        },
        "17d0633bd144df773e227973": {
            "db_id": "mimic_iv",
            "generator_name": "llm2sql",
            "question": "How much is a urea nitrogen lab test?",
            "gold_sql": "SELECT DISTINCT cost.cost FROM cost WHERE cost.event_type = 'labevents' AND cost.event_id IN ( SELECT labevents.row_id FROM labevents WHERE labevents.itemid IN ( SELECT d_labitems.itemid FROM d_labitems WHERE d_labitems.label = 'urea nitrogen' ) )",
            "pred_sql": "SELECT itemid FROM d_labitems WHERE label = 'urea nitrogen';",
            "gold_answer": "[['9.91']]",
            "pred_answer": "[['51006.0'], ['52647.0']]",
            "is_correct": false,
            "reasoning": "The predicted query completely ignores the cost table and returns only the itemid from d_labitems, rather than retrieving the cost of the specified lab test. This is not a minor typo or missing column; it fundamentally alters the intended logic (finding the cost) by querying the wrong table and omitting necessary joins. Thus it is a global error.",
            "error_type": "Global: incorrect table reference"
        }
    },
    "deepseek": {
        "e9ed36089be4408a078a0d60": {
            "db_id": "mimic_iv",
            "generator_name": "deepseek",
            "question": "How many times in 2100 did patient 10022281 receive a rdw test?",
            "gold_sql": "SELECT COUNT(*) FROM labevents WHERE labevents.itemid IN ( SELECT d_labitems.itemid FROM d_labitems WHERE d_labitems.label = 'rdw' ) AND labevents.hadm_id IN ( SELECT admissions.hadm_id FROM admissions WHERE admissions.subject_id = 10022281 ) AND strftime('%Y',labevents.charttime) = '2100'",
            "pred_sql": "SELECT COUNT(*) FROM labevents JOIN d_labitems ON labevents.itemid = d_labitems.itemid WHERE labevents.subject_id = 10022281 AND d_labitems.label = 'red cell distribution width (rdw)' AND strftime('%Y', labevents.charttime) = '2100';",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query fails only in the WHERE clause literal for the lab test label: it uses 'red cell distribution width (rdw)' instead of the correct 'rdw'. All other joins and filters (including filtering by patient and year) follow the intended structure. This mistake is localized to a single condition and does not require changing the overall query logic or structure.",
            "error_type": "Local: value parsing error"
        },
        "e7780f295aaf7bacd3b27961": {
            "db_id": "mimic_iv",
            "generator_name": "deepseek",
            "question": "Please tell me the total number of patients who had a famotidine (pepcid) input since 2100.",
            "gold_sql": "SELECT COUNT( DISTINCT admissions.subject_id ) FROM admissions WHERE admissions.hadm_id IN ( SELECT icustays.hadm_id FROM icustays WHERE icustays.stay_id IN ( SELECT inputevents.stay_id FROM inputevents WHERE inputevents.itemid IN ( SELECT d_items.itemid FROM d_items WHERE d_items.label = 'famotidine (pepcid)' AND d_items.linksto = 'inputevents' ) AND strftime('%Y',inputevents.starttime) >= '2100' ) )",
            "pred_sql": "SELECT COUNT(DISTINCT ie.subject_id) AS total_patients FROM inputevents ie JOIN d_items di ON ie.itemid = di.itemid WHERE di.label IN ('famotidine', 'pepcid') AND ie.starttime >= '2100-01-01 00:00:00';",
            "gold_answer": "[['17.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted query\u2019s error lies in the WHERE clause: it filters on di.label IN ('famotidine', 'pepcid') rather than matching the full label 'famotidine (pepcid)' and does not include the linksto filter. This is a localized mistake in the value condition and does not require restructuring the joins or overall logic of the query.",
            "error_type": "Local: incorrect filter value"
        },
        "f21ac0d3fff988fd6278434b": {
            "db_id": "mimic_iv",
            "generator_name": "deepseek",
            "question": "How many patients received excision of right saphenous vein, percutaneous endoscopic approach treatment within the same hospital visit after being diagnosed with essential (primary) hypertension this year?",
            "gold_sql": "SELECT COUNT( DISTINCT T1.subject_id ) FROM ( SELECT admissions.subject_id, diagnoses_icd.charttime, admissions.hadm_id FROM diagnoses_icd JOIN admissions ON diagnoses_icd.hadm_id = admissions.hadm_id WHERE diagnoses_icd.icd_code = ( SELECT d_icd_diagnoses.icd_code FROM d_icd_diagnoses WHERE d_icd_diagnoses.long_title = 'essential (primary) hypertension' ) AND datetime(diagnoses_icd.charttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T1 JOIN ( SELECT admissions.subject_id, procedures_icd.charttime, admissions.hadm_id FROM procedures_icd JOIN admissions ON procedures_icd.hadm_id = admissions.hadm_id WHERE procedures_icd.icd_code = ( SELECT d_icd_procedures.icd_code FROM d_icd_procedures WHERE d_icd_procedures.long_title = 'excision of right saphenous vein, percutaneous endoscopic approach' ) AND datetime(procedures_icd.charttime,'start of year') = datetime('2100-12-31 23:59:00','start of year','-0 year') ) AS T2 ON T1.subject_id = T2.subject_id WHERE T1.charttime < T2.charttime AND T1.hadm_id = T2.hadm_id",
            "pred_sql": "SELECT COUNT(DISTINCT p.subject_id) AS num_patients FROM patients p JOIN admissions a ON p.subject_id = a.subject_id JOIN diagnoses_icd d ON a.hadm_id = d.hadm_id JOIN d_icd_diagnoses dd ON d.icd_code = dd.icd_code JOIN procedures_icd proc ON a.hadm_id = proc.hadm_id JOIN d_icd_procedures dproc ON proc.icd_code = dproc.icd_code WHERE dd.long_title = 'Essential (primary) hypertension' AND dproc.long_title = 'Excision of right saphenous vein, percutaneous endoscopic approach' AND STRFTIME('%Y', a.admitt;",
            "gold_answer": "[['2.0']]",
            "pred_answer": "near \";\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL is syntactically incomplete, ending abruptly with \"AND STRFTIME('%Y', a.admitt;\" and causing a parse error. This is a localized syntax mistake that can be fixed without changing the overall query logic or joins.",
            "error_type": "Local: syntax error"
        }
    },
    "dinsql": {
        "853d6c6aace2c37387e3042e": {
            "db_id": "mimic_iv",
            "generator_name": "dinsql",
            "question": "Tell me about the most common five output events in 2100.",
            "gold_sql": "SELECT d_items.label FROM d_items WHERE d_items.itemid IN ( SELECT T1.itemid FROM ( SELECT outputevents.itemid, DENSE_RANK() OVER ( ORDER BY COUNT(*) DESC ) AS C1 FROM outputevents WHERE strftime('%Y',outputevents.charttime) = '2100' GROUP BY outputevents.itemid ) AS T1 WHERE T1.C1 <= 5 )",
            "pred_sql": "SELECT itemid FROM outputevents WHERE strftime('%Y', charttime) = '2100' GROUP BY itemid ORDER BY COUNT(*) DESC LIMIT 5",
            "gold_answer": "[['cerebral ventricular #1'], ['chest tube #1'], ['foley'], ['tf residual'], ['void']]",
            "pred_answer": "[['226559.0'], ['226560.0'], ['226588.0'], ['226606.0'], ['227510.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only selects the raw itemid from outputevents, failing to join to the d_items table to retrieve the event labels as required. This is a localized mistake in the SELECT clause/table reference, not a structural issue with the overall query logic or flow.",
            "error_type": "Local: table reference error"
        }
    }
}