{
    "dinsql": {
        "9268ab37a2d7fdb001795bef1e30dbe2": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "tell me the number of patients with coronary artery primary disease. (Values: CORONARY ARTERY DISEASE)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"CORONARY ARTERY DISEASE\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) FROM DEMOGRAPHIC WHERE DIAGNOSIS LIKE '%CORONARY ARTERY DISEASE%'",
            "gold_answer": "[['3.0']]",
            "pred_answer": "[['7.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL\u2019s error lies solely in the WHERE clause: it uses a LIKE '%CORONARY ARTERY DISEASE%' pattern match instead of the exact equality comparison required. This mistake broadens the match and inflates the count but does not alter the query\u2019s overall structure, joins, or logic. It can be corrected by replacing LIKE with =, making it a localized fix.",
            "error_type": "Local: incorrect operator in WHERE clause"
        }
    },
    "llm2sql": {
        "9aed3ef959f024e0ffaf5f92500bda5a": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "mention the primary disease and diagnosis short title of the subject name betty campbell. (Values: Betty Campbell)",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DIAGNOSIS\",DIAGNOSES.\"SHORT_TITLE\" FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"NAME\" = \"Betty Campbell\"",
            "pred_sql": "SELECT DIAGNOSES.LONG_TITLE, DIAGNOSES.SHORT_TITLE FROM DEMOGRAPHIC INNER JOIN DIAGNOSES ON DEMOGRAPHIC.SUBJECT_ID = DIAGNOSES.SUBJECT_ID AND DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.NAME = 'Betty Campbell';",
            "gold_answer": "[['ANGIOEDEMA', 'Acute respiratry failure'], ['ANGIOEDEMA', 'Acute uri NOS'], ['ANGIOEDEMA', 'Adv eff cardiovasc NEC'], ['ANGIOEDEMA', 'Angioneurotic edema'], ['ANGIOEDEMA', 'Backache NOS'], ['ANGIOEDEMA', 'DMII ophth nt st uncntrl'], ['ANGIOEDEMA', 'Hyperlipidemia NEC/NOS'], ['ANGIOEDEMA', 'Hypertension NOS'], ['ANGIOEDEMA', 'Myopia'], ['ANGIOEDEMA', 'Prolif diab retinopathy']]",
            "pred_answer": "[['Acute respiratory failure', 'Acute respiratry failure'], ['Acute upper respiratory infections of unspecified site', 'Acute uri NOS'], ['Angioneurotic edema, not elsewhere classified', 'Angioneurotic edema'], ['Backache, unspecified', 'Backache NOS'], ['Diabetes with ophthalmic manifestations, type II or unspecified type, not stated as uncontrolled', 'DMII ophth nt st uncntrl'], ['Myopia', 'Myopia'], ['Other and unspecified agents primarily affecting the cardiovascular system causing adverse effects in therapeutic use', 'Adv eff cardiovasc NEC'], ['Other and unspecified hyperlipidemia', 'Hyperlipidemia NEC/NOS'], ['Proliferative diabetic retinopathy', 'Prolif diab retinopathy'], ['Unspecified essential hypertension', 'Hypertension NOS']]",
            "is_correct": false,
            "reasoning": "The predicted query is joining tables correctly (even though it redundantly uses both SUBJECT_ID and HADM_ID), and the WHERE clause is correct. The only mistake is in the SELECT clause: it returns DIAGNOSES.LONG_TITLE instead of the DEMOGRAPHIC.DIAGNOSIS column (the primary disease). This is a localized error in the column selection and doesn\u2019t require changing the overall query structure or join logic.",
            "error_type": "Local: column reference error"
        },
        "04e257060d814171a01a4a75a258d385": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "how many patients are primarily suffering from t5 fracture? (Values: T5 FRACTURE)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"T5 FRACTURE\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) FROM DIAGNOSES WHERE SHORT_TITLE LIKE '%T5 FRACTURE%' OR LONG_TITLE LIKE '%T5 FRACTURE%';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the DIAGNOSES table with LIKE filters on SHORT_TITLE and LONG_TITLE, whereas the question asks for the primary diagnosis recorded in the DEMOGRAPHIC table\u2019s DIAGNOSIS column. This is not a minor typo or clause mistake but a fundamental change in table choice and logic, altering the intended query structure and meaning.",
            "error_type": "Global: wrong table used"
        },
        "0889b8c37decb7cd8458fd44dc8b8bb5": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "how many patients with polycythemia were treated with main drug? (Values: Polycythemia vera, MAIN)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DIAGNOSES.\"SHORT_TITLE\" = \"Polycythemia vera\" AND PRESCRIPTIONS.\"DRUG_TYPE\" = \"MAIN\"",
            "pred_sql": "SELECT COUNT(DISTINCT diagnoses.SUBJECT_ID) nFROM DIAGNOSES nJOIN PRESCRIPTIONS ON DIAGNOSES.SUBJECT_ID = PRESCRIPTIONS.SUBJECT_ID nAND DIAGNOSES.HADM_ID = PRESCRIPTIONS.HADM_ID nWHERE (diagnoses.SHORT_TITLE LIKE '%Polycythemia vera%' OR diagnoses.LONG_TITLE LIKE '%Polycythemia vera%') nAND PRESCRIPTIONS.DRUG_TYPE = 'MAIN';",
            "gold_answer": "[['1.0']]",
            "pred_answer": "near \"DIAGNOSES\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL contains a syntax error near \"DIAGNOSES\" due to the stray \"nFROM\" and \"nJOIN\" tokens and missing whitespace. This is a localized syntax mistake in the SELECT/FROM clause and does not affect the overall query logic or table relationships. It can be fixed by correcting the formatting and keywords without restructuring the query.",
            "error_type": "Local: syntax error"
        },
        "0f8c99adf2a5dc590120e3fc5f613dbc": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "what is the insurance and primary disease of the patient id 2560?",
            "gold_sql": "SELECT DEMOGRAPHIC.\"INSURANCE\",DEMOGRAPHIC.\"DIAGNOSIS\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"2560\"",
            "pred_sql": "SELECT DEMOGRAPHIC.INSURANCE, DIAGNOSES.LONG_TITLE FROM DEMOGRAPHIC INNER JOIN DIAGNOSES ON DEMOGRAPHIC.SUBJECT_ID = DIAGNOSES.SUBJECT_ID WHERE DEMOGRAPHIC.SUBJECT_ID = 2560;",
            "gold_answer": "[['Private', 'NEWBORN']]",
            "pred_answer": "[['Private', 'Congenital pigmentary anomalies of skin'], ['Private', 'Need for prophylactic vaccination and inoculation against viral hepatitis'], ['Private', 'Observation for suspected infectious condition'], ['Private', 'Routine or ritual circumcision'], ['Private', 'Single liveborn, born in hospital, delivered by cesarean section']]",
            "is_correct": false,
            "reasoning": "The predicted SQL incorrectly joins the DIAGNOSES table and selects DIAGNOSES.LONG_TITLE instead of using the DEMOGRAPHIC.DIAGNOSIS column. The extra JOIN and wrong column selection are localized to the SELECT and JOIN parts and do not require restructuring the overall query logic. This is a simple column reference error.",
            "error_type": "Local: table/column reference error"
        },
        "89a0044a0f95cc0d7cc6757f5a6c4d6f": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "among patients treated with base drug, how many of them had ventricular tachycardia as primary disease? (Values: VENTRICULAR TACHYCARDIA, BASE)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"VENTRICULAR TACHYCARDIA\" AND PRESCRIPTIONS.\"DRUG_TYPE\" = \"BASE\"",
            "pred_sql": "SELECT COUNT(DISTINCT d.SUBJECT_ID) FROM LAB l JOIN DIAGNOSES d ON l.SUBJECT_ID = d.SUBJECT_ID AND l.HADM_ID = d.HADM_ID WHERE l.LABEL = 'Base' AND d.LONG_TITLE = 'Ventricular tachycardia'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the LAB table and DIAGNOSES table instead of PRESCRIPTIONS and DEMOGRAPHIC, respectively. It filters on l.LABEL = 'Base' rather than PRESCRIPTIONS.DRUG_TYPE = 'BASE', and uses d.LONG_TITLE for ventricular tachycardia rather than DEMOGRAPHIC.DIAGNOSIS. This is not a simple column name or syntax mistake but a fundamental misuse of tables and joins, altering the entire query structure and intended logic.",
            "error_type": "Global: incorrect join strategy"
        }
    },
    "codes": {
        "91e4268fef7e4c6940983b195523dd3d": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "Calculate the average age of unmarried patients born after the year 2097 (Values: SINGLE)",
            "gold_sql": "SELECT AVG ( DEMOGRAPHIC.\"AGE\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"MARITAL_STATUS\" = \"SINGLE\" AND DEMOGRAPHIC.\"DOB_YEAR\" > \"2097\"",
            "pred_sql": "SELECT avg(age) FROM demographic WHERE dob > '2097-01-01' AND marital_status = 'SINGLE'",
            "gold_answer": "[['47.6']]",
            "pred_answer": "[['46.0']]",
            "is_correct": false,
            "reasoning": "The predicted query incorrectly filters on the full DOB column with a date literal ('2097-01-01') instead of using the DOB_YEAR column with a year comparison (> 2097). This mistake is confined to a specific condition and does not require restructuring joins or the overall query logic, so it is a local error.",
            "error_type": "Local: column reference/value parsing error"
        },
        "9ce7d4ba8e33f5a9bb87ec0199c5fcd2": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many patients had procedure creation of conduit between left ventricle and aorta? (Values: Creation of conduit between left ventricle and aorta)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE PROCEDURES.\"LONG_TITLE\" = \"Creation of conduit between left ventricle and aorta\"",
            "pred_sql": "SELECT count(DISTINCT procedures.subject_id) FROM procedures INNER JOIN diagnoses ON procedures.subject_id = diagnoses.subject_id WHERE diagnoses.short_title = 'Creation of conduit between left ventricle and aorta'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally alters the query\u2019s logic by joining PROCEDURES to DIAGNOSES and filtering on DIAGNOSES.SHORT_TITLE rather than filtering PROCEDURES.LONG_TITLE. This is not a minor typo or localized mistake; it changes the tables and relationships used and thus the overall meaning of the query. Therefore it is a global error.",
            "error_type": "Global: incorrect table join/condition"
        },
        "0d8668ce9bb2d5b309822a5b89240277": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "find out the birth date and time of admission for patient john gartman. (Values: John Gartman)",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DOB\",DEMOGRAPHIC.\"ADMITTIME\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"NAME\" = \"John Gartman\"",
            "pred_sql": "SELECT demographic.dob, demographic.admittime FROM demographic INNER JOIN demographic ON demographic.subject_id = demographic.subject_id WHERE demographic.name = 'John Gartman'",
            "gold_answer": "[['2083-08-25 00:00:00', '2145-05-05 18:57:00']]",
            "pred_answer": "ambiguous column name: demographic.dob",
            "is_correct": false,
            "reasoning": "The predicted SQL introduces an unnecessary self\u2010JOIN on the same table without aliases, causing ambiguous column references (demographic.dob, demographic.admittime). This is a join/local reference issue that does not change the overall query logic\u2014it\u2019s confined to the JOIN clause and column references. Hence it\u2019s a localized error, not a structural rework of the query.",
            "error_type": "Local: ambiguous column reference"
        },
        "93f1c2203790abf5e19f70304d9fa6cb": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "among patients treated with amitriptyline, calculate the number of female patients. (Values: F, Amitriptyline)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"GENDER\" = \"F\" AND PRESCRIPTIONS.\"DRUG\" = \"Amitriptyline\"",
            "pred_sql": "SELECT count(demographic.gender) FROM demographic INNER JOIN prescriptions ON demographic.subject_id = prescriptions.subject_id WHERE prescriptions.drug = 'Amitriptyline' AND demographic.gender = 'F'",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['3.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses COUNT(demographic.gender) without DISTINCT and joins PRESCRIPTIONS to DEMOGRAPHIC only on SUBJECT_ID rather than both SUBJECT_ID and HADM_ID. This incorrect join key and lack of de-duplication fundamentally changes the logic (it counts prescription rows, not unique patients), leading to an inflated count. Fixing it requires more than a minor syntax tweak\u2014it requires correcting the join relationship and adding DISTINCT, altering the core query structure.",
            "error_type": "Global: incorrect join strategy"
        },
        "00904139a2ed10eebae557a135321017": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many patients were transferred within this facilty? (Values: TRSF WITHIN THIS FACILITY)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"ADMISSION_LOCATION\" = \"TRSF WITHIN THIS FACILITY\"",
            "pred_sql": "SELECT count(subject_id) FROM demographic WHERE admission_location = 'TRANSFER FROM HOSP/EXTRAM'",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['10.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the wrong literal in the WHERE clause (\u2018TRANSFER FROM HOSP/EXTRAM\u2019 instead of the required \u2018TRSF WITHIN THIS FACILITY\u2019). This is a localized mistake in the filter value and does not affect the query\u2019s overall structure or logic.",
            "error_type": "Local: value parsing error"
        },
        "8385c7828a91dfb287c01c8c00c801d6": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many patients were admitted before the year 2103 and underwent procedure under icd9 code 93?",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"ADMITYEAR\" < \"2103\" AND PROCEDURES.\"ICD9_CODE\" = \"93\"",
            "pred_sql": "SELECT count(DISTINCT subject_id) FROM procedures WHERE icd9_code = 93 AND strftime('%Y', admittedtime) < '2103'",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such column: admittedtime",
            "is_correct": false,
            "reasoning": "The predicted SQL fails because it references a non-existent column 'admittedtime'. This is a simple column reference error (misspelling or wrong column name) and can be fixed by using the correct column name (e.g., ADMITTIME or ADMITYEAR) without altering the overall query structure or joins.",
            "error_type": "Local: table/column reference error"
        }
    },
    "deepseek": {
        "0b8b878c3c9bf9cfc59e3c2528341dfa": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "for patient id 1875, specify the icd9 code and discharge time",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DISCHTIME\",DIAGNOSES.\"SHORT_TITLE\" FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"1875\"",
            "pred_sql": "SELECT D.ICD9_CODE, DE.DISCHTIME FROM DEMOGRAPHIC DE INNER JOIN DIAGNOSES D ON DE.SUBJECT_ID = D.SUBJECT_ID AND DE.HADM_ID = D.HADM_ID WHERE DE.SUBJECT_ID = 1875;",
            "gold_answer": "[['2120-04-22 12:27:00', 'Abn react-surg proc NEC'], ['2120-04-22 12:27:00', 'Hypertension NOS'], ['2120-04-22 12:27:00', 'Injury femoral nerve'], ['2120-04-22 12:27:00', 'Malig neo bladder NEC'], ['2120-04-22 12:27:00', 'Mitral valve disorder'], ['2120-04-22 12:27:00', 'Other postop infection']]",
            "pred_answer": "[['1888.0', '2120-04-22 12:27:00'], ['4019.0', '2120-04-22 12:27:00'], ['4240.0', '2120-04-22 12:27:00'], ['9561.0', '2120-04-22 12:27:00'], ['99859.0', '2120-04-22 12:27:00'], ['E8788', '2120-04-22 12:27:00']]",
            "is_correct": false,
            "reasoning": "The predicted query differs from the ground truth only in the SELECT clause: it returns ICD9_CODE and DISCHTIME, whereas the ground truth returns DISCHTIME and SHORT_TITLE. The discrepancy is purely a column reference/selection error in the SELECT list and does not affect joins, filters, or overall query structure.",
            "error_type": "Local: column-reference error"
        },
        "9b581dcd0f727ee14875356de70bafdd": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "How many female patients use a drug named theophylline sr? (Values: F, Theophylline SR)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"GENDER\" = \"F\" AND PRESCRIPTIONS.\"DRUG\" = \"Theophylline SR\"",
            "pred_sql": "SELECT COUNT(DISTINCT D.SUBJECT_ID) AS FEMALE_PATIENTS USING_THEOPHYLLINE_SR FROM DEMOGRAPHIC D INNER JOIN PRESCRIPTIONS P ON D.SUBJECT_ID = P.SUBJECT_ID AND D.HADM_ID = P.HADM_ID WHERE D.GENDER = 'F' AND P.DRUG = 'Theophylline SR';",
            "gold_answer": "[['0.0']]",
            "pred_answer": "near \"USING_THEOPHYLLINE_SR\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL fails due to a syntax error in the SELECT clause: it attempts to assign two aliases without proper comma or AS usage (\"AS FEMALE_PATIENTS USING_THEOPHYLLINE_SR\"), which is a localized mistake in aliasing and does not affect the overall query logic or joins.",
            "error_type": "Local: syntax error"
        },
        "8404915c4b01e35617f74cf4e165a482": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "Let me know the short title of diagnoses and procedures for the patient with patient id 74463.",
            "gold_sql": "SELECT DIAGNOSES.\"SHORT_TITLE\",PROCEDURES.\"SHORT_TITLE\" FROM DIAGNOSES INNER JOIN PROCEDURES on DIAGNOSES.HADM_ID = PROCEDURES.HADM_ID WHERE DIAGNOSES.\"SUBJECT_ID\" = \"74463\"",
            "pred_sql": "SELECT SHORT_TITLE FROM DIAGNOSES WHERE SUBJECT_ID = 74463 UNION SELECT SHORT_TITLE FROM PROCEDURES WHERE SUBJECT_ID = 74463;",
            "gold_answer": "[['Abn react-artif implant', 'Dx ultrasound-heart'], ['Abn react-artif implant', 'Extracorporeal circulat'], ['Abn react-artif implant', 'Opn/oth rep aort vlv-tis'], ['Aortic valve disorder', 'Dx ultrasound-heart'], ['Aortic valve disorder', 'Extracorporeal circulat'], ['Aortic valve disorder', 'Opn/oth rep aort vlv-tis'], ['Aortocoronary bypass', 'Dx ultrasound-heart'], ['Aortocoronary bypass', 'Extracorporeal circulat'], ['Aortocoronary bypass', 'Opn/oth rep aort vlv-tis'], ['Atrial fibrillation', 'Dx ultrasound-heart'], ['Atrial fibrillation', 'Extracorporeal circulat'], ['Atrial fibrillation', 'Opn/oth rep aort vlv-tis'], ['Crnry athrscl natve vssl', 'Dx ultrasound-heart'], ['Crnry athrscl natve vssl', 'Extracorporeal circulat'], ['Crnry athrscl natve vssl', 'Opn/oth rep aort vlv-tis'], ['DMII wo cmp nt st uncntr', 'Dx ultrasound-heart'], ['DMII wo cmp nt st uncntr', 'Extracorporeal circulat'], ['DMII wo cmp nt st uncntr', 'Opn/oth rep aort vlv-tis'], ['Hyperlipidemia NEC/NOS', 'Dx ultrasound-heart'], ['Hyperlipidemia NEC/NOS', 'Extracorporeal circulat'], ['Hyperlipidemia NEC/NOS', 'Opn/oth rep aort vlv-tis'], ['Hypertension NOS', 'Dx ultrasound-heart'], ['Hypertension NOS', 'Extracorporeal circulat'], ['Hypertension NOS', 'Opn/oth rep aort vlv-tis'], ['Hypoxemia', 'Dx ultrasound-heart'], ['Hypoxemia', 'Extracorporeal circulat'], ['Hypoxemia', 'Opn/oth rep aort vlv-tis'], ['Long-term use anticoagul', 'Dx ultrasound-heart'], ['Long-term use anticoagul', 'Extracorporeal circulat'], ['Long-term use anticoagul', 'Opn/oth rep aort vlv-tis'], ['Old myocardial infarct', 'Dx ultrasound-heart'], ['Old myocardial infarct', 'Extracorporeal circulat'], ['Old myocardial infarct', 'Opn/oth rep aort vlv-tis'], ['Secundum atrial sept def', 'Dx ultrasound-heart'], ['Secundum atrial sept def', 'Extracorporeal circulat'], ['Secundum atrial sept def', 'Opn/oth rep aort vlv-tis'], ['Seroma complicting proc', 'Dx ultrasound-heart'], ['Seroma complicting proc', 'Extracorporeal circulat'], ['Seroma complicting proc', 'Opn/oth rep aort vlv-tis'], ['Status-post ptca', 'Dx ultrasound-heart'], ['Status-post ptca', 'Extracorporeal circulat'], ['Status-post ptca', 'Opn/oth rep aort vlv-tis']]",
            "pred_answer": "[['Abn react-artif implant'], ['Aortic valve disorder'], ['Aortocoronary bypass'], ['Atrial fibrillation'], ['Crnry athrscl natve vssl'], ['DMII wo cmp nt st uncntr'], ['Dx ultrasound-heart'], ['Extracorporeal circulat'], ['Hyperlipidemia NEC/NOS'], ['Hypertension NOS'], ['Hypoxemia'], ['Long-term use anticoagul'], ['Old myocardial infarct'], ['Opn/oth rep aort vlv-tis'], ['Secundum atrial sept def'], ['Seroma complicting proc'], ['Status-post ptca']]",
            "is_correct": false,
            "reasoning": "The predicted SQL replaces the intended INNER JOIN between DIAGNOSES and PROCEDURES with a UNION, fundamentally changing the query\u2019s structure and semantics. Instead of returning paired short titles for diagnoses and procedures per patient stay, it returns a single deduplicated list of titles across both tables. Fixing this requires restructuring the entire query (replacing the UNION with a proper JOIN), so it is not a localized mistake.",
            "error_type": "Global: join error"
        }
    },
    "macsql": {
        "925b64a7b970e5a56de55e7db18fbd8f": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "what is the average age of patients whose language is cape and primary disease is hyperglycemia? (Values: CAPE, HYPERGLYCEMIA)",
            "gold_sql": "SELECT AVG ( DEMOGRAPHIC.\"AGE\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"LANGUAGE\" = \"CAPE\" AND DEMOGRAPHIC.\"DIAGNOSIS\" = \"HYPERGLYCEMIA\"",
            "pred_sql": "SELECT AVG(T1.AGE) AS average_age FROM DEMOGRAPHIC AS T1 INNER JOIN DIAGNOSES AS T2 ON T1.SUBJECT_ID = T2.SUBJECT_ID AND T1.HADM_ID = T2.HADM_ID WHERE T1.LANGUAGE = 'CAPE' AND T2.LONG_TITLE LIKE '%HYPERGLYCEMIA%' AND T1.AGE IS NOT NULL AND T2.LONG_TITLE IS NOT NULL AND T1.LANGUAGE IS NOT NULL",
            "gold_answer": "[['49.0']]",
            "pred_answer": "[['None']]",
            "is_correct": false,
            "reasoning": "The predicted SQL changes the query\u2019s overall logic by joining the DEMOGRAPHIC table to DIAGNOSES and filtering on DIAGNOSES.LONG_TITLE, whereas the ground truth filters DEMOGRAPHIC.DIAGNOSIS directly. This is not a small syntax mistake but a fundamental change to the query structure and intended semantics\u2014using the wrong table and join instead of filtering the primary diagnosis column. This requires restructuring the query to match the intended meaning, so it is a global error.",
            "error_type": "Global: incorrect join/table usage"
        },
        "a54b66567c23a6ca8e774a4507f148c5": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "give me the lab test item id and lab test abnormal status of patient with patient id 22377.",
            "gold_sql": "SELECT LAB.\"ITEMID\",LAB.\"FLAG\" FROM LAB WHERE LAB.\"SUBJECT_ID\" = \"22377\"",
            "pred_sql": "SELECT ITEMID, FLAG FROM LAB WHERE SUBJECT_ID = 22377 AND FLAG IS NOT NULL",
            "gold_answer": "[['50883.0', 'None'], ['50883.0', 'None'], ['50884.0', 'None'], ['50884.0', 'None'], ['50885.0', 'abnormal'], ['50885.0', 'abnormal']]",
            "pred_answer": "[['50885.0', 'abnormal'], ['50885.0', 'abnormal']]",
            "is_correct": false,
            "reasoning": "The predicted SQL adds an extra filter `AND FLAG IS NOT NULL` in the WHERE clause, which removes rows where FLAG is NULL. The ground truth query returns all lab test statuses (including NULL flags) for SUBJECT_ID = 22377. The mistake is confined to the WHERE clause and does not change the overall query structure or table relationships\u2014just an overly restrictive filter.",
            "error_type": "Local: incorrect WHERE filter"
        },
        "9d5d968951e3f72781e48eabfa97ce79": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "tell me the icu stay id for patient stephanie suchan. (Values: Stephanie Suchan)",
            "gold_sql": "SELECT PRESCRIPTIONS.\"ICUSTAY_ID\" FROM DEMOGRAPHIC INNER JOIN PRESCRIPTIONS on DEMOGRAPHIC.HADM_ID = PRESCRIPTIONS.HADM_ID WHERE DEMOGRAPHIC.\"NAME\" = \"Stephanie Suchan\"",
            "pred_sql": "SELECT ICUSTAY_ID FROM PRESCRIPTIONS WHERE SUBJECT_ID = ( SELECT SUBJECT_ID FROM DEMOGRAPHIC WHERE NAME = 'Stephanie Suchan' ) AND HADM_ID = ( SELECT HADM_ID FROM DEMOGRAPHIC WHERE NAME = 'Stephanie Suchan' ) AND ICUSTAY_ID IS NOT NULL;",
            "gold_answer": "[['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None']]",
            "pred_answer": "[['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0'], ['242681.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL deviates from the ground truth only by adding an extra condition in the WHERE clause (AND ICUSTAY_ID IS NOT NULL), which filters out rows with NULL ICUSTAY_ID. The table joins and overall query structure remain the same; the error is confined to the WHERE clause logic and does not affect relationships between tables.",
            "error_type": "Local: where-clause error"
        },
        "061d620cdd89282af1d48f9a0f2d3931": {
            "db_id": "mimicsql",
            "generator_name": "macsql",
            "question": "get the number of alive patients who underwent open biopsy of soft tissue. (Values: 0, Open biopsy of soft tissue)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN PROCEDURES on DEMOGRAPHIC.HADM_ID = PROCEDURES.HADM_ID WHERE DEMOGRAPHIC.\"EXPIRE_FLAG\" = \"0\" AND PROCEDURES.\"LONG_TITLE\" = \"Open biopsy of soft tissue\"",
            "pred_sql": "SELECT COUNT(*) FROM ( SELECT DISTINCT P.`SUBJECT_ID` FROM PROCEDURES AS P JOIN DEMOGRAPHIC AS D ON P.`SUBJECT_ID` = D.`SUBJECT_ID` AND P.`HADM_ID` = D.`HADM_ID` WHERE P.`ICD9_CODE` = '0' -- Assuming '0' is the ICD-9 code for \"Open biopsy of soft tissue\" AND D.`EXPIRE_FLAG` = 0 ) AS AlivePatients",
            "gold_answer": "[['0.0']]",
            "pred_answer": "incomplete input",
            "is_correct": false,
            "reasoning": "The predicted query fails by filtering on PROCEDURES.ICD9_CODE = '0' instead of PROCEDURES.LONG_TITLE = 'Open biopsy of soft tissue'. This is a misuse of a column/value in the WHERE clause and does not alter the overall join structure or query logic. It is a localized error in the filter condition.",
            "error_type": "Local: table/column reference error"
        }
    },
    "qwen3": {
        "0d8e3bc0c9b32c93056a71cbc2e7882e": {
            "db_id": "mimicsql",
            "generator_name": "qwen3",
            "question": "give the number of patients who were diagnosed with personal history of colonic polyps and lab test result is abnormal. (Values: Personal history of colonic polyps)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN DIAGNOSES on DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DIAGNOSES.\"LONG_TITLE\" = \"Personal history of colonic polyps\" AND LAB.\"FLAG\" = \"abnormal\"",
            "pred_sql": "SELECT COUNT(DISTINCT d.SUBJECT_ID) FROM DIAGNOSES d JOIN LAB l ON d.SUBJECT_ID = l.SUBJECT_ID WHERE d.SHORT_TITLE = 'Personal history of colonic polyps' AND l.FLAG = 'abnormal';",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses SHORT_TITLE instead of the required LONG_TITLE (a wrong column reference) and omits the HADM_ID join condition, joining only on SUBJECT_ID. Both are localized mistakes in column reference and JOIN clause, fixable without restructuring the overall query logic.",
            "error_type": "Local: table/column reference and join-condition error"
        }
    }
}