{
    "llm2sql": {
        "0d2d4b9ce812c7d9805538e58b0de30e": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "what is the number of patients with primary disease abdominal pain who were aged less than 68 years? (Values: ABDOMINAL PAIN)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"ABDOMINAL PAIN\" AND DEMOGRAPHIC.\"AGE\" < \"68\"",
            "pred_sql": "SELECT COUNT(DISTINCT DEMOGRAPHIC.SUBJECT_ID) FROM DEMOGRAPHIC JOIN DIAGNOSES ON DEMOGRAPHIC.SUBJECT_ID = DIAGNOSES.SUBJECT_ID WHERE (DIAGNOSES.SHORT_TITLE LIKE '%ABDOMINAL PAIN%' OR DIAGNOSES.LONG_TITLE LIKE '%ABDOMINAL PAIN%') AND DEMOGRAPHIC.AGE < 68;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL changes the fundamental logic by joining with the DIAGNOSES table and filtering on SHORT_TITLE/LONG_TITLE rather than using the DEMOGRAPHIC.DIAGNOSIS column for primary disease. This join and filter shift alters the intended meaning (primary disease field vs. any diagnosis) and leads to different results. Fixing this requires restructuring the query, not just a local tweak.",
            "error_type": "Global: incorrect join error"
        },
        "0d78e61ca912d643a9233b60b95f4b40": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "What is the primary disease of Kelly Gallardo?",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DIAGNOSIS\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"NAME\" = \"Kelly Gallardo\"",
            "pred_sql": "SELECT D.LONG_TITLE FROM DIAGNOSES D INNER JOIN DEMOGRAPHIC DH ON D.SUBJECT_ID = DH.SUBJECT_ID WHERE DH.NAME = 'Kelly Gallardo';",
            "gold_answer": "[['NEWBORN']]",
            "pred_answer": "[['35-36 completed weeks of gestation'], ['Need for prophylactic vaccination and inoculation against viral hepatitis'], ['Observation for suspected infectious condition'], ['Other preterm infants, 2,000-2,499 grams'], ['Primary apnea of newborn'], ['Single liveborn, born in hospital, delivered by cesarean section']]",
            "is_correct": false,
            "reasoning": "The predicted query fundamentally misinterprets the source of the \u201cprimary disease\u201d field. Instead of selecting the DIAGNOSIS column from the DEMOGRAPHIC table (which holds the primary disease), it joins to the DIAGNOSES table and retrieves all matching LONG_TITLE entries. This is not a minor syntax or alias mistake but a structural error: the wrong table is used and the join logic is flawed, leading to unintended many-row results rather than the single primary disease value.",
            "error_type": "Global: incorrect-table-join"
        },
        "8762eb0a5667497e60e00c3d154d04a5": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "how many patients with infected right thigh graft were of american indian/alaska native ethnicty? (Values: AMERICAN INDIAN/ALASKA NATIVE, INFECTED RIGHT THIGH GRAFT)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"ETHNICITY\" = \"AMERICAN INDIAN/ALASKA NATIVE\" AND DEMOGRAPHIC.\"DIAGNOSIS\" = \"INFECTED RIGHT THIGH GRAFT\"",
            "pred_sql": "SELECT COUNT(DISTINCT DEMOGRAPHIC.SUBJECT_ID) nFROM DEMOGRAPHIC nINNER JOIN DIAGNOSES ON DEMOGRAPHIC.HADM_ID = DIAGNOSES.HADM_ID nWHERE DEMOGRAPHIC.ETHNICITY = 'AMERICAN INDIAN/ALASKA NATIVE' nAND (DIAGNOSES.LONG_TITLE = 'INFECTED RIGHT THIGH GRAFT' nOR DIAGNOSES.SHORT_TITLE = 'INFECTED RIGHT THIGH GRAFT')",
            "gold_answer": "[['0.0']]",
            "pred_answer": "near \"DEMOGRAPHIC\": syntax error",
            "is_correct": false,
            "reasoning": "The predicted SQL has a syntax error due to the stray 'n' before FROM and INNER JOIN (i.e., 'nFROM', 'nINNER JOIN'), causing SQLite to throw a syntax error. This is a localized mistake in the SELECT/JOIN clause formatting and does not reflect a deeper logical or structural misunderstanding.",
            "error_type": "Local: syntax error"
        },
        "8e5b3b23c0faa725dddd16452c1d83cd": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "Find out the number of patients with a newborn primary disease. (Values: NEWBORN)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"NEWBORN\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) FROM DIAGNOSES WHERE SHORT_TITLE LIKE '%NEWBORN%' OR LONG_TITLE LIKE '%NEWBORN%';",
            "gold_answer": "[['22.0']]",
            "pred_answer": "[['7.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL pulls from the DIAGNOSES table and uses LIKE on SHORT_TITLE and LONG_TITLE, whereas the question and ground truth use the DEMOGRAPHIC table\u2019s DIAGNOSIS column for an exact match. This changes the overall logic and data source, not just a minor clause, resulting in different patient counts. The error spans the core query structure and intended meaning.",
            "error_type": "Global: incorrect table and logic"
        },
        "02c34ef8864566dbd0a9c9ad006c1b21": {
            "db_id": "mimicsql",
            "generator_name": "llm2sql",
            "question": "find the primary disease and admission time of subject id 813.",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DIAGNOSIS\",DEMOGRAPHIC.\"ADMITTIME\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"SUBJECT_ID\" = \"813\"",
            "pred_sql": "SELECT DIAGNOSES.LONG_TITLE AS primary_disease, DEMOGRAPHIC.ADMITTIME AS admission_time FROM DIAGNOSES INNER JOIN DEMOGRAPHIC ON DIAGNOSES.SUBJECT_ID = DEMOGRAPHIC.SUBJECT_ID WHERE DIAGNOSES.SUBJECT_ID = 813;",
            "gold_answer": "[['GASTROINTESTINAL BLEED', '2179-12-15 18:01:00']]",
            "pred_answer": "[['Acute myocardial infarction of other inferior wall, initial episode of care', '2179-12-15 18:01:00'], ['Atrial fibrillation', '2179-12-15 18:01:00'], ['Cardiac complications, not elsewhere classified', '2179-12-15 18:01:00'], ['Congestive heart failure, unspecified', '2179-12-15 18:01:00'], ['Coronary atherosclerosis of native coronary artery', '2179-12-15 18:01:00'], ['Diverticulosis of colon (without mention of hemorrhage)', '2179-12-15 18:01:00'], ['Hemorrhage of gastrointestinal tract, unspecified', '2179-12-15 18:01:00'], ['Malignant neoplasm of ascending colon', '2179-12-15 18:01:00'], ['Pneumonia, organism unspecified', '2179-12-15 18:01:00']]",
            "is_correct": false,
            "reasoning": "The predicted SQL fundamentally changes the query\u2019s logic by pulling from the DIAGNOSES table instead of using the DEMOGRAPHIC.DIAGNOSIS column for the primary disease, and by joining only on SUBJECT_ID (omitting HADM_ID), it returns multiple diagnosis rows rather than a single primary disease. This is not a minor syntax or reference mistake but a flawed join strategy and table choice that alters the intended meaning of the query.",
            "error_type": "Global: incorrect join"
        }
    },
    "codes": {
        "8e4f2450d232947ef620cb4b261579f2": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "give the lab test results of patient id 2560.",
            "gold_sql": "SELECT LAB.\"FLAG\" FROM LAB WHERE LAB.\"SUBJECT_ID\" = \"2560\"",
            "pred_sql": "SELECT label, value_unit FROM lab WHERE subject_id = 2560",
            "gold_answer": "[['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['None'], ['abnormal'], ['abnormal'], ['abnormal'], ['abnormal'], ['abnormal'], ['abnormal']]",
            "pred_answer": "[['Atypical Lymphocytes', '0%'], ['Bands', '3%'], ['Basophils', '0%'], ['Bilirubin, Direct', '0.3mg/dL'], ['Bilirubin, Indirect', '2.3mg/dL'], ['Bilirubin, Total', '2.6mg/dL'], ['Eosinophils', '0%'], ['Hematocrit', '48.7%'], ['Hemoglobin', '15.6g/dL'], ['Lymphocytes', '19%'], ['MCH', '36.7pg'], ['MCHC', '32.0%'], ['MCV', '115fL'], ['Metamyelocytes', '0%'], ['Monocytes', '9%'], ['Myelocytes', '0%'], ['Neutrophils', '69%'], ['Nucleated Red Cells', '3%'], ['Platelet Count', '334K/uL'], ['RDW', '17.0%'], ['Red Blood Cells', '4.24m/uL'], ['White Blood Cells', '13.0K/uL']]",
            "is_correct": false,
            "reasoning": "The predicted SQL selects the LABEL and VALUE_UNIT columns instead of the FLAG column, which the question and ground truth specify. This is a column reference error in the SELECT clause that does not change the overall query structure or table relationships.",
            "error_type": "Local: table/column reference error"
        },
        "95467eb799726ac08b222ad6b2fa9fc8": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "Specify the total number of male patients with item id 51148 (Values: M)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"GENDER\" = \"M\" AND LAB.\"ITEMID\" = \"51148\"",
            "pred_sql": "SELECT count(subject_id) FROM lab WHERE itemid = 51148 AND value LIKE 'M%'",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such column: value",
            "is_correct": false,
            "reasoning": "The predicted SQL references a non-existent column 'value' in the LAB table (the actual column is VALUE_UNIT). This is a simple column reference error and does not affect overall query logic or structure.",
            "error_type": "Local: table/column reference error"
        },
        "96a65966374941a10a74e3436a43aadd": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "Count the number of newborn patients whose lab test fluid is blood (Values: NEWBORN, Blood)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"NEWBORN\" AND LAB.\"FLUID\" = \"Blood\"",
            "pred_sql": "SELECT count(lab.hadm_id) FROM lab INNER JOIN demographic ON lab.hadm_id = demographic.hadm_id WHERE demographic.name = 'NEWBORN' AND lab.fluid = 'Blood'",
            "gold_answer": "[['22.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses demographic.name = 'NEWBORN' instead of the correct demographic.DIAGNOSIS = 'NEWBORN', and it counts lab.hadm_id rather than counting distinct subject IDs. These are local mistakes in column references and aggregation that do not alter the overall query structure or required joins.",
            "error_type": "Local: table/column reference error"
        },
        "bb33d9ea342c4d53171831ac967d5204": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "find out the type of admission patient jerry deberry had. (Values: Jerry Deberry)",
            "gold_sql": "SELECT DEMOGRAPHIC.\"ADMISSION_TYPE\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"NAME\" = \"Jerry Deberry\"",
            "pred_sql": "SELECT admission_type FROM demographic WHERE name = 'J<NAME>'",
            "gold_answer": "[['EMERGENCY']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL simply uses an incorrect literal in the WHERE clause (\u2018J<NAME>\u2019 instead of \u2018Jerry Deberry\u2019), causing no rows to match. This is a localized mistake in the value parsing of the condition and does not affect the overall query structure or logic.",
            "error_type": "Local: value parsing error"
        },
        "9ff64e587978e15c158f7b6b80563161": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many patients are diagnosed with primary disease upper gi bleed and are born before 2112? (Values: UPPER GI BLEED)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"UPPER GI BLEED\" AND DEMOGRAPHIC.\"DOB_YEAR\" < \"2112\"",
            "pred_sql": "SELECT count(DISTINCT demographic.subject_id) FROM demographic INNER JOIN diagnoses ON demographic.subject_id = diagnoses.subject_id WHERE diagnoses.short_title = 'UPPER GI BLEED' AND demographic.dob_year < 2112",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The ground truth query filters patients based on the primary disease stored in the DEMOGRAPHIC.DIAGNOSIS column. The predicted query instead joins to the DIAGNOSES table on diagnoses.short_title, thus using secondary diagnoses rather than the primary diagnosis field. This is not a simple column typo or missing alias but a fundamentally different join strategy that changes the logic of which patients are counted.",
            "error_type": "Global: incorrect join/table usage"
        },
        "a8ed9d698cc466a86e52507edcf4e5df": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "What is the number of patients born before 2120 who had urine lab tests? (Values: Urine)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE DEMOGRAPHIC.\"DOB_YEAR\" < \"2120\" AND LAB.\"FLUID\" = \"Urine\"",
            "pred_sql": "SELECT count(DISTINCT lab.subject_id) FROM lab INNER JOIN demographic ON lab.subject_id = demographic.subject_id WHERE demographic.dob_year < 2120",
            "gold_answer": "[['48.0']]",
            "pred_answer": "[['67.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL omits the condition LAB.FLUID = 'Urine' from the WHERE clause, which is a missing filter on the lab test fluid type. This is a localized issue within the WHERE clause and does not require restructuring joins or subqueries; it can be fixed by adding the missing predicate.",
            "error_type": "Local: missing WHERE predicate"
        },
        "0dc83447bac46f820dda4a5f23a89502": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many patients born before 2078 are discharged to short term hospital? (Values: SHORT TERM HOSPITAL)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DISCHARGE_LOCATION\" = \"SHORT TERM HOSPITAL\" AND DEMOGRAPHIC.\"DOB_YEAR\" < \"2078\"",
            "pred_sql": "SELECT count(subject_id) FROM demographic WHERE dob_year < 2078",
            "gold_answer": "[['0.0']]",
            "pred_answer": "[['34.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only applies the dob_year filter and omits the discharge_location condition entirely. This is an error confined to the WHERE clause (missing filter) and does not require restructuring joins or subqueries.",
            "error_type": "Local: missing where condition"
        },
        "a042f037d40f6ca5ddaa6b3b1cd2d4fb": {
            "db_id": "mimicsql",
            "generator_name": "codes",
            "question": "how many patients were tested for triiodothyronine (t3)? (Values: Triiodothyronine (T3))",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC INNER JOIN LAB on DEMOGRAPHIC.HADM_ID = LAB.HADM_ID WHERE LAB.\"LABEL\" = \"Triiodothyronine (T3)\"",
            "pred_sql": "SELECT count(subject_id) FROM lab WHERE label = 'Triiodothyronine (T3)'",
            "gold_answer": "[['2.0']]",
            "pred_answer": "[['4.0']]",
            "is_correct": false,
            "reasoning": "The predicted query counts all lab records for Triiodothyronine (T3) (count(subject_id)) rather than the number of unique patients. It omits the DISTINCT qualifier on subject_id, leading to duplicate counts, but the overall query structure (one table, one WHERE clause) remains correct. This is a localized mistake in the aggregation rather than a flaw in the query\u2019s logic or joins.",
            "error_type": "Local: missing-distinct error"
        }
    },
    "deepseek": {
        "827507e01ab3afc178dc211fd3c77e6e": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "How many patients with an american indian/alaska native ethnic background were born before 2129? (Values: AMERICAN INDIAN/ALASKA NATIVE)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"ETHNICITY\" = \"AMERICAN INDIAN/ALASKA NATIVE\" AND DEMOGRAPHIC.\"DOB_YEAR\" < \"2129\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) FROM DEMOGRAPHIC WHERE ETHNICITY = 'AMERICAN INDIAN/ALASKA NATIVE' AND YEAR(DOB) < 2129;",
            "gold_answer": "[['0.0']]",
            "pred_answer": "no such function: YEAR",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the YEAR(DOB) function, which does not exist in SQLite, resulting in a 'no such function: YEAR' error. This is a localized issue within the WHERE clause\u2019s date handling and does not affect the overall query structure or table relationships.",
            "error_type": "Local: other-temporal error"
        },
        "9f47c8570c1f03b0c2ced60a72ab7677": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "find the diagnostic decription of diagnoses icd9 code v202. (Values: V202)",
            "gold_sql": "SELECT DIAGNOSES.\"LONG_TITLE\" FROM DIAGNOSES WHERE DIAGNOSES.\"ICD9_CODE\" = \"V202\"",
            "pred_sql": "SELECT SHORT_TITLE, LONG_TITLE FROM DIAGNOSES WHERE ICD9_CODE = 'V202';",
            "gold_answer": "[['Routine infant or child health check'], ['Routine infant or child health check']]",
            "pred_answer": "[['Routin child health exam', 'Routine infant or child health check'], ['Routin child health exam', 'Routine infant or child health check']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only differs from the ground truth in the SELECT clause: it returns both SHORT_TITLE and LONG_TITLE instead of only LONG_TITLE. The WHERE clause and table are correct, and no joins or logic are altered. This is a localized mistake in the selected columns and does not affect the overall query structure or relationships.",
            "error_type": "Local: wrong-selection error"
        },
        "089d4aad2ec39bb2d761af30e107414a": {
            "db_id": "mimicsql",
            "generator_name": "deepseek",
            "question": "Get me the number of white russian patients born before year 2103. (Values: WHITE - RUSSIAN)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"ETHNICITY\" = \"WHITE - RUSSIAN\" AND DEMOGRAPHIC.\"DOB_YEAR\" < \"2103\"",
            "pred_sql": "SELECT COUNT(SUBJECT_ID) AS NUMBER_OF_PATIENTS FROM DEMOGRAPHIC WHERE ETHNICITY = 'WHITE' AND DOB_YEAR < 2103;",
            "gold_answer": "[['1.0']]",
            "pred_answer": "[['41.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL only filters for ETHNICITY = 'WHITE' instead of the exact value 'WHITE - RUSSIAN' specified in the question. This is a mistake in the WHERE clause literal value and does not alter the overall query structure or join logic. It can be fixed by changing the string literal to the correct ethnicity value.",
            "error_type": "Local: value parsing error"
        }
    },
    "o4-mini": {
        "895ca1f9dc05114c51436d4c28f1dbaa": {
            "db_id": "mimicsql",
            "generator_name": "o4-mini",
            "question": "specify complete details of icd9 code 4591",
            "gold_sql": "SELECT PROCEDURES.\"SHORT_TITLE\",PROCEDURES.\"LONG_TITLE\" FROM PROCEDURES WHERE PROCEDURES.\"ICD9_CODE\" = \"4591\"",
            "pred_sql": "SELECT * FROM DIAGNOSES WHERE ICD9_CODE = '4591';",
            "gold_answer": "[['Sm-to-sm bowel anastom', 'Small-to-small intestinal anastomosis']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL queries the DIAGNOSES table instead of the PROCEDURES table specified by the question. This is a simple table reference error: changing the table name to PROCEDURES would fix the query without altering its overall structure or logic.",
            "error_type": "Local: table reference error"
        }
    },
    "dinsql": {
        "0cb83c2bc10e573ed3e25a658d8318e4": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "what number of patients have been diagnosed with hyperglycemia? (Values: HYPERGLYCEMIA)",
            "gold_sql": "SELECT COUNT ( DISTINCT DEMOGRAPHIC.\"SUBJECT_ID\" ) FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"DIAGNOSIS\" = \"HYPERGLYCEMIA\"",
            "pred_sql": "SELECT COUNT(DISTINCT SUBJECT_ID) FROM DIAGNOSES WHERE LONG_TITLE LIKE '%HYPERGLYCEMIA%'",
            "gold_answer": "[['3.0']]",
            "pred_answer": "[['0.0']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the DIAGNOSES table and filters on LONG_TITLE with a LIKE condition, while the ground truth uses the DEMOGRAPHIC table\u2019s DIAGNOSIS column for an exact match. This is not a simple fix within a clause\u2014it fundamentally changes which table is queried and how diagnoses are counted, altering the overall query logic.",
            "error_type": "Global: incorrect table selection"
        },
        "0a7ebbf361bf96cd1fcfb073368908b5": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "find the primary disease of robert clayton. (Values: Robert Clayton)",
            "gold_sql": "SELECT DEMOGRAPHIC.\"DIAGNOSIS\" FROM DEMOGRAPHIC WHERE DEMOGRAPHIC.\"NAME\" = \"Robert Clayton\"",
            "pred_sql": "SELECT d.LONG_TITLE FROM DEMOGRAPHIC dem JOIN DIAGNOSES d ON dem.SUBJECT_ID = d.SUBJECT_ID AND dem.HADM_ID = d.HADM_ID WHERE dem.NAME = 'Robert Clayton' GROUP BY d.LONG_TITLE ORDER BY COUNT(*) DESC LIMIT 1",
            "gold_answer": "[['ATRIAL FIBRILLATION\\\\THORACOSCOPIC MAZE PROCEDURE BILATERAL/SDA']]",
            "pred_answer": "[['Personal history of surgery to other organs']]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the DIAGNOSES table and aggregates LONG_TITLE via a JOIN and GROUP BY, whereas the ground truth simply selects the DIAGNOSIS column from the DEMOGRAPHIC table. This is not a minor syntax or column reference mistake but a fundamentally different strategy: it joins an unrelated table, groups results, and picks the most frequent LONG_TITLE rather than directly retrieving the DEMOGRAPHIC.DIAGNOSIS. This alters the intended logic and table relationships, requiring a restructuring of the query beyond a single clause fix.",
            "error_type": "Global: join error"
        },
        "8e58c53ed2c7d9da3e3d7bb4d73cfdbe": {
            "db_id": "mimicsql",
            "generator_name": "dinsql",
            "question": "find out mor10l medications type and route of administration. (Values: MOR10L)",
            "gold_sql": "SELECT PRESCRIPTIONS.\"DRUG_TYPE\",PRESCRIPTIONS.\"ROUTE\" FROM PRESCRIPTIONS WHERE PRESCRIPTIONS.\"FORMULARY_DRUG_CD\" = \"MOR10L\"",
            "pred_sql": "SELECT DISTINCT DRUG_TYPE, ROUTE FROM PRESCRIPTIONS WHERE DRUG = 'MOR10L'",
            "gold_answer": "[['MAIN', 'PO'], ['MAIN', 'PO'], ['MAIN', 'PO/NG']]",
            "pred_answer": "[]",
            "is_correct": false,
            "reasoning": "The predicted SQL uses the DRUG column in the WHERE clause instead of the FORMULARY_DRUG_CD column specified by the question. This is a column reference error in a single clause and does not require changing the overall structure or logic of the query.",
            "error_type": "Local: table/column reference error"
        }
    }
}