[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Autoimmune hepatitis (AIH)",
            "Rheumatoid arthritis (RA)",
            "Systemic lupus erythematosus (SLE)",
            "Multiple sclerosis (MS)",
            "Type 1 diabetes mellitus (T1DM)",
            "Graves' disease",
            "Hashimoto's thyroiditis",
            "Vitiligo",
            "Pernicious anemia",
            "Myasthenia gravis",
            "Sj\u00f6gren's syndrome",
            "Psoriasis",
            "Addison's disease",
            "Ulcerative colitis",
            "Crohn's disease",
            "Chronic lymphocytic thyroiditis",
            "Primary biliary cholangitis (PBC)",
            "Primary sclerosing cholangitis (PSC)",
            "Idiopathic thrombocytopenic purpura (ITP)",
            "Autoimmune hemolytic anemia (AIHA)",
            "Autoimmune thrombocytopenia",
            "Autoimmune nephritis",
            "Autoimmune hepatitis overlap syndrome",
            "Autoimmune pancreatitis"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Autoimmune hepatitis (AIH)",
                "Rheumatoid arthritis (RA)",
                "Systemic lupus erythematosus (SLE)",
                "Multiple sclerosis (MS)",
                "Type 1 diabetes mellitus (T1DM)",
                "Graves' disease",
                "Hashimoto's thyroiditis",
                "Vitiligo",
                "Pernicious anemia",
                "Myasthenia gravis",
                "Sj\u00f6gren's syndrome",
                "Psoriasis",
                "Addison's disease",
                "Ulcerative colitis",
                "Crohn's disease",
                "Chronic lymphocytic thyroiditis",
                "Primary biliary cholangitis (PBC)",
                "Primary sclerosing cholangitis (PSC)",
                "Idiopathic thrombocytopenic purpura (ITP)",
                "Autoimmune hemolytic anemia (AIHA)"
            ],
            "mismatches": [
                "Autoimmune thrombocytopenia",
                "Autoimmune nephritis",
                "Autoimmune hepatitis overlap syndrome",
                "Autoimmune pancreatitis"
            ],
            "true_referents": [
                "Addison's disease",
                "Autoimmune hemolytic anemia (AIHA)",
                "Autoimmune hepatitis (AIH)",
                "Autoimmune hepatitis overlap syndrome",
                "Autoimmune nephritis",
                "Autoimmune pancreatitis",
                "Autoimmune thrombocytopenia",
                "Chronic lymphocytic thyroiditis",
                "Crohn's disease",
                "Graves' disease",
                "Hashimoto's thyroiditis",
                "Idiopathic thrombocytopenic purpura (ITP)",
                "Multiple sclerosis (MS)",
                "Myasthenia gravis",
                "Pernicious anemia",
                "Primary biliary cholangitis (PBC)",
                "Primary sclerosing cholangitis (PSC)",
                "Psoriasis",
                "Rheumatoid arthritis (RA)",
                "Sj\u00f6gren's syndrome",
                "Systemic lupus erythematosus (SLE)",
                "Type 1 diabetes mellitus (T1DM)",
                "Ulcerative colitis",
                "Vitiligo"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Systemic Lupus Erythematosus (SLE)",
            "Rheumatoid Arthritis (RA)",
            "Type 1 Diabetes Mellitus (T1DM)",
            "Multiple Sclerosis (MS)",
            "Graves' Disease",
            "Myasthenia Gravis",
            "Inflammatory Bowel Disease (IBD)",
            "Hashimoto's Thyroiditis",
            "Sj\u00f6gren's Syndrome",
            "Vitiligo",
            "Psoriasis",
            "Addison's Disease",
            "Scleroderma",
            "Polymyositis",
            "Dermatomyositis",
            "Antiphospholipid Syndrome (APS)",
            "Guillain-Barr\u00e9 Syndrome",
            "Chronic Inflammatory Demyelinating Polyneuropathy (CIDP)",
            "Bullous Pemphigoid",
            "Pemphigus Vulgaris",
            "Celiac Disease",
            "Ulcerative Colitis",
            "Crohn's Disease",
            "Autoimmune Hepatitis"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Systemic Lupus Erythematosus (SLE)",
                "Rheumatoid Arthritis (RA)",
                "Type 1 Diabetes Mellitus (T1DM)",
                "Multiple Sclerosis (MS)",
                "Graves' Disease",
                "Myasthenia Gravis",
                "Inflammatory Bowel Disease (IBD)",
                "Hashimoto's Thyroiditis",
                "Sj\u00f6gren's Syndrome",
                "Vitiligo",
                "Psoriasis",
                "Addison's Disease",
                "Scleroderma",
                "Polymyositis",
                "Dermatomyositis",
                "Antiphospholipid Syndrome (APS)",
                "Guillain-Barr\u00e9 Syndrome",
                "Chronic Inflammatory Demyelinating Polyneuropathy (CIDP)",
                "Bullous Pemphigoid",
                "Pemphigus Vulgaris",
                "Celiac Disease",
                "Ulcerative Colitis",
                "Crohn's Disease",
                "Autoimmune Hepatitis"
            ],
            "mismatches": [],
            "true_referents": [
                "Addison's Disease",
                "Antiphospholipid Syndrome (APS)",
                "Autoimmune Hepatitis",
                "Bullous Pemphigoid",
                "Celiac Disease",
                "Chronic Inflammatory Demyelinating Polyneuropathy (CIDP)",
                "Crohn's Disease",
                "Dermatomyositis",
                "Graves' Disease",
                "Guillain-Barr\u00e9 Syndrome",
                "Hashimoto's Thyroiditis",
                "Inflammatory Bowel Disease (IBD)",
                "Multiple Sclerosis (MS)",
                "Myasthenia Gravis",
                "Pemphigus Vulgaris",
                "Polymyositis",
                "Psoriasis",
                "Rheumatoid Arthritis (RA)",
                "Scleroderma",
                "Sj\u00f6gren's Syndrome",
                "Systemic Lupus Erythematosus (SLE)",
                "Type 1 Diabetes Mellitus (T1DM)",
                "Ulcerative Colitis",
                "Vitiligo"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Systemic Lupus Erythematosus (SLE)",
            "Rheumatoid Arthritis (RA)",
            "Type 1 Diabetes Mellitus",
            "Hashimoto's Thyroiditis",
            "Graves' Disease",
            "Multiple Sclerosis (MS)",
            "Sj\u00f6gren's Syndrome",
            "Autoimmune Hemolytic Anemia (AIHA)",
            "Myasthenia Gravis",
            "Pernicious Anemia",
            "Celiac Disease",
            "Addison's Disease",
            "Autoimmune Hepatitis",
            "Guillain-Barr\u00e9 Syndrome",
            "Vasculitis",
            "Goodpasture Syndrome",
            "Pemphigus",
            "Bullous Pemphigoid",
            "Autoimmune Thrombocytopenic Purpura (ITP)",
            "Autoimmune Oophoritis",
            "Autoimmune Orchitis",
            "Autoimmune Encephalitis",
            "Autoimmune Myocarditis",
            "Autoimmune Pancreatitis",
            "Autoimmune Uveitis"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Systemic Lupus Erythematosus (SLE)",
                "Rheumatoid Arthritis (RA)",
                "Type 1 Diabetes Mellitus",
                "Hashimoto's Thyroiditis",
                "Graves' Disease",
                "Multiple Sclerosis (MS)",
                "Sj\u00f6gren's Syndrome",
                "Autoimmune Hemolytic Anemia (AIHA)",
                "Myasthenia Gravis",
                "Pernicious Anemia",
                "Celiac Disease",
                "Addison's Disease",
                "Autoimmune Hepatitis",
                "Guillain-Barr\u00e9 Syndrome",
                "Vasculitis",
                "Goodpasture Syndrome",
                "Pemphigus",
                "Bullous Pemphigoid",
                "Autoimmune Thrombocytopenic Purpura (ITP)",
                "Autoimmune Oophoritis",
                "Autoimmune Orchitis",
                "Autoimmune Encephalitis",
                "Autoimmune Myocarditis",
                "Autoimmune Pancreatitis"
            ],
            "mismatches": [
                "Autoimmune Uveitis"
            ],
            "true_referents": [
                "Addison's Disease",
                "Autoimmune Encephalitis",
                "Autoimmune Hemolytic Anemia (AIHA)",
                "Autoimmune Hepatitis",
                "Autoimmune Myocarditis",
                "Autoimmune Oophoritis",
                "Autoimmune Orchitis",
                "Autoimmune Pancreatitis",
                "Autoimmune Thrombocytopenic Purpura (ITP)",
                "Bullous Pemphigoid",
                "Celiac Disease",
                "Goodpasture Syndrome",
                "Graves' Disease",
                "Guillain-Barr\u00e9 Syndrome",
                "Hashimoto's Thyroiditis",
                "Multiple Sclerosis (MS)",
                "Myasthenia Gravis",
                "Pemphigus",
                "Pernicious Anemia",
                "Rheumatoid Arthritis (RA)",
                "Sj\u00f6gren's Syndrome",
                "Systemic Lupus Erythematosus (SLE)",
                "Type 1 Diabetes Mellitus",
                "Vasculitis"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Systemic Lupus Erythematosus (SLE)",
            "Rheumatoid Arthritis (RA)",
            "Type 1 Diabetes Mellitus (T1DM)",
            "Multiple Sclerosis (MS)",
            "Hashimoto's Thyroiditis (HT)",
            "Graves' Disease (GD)",
            "Psoriasis (Ps)",
            "Inflammatory Bowel Disease - Crohn's Disease (IBD-CD)",
            "Inflammatory Bowel Disease - Ulcerative Colitis (IBD-UC)",
            "Autoimmune Hemolytic Anemia (AIHA)",
            "Idiopathic Thrombocytopenic Purpura (ITP)",
            "Goodpasture's Syndrome (GPS)",
            "Myasthenia Gravis (MG)",
            "Guillain-Barr\u00e9 Syndrome (GBS)",
            "Primary Biliary Cholangitis (PBC)",
            "Primary Sclerosing Cholangitis (PSC)",
            "Sj\u00f6gren's Syndrome (SS)",
            "Addison's Disease (AD)",
            "Celiac Disease (CD)",
            "Vitiligo (Vit)",
            "Pemphigus Vulgaris (PV)",
            "Bullous Pemphigoid (BP)",
            "Antiphospholipid Syndrome (APS)",
            "Vasculitis - Granulomatosis with Polyangiitis (GPA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Systemic Lupus Erythematosus (SLE)",
                "Rheumatoid Arthritis (RA)",
                "Type 1 Diabetes Mellitus (T1DM)",
                "Multiple Sclerosis (MS)",
                "Hashimoto's Thyroiditis (HT)",
                "Graves' Disease (GD)",
                "Psoriasis (Ps)",
                "Inflammatory Bowel Disease - Crohn's Disease (IBD-CD)",
                "Inflammatory Bowel Disease - Ulcerative Colitis (IBD-UC)",
                "Autoimmune Hemolytic Anemia (AIHA)",
                "Idiopathic Thrombocytopenic Purpura (ITP)",
                "Goodpasture's Syndrome (GPS)",
                "Myasthenia Gravis (MG)",
                "Guillain-Barr\u00e9 Syndrome (GBS)",
                "Primary Biliary Cholangitis (PBC)",
                "Primary Sclerosing Cholangitis (PSC)",
                "Sj\u00f6gren's Syndrome (SS)",
                "Addison's Disease (AD)",
                "Celiac Disease (CD)",
                "Vitiligo (Vit)",
                "Pemphigus Vulgaris (PV)",
                "Bullous Pemphigoid (BP)",
                "Antiphospholipid Syndrome (APS)",
                "Vasculitis - Granulomatosis with Polyangiitis (GPA)"
            ],
            "mismatches": [],
            "true_referents": [
                "Addison's Disease (AD)",
                "Antiphospholipid Syndrome (APS)",
                "Autoimmune Hemolytic Anemia (AIHA)",
                "Bullous Pemphigoid (BP)",
                "Celiac Disease (CD)",
                "Goodpasture's Syndrome (GPS)",
                "Graves' Disease (GD)",
                "Guillain-Barr\u00e9 Syndrome (GBS)",
                "Hashimoto's Thyroiditis (HT)",
                "Idiopathic Thrombocytopenic Purpura (ITP)",
                "Inflammatory Bowel Disease - Crohn's Disease (IBD-CD)",
                "Inflammatory Bowel Disease - Ulcerative Colitis (IBD-UC)",
                "Multiple Sclerosis (MS)",
                "Myasthenia Gravis (MG)",
                "Pemphigus Vulgaris (PV)",
                "Primary Biliary Cholangitis (PBC)",
                "Primary Sclerosing Cholangitis (PSC)",
                "Psoriasis (Ps)",
                "Rheumatoid Arthritis (RA)",
                "Sj\u00f6gren's Syndrome (SS)",
                "Systemic Lupus Erythematosus (SLE)",
                "Type 1 Diabetes Mellitus (T1DM)",
                "Vasculitis - Granulomatosis with Polyangiitis (GPA)",
                "Vitiligo (Vit)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Systemic Lupus Erythematosus (SLE)",
            "Rheumatoid Arthritis (RA)",
            "Type 1 Diabetes Mellitus (T1DM)",
            "Graves' Disease",
            "Hashimoto's Thyroiditis",
            "Multiple Sclerosis (MS)",
            "Psoriasis",
            "Ankylosing Spondylitis",
            "Celiac Disease",
            "Sj\u00f6gren's Syndrome",
            "Myasthenia Gravis (MG)",
            "Pemphigus Vulgaris",
            "Autoimmune Hemolytic Anemia (AIHA)",
            "Idiopathic Thrombocytopenic Purpura (ITP)",
            "Addison's Disease",
            "Pernicious Anemia",
            "Vasculitis",
            "Scleroderma",
            "Polymyositis",
            "Dermatomyositis",
            "Goodpasture's Syndrome",
            "Antiphospholipid Syndrome",
            "Autoimmune Hepatitis",
            "Wegener's Granulomatosis"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Systemic Lupus Erythematosus (SLE)",
                "Rheumatoid Arthritis (RA)",
                "Type 1 Diabetes Mellitus (T1DM)",
                "Graves' Disease",
                "Hashimoto's Thyroiditis",
                "Multiple Sclerosis (MS)",
                "Psoriasis",
                "Ankylosing Spondylitis",
                "Celiac Disease",
                "Sj\u00f6gren's Syndrome",
                "Myasthenia Gravis (MG)",
                "Pemphigus Vulgaris",
                "Autoimmune Hemolytic Anemia (AIHA)",
                "Idiopathic Thrombocytopenic Purpura (ITP)",
                "Addison's Disease",
                "Pernicious Anemia",
                "Vasculitis",
                "Scleroderma",
                "Polymyositis",
                "Dermatomyositis",
                "Goodpasture's Syndrome",
                "Antiphospholipid Syndrome",
                "Autoimmune Hepatitis",
                "Wegener's Granulomatosis"
            ],
            "mismatches": [],
            "true_referents": [
                "Addison's Disease",
                "Ankylosing Spondylitis",
                "Antiphospholipid Syndrome",
                "Autoimmune Hemolytic Anemia (AIHA)",
                "Autoimmune Hepatitis",
                "Celiac Disease",
                "Dermatomyositis",
                "Goodpasture's Syndrome",
                "Graves' Disease",
                "Hashimoto's Thyroiditis",
                "Idiopathic Thrombocytopenic Purpura (ITP)",
                "Multiple Sclerosis (MS)",
                "Myasthenia Gravis (MG)",
                "Pemphigus Vulgaris",
                "Pernicious Anemia",
                "Polymyositis",
                "Psoriasis",
                "Rheumatoid Arthritis (RA)",
                "Scleroderma",
                "Sj\u00f6gren's Syndrome",
                "Systemic Lupus Erythematosus (SLE)",
                "Type 1 Diabetes Mellitus (T1DM)",
                "Vasculitis",
                "Wegener's Granulomatosis"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Systemic Lupus Erythematosus (SLE)",
            "Rheumatoid Arthritis (RA)",
            "Hashimoto's Thyroiditis",
            "Graves' Disease",
            "Multiple Sclerosis (MS)",
            "Type 1 Diabetes Mellitus",
            "Pernicious Anemia",
            "Sj\u00f6gren's Syndrome",
            "Myasthenia Gravis",
            "Celiac Disease",
            "Autoimmune Hepatitis",
            "Dermatomyositis",
            "Vasculitis",
            "Psoriasis",
            "Ankylosing Spondylitis",
            "Guillain-Barr\u00e9 Syndrome",
            "Alopecia Areata",
            "Chronic Inflammatory Demyelinating Polyneuropathy (CIDP)",
            "Scleroderma",
            "Antiphospholipid Syndrome",
            "Beh\u00e7et's Disease",
            "Idiopathic Thrombocytopenic Purpura (ITP)",
            "Crohn's Disease",
            "Ulcerative Colitis"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Systemic Lupus Erythematosus (SLE)",
                "Rheumatoid Arthritis (RA)",
                "Hashimoto's Thyroiditis",
                "Graves' Disease",
                "Multiple Sclerosis (MS)",
                "Type 1 Diabetes Mellitus",
                "Pernicious Anemia",
                "Sj\u00f6gren's Syndrome",
                "Myasthenia Gravis",
                "Celiac Disease",
                "Autoimmune Hepatitis",
                "Dermatomyositis",
                "Vasculitis",
                "Psoriasis",
                "Ankylosing Spondylitis",
                "Guillain-Barr\u00e9 Syndrome",
                "Alopecia Areata",
                "Chronic Inflammatory Demyelinating Polyneuropathy (CIDP)",
                "Scleroderma",
                "Antiphospholipid Syndrome",
                "Beh\u00e7et's Disease",
                "Idiopathic Thrombocytopenic Purpura (ITP)",
                "Crohn's Disease",
                "Ulcerative Colitis"
            ],
            "mismatches": [],
            "true_referents": [
                "Alopecia Areata",
                "Ankylosing Spondylitis",
                "Antiphospholipid Syndrome",
                "Autoimmune Hepatitis",
                "Beh\u00e7et's Disease",
                "Celiac Disease",
                "Chronic Inflammatory Demyelinating Polyneuropathy (CIDP)",
                "Crohn's Disease",
                "Dermatomyositis",
                "Graves' Disease",
                "Guillain-Barr\u00e9 Syndrome",
                "Hashimoto's Thyroiditis",
                "Idiopathic Thrombocytopenic Purpura (ITP)",
                "Multiple Sclerosis (MS)",
                "Myasthenia Gravis",
                "Pernicious Anemia",
                "Psoriasis",
                "Rheumatoid Arthritis (RA)",
                "Scleroderma",
                "Sj\u00f6gren's Syndrome",
                "Systemic Lupus Erythematosus (SLE)",
                "Type 1 Diabetes Mellitus",
                "Ulcerative Colitis",
                "Vasculitis"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Systemic Lupus Erythematosus (SLE)",
            "Rheumatoid Arthritis (RA)",
            "Hashimoto's Thyroiditis",
            "Graves' Disease",
            "Type 1 Diabetes Mellitus",
            "Multiple Sclerosis (MS)",
            "Psoriasis",
            "Sjogren's Syndrome",
            "Addison's Disease",
            "Pernicious Anemia",
            "Celiac Disease",
            "Vitiligo",
            "Guillain-Barre Syndrome",
            "Goodpasture's Syndrome",
            "Autoimmune Hepatitis",
            "Myasthenia Gravis",
            "Autoimmune Uveitis",
            "Autoimmune Hemolytic Anemia",
            "Autoimmune Thrombocytopenic Purpura",
            "Autoimmune Lymphoproliferative Syndrome",
            "Autoimmune Encephalitis",
            "Autoimmune Pancreatitis",
            "Autoimmune Inner Ear Disease (AIED)",
            "Scleroderma"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Systemic Lupus Erythematosus (SLE)",
                "Rheumatoid Arthritis (RA)",
                "Hashimoto's Thyroiditis",
                "Graves' Disease",
                "Type 1 Diabetes Mellitus",
                "Multiple Sclerosis (MS)",
                "Psoriasis",
                "Sjogren's Syndrome",
                "Addison's Disease",
                "Pernicious Anemia",
                "Celiac Disease",
                "Vitiligo",
                "Guillain-Barre Syndrome",
                "Goodpasture's Syndrome",
                "Autoimmune Hepatitis",
                "Myasthenia Gravis",
                "Autoimmune Uveitis",
                "Autoimmune Hemolytic Anemia",
                "Autoimmune Thrombocytopenic Purpura",
                "Autoimmune Lymphoproliferative Syndrome",
                "Autoimmune Encephalitis",
                "Autoimmune Pancreatitis",
                "Autoimmune Inner Ear Disease (AIED)",
                "Scleroderma"
            ],
            "mismatches": [],
            "true_referents": [
                "Addison's Disease",
                "Autoimmune Encephalitis",
                "Autoimmune Hemolytic Anemia",
                "Autoimmune Hepatitis",
                "Autoimmune Inner Ear Disease (AIED)",
                "Autoimmune Lymphoproliferative Syndrome",
                "Autoimmune Pancreatitis",
                "Autoimmune Thrombocytopenic Purpura",
                "Autoimmune Uveitis",
                "Celiac Disease",
                "Goodpasture's Syndrome",
                "Graves' Disease",
                "Guillain-Barre Syndrome",
                "Hashimoto's Thyroiditis",
                "Multiple Sclerosis (MS)",
                "Myasthenia Gravis",
                "Pernicious Anemia",
                "Psoriasis",
                "Rheumatoid Arthritis (RA)",
                "Scleroderma",
                "Sjogren's Syndrome",
                "Systemic Lupus Erythematosus (SLE)",
                "Type 1 Diabetes Mellitus",
                "Vitiligo"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Rheumatoid arthritis",
            "Systemic lupus erythematosus",
            "Type 1 diabetes",
            "Multiple sclerosis",
            "Graves' disease",
            "Hashimoto's thyroiditis",
            "Myasthenia gravis",
            "Pernicious anemia",
            "Celiac disease",
            "Ulcerative colitis",
            "Crohn's disease",
            "Psoriasis",
            "Sj\u00f6gren's syndrome",
            "Antiphospholipid syndrome",
            "Autoimmune hepatitis",
            "Vitiligo",
            "Polymyalgia rheumatica",
            "Polymyositis",
            "Dermatomyositis",
            "Scleroderma",
            "Goodpasture's syndrome",
            "Autoimmune encephalitis",
            "Autoimmune hemolytic anemia",
            "Autoimmune thrombocytopenia"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rheumatoid arthritis",
                "Systemic lupus erythematosus",
                "Type 1 diabetes",
                "Multiple sclerosis",
                "Graves' disease",
                "Hashimoto's thyroiditis",
                "Myasthenia gravis",
                "Pernicious anemia",
                "Celiac disease",
                "Ulcerative colitis",
                "Crohn's disease",
                "Psoriasis",
                "Sj\u00f6gren's syndrome",
                "Antiphospholipid syndrome",
                "Autoimmune hepatitis",
                "Vitiligo",
                "Polymyalgia rheumatica",
                "Polymyositis",
                "Dermatomyositis",
                "Scleroderma",
                "Goodpasture's syndrome",
                "Autoimmune encephalitis",
                "Autoimmune hemolytic anemia",
                "Autoimmune thrombocytopenia"
            ],
            "mismatches": [],
            "true_referents": [
                "Antiphospholipid syndrome",
                "Autoimmune encephalitis",
                "Autoimmune hemolytic anemia",
                "Autoimmune hepatitis",
                "Autoimmune thrombocytopenia",
                "Celiac disease",
                "Crohn's disease",
                "Dermatomyositis",
                "Goodpasture's syndrome",
                "Graves' disease",
                "Hashimoto's thyroiditis",
                "Multiple sclerosis",
                "Myasthenia gravis",
                "Pernicious anemia",
                "Polymyalgia rheumatica",
                "Polymyositis",
                "Psoriasis",
                "Rheumatoid arthritis",
                "Scleroderma",
                "Sj\u00f6gren's syndrome",
                "Systemic lupus erythematosus",
                "Type 1 diabetes",
                "Ulcerative colitis",
                "Vitiligo"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Rheumatoid arthritis (RA)",
            "Systemic lupus erythematosus (SLE)",
            "Multiple sclerosis (MS)",
            "Type 1 diabetes mellitus (T1D)",
            "Hashimoto's thyroiditis",
            "Graves' disease",
            "Celiac disease",
            "Psoriasis",
            "Inflammatory bowel disease (IBD)",
            "Ankylosing spondylitis",
            "Sj\u00f6gren's syndrome",
            "Addison's disease",
            "Autoimmune hepatitis",
            "Pemphigus vulgaris",
            "Goodpasture's syndrome",
            "Autoimmune uveitis",
            "Vasculitis",
            "Pernicious anemia",
            "Guillain-Barr\u00e9 syndrome",
            "Myasthenia gravis",
            "Scleroderma (Systemic sclerosis)",
            "Autoimmune myocarditis",
            "Autoimmune thrombocytopenia",
            "Dermatitis herpetiformis"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rheumatoid arthritis (RA)",
                "Systemic lupus erythematosus (SLE)",
                "Multiple sclerosis (MS)",
                "Type 1 diabetes mellitus (T1D)",
                "Hashimoto's thyroiditis",
                "Graves' disease",
                "Celiac disease",
                "Psoriasis",
                "Inflammatory bowel disease (IBD)",
                "Ankylosing spondylitis",
                "Sj\u00f6gren's syndrome",
                "Addison's disease",
                "Autoimmune hepatitis",
                "Pemphigus vulgaris",
                "Goodpasture's syndrome",
                "Autoimmune uveitis",
                "Vasculitis",
                "Pernicious anemia",
                "Guillain-Barr\u00e9 syndrome",
                "Myasthenia gravis",
                "Scleroderma (Systemic sclerosis)",
                "Autoimmune myocarditis",
                "Autoimmune thrombocytopenia",
                "Dermatitis herpetiformis"
            ],
            "mismatches": [],
            "true_referents": [
                "Addison's disease",
                "Ankylosing spondylitis",
                "Autoimmune hepatitis",
                "Autoimmune myocarditis",
                "Autoimmune thrombocytopenia",
                "Autoimmune uveitis",
                "Celiac disease",
                "Dermatitis herpetiformis",
                "Goodpasture's syndrome",
                "Graves' disease",
                "Guillain-Barr\u00e9 syndrome",
                "Hashimoto's thyroiditis",
                "Inflammatory bowel disease (IBD)",
                "Multiple sclerosis (MS)",
                "Myasthenia gravis",
                "Pemphigus vulgaris",
                "Pernicious anemia",
                "Psoriasis",
                "Rheumatoid arthritis (RA)",
                "Scleroderma (Systemic sclerosis)",
                "Sj\u00f6gren's syndrome",
                "Systemic lupus erythematosus (SLE)",
                "Type 1 diabetes mellitus (T1D)",
                "Vasculitis"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Systemic Lupus Erythematosus (SLE)",
            "Rheumatoid Arthritis (RA)",
            "Multiple Sclerosis (MS)",
            "Type 1 Diabetes Mellitus",
            "Graves' Disease",
            "Hashimoto's Thyroiditis",
            "Myasthenia Gravis",
            "Sj\u00f6gren's Syndrome",
            "Celiac Disease",
            "Addison's Disease",
            "Pernicious Anemia",
            "Pemphigus Vulgaris",
            "Bullous Pemphigoid",
            "Goodpasture's Syndrome",
            "Antiphospholipid Syndrome",
            "Polymyositis",
            "Dermatomyositis",
            "Scleroderma",
            "Primary Biliary Cholangitis (PBC)",
            "Autoimmune Hepatitis",
            "Vasculitis",
            "Guillain-Barr\u00e9 Syndrome",
            "Psoriasis",
            "Vitiligo"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Systemic Lupus Erythematosus (SLE)",
                "Rheumatoid Arthritis (RA)",
                "Multiple Sclerosis (MS)",
                "Type 1 Diabetes Mellitus",
                "Graves' Disease",
                "Hashimoto's Thyroiditis",
                "Myasthenia Gravis",
                "Sj\u00f6gren's Syndrome",
                "Celiac Disease",
                "Addison's Disease",
                "Pernicious Anemia",
                "Pemphigus Vulgaris",
                "Bullous Pemphigoid",
                "Goodpasture's Syndrome",
                "Antiphospholipid Syndrome",
                "Polymyositis",
                "Dermatomyositis",
                "Scleroderma",
                "Primary Biliary Cholangitis (PBC)",
                "Autoimmune Hepatitis",
                "Vasculitis",
                "Guillain-Barr\u00e9 Syndrome",
                "Psoriasis",
                "Vitiligo"
            ],
            "mismatches": [],
            "true_referents": [
                "Addison's Disease",
                "Antiphospholipid Syndrome",
                "Autoimmune Hepatitis",
                "Bullous Pemphigoid",
                "Celiac Disease",
                "Dermatomyositis",
                "Goodpasture's Syndrome",
                "Graves' Disease",
                "Guillain-Barr\u00e9 Syndrome",
                "Hashimoto's Thyroiditis",
                "Multiple Sclerosis (MS)",
                "Myasthenia Gravis",
                "Pemphigus Vulgaris",
                "Pernicious Anemia",
                "Polymyositis",
                "Primary Biliary Cholangitis (PBC)",
                "Psoriasis",
                "Rheumatoid Arthritis (RA)",
                "Scleroderma",
                "Sj\u00f6gren's Syndrome",
                "Systemic Lupus Erythematosus (SLE)",
                "Type 1 Diabetes Mellitus",
                "Vasculitis",
                "Vitiligo"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Systemic lupus erythematosus (SLE)",
            "Rheumatoid arthritis (RA)",
            "Type 1 diabetes mellitus (T1DM)",
            "Multiple sclerosis (MS)",
            "Graves' disease",
            "Hashimoto's thyroiditis",
            "Myasthenia gravis (MG)",
            "Pernicious anemia",
            "Sj\u00f6gren's syndrome",
            "Goodpasture syndrome",
            "Autoimmune hepatitis",
            "Primary biliary cholangitis (PBC)",
            "Celiac disease",
            "Inflammatory bowel disease (IBD)",
            "Psoriasis",
            "Scleroderma",
            "Dermatomyositis",
            "Polymyositis",
            "Antiphospholipid syndrome (APS)",
            "Autoimmune vasculitis",
            "Autoimmune hemolytic anemia (AIHA)",
            "Idiopathic thrombocytopenic purpura (ITP)",
            "Autoimmune neutropenia",
            "Autoimmune polyglandular syndrome (APS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Systemic lupus erythematosus (SLE)",
                "Rheumatoid arthritis (RA)",
                "Type 1 diabetes mellitus (T1DM)",
                "Multiple sclerosis (MS)",
                "Graves' disease",
                "Hashimoto's thyroiditis",
                "Myasthenia gravis (MG)",
                "Pernicious anemia",
                "Sj\u00f6gren's syndrome",
                "Goodpasture syndrome",
                "Autoimmune hepatitis",
                "Primary biliary cholangitis (PBC)",
                "Celiac disease",
                "Inflammatory bowel disease (IBD)",
                "Psoriasis",
                "Scleroderma",
                "Dermatomyositis",
                "Polymyositis",
                "Antiphospholipid syndrome (APS)",
                "Autoimmune vasculitis",
                "Autoimmune hemolytic anemia (AIHA)",
                "Idiopathic thrombocytopenic purpura (ITP)",
                "Autoimmune neutropenia",
                "Autoimmune polyglandular syndrome (APS)"
            ],
            "mismatches": [],
            "true_referents": [
                "Antiphospholipid syndrome (APS)",
                "Autoimmune hemolytic anemia (AIHA)",
                "Autoimmune hepatitis",
                "Autoimmune neutropenia",
                "Autoimmune polyglandular syndrome (APS)",
                "Autoimmune vasculitis",
                "Celiac disease",
                "Dermatomyositis",
                "Goodpasture syndrome",
                "Graves' disease",
                "Hashimoto's thyroiditis",
                "Idiopathic thrombocytopenic purpura (ITP)",
                "Inflammatory bowel disease (IBD)",
                "Multiple sclerosis (MS)",
                "Myasthenia gravis (MG)",
                "Pernicious anemia",
                "Polymyositis",
                "Primary biliary cholangitis (PBC)",
                "Psoriasis",
                "Rheumatoid arthritis (RA)",
                "Scleroderma",
                "Sj\u00f6gren's syndrome",
                "Systemic lupus erythematosus (SLE)",
                "Type 1 diabetes mellitus (T1DM)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Rheumatoid arthritis (RA)",
            "Systemic lupus erythematosus (SLE)",
            "Multiple sclerosis (MS)",
            "Type 1 diabetes mellitus",
            "Hashimoto's thyroiditis",
            "Graves' disease",
            "Myasthenia gravis",
            "Pernicious anemia",
            "Addison's disease",
            "Vitiligo",
            "Sj\u00f6gren's syndrome",
            "Antiphospholipid syndrome",
            "Autoimmune hepatitis",
            "Inflammatory bowel disease (IBD)",
            "Psoriasis",
            "Scleroderma",
            "Polymyositis",
            "Dermatomyositis",
            "Autoimmune hemolytic anemia",
            "Autoimmune thrombocytopenic purpura (ATP)",
            "Guillain-Barr\u00e9 syndrome",
            "Goodpasture's syndrome",
            "Pemphigus vulgaris",
            "Autoimmune polyendocrine syndrome"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rheumatoid arthritis (RA)",
                "Systemic lupus erythematosus (SLE)",
                "Multiple sclerosis (MS)",
                "Type 1 diabetes mellitus",
                "Hashimoto's thyroiditis",
                "Graves' disease",
                "Myasthenia gravis",
                "Pernicious anemia",
                "Addison's disease",
                "Vitiligo",
                "Sj\u00f6gren's syndrome",
                "Antiphospholipid syndrome",
                "Autoimmune hepatitis",
                "Inflammatory bowel disease (IBD)",
                "Psoriasis",
                "Scleroderma",
                "Polymyositis",
                "Dermatomyositis",
                "Autoimmune hemolytic anemia",
                "Autoimmune thrombocytopenic purpura (ATP)",
                "Guillain-Barr\u00e9 syndrome",
                "Goodpasture's syndrome",
                "Pemphigus vulgaris",
                "Autoimmune polyendocrine syndrome"
            ],
            "mismatches": [],
            "true_referents": [
                "Addison's disease",
                "Antiphospholipid syndrome",
                "Autoimmune hemolytic anemia",
                "Autoimmune hepatitis",
                "Autoimmune polyendocrine syndrome",
                "Autoimmune thrombocytopenic purpura (ATP)",
                "Dermatomyositis",
                "Goodpasture's syndrome",
                "Graves' disease",
                "Guillain-Barr\u00e9 syndrome",
                "Hashimoto's thyroiditis",
                "Inflammatory bowel disease (IBD)",
                "Multiple sclerosis (MS)",
                "Myasthenia gravis",
                "Pemphigus vulgaris",
                "Pernicious anemia",
                "Polymyositis",
                "Psoriasis",
                "Rheumatoid arthritis (RA)",
                "Scleroderma",
                "Sj\u00f6gren's syndrome",
                "Systemic lupus erythematosus (SLE)",
                "Type 1 diabetes mellitus",
                "Vitiligo"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Autoimmune Hepatitis (AIH)",
            "Graves' Disease (GD)",
            "Hashimoto's Thyroiditis (HT)",
            "Rheumatoid Arthritis (RA)",
            "Systemic Lupus Erythematosus (SLE)",
            "Multiple Sclerosis (MS)",
            "Type 1 Diabetes Mellitus (T1DM)",
            "Myasthenia Gravis (MG)",
            "Guillain-Barr\u00e9 Syndrome (GBS)",
            "Pemphigus Vulgaris (PV)",
            "Scleroderma (SSc)",
            "Sj\u00f6gren's Syndrome (SS)",
            "Antiphospholipid Syndrome (APS)",
            "Inflammatory Bowel Disease (IBD)",
            "Celiac Disease (CD)",
            "Vitiligo (VIT)",
            "Psoriasis (PSO)",
            "Alopecia Areata (AA)",
            "Autoimmune Hemolytic Anemia (AIHA)",
            "Idiopathic Thrombocytopenic Purpura (ITP)",
            "Goodpasture's Syndrome (GS)",
            "Autoimmune Encephalitis (AIE)",
            "Autoimmune Nephritis (AIN)",
            "Autoimmune Neuropathy (AIN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Autoimmune Hepatitis (AIH)",
                "Graves' Disease (GD)",
                "Hashimoto's Thyroiditis (HT)",
                "Rheumatoid Arthritis (RA)",
                "Systemic Lupus Erythematosus (SLE)",
                "Multiple Sclerosis (MS)",
                "Type 1 Diabetes Mellitus (T1DM)",
                "Myasthenia Gravis (MG)",
                "Guillain-Barr\u00e9 Syndrome (GBS)",
                "Pemphigus Vulgaris (PV)",
                "Scleroderma (SSc)",
                "Sj\u00f6gren's Syndrome (SS)",
                "Antiphospholipid Syndrome (APS)",
                "Inflammatory Bowel Disease (IBD)",
                "Celiac Disease (CD)",
                "Vitiligo (VIT)",
                "Psoriasis (PSO)",
                "Alopecia Areata (AA)",
                "Autoimmune Hemolytic Anemia (AIHA)",
                "Idiopathic Thrombocytopenic Purpura (ITP)",
                "Goodpasture's Syndrome (GS)",
                "Autoimmune Encephalitis (AIE)"
            ],
            "mismatches": [
                "Autoimmune Nephritis (AIN)",
                "Autoimmune Neuropathy (AIN)"
            ],
            "true_referents": [
                "Alopecia Areata (AA)",
                "Antiphospholipid Syndrome (APS)",
                "Autoimmune Encephalitis (AIE)",
                "Autoimmune Hemolytic Anemia (AIHA)",
                "Autoimmune Hepatitis (AIH)",
                "Autoimmune Nephritis (AIN)",
                "Autoimmune Neuropathy (AIN)",
                "Celiac Disease (CD)",
                "Goodpasture's Syndrome (GS)",
                "Graves' Disease (GD)",
                "Guillain-Barr\u00e9 Syndrome (GBS)",
                "Hashimoto's Thyroiditis (HT)",
                "Idiopathic Thrombocytopenic Purpura (ITP)",
                "Inflammatory Bowel Disease (IBD)",
                "Multiple Sclerosis (MS)",
                "Myasthenia Gravis (MG)",
                "Pemphigus Vulgaris (PV)",
                "Psoriasis (PSO)",
                "Rheumatoid Arthritis (RA)",
                "Scleroderma (SSc)",
                "Sj\u00f6gren's Syndrome (SS)",
                "Systemic Lupus Erythematosus (SLE)",
                "Type 1 Diabetes Mellitus (T1DM)",
                "Vitiligo (VIT)"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Autoimmune Hemolytic Anemia (AIHA) (1)",
            "Goodpasture's Syndrome (2)",
            "Pernicious Anemia (3)",
            "Rheumatoid Arthritis (4)",
            "Systemic Lupus Erythematosus (5)",
            "Hashimoto's Thyroiditis (6)",
            "Graves' Disease (7)",
            "Type 1 Diabetes (8)",
            "Multiple Sclerosis (9)",
            "Guillain-Barr\u00e9 Syndrome (10)",
            "Psoriasis (11)",
            "Vitiligo (12)",
            "Pemphigus (13)",
            "Pemphigoid (14)",
            "Epidermolysis Bullosa Acquisita (15)",
            "Chronic Active Hepatitis (16)",
            "Primary Biliary Cirrhosis (17)",
            "Primary Sclerosing Cholangitis (18)",
            "Crohn's Disease (19)",
            "Ulcerative Colitis (20)",
            "Psoriatic Arthritis (21)",
            "Lupus Nephritis (22)",
            "Kawasaki Disease (23)",
            "Stevens-Johnson Syndrome (24)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Autoimmune Hemolytic Anemia (AIHA) (1)",
                "Goodpasture's Syndrome (2)",
                "Pernicious Anemia (3)",
                "Rheumatoid Arthritis (4)",
                "Systemic Lupus Erythematosus (5)",
                "Hashimoto's Thyroiditis (6)",
                "Graves' Disease (7)",
                "Type 1 Diabetes (8)",
                "Multiple Sclerosis (9)",
                "Guillain-Barr\u00e9 Syndrome (10)",
                "Psoriasis (11)",
                "Vitiligo (12)",
                "Pemphigus (13)",
                "Pemphigoid (14)",
                "Epidermolysis Bullosa Acquisita (15)",
                "Chronic Active Hepatitis (16)",
                "Primary Biliary Cirrhosis (17)",
                "Primary Sclerosing Cholangitis (18)",
                "Crohn's Disease (19)",
                "Ulcerative Colitis (20)",
                "Psoriatic Arthritis (21)",
                "Lupus Nephritis (22)",
                "Kawasaki Disease (23)",
                "Stevens-Johnson Syndrome (24)"
            ],
            "mismatches": [],
            "true_referents": [
                "Autoimmune Hemolytic Anemia (AIHA) (1)",
                "Chronic Active Hepatitis (16)",
                "Crohn's Disease (19)",
                "Epidermolysis Bullosa Acquisita (15)",
                "Goodpasture's Syndrome (2)",
                "Graves' Disease (7)",
                "Guillain-Barr\u00e9 Syndrome (10)",
                "Hashimoto's Thyroiditis (6)",
                "Kawasaki Disease (23)",
                "Lupus Nephritis (22)",
                "Multiple Sclerosis (9)",
                "Pemphigoid (14)",
                "Pemphigus (13)",
                "Pernicious Anemia (3)",
                "Primary Biliary Cirrhosis (17)",
                "Primary Sclerosing Cholangitis (18)",
                "Psoriasis (11)",
                "Psoriatic Arthritis (21)",
                "Rheumatoid Arthritis (4)",
                "Stevens-Johnson Syndrome (24)",
                "Systemic Lupus Erythematosus (5)",
                "Type 1 Diabetes (8)",
                "Ulcerative Colitis (20)",
                "Vitiligo (12)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            "Rheumatoid Arthritis (RA)",
            "Lupus Erythematosus (SLE)",
            "Hashimoto's Thyroiditis",
            "Type 1 Diabetes",
            "Multiple Sclerosis (MS)",
            "Guillain-Barr\u00e9 Syndrome",
            "Pernicious Anemia",
            "Vitiligo",
            "Pemphigus Vulgaris",
            "Alopecia Areata",
            "Crohn's Disease",
            "Ulcerative Colitis",
            "Psoriasis",
            "Sj\u00f6gren's Syndrome",
            "Raynaud's Phenomenon",
            "Scleroderma",
            "Dermatomyositis",
            "Polymyositis",
            "Chronic Inflammatory Demyelinating Polyneuropathy (CIDP)",
            "Graves' Disease",
            "Myasthenia Gravis",
            "Pernicious Anemia",
            "Wegener's Granulomatosis",
            "Microscopic Polyangiitis",
            "Churg-Strauss Syndrome"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rheumatoid Arthritis (RA)",
                "Lupus Erythematosus (SLE)",
                "Hashimoto's Thyroiditis",
                "Type 1 Diabetes",
                "Multiple Sclerosis (MS)",
                "Guillain-Barr\u00e9 Syndrome",
                "Pernicious Anemia",
                "Vitiligo",
                "Pemphigus Vulgaris",
                "Alopecia Areata",
                "Crohn's Disease",
                "Ulcerative Colitis",
                "Psoriasis",
                "Sj\u00f6gren's Syndrome",
                "Raynaud's Phenomenon",
                "Scleroderma",
                "Dermatomyositis",
                "Polymyositis",
                "Chronic Inflammatory Demyelinating Polyneuropathy (CIDP)",
                "Graves' Disease",
                "Myasthenia Gravis",
                "Wegener's Granulomatosis",
                "Microscopic Polyangiitis"
            ],
            "mismatches": [
                "Churg-Strauss Syndrome"
            ],
            "true_referents": [
                "Alopecia Areata",
                "Chronic Inflammatory Demyelinating Polyneuropathy (CIDP)",
                "Crohn's Disease",
                "Dermatomyositis",
                "Graves' Disease",
                "Guillain-Barr\u00e9 Syndrome",
                "Hashimoto's Thyroiditis",
                "Lupus Erythematosus (SLE)",
                "Microscopic Polyangiitis",
                "Multiple Sclerosis (MS)",
                "Myasthenia Gravis",
                "Pemphigus Vulgaris",
                "Pernicious Anemia",
                "Polymyositis",
                "Psoriasis",
                "Raynaud's Phenomenon",
                "Rheumatoid Arthritis (RA)",
                "Scleroderma",
                "Sj\u00f6gren's Syndrome",
                "Type 1 Diabetes",
                "Ulcerative Colitis",
                "Vitiligo",
                "Wegener's Granulomatosis"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "autoimmune disease",
        "domain": "medicine",
        "response": [
            {
                "Referent": "Anemia",
                "Canonical Name": "Anemia"
            },
            {
                "Referent": "Cancer",
                "Canonical Name": "Cancer"
            },
            {
                "Referent": "Celiac disease",
                "Canonical Name": "Celiac disease"
            },
            {
                "Referent": "Eczema",
                "Canonical Name": "Eczema"
            },
            {
                "Referent": "Gout",
                "Canonical Name": "Gout"
            },
            {
                "Referent": "Hashimoto's thyroiditis",
                "Canonical Name": "Hashimoto's thyroiditis"
            },
            {
                "Referent": "Hypothyroidism",
                "Canonical Name": "Hypothyroidism"
            },
            {
                "Referent": "Hyperthyroidism",
                "Canonical Name": "Hyperthyroidism"
            },
            {
                "Referent": "Inflammatory bowel disease",
                "Canonical Name": "Inflammatory bowel disease"
            },
            {
                "Referent": "Multiple sclerosis",
                "Canonical Name": "Multiple sclerosis"
            },
            {
                "Referent": "Rheumatoid arthritis",
                "Canonical Name": "Rheumatoid arthritis"
            },
            {
                "Referent": "Systemic lupus erythematosus",
                "Canonical Name": "Systemic lupus erythematosus"
            },
            {
                "Referent": "Ulcerative colitis",
                "Canonical Name": "Ulcerative colitis"
            },
            {
                "Referent": "Vitiligo",
                "Canonical Name": "Vitiligo"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Anemia",
                "Cancer",
                "Celiac disease",
                "Eczema",
                "Gout",
                "Hashimoto's thyroiditis",
                "Hypothyroidism",
                "Hyperthyroidism",
                "Inflammatory bowel disease",
                "Multiple sclerosis",
                "Rheumatoid arthritis",
                "Systemic lupus erythematosus",
                "Ulcerative colitis",
                "Vitiligo"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"Anemia\", \"Canonical Name\": \"Anemia\"}",
                "{\"Referent\": \"Cancer\", \"Canonical Name\": \"Cancer\"}",
                "{\"Referent\": \"Celiac disease\", \"Canonical Name\": \"Celiac disease\"}",
                "{\"Referent\": \"Eczema\", \"Canonical Name\": \"Eczema\"}",
                "{\"Referent\": \"Gout\", \"Canonical Name\": \"Gout\"}",
                "{\"Referent\": \"Hashimoto's thyroiditis\", \"Canonical Name\": \"Hashimoto's thyroiditis\"}",
                "{\"Referent\": \"Hyperthyroidism\", \"Canonical Name\": \"Hyperthyroidism\"}",
                "{\"Referent\": \"Hypothyroidism\", \"Canonical Name\": \"Hypothyroidism\"}",
                "{\"Referent\": \"Inflammatory bowel disease\", \"Canonical Name\": \"Inflammatory bowel disease\"}",
                "{\"Referent\": \"Multiple sclerosis\", \"Canonical Name\": \"Multiple sclerosis\"}",
                "{\"Referent\": \"Rheumatoid arthritis\", \"Canonical Name\": \"Rheumatoid arthritis\"}",
                "{\"Referent\": \"Systemic lupus erythematosus\", \"Canonical Name\": \"Systemic lupus erythematosus\"}",
                "{\"Referent\": \"Ulcerative colitis\", \"Canonical Name\": \"Ulcerative colitis\"}",
                "{\"Referent\": \"Vitiligo\", \"Canonical Name\": \"Vitiligo\"}"
            ],
            "TP": 14,
            "FP": 0,
            "FN": 0
        }
    }
]