[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic cell (DC)",
            "Macrophage",
            "B cell",
            "Langerhans cell",
            "Interdigitating cell",
            "Epithelial cell",
            "Mast cell",
            "Neutrophil",
            "Red pulp marginal metallophilic macrophage",
            "Microglia",
            "Osteoclast",
            "Kupffer cell",
            "Alveolar macrophage",
            "Lymphoid tissue inducer cell",
            "Tumor-associated macrophage",
            "M\u00fcller cell",
            "Corneal endothelial cell",
            "Corneal stromal cell",
            "Corneal epithelial cell",
            "Retinal pigment epithelial cell",
            "Mesothelial cell",
            "Sinusoidal endothelial cell",
            "Endothelial progenitor cell",
            "Perivascular cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic cell (DC)",
                "Macrophage",
                "B cell",
                "Langerhans cell",
                "Interdigitating cell",
                "Epithelial cell",
                "Mast cell",
                "Neutrophil",
                "Red pulp marginal metallophilic macrophage",
                "Microglia",
                "Osteoclast",
                "Kupffer cell",
                "Alveolar macrophage",
                "Lymphoid tissue inducer cell",
                "Tumor-associated macrophage",
                "M\u00fcller cell",
                "Corneal endothelial cell",
                "Corneal stromal cell",
                "Corneal epithelial cell",
                "Retinal pigment epithelial cell",
                "Mesothelial cell",
                "Sinusoidal endothelial cell",
                "Endothelial progenitor cell",
                "Perivascular cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage",
                "B cell",
                "Corneal endothelial cell",
                "Corneal epithelial cell",
                "Corneal stromal cell",
                "Dendritic cell (DC)",
                "Endothelial progenitor cell",
                "Epithelial cell",
                "Interdigitating cell",
                "Kupffer cell",
                "Langerhans cell",
                "Lymphoid tissue inducer cell",
                "Macrophage",
                "Mast cell",
                "Mesothelial cell",
                "Microglia",
                "M\u00fcller cell",
                "Neutrophil",
                "Osteoclast",
                "Perivascular cell",
                "Red pulp marginal metallophilic macrophage",
                "Retinal pigment epithelial cell",
                "Sinusoidal endothelial cell",
                "Tumor-associated macrophage"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic cell (DC)",
            "Macrophage",
            "B cell",
            "Monocyte",
            "Conventional dendritic cell (cDC)",
            "Plasmacytoid dendritic cell (pDC)",
            "Langerhans cell",
            "Kupffer cell",
            "Microglial cell",
            "Osteoclast",
            "Follicular dendritic cell",
            "Epidermal Langerhans cell",
            "Interstitial dendritic cell",
            "Inflammatory monocyte",
            "Tissue-resident macrophage",
            "Myeloid dendritic cell",
            "Lymphoid dendritic cell",
            "Neutrophil",
            "Intravascular dendritic cell",
            "Perivascular dendritic cell",
            "Langerhans cell precursor",
            "Monocyte-derived dendritic cell",
            "Follicular dendritic cell in lymph nodes",
            "Epithelial Langerhans cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic cell (DC)",
                "Macrophage",
                "B cell",
                "Monocyte",
                "Conventional dendritic cell (cDC)",
                "Plasmacytoid dendritic cell (pDC)",
                "Langerhans cell",
                "Kupffer cell",
                "Microglial cell",
                "Osteoclast",
                "Follicular dendritic cell",
                "Epidermal Langerhans cell",
                "Interstitial dendritic cell",
                "Inflammatory monocyte",
                "Tissue-resident macrophage",
                "Myeloid dendritic cell",
                "Lymphoid dendritic cell",
                "Neutrophil",
                "Intravascular dendritic cell",
                "Perivascular dendritic cell",
                "Langerhans cell precursor",
                "Monocyte-derived dendritic cell",
                "Follicular dendritic cell in lymph nodes",
                "Epithelial Langerhans cell"
            ],
            "mismatches": [],
            "true_referents": [
                "B cell",
                "Conventional dendritic cell (cDC)",
                "Dendritic cell (DC)",
                "Epidermal Langerhans cell",
                "Epithelial Langerhans cell",
                "Follicular dendritic cell",
                "Follicular dendritic cell in lymph nodes",
                "Inflammatory monocyte",
                "Interstitial dendritic cell",
                "Intravascular dendritic cell",
                "Kupffer cell",
                "Langerhans cell",
                "Langerhans cell precursor",
                "Lymphoid dendritic cell",
                "Macrophage",
                "Microglial cell",
                "Monocyte",
                "Monocyte-derived dendritic cell",
                "Myeloid dendritic cell",
                "Neutrophil",
                "Osteoclast",
                "Perivascular dendritic cell",
                "Plasmacytoid dendritic cell (pDC)",
                "Tissue-resident macrophage"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic Cell (DC)",
            "Macrophage",
            "B Cell",
            "Langerhans Cell",
            "Follicular Dendritic Cell",
            "Interdigitating Dendritic Cell",
            "Conventional Dendritic Cell (cDC)",
            "Plasmacytoid Dendritic Cell (pDC)",
            "Monocyte",
            "Microglial Cell",
            "Kupffer Cell",
            "Osteoclast",
            "Alveolar Macrophage",
            "Histiocyte",
            "Lymph Node Stromal Cell",
            "Marginal Zone Macrophage",
            "Red Pulp Macrophage",
            "Spleen Macrophage",
            "Peritoneal Macrophage",
            "Bone Marrow Macrophage",
            "Eosinophil",
            "Basophil",
            "Mast Cell",
            "Fibroblast",
            "Endothelial Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic Cell (DC)",
                "Macrophage",
                "B Cell",
                "Langerhans Cell",
                "Follicular Dendritic Cell",
                "Interdigitating Dendritic Cell",
                "Conventional Dendritic Cell (cDC)",
                "Plasmacytoid Dendritic Cell (pDC)",
                "Monocyte",
                "Microglial Cell",
                "Kupffer Cell",
                "Osteoclast",
                "Alveolar Macrophage",
                "Histiocyte",
                "Lymph Node Stromal Cell",
                "Marginal Zone Macrophage",
                "Red Pulp Macrophage",
                "Spleen Macrophage",
                "Peritoneal Macrophage",
                "Bone Marrow Macrophage",
                "Eosinophil",
                "Basophil",
                "Mast Cell",
                "Fibroblast"
            ],
            "mismatches": [
                "Endothelial Cell"
            ],
            "true_referents": [
                "Alveolar Macrophage",
                "B Cell",
                "Basophil",
                "Bone Marrow Macrophage",
                "Conventional Dendritic Cell (cDC)",
                "Dendritic Cell (DC)",
                "Eosinophil",
                "Fibroblast",
                "Follicular Dendritic Cell",
                "Histiocyte",
                "Interdigitating Dendritic Cell",
                "Kupffer Cell",
                "Langerhans Cell",
                "Lymph Node Stromal Cell",
                "Macrophage",
                "Marginal Zone Macrophage",
                "Mast Cell",
                "Microglial Cell",
                "Monocyte",
                "Osteoclast",
                "Peritoneal Macrophage",
                "Plasmacytoid Dendritic Cell (pDC)",
                "Red Pulp Macrophage",
                "Spleen Macrophage"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Classical Dendritic Cell (cDC)",
            "Plasmacytoid Dendritic Cell (pDC)",
            "Monocyte-Derived Dendritic Cell (moDC)",
            "Langerhans Cell (LC)",
            "Interstitial Dendritic Cell (IDC)",
            "Birbeck Cell (LC subtype)",
            "Follicular Dendritic Cell (FDC)",
            "Conventional Type 1 Dendritic Cell (cDC1)",
            "Conventional Type 2 Dendritic Cell (cDC2)",
            "Migratory Dendritic Cell (mDC)",
            "Immature Dendritic Cell (iDC)",
            "Mature Dendritic Cell (mDC - following activation)",
            "B Cell (expressing MHC II)",
            "Macrophages (M1 polarized)",
            "Macrophages (M2 polarized)",
            "Microglial Cell (CNS)",
            "Alveolar Macrophage (lung)",
            "Kupffer Cell (liver)",
            "Splenic Dendritic Cell (in white pulp)",
            "Lymph Node Dendritic Cell (in T cell zone)",
            "Intestinal Dendritic Cell (CD103+)",
            "CD8\u03b1+ Dendritic Cell (mouse)",
            "CD11b+ Dendritic Cell (mouse)",
            "Human Dendritic Adventitial Cell (hDAC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Classical Dendritic Cell (cDC)",
                "Plasmacytoid Dendritic Cell (pDC)",
                "Monocyte-Derived Dendritic Cell (moDC)",
                "Langerhans Cell (LC)",
                "Interstitial Dendritic Cell (IDC)",
                "Birbeck Cell (LC subtype)",
                "Follicular Dendritic Cell (FDC)",
                "Conventional Type 1 Dendritic Cell (cDC1)",
                "Conventional Type 2 Dendritic Cell (cDC2)",
                "Migratory Dendritic Cell (mDC)",
                "Immature Dendritic Cell (iDC)",
                "Mature Dendritic Cell (mDC - following activation)",
                "B Cell (expressing MHC II)",
                "Macrophages (M1 polarized)",
                "Macrophages (M2 polarized)",
                "Microglial Cell (CNS)",
                "Alveolar Macrophage (lung)",
                "Kupffer Cell (liver)",
                "Splenic Dendritic Cell (in white pulp)",
                "Lymph Node Dendritic Cell (in T cell zone)",
                "Intestinal Dendritic Cell (CD103+)",
                "CD8\u03b1+ Dendritic Cell (mouse)",
                "CD11b+ Dendritic Cell (mouse)",
                "Human Dendritic Adventitial Cell (hDAC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar Macrophage (lung)",
                "B Cell (expressing MHC II)",
                "Birbeck Cell (LC subtype)",
                "CD11b+ Dendritic Cell (mouse)",
                "CD8\u03b1+ Dendritic Cell (mouse)",
                "Classical Dendritic Cell (cDC)",
                "Conventional Type 1 Dendritic Cell (cDC1)",
                "Conventional Type 2 Dendritic Cell (cDC2)",
                "Follicular Dendritic Cell (FDC)",
                "Human Dendritic Adventitial Cell (hDAC)",
                "Immature Dendritic Cell (iDC)",
                "Interstitial Dendritic Cell (IDC)",
                "Intestinal Dendritic Cell (CD103+)",
                "Kupffer Cell (liver)",
                "Langerhans Cell (LC)",
                "Lymph Node Dendritic Cell (in T cell zone)",
                "Macrophages (M1 polarized)",
                "Macrophages (M2 polarized)",
                "Mature Dendritic Cell (mDC - following activation)",
                "Microglial Cell (CNS)",
                "Migratory Dendritic Cell (mDC)",
                "Monocyte-Derived Dendritic Cell (moDC)",
                "Plasmacytoid Dendritic Cell (pDC)",
                "Splenic Dendritic Cell (in white pulp)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic cell (DC)",
            "Macrophage",
            "B cell",
            "Langerhans cell",
            "Follicular dendritic cell (FDC)",
            "Interdigitating dendritic cell",
            "Plasmacytoid dendritic cell (pDC)",
            "Kupffer cell",
            "Microglia",
            "Alveolar macrophage",
            "Peritoneal macrophage",
            "Monocyte",
            "Osteoclast",
            "Sinusoidal endothelial cell",
            "Thymic epithelial cell",
            "Intestinal epithelial cell",
            "Mesangial cell",
            "Eosinophil",
            "Basophil",
            "Mast cell",
            "Lymph node stromal cell",
            "Tingible body macrophage",
            "Epidermal Langerhans cell",
            "Glial cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic cell (DC)",
                "Macrophage",
                "B cell",
                "Langerhans cell",
                "Follicular dendritic cell (FDC)",
                "Interdigitating dendritic cell",
                "Plasmacytoid dendritic cell (pDC)",
                "Kupffer cell",
                "Microglia",
                "Alveolar macrophage",
                "Peritoneal macrophage",
                "Monocyte",
                "Osteoclast",
                "Sinusoidal endothelial cell",
                "Thymic epithelial cell",
                "Intestinal epithelial cell",
                "Mesangial cell",
                "Eosinophil",
                "Basophil",
                "Mast cell",
                "Lymph node stromal cell",
                "Tingible body macrophage",
                "Epidermal Langerhans cell",
                "Glial cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage",
                "B cell",
                "Basophil",
                "Dendritic cell (DC)",
                "Eosinophil",
                "Epidermal Langerhans cell",
                "Follicular dendritic cell (FDC)",
                "Glial cell",
                "Interdigitating dendritic cell",
                "Intestinal epithelial cell",
                "Kupffer cell",
                "Langerhans cell",
                "Lymph node stromal cell",
                "Macrophage",
                "Mast cell",
                "Mesangial cell",
                "Microglia",
                "Monocyte",
                "Osteoclast",
                "Peritoneal macrophage",
                "Plasmacytoid dendritic cell (pDC)",
                "Sinusoidal endothelial cell",
                "Thymic epithelial cell",
                "Tingible body macrophage"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic Cell (DC)",
            "Macrophage (M\u03a6)",
            "B Cell (B lymphocyte)",
            "Langerhans Cell (LC)",
            "Monocyte (Mo)",
            "Follicular Dendritic Cell (FDC)",
            "Activated T Cell (aT)",
            "Plasmacytoid Dendritic Cell (pDC)",
            "Interdigitating Dendritic Cell (IDC)",
            "Myeloid Dendritic Cell (mDC)",
            "CD8+ T Cell (CD8+ T)",
            "CD4+ T Cell (CD4+ T)",
            "Bone Marrow-Derived Dendritic Cell (BMDC)",
            "Tissue-resident Dendritic Cell (trDC)",
            "Regulatory T Cell (Treg)",
            "Nasal Dendritic Cell (NDC)",
            "Tumor-associated Dendritic Cell (TADC)",
            "Lymphoid Dendritic Cell (LDC)",
            "Antigen-presenting B Cell (APB)",
            "Microglia (MG)",
            "Kupffer Cell (KC)",
            "Alveolar Macrophage (AM)",
            "Spleen Dendritic Cell (SDC)",
            "Mucosal Dendritic Cell (MDC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic Cell (DC)",
                "Macrophage (M\u03a6)",
                "B Cell (B lymphocyte)",
                "Langerhans Cell (LC)",
                "Monocyte (Mo)",
                "Follicular Dendritic Cell (FDC)",
                "Activated T Cell (aT)",
                "Plasmacytoid Dendritic Cell (pDC)",
                "Interdigitating Dendritic Cell (IDC)",
                "Myeloid Dendritic Cell (mDC)",
                "CD8+ T Cell (CD8+ T)",
                "CD4+ T Cell (CD4+ T)",
                "Bone Marrow-Derived Dendritic Cell (BMDC)",
                "Tissue-resident Dendritic Cell (trDC)",
                "Regulatory T Cell (Treg)",
                "Nasal Dendritic Cell (NDC)",
                "Tumor-associated Dendritic Cell (TADC)",
                "Lymphoid Dendritic Cell (LDC)",
                "Antigen-presenting B Cell (APB)",
                "Microglia (MG)",
                "Kupffer Cell (KC)",
                "Alveolar Macrophage (AM)",
                "Spleen Dendritic Cell (SDC)",
                "Mucosal Dendritic Cell (MDC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated T Cell (aT)",
                "Alveolar Macrophage (AM)",
                "Antigen-presenting B Cell (APB)",
                "B Cell (B lymphocyte)",
                "Bone Marrow-Derived Dendritic Cell (BMDC)",
                "CD4+ T Cell (CD4+ T)",
                "CD8+ T Cell (CD8+ T)",
                "Dendritic Cell (DC)",
                "Follicular Dendritic Cell (FDC)",
                "Interdigitating Dendritic Cell (IDC)",
                "Kupffer Cell (KC)",
                "Langerhans Cell (LC)",
                "Lymphoid Dendritic Cell (LDC)",
                "Macrophage (M\u03a6)",
                "Microglia (MG)",
                "Monocyte (Mo)",
                "Mucosal Dendritic Cell (MDC)",
                "Myeloid Dendritic Cell (mDC)",
                "Nasal Dendritic Cell (NDC)",
                "Plasmacytoid Dendritic Cell (pDC)",
                "Regulatory T Cell (Treg)",
                "Spleen Dendritic Cell (SDC)",
                "Tissue-resident Dendritic Cell (trDC)",
                "Tumor-associated Dendritic Cell (TADC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic Cells (DCs)",
            "Macrophages",
            "B cells",
            "Monocytes",
            "Langerhans Cells",
            "Microglial Cells",
            "Kupffer Cells",
            "Osteoclasts",
            "Neutrophils",
            "Follicular Dendritic Cells",
            "Interstitial Dendritic Cells",
            "Veiled Cells",
            "Interdigitating Dendritic Cells",
            "Plasmacytoid Dendritic Cells",
            "Inflammatory Dendritic Epidermal Cells (IDECs)",
            "CD8 alpha+ Dendritic Cells",
            "CD103+ Dendritic Cells",
            "CD11c+ Dendritic Cells",
            "CD14+ Dendritic Cells",
            "CD1c (BDCA-1)+ Myeloid Dendritic Cells",
            "CD141 (BDCA-3)+ Myeloid Dendritic Cells",
            "CD123 (BDCA-2)+ Plasmacytoid Dendritic Cells",
            "CD303 (BDCA-2)+ Plasmacytoid Dendritic Cells",
            "CD304 (BDCA-4/Neuropilin-1)+ Plasmacytoid Dendritic Cells"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic Cells (DCs)",
                "Macrophages",
                "B cells",
                "Monocytes",
                "Langerhans Cells",
                "Microglial Cells",
                "Kupffer Cells",
                "Osteoclasts",
                "Neutrophils",
                "Follicular Dendritic Cells",
                "Interstitial Dendritic Cells",
                "Veiled Cells",
                "Interdigitating Dendritic Cells",
                "Plasmacytoid Dendritic Cells",
                "Inflammatory Dendritic Epidermal Cells (IDECs)",
                "CD8 alpha+ Dendritic Cells",
                "CD103+ Dendritic Cells",
                "CD11c+ Dendritic Cells",
                "CD14+ Dendritic Cells",
                "CD1c (BDCA-1)+ Myeloid Dendritic Cells",
                "CD141 (BDCA-3)+ Myeloid Dendritic Cells",
                "CD123 (BDCA-2)+ Plasmacytoid Dendritic Cells",
                "CD303 (BDCA-2)+ Plasmacytoid Dendritic Cells",
                "CD304 (BDCA-4/Neuropilin-1)+ Plasmacytoid Dendritic Cells"
            ],
            "mismatches": [],
            "true_referents": [
                "B cells",
                "CD103+ Dendritic Cells",
                "CD11c+ Dendritic Cells",
                "CD123 (BDCA-2)+ Plasmacytoid Dendritic Cells",
                "CD14+ Dendritic Cells",
                "CD141 (BDCA-3)+ Myeloid Dendritic Cells",
                "CD1c (BDCA-1)+ Myeloid Dendritic Cells",
                "CD303 (BDCA-2)+ Plasmacytoid Dendritic Cells",
                "CD304 (BDCA-4/Neuropilin-1)+ Plasmacytoid Dendritic Cells",
                "CD8 alpha+ Dendritic Cells",
                "Dendritic Cells (DCs)",
                "Follicular Dendritic Cells",
                "Inflammatory Dendritic Epidermal Cells (IDECs)",
                "Interdigitating Dendritic Cells",
                "Interstitial Dendritic Cells",
                "Kupffer Cells",
                "Langerhans Cells",
                "Macrophages",
                "Microglial Cells",
                "Monocytes",
                "Neutrophils",
                "Osteoclasts",
                "Plasmacytoid Dendritic Cells",
                "Veiled Cells"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic cell",
            "Macrophage",
            "B cell",
            "Langerhans cell",
            "Follicular dendritic cell",
            "Monocyte",
            "Plasmacytoid dendritic cell",
            "Fibroblast-like synoviocyte",
            "Endothelial cell",
            "Epithelial cell",
            "Osteoblast",
            "Osteoclast",
            "Neutrophil",
            "Eosinophil",
            "Basophil",
            "Mast cell",
            "Kupffer cell",
            "Microglia",
            "Pericyte",
            "Fibroblast",
            "Schwann cell",
            "T cell",
            "Natural killer cell",
            "Lymphatic endothelial cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic cell",
                "Macrophage",
                "B cell",
                "Langerhans cell",
                "Follicular dendritic cell",
                "Monocyte",
                "Plasmacytoid dendritic cell",
                "Fibroblast-like synoviocyte",
                "Endothelial cell",
                "Epithelial cell",
                "Osteoblast",
                "Osteoclast",
                "Neutrophil",
                "Eosinophil",
                "Basophil",
                "Mast cell",
                "Kupffer cell",
                "Microglia",
                "Pericyte",
                "Fibroblast",
                "Schwann cell",
                "T cell",
                "Natural killer cell",
                "Lymphatic endothelial cell"
            ],
            "mismatches": [],
            "true_referents": [
                "B cell",
                "Basophil",
                "Dendritic cell",
                "Endothelial cell",
                "Eosinophil",
                "Epithelial cell",
                "Fibroblast",
                "Fibroblast-like synoviocyte",
                "Follicular dendritic cell",
                "Kupffer cell",
                "Langerhans cell",
                "Lymphatic endothelial cell",
                "Macrophage",
                "Mast cell",
                "Microglia",
                "Monocyte",
                "Natural killer cell",
                "Neutrophil",
                "Osteoblast",
                "Osteoclast",
                "Pericyte",
                "Plasmacytoid dendritic cell",
                "Schwann cell",
                "T cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic cell (DC)",
            "Macrophage",
            "B cell",
            "Langerhans cell",
            "Follicular dendritic cell",
            "Plasmacytoid dendritic cell (pDC)",
            "Microglia",
            "Kupffer cell",
            "Osteoclast",
            "Monocyte-derived dendritic cell",
            "Interdigitating dendritic cell",
            "CD1c+ dendritic cell",
            "CD141+ dendritic cell",
            "Skin dendritic cell",
            "Intestinal dendritic cell",
            "Neural dendritic cell",
            "Peripheral blood dendritic cell",
            "Alveolar macrophage",
            "Peritoneal macrophage",
            "Hepatic macrophage",
            "Splenic macrophage",
            "Lung dendritic cell",
            "DC-SIGN+ dendritic cell",
            "Migratory dendritic cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic cell (DC)",
                "Macrophage",
                "B cell",
                "Langerhans cell",
                "Follicular dendritic cell",
                "Plasmacytoid dendritic cell (pDC)",
                "Microglia",
                "Kupffer cell",
                "Osteoclast",
                "Monocyte-derived dendritic cell",
                "Interdigitating dendritic cell",
                "CD1c+ dendritic cell",
                "CD141+ dendritic cell",
                "Skin dendritic cell",
                "Intestinal dendritic cell",
                "Neural dendritic cell",
                "Peripheral blood dendritic cell",
                "Alveolar macrophage",
                "Peritoneal macrophage",
                "Hepatic macrophage",
                "Splenic macrophage",
                "Lung dendritic cell",
                "DC-SIGN+ dendritic cell",
                "Migratory dendritic cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage",
                "B cell",
                "CD141+ dendritic cell",
                "CD1c+ dendritic cell",
                "DC-SIGN+ dendritic cell",
                "Dendritic cell (DC)",
                "Follicular dendritic cell",
                "Hepatic macrophage",
                "Interdigitating dendritic cell",
                "Intestinal dendritic cell",
                "Kupffer cell",
                "Langerhans cell",
                "Lung dendritic cell",
                "Macrophage",
                "Microglia",
                "Migratory dendritic cell",
                "Monocyte-derived dendritic cell",
                "Neural dendritic cell",
                "Osteoclast",
                "Peripheral blood dendritic cell",
                "Peritoneal macrophage",
                "Plasmacytoid dendritic cell (pDC)",
                "Skin dendritic cell",
                "Splenic macrophage"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic cell (DC)",
            "Macrophage",
            "B cell",
            "Langerhans cell",
            "Monocyte",
            "Follicular dendritic cell (FDC)",
            "Kupffer cell",
            "Microglia",
            "Alveolar macrophage",
            "Plasmacytoid dendritic cell (pDC)",
            "Interdigitating dendritic cell",
            "Conventional dendritic cell (cDC)",
            "Myeloid dendritic cell (mDC)",
            "Osteoclast",
            "Sinus histiocyte",
            "Epithelial cell",
            "Fibroblast",
            "Endothelial cell",
            "Thymic epithelial cell",
            "Mast cell",
            "Neutrophil",
            "Natural killer cell (NK cell)",
            "Mesenchymal stem cell (MSC)",
            "\u03b3\u03b4 T cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic cell (DC)",
                "Macrophage",
                "B cell",
                "Langerhans cell",
                "Monocyte",
                "Follicular dendritic cell (FDC)",
                "Kupffer cell",
                "Microglia",
                "Alveolar macrophage",
                "Plasmacytoid dendritic cell (pDC)",
                "Interdigitating dendritic cell",
                "Conventional dendritic cell (cDC)",
                "Myeloid dendritic cell (mDC)",
                "Osteoclast",
                "Sinus histiocyte",
                "Epithelial cell",
                "Fibroblast",
                "Endothelial cell",
                "Thymic epithelial cell",
                "Mast cell",
                "Neutrophil",
                "Natural killer cell (NK cell)",
                "Mesenchymal stem cell (MSC)",
                "\u03b3\u03b4 T cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage",
                "B cell",
                "Conventional dendritic cell (cDC)",
                "Dendritic cell (DC)",
                "Endothelial cell",
                "Epithelial cell",
                "Fibroblast",
                "Follicular dendritic cell (FDC)",
                "Interdigitating dendritic cell",
                "Kupffer cell",
                "Langerhans cell",
                "Macrophage",
                "Mast cell",
                "Mesenchymal stem cell (MSC)",
                "Microglia",
                "Monocyte",
                "Myeloid dendritic cell (mDC)",
                "Natural killer cell (NK cell)",
                "Neutrophil",
                "Osteoclast",
                "Plasmacytoid dendritic cell (pDC)",
                "Sinus histiocyte",
                "Thymic epithelial cell",
                "\u03b3\u03b4 T cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic cell (DC)",
            "Macrophage",
            "B cell",
            "Monocyte",
            "Langerhans cell",
            "Interdigitating dendritic cell (IDC)",
            "Follicular dendritic cell (FDC)",
            "Plasmacytoid dendritic cell (pDC)",
            "Myeloid dendritic cell (mDC)",
            "Microglia",
            "Kupffer cell",
            "Alveolar macrophage",
            "Peritoneal macrophage",
            "Osteoclast",
            "Epithelioid cell",
            "Multinucleated giant cell",
            "Veiled cell",
            "Interstitial dendritic cell",
            "Dermal dendritic cell",
            "Thymic dendritic cell",
            "Splenic dendritic cell",
            "Lymph node dendritic cell",
            "Intestinal dendritic cell",
            "Liver sinusoidal endothelial cell (LSEC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic cell (DC)",
                "Macrophage",
                "B cell",
                "Monocyte",
                "Langerhans cell",
                "Interdigitating dendritic cell (IDC)",
                "Follicular dendritic cell (FDC)",
                "Plasmacytoid dendritic cell (pDC)",
                "Myeloid dendritic cell (mDC)",
                "Microglia",
                "Kupffer cell",
                "Alveolar macrophage",
                "Peritoneal macrophage",
                "Osteoclast",
                "Epithelioid cell",
                "Multinucleated giant cell",
                "Veiled cell",
                "Interstitial dendritic cell",
                "Dermal dendritic cell",
                "Thymic dendritic cell",
                "Splenic dendritic cell",
                "Lymph node dendritic cell",
                "Intestinal dendritic cell",
                "Liver sinusoidal endothelial cell (LSEC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage",
                "B cell",
                "Dendritic cell (DC)",
                "Dermal dendritic cell",
                "Epithelioid cell",
                "Follicular dendritic cell (FDC)",
                "Interdigitating dendritic cell (IDC)",
                "Interstitial dendritic cell",
                "Intestinal dendritic cell",
                "Kupffer cell",
                "Langerhans cell",
                "Liver sinusoidal endothelial cell (LSEC)",
                "Lymph node dendritic cell",
                "Macrophage",
                "Microglia",
                "Monocyte",
                "Multinucleated giant cell",
                "Myeloid dendritic cell (mDC)",
                "Osteoclast",
                "Peritoneal macrophage",
                "Plasmacytoid dendritic cell (pDC)",
                "Splenic dendritic cell",
                "Thymic dendritic cell",
                "Veiled cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic Cell (DC)",
            "Macrophage",
            "B Cell",
            "Langerhans Cell",
            "Monocyte",
            "Follicular Dendritic Cell (FDC)",
            "Thymic Epithelial Cell",
            "Kupffer Cell",
            "Microglia",
            "Osteoclast",
            "Endothelial Cell",
            "Fibroblast",
            "Neutrophil",
            "Eosinophil",
            "Basophil",
            "Mast Cell",
            "Natural Killer Cell (NK Cell)",
            "Gamma Delta T Cell (\u03b3\u03b4 T Cell)",
            "Mucosal Lymphoid Cell",
            "Hepatocyte",
            "Keratinocyte",
            "Mesangial Cell",
            "Retinal Pigment Epithelial Cell",
            "Adipocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic Cell (DC)",
                "Macrophage",
                "B Cell",
                "Langerhans Cell",
                "Monocyte",
                "Follicular Dendritic Cell (FDC)",
                "Thymic Epithelial Cell",
                "Kupffer Cell",
                "Microglia",
                "Osteoclast",
                "Endothelial Cell",
                "Fibroblast",
                "Neutrophil",
                "Eosinophil",
                "Basophil",
                "Mast Cell",
                "Natural Killer Cell (NK Cell)",
                "Gamma Delta T Cell (\u03b3\u03b4 T Cell)",
                "Mucosal Lymphoid Cell",
                "Hepatocyte",
                "Keratinocyte",
                "Mesangial Cell",
                "Retinal Pigment Epithelial Cell",
                "Adipocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "B Cell",
                "Basophil",
                "Dendritic Cell (DC)",
                "Endothelial Cell",
                "Eosinophil",
                "Fibroblast",
                "Follicular Dendritic Cell (FDC)",
                "Gamma Delta T Cell (\u03b3\u03b4 T Cell)",
                "Hepatocyte",
                "Keratinocyte",
                "Kupffer Cell",
                "Langerhans Cell",
                "Macrophage",
                "Mast Cell",
                "Mesangial Cell",
                "Microglia",
                "Monocyte",
                "Mucosal Lymphoid Cell",
                "Natural Killer Cell (NK Cell)",
                "Neutrophil",
                "Osteoclast",
                "Retinal Pigment Epithelial Cell",
                "Thymic Epithelial Cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic Cell (DC)",
            "Macrophage (M\u03c6)",
            "B Lymphocyte (B Cell)",
            "Langerhans Cell (LC)",
            "Interdigitating Dendritic Cell (IDC)",
            "Follicular Dendritic Cell (FDC)",
            "Monocyte (Mo)",
            "Microglia (MG)",
            "Kupffer Cell (KC)",
            "Alveolar Macrophage (AM)",
            "Osteoclast (OC)",
            "Myeloid Dendritic Cell (mDC)",
            "Plasmacytoid Dendritic Cell (pDC)",
            "Intestinal Epithelial Cell (IEC)",
            "Thymic Epithelial Cell (TEC)",
            "Glomerular Mesangial Cell (GMC)",
            "Retinal Pigment Epithelial Cell (RPEC)",
            "Liver Sinusoidal Endothelial Cell (LSEC)",
            "Endothelial Cell (EC)",
            "Fibroblast (Fb)",
            "Astrocyte (AC)",
            "Microvascular Pericyte (MP)",
            "Adipocyte (Ad)",
            "Keratinocyte (KC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic Cell (DC)",
                "Macrophage (M\u03d5)",
                "B Lymphocyte (B Cell)",
                "Langerhans Cell (LC)",
                "Interdigitating Dendritic Cell (IDC)",
                "Follicular Dendritic Cell (FDC)",
                "Monocyte (Mo)",
                "Microglia (MG)",
                "Kupffer Cell (KC)",
                "Alveolar Macrophage (AM)",
                "Osteoclast (OC)",
                "Myeloid Dendritic Cell (mDC)",
                "Plasmacytoid Dendritic Cell (pDC)",
                "Intestinal Epithelial Cell (IEC)",
                "Thymic Epithelial Cell (TEC)",
                "Glomerular Mesangial Cell (GMC)",
                "Retinal Pigment Epithelial Cell (RPEC)",
                "Liver Sinusoidal Endothelial Cell (LSEC)",
                "Endothelial Cell (EC)",
                "Fibroblast (Fb)",
                "Astrocyte (AC)",
                "Microvascular Pericyte (MP)",
                "Adipocyte (Ad)",
                "Keratinocyte (KC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (Ad)",
                "Alveolar Macrophage (AM)",
                "Astrocyte (AC)",
                "B Lymphocyte (B Cell)",
                "Dendritic Cell (DC)",
                "Endothelial Cell (EC)",
                "Fibroblast (Fb)",
                "Follicular Dendritic Cell (FDC)",
                "Glomerular Mesangial Cell (GMC)",
                "Interdigitating Dendritic Cell (IDC)",
                "Intestinal Epithelial Cell (IEC)",
                "Keratinocyte (KC)",
                "Kupffer Cell (KC)",
                "Langerhans Cell (LC)",
                "Liver Sinusoidal Endothelial Cell (LSEC)",
                "Macrophage (M\u03c6)",
                "Microglia (MG)",
                "Microvascular Pericyte (MP)",
                "Monocyte (Mo)",
                "Myeloid Dendritic Cell (mDC)",
                "Osteoclast (OC)",
                "Plasmacytoid Dendritic Cell (pDC)",
                "Retinal Pigment Epithelial Cell (RPEC)",
                "Thymic Epithelial Cell (TEC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic cells (DCs) (DC)",
            "Macrophages (M\u03a6)",
            "Monocytes (Mo)",
            "Langerhans cells (LC)",
            "Follicular dendritic cells (FDC)",
            "Interdigitating dendritic cells (IDC)",
            "Plasmacytoid dendritic cells (pDC)",
            "M2 macrophages",
            "M1 macrophages",
            "Tumor-associated macrophages (TAM)",
            "Tumor-infiltrating macrophages (TIM)",
            "Microglia",
            "Osteoclasts",
            "Kupffer cells",
            "Alveolar macrophages",
            "Spleen macrophages",
            "Peritoneal macrophages",
            "Liver sinusoidal macrophages",
            "Bone marrow-derived macrophages",
            "Blood-borne macrophages",
            "Splenic dendritic cells",
            "Lymph node dendritic cells",
            "Peyer's patch dendritic cells",
            "Intestinal lamina propria dendritic cells",
            "Skin dendritic cells"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic cells (DCs) (DC)",
                "Macrophages (M\u03a6)",
                "Monocytes (Mo)",
                "Langerhans cells (LC)",
                "Follicular dendritic cells (FDC)",
                "Interdigitating dendritic cells (IDC)",
                "Plasmacytoid dendritic cells (pDC)",
                "M2 macrophages",
                "M1 macrophages",
                "Tumor-associated macrophages (TAM)",
                "Tumor-infiltrating macrophages (TIM)",
                "Microglia",
                "Osteoclasts",
                "Kupffer cells",
                "Alveolar macrophages",
                "Spleen macrophages",
                "Peritoneal macrophages",
                "Liver sinusoidal macrophages",
                "Bone marrow-derived macrophages",
                "Blood-borne macrophages",
                "Splenic dendritic cells",
                "Lymph node dendritic cells",
                "Peyer's patch dendritic cells",
                "Intestinal lamina propria dendritic cells"
            ],
            "mismatches": [
                "Skin dendritic cells"
            ],
            "true_referents": [
                "Alveolar macrophages",
                "Blood-borne macrophages",
                "Bone marrow-derived macrophages",
                "Dendritic cells (DCs) (DC)",
                "Follicular dendritic cells (FDC)",
                "Interdigitating dendritic cells (IDC)",
                "Intestinal lamina propria dendritic cells",
                "Kupffer cells",
                "Langerhans cells (LC)",
                "Liver sinusoidal macrophages",
                "Lymph node dendritic cells",
                "M1 macrophages",
                "M2 macrophages",
                "Macrophages (M\u03a6)",
                "Microglia",
                "Monocytes (Mo)",
                "Osteoclasts",
                "Peritoneal macrophages",
                "Peyer's patch dendritic cells",
                "Plasmacytoid dendritic cells (pDC)",
                "Spleen macrophages",
                "Splenic dendritic cells",
                "Tumor-associated macrophages (TAM)",
                "Tumor-infiltrating macrophages (TIM)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "Dendritic cell (DC)",
            "Macrophage (M\u03c6)",
            "B cell",
            "Langerhans cell",
            "Kupffer cell",
            "Microglia",
            "Follicular dendritic cell (FDC)",
            "Interdigitating dendritic cell (IDC)",
            "Myeloid dendritic cell (mDC)",
            "Plasmacytoid dendritic cell (pDC)",
            "Monocyte",
            "Neutrophil",
            "Eosinophil",
            "Basophil",
            "Mast cell",
            "Thymic epithelial cell",
            "Epidermal cell",
            "Endothelial cell",
            " Fibroblast",
            "Osteoclast",
            "Chondrocyte",
            "Keratinocyte",
            "Adipocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic cell (DC)",
                "Macrophage (M\u03d5)",
                "B cell",
                "Langerhans cell",
                "Kupffer cell",
                "Microglia",
                "Follicular dendritic cell (FDC)",
                "Interdigitating dendritic cell (IDC)",
                "Myeloid dendritic cell (mDC)",
                "Plasmacytoid dendritic cell (pDC)",
                "Monocyte",
                "Neutrophil",
                "Eosinophil",
                "Basophil",
                "Mast cell",
                "Thymic epithelial cell",
                "Epidermal cell",
                "Endothelial cell",
                " Fibroblast",
                "Osteoclast",
                "Chondrocyte",
                "Keratinocyte",
                "Adipocyte"
            ],
            "mismatches": [],
            "true_referents": [
                " Fibroblast",
                "Adipocyte",
                "B cell",
                "Basophil",
                "Chondrocyte",
                "Dendritic cell (DC)",
                "Endothelial cell",
                "Eosinophil",
                "Epidermal cell",
                "Follicular dendritic cell (FDC)",
                "Interdigitating dendritic cell (IDC)",
                "Keratinocyte",
                "Kupffer cell",
                "Langerhans cell",
                "Macrophage (M\u03c6)",
                "Mast cell",
                "Microglia",
                "Monocyte",
                "Myeloid dendritic cell (mDC)",
                "Neutrophil",
                "Osteoclast",
                "Plasmacytoid dendritic cell (pDC)",
                "Thymic epithelial cell"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "antigen-presenting cell",
        "domain": "biology",
        "response": [
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)",
            "antigen-presenting cell (APC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "antigen-presenting cell (APC)"
            ],
            "mismatches": [],
            "true_referents": [
                "antigen-presenting cell (APC)"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 0
        }
    }
]