[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Macrophage",
            "Dendritic cell",
            "Eosinophil",
            "Basophil",
            "Mast cell",
            "Alveolar macrophage",
            "Kupffer cell",
            "Microglia",
            "Langerhans cell",
            "Histiocyte",
            "Osteoclast",
            "Zebra fish macrophage",
            "Plasmodium falciparum infected red blood cell",
            "Drosophila melanogaster hemocyte",
            "C. elegans phagocytic cell",
            "Amoeba",
            "Dictyostelium discoideum",
            "Entamoeba histolytica",
            "Leishmania donovani amastigote-containing macrophage",
            "Mycobacterium tuberculosis-infected macrophage",
            "Cryptococcus neoformans-infected macrophage",
            "Pseudomonas aeruginosa-infected macrophage",
            "Escherichia coli-infected neutrophil"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Macrophage",
                "Dendritic cell",
                "Eosinophil",
                "Basophil",
                "Mast cell",
                "Alveolar macrophage",
                "Kupffer cell",
                "Microglia",
                "Langerhans cell",
                "Histiocyte",
                "Osteoclast",
                "Zebra fish macrophage",
                "Plasmodium falciparum infected red blood cell",
                "Drosophila melanogaster hemocyte",
                "C. elegans phagocytic cell",
                "Amoeba",
                "Dictyostelium discoideum",
                "Entamoeba histolytica",
                "Leishmania donovani amastigote-containing macrophage",
                "Mycobacterium tuberculosis-infected macrophage",
                "Cryptococcus neoformans-infected macrophage",
                "Pseudomonas aeruginosa-infected macrophage",
                "Escherichia coli-infected neutrophil"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage",
                "Amoeba",
                "Basophil",
                "C. elegans phagocytic cell",
                "Cryptococcus neoformans-infected macrophage",
                "Dendritic cell",
                "Dictyostelium discoideum",
                "Drosophila melanogaster hemocyte",
                "Entamoeba histolytica",
                "Eosinophil",
                "Escherichia coli-infected neutrophil",
                "Histiocyte",
                "Kupffer cell",
                "Langerhans cell",
                "Leishmania donovani amastigote-containing macrophage",
                "Macrophage",
                "Mast cell",
                "Microglia",
                "Mycobacterium tuberculosis-infected macrophage",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Plasmodium falciparum infected red blood cell",
                "Pseudomonas aeruginosa-infected macrophage",
                "Zebra fish macrophage"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Macrophage",
            "Monocyte",
            "Dendritic cell",
            "Eosinophil",
            "Basophil",
            "Microglia",
            "Kupffer cell",
            "Histiocyte",
            "Osteoclast",
            "Follicular dendritic cell",
            "Langerhans cell",
            "Neutrophil granulocyte",
            "Alveolar macrophage",
            "Splenic macrophage",
            "Peritoneal macrophage",
            "Mesangial cell",
            "Histiocytic sarcoma cell",
            "Sinusoidal endothelial cell",
            "Epithelioid cell",
            "Mast cell",
            "Natural killer cell",
            "Lymphocyte",
            "Neutrophil extracellular trap (NET)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Macrophage",
                "Monocyte",
                "Dendritic cell",
                "Eosinophil",
                "Basophil",
                "Microglia",
                "Kupffer cell",
                "Histiocyte",
                "Osteoclast",
                "Follicular dendritic cell",
                "Langerhans cell",
                "Neutrophil granulocyte",
                "Alveolar macrophage",
                "Splenic macrophage",
                "Peritoneal macrophage",
                "Mesangial cell",
                "Histiocytic sarcoma cell",
                "Sinusoidal endothelial cell",
                "Epithelioid cell",
                "Mast cell",
                "Natural killer cell",
                "Lymphocyte",
                "Neutrophil extracellular trap (NET)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage",
                "Basophil",
                "Dendritic cell",
                "Eosinophil",
                "Epithelioid cell",
                "Follicular dendritic cell",
                "Histiocyte",
                "Histiocytic sarcoma cell",
                "Kupffer cell",
                "Langerhans cell",
                "Lymphocyte",
                "Macrophage",
                "Mast cell",
                "Mesangial cell",
                "Microglia",
                "Monocyte",
                "Natural killer cell",
                "Neutrophil (PMN)",
                "Neutrophil extracellular trap (NET)",
                "Neutrophil granulocyte",
                "Osteoclast",
                "Peritoneal macrophage",
                "Sinusoidal endothelial cell",
                "Splenic macrophage"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Macrophage",
            "Monocyte",
            "Eosinophil",
            "Basophil",
            "Dendritic Cell",
            "Mast Cell",
            "Kupffer Cell (Liver Macrophage)",
            "Alveolar Macrophage",
            "Microglia",
            "Histiocyte",
            "Langerhans Cell",
            "Osteoclast",
            "Microfold Cell (M Cell)",
            "Giant Cell",
            "Epithelioid Cell",
            "Hoechst Cell",
            "Foam Cell",
            "Dust Cell",
            "Tissue Macrophage",
            "Peritoneal Macrophage",
            "Splenic Macrophage",
            "Bone Marrow Macrophage",
            "Hepatic Stellate Cell (Ito Cell)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Macrophage",
                "Monocyte",
                "Eosinophil",
                "Basophil",
                "Dendritic Cell",
                "Mast Cell",
                "Kupffer Cell (Liver Macrophage)",
                "Alveolar Macrophage",
                "Microglia",
                "Histiocyte",
                "Langerhans Cell",
                "Osteoclast",
                "Microfold Cell (M Cell)",
                "Giant Cell",
                "Epithelioid Cell",
                "Hoechst Cell",
                "Foam Cell",
                "Dust Cell",
                "Tissue Macrophage",
                "Peritoneal Macrophage",
                "Splenic Macrophage",
                "Bone Marrow Macrophage",
                "Hepatic Stellate Cell (Ito Cell)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar Macrophage",
                "Basophil",
                "Bone Marrow Macrophage",
                "Dendritic Cell",
                "Dust Cell",
                "Eosinophil",
                "Epithelioid Cell",
                "Foam Cell",
                "Giant Cell",
                "Hepatic Stellate Cell (Ito Cell)",
                "Histiocyte",
                "Hoechst Cell",
                "Kupffer Cell (Liver Macrophage)",
                "Langerhans Cell",
                "Macrophage",
                "Mast Cell",
                "Microfold Cell (M Cell)",
                "Microglia",
                "Monocyte",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Peritoneal Macrophage",
                "Splenic Macrophage",
                "Tissue Macrophage"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Macrophage (M\u03a6)",
            "Dendritic Cell (DC)",
            "Monocyte",
            "Eosinophil",
            "Basophil",
            "Mast Cell",
            "Kupffer Cell (KC)",
            "Alveolar Macrophage",
            "Microglial Cell",
            "Peritoneal Macrophage",
            "Osteoclast",
            "Splenic Macrophage",
            "Histiocyte",
            "Langerhans Cell",
            "Fibroblast (under certain conditions)",
            "Natural Killer Cell (NK cell - limited phagocytosis)",
            "B Cell (antibody-mediated phagocytosis)",
            "T Cell (limited phagocytosis)",
            "Circulating Precursor Cell (granulocyte-macrophage progenitor)",
            "Bone Marrow Derived Macrophage",
            "M1 Macrophage",
            "M2 Macrophage",
            "Foam Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Macrophage (M\u03a6)",
                "Dendritic Cell (DC)",
                "Monocyte",
                "Eosinophil",
                "Basophil",
                "Mast Cell",
                "Kupffer Cell (KC)",
                "Alveolar Macrophage",
                "Microglial Cell",
                "Peritoneal Macrophage",
                "Osteoclast",
                "Splenic Macrophage",
                "Histiocyte",
                "Langerhans Cell",
                "Fibroblast (under certain conditions)",
                "Natural Killer Cell (NK cell - limited phagocytosis)",
                "B Cell (antibody-mediated phagocytosis)",
                "T Cell (limited phagocytosis)",
                "Circulating Precursor Cell (granulocyte-macrophage progenitor)",
                "Bone Marrow Derived Macrophage",
                "M1 Macrophage",
                "M2 Macrophage",
                "Foam Cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar Macrophage",
                "B Cell (antibody-mediated phagocytosis)",
                "Basophil",
                "Bone Marrow Derived Macrophage",
                "Circulating Precursor Cell (granulocyte-macrophage progenitor)",
                "Dendritic Cell (DC)",
                "Eosinophil",
                "Fibroblast (under certain conditions)",
                "Foam Cell",
                "Histiocyte",
                "Kupffer Cell (KC)",
                "Langerhans Cell",
                "M1 Macrophage",
                "M2 Macrophage",
                "Macrophage (M\u03a6)",
                "Mast Cell",
                "Microglial Cell",
                "Monocyte",
                "Natural Killer Cell (NK cell - limited phagocytosis)",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Peritoneal Macrophage",
                "Splenic Macrophage",
                "T Cell (limited phagocytosis)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Macrophage",
            "Monocyte",
            "Dendritic cell (DC)",
            "Kupffer cell",
            "Alveolar macrophage",
            "Microglia",
            "Osteoclast",
            "Eosinophil",
            "Basophil",
            "Langerhans cell",
            "Peritoneal macrophage",
            "Splenic macrophage",
            "Histiocyte",
            "Foam cell",
            "Giant cell",
            "M1 macrophage",
            "M2 macrophage",
            "Tingible body macrophage",
            "Epithelioid cell",
            "Serosal macrophage",
            "Adipose tissue macrophage",
            "Pigment cell",
            "Intestinal macrophage"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Macrophage",
                "Monocyte",
                "Dendritic cell (DC)",
                "Kupffer cell",
                "Alveolar macrophage",
                "Microglia",
                "Osteoclast",
                "Eosinophil",
                "Basophil",
                "Langerhans cell",
                "Peritoneal macrophage",
                "Splenic macrophage",
                "Histiocyte",
                "Foam cell",
                "Giant cell",
                "M1 macrophage",
                "M2 macrophage",
                "Tingible body macrophage",
                "Epithelioid cell",
                "Serosal macrophage",
                "Adipose tissue macrophage",
                "Pigment cell",
                "Intestinal macrophage"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipose tissue macrophage",
                "Alveolar macrophage",
                "Basophil",
                "Dendritic cell (DC)",
                "Eosinophil",
                "Epithelioid cell",
                "Foam cell",
                "Giant cell",
                "Histiocyte",
                "Intestinal macrophage",
                "Kupffer cell",
                "Langerhans cell",
                "M1 macrophage",
                "M2 macrophage",
                "Macrophage",
                "Microglia",
                "Monocyte",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Peritoneal macrophage",
                "Pigment cell",
                "Serosal macrophage",
                "Splenic macrophage",
                "Tingible body macrophage"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Macrophage (M\u03a6)",
            "Dendritic cell (DC)",
            "Monocyte (Mo)",
            "Eosinophil (Eo)",
            "Basophil (Ba)",
            "Kupffer cell (KC)",
            "Microglia (MG)",
            "Alveolar macrophage (AM)",
            "Langerhans cell (LC)",
            "Osteoclast (OC)",
            "Mast cell (MC)",
            "Peritoneal macrophage (PM)",
            "Bone marrow-derived macrophage (BMDM)",
            "Tissue-resident macrophage (TRM)",
            "Foam cell (FC)",
            "Neutrophil extracellular trap (NET)",
            "Giant cell (GC)",
            "Synovial macrophage (SM)",
            "Inflammatory monocyte (IM)",
            "Thymic macrophage (TM)",
            "Tumor-associated macrophage (TAM)",
            "Regulatory macrophage (RM)",
            "Antigen-presenting cell (APC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Macrophage (M\u03a6)",
                "Dendritic cell (DC)",
                "Monocyte (Mo)",
                "Eosinophil (Eo)",
                "Basophil (Ba)",
                "Kupffer cell (KC)",
                "Microglia (MG)",
                "Alveolar macrophage (AM)",
                "Langerhans cell (LC)",
                "Osteoclast (OC)",
                "Mast cell (MC)",
                "Peritoneal macrophage (PM)",
                "Bone marrow-derived macrophage (BMDM)",
                "Tissue-resident macrophage (TRM)",
                "Foam cell (FC)",
                "Neutrophil extracellular trap (NET)",
                "Giant cell (GC)",
                "Synovial macrophage (SM)",
                "Inflammatory monocyte (IM)",
                "Thymic macrophage (TM)",
                "Tumor-associated macrophage (TAM)",
                "Regulatory macrophage (RM)",
                "Antigen-presenting cell (APC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage (AM)",
                "Antigen-presenting cell (APC)",
                "Basophil (Ba)",
                "Bone marrow-derived macrophage (BMDM)",
                "Dendritic cell (DC)",
                "Eosinophil (Eo)",
                "Foam cell (FC)",
                "Giant cell (GC)",
                "Inflammatory monocyte (IM)",
                "Kupffer cell (KC)",
                "Langerhans cell (LC)",
                "Macrophage (M\u03a6)",
                "Mast cell (MC)",
                "Microglia (MG)",
                "Monocyte (Mo)",
                "Neutrophil (PMN)",
                "Neutrophil extracellular trap (NET)",
                "Osteoclast (OC)",
                "Peritoneal macrophage (PM)",
                "Regulatory macrophage (RM)",
                "Synovial macrophage (SM)",
                "Thymic macrophage (TM)",
                "Tissue-resident macrophage (TRM)",
                "Tumor-associated macrophage (TAM)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophils (PMN)",
            "Macrophages (M\u03a6)",
            "Dendritic Cells (DCs)",
            "Monocytes (MO)",
            "Microglia (MG)",
            "Osteoclasts (OC)",
            "Mast Cells (MC)",
            "Eosinophils (EO)",
            "Basophils (BA)",
            "Kupffer Cells (KC)",
            "Epithelial Cells (EC)",
            "Endothelial Cells (EndoC)",
            "Natural Killer Cells (NK)",
            "Langerhans Cells (LC)",
            "Peritoneal Macrophages (PM)",
            "Alveolar Macrophages (AM)",
            "Interstitial Macrophages (IM)",
            "Resident Macrophages (RM)",
            "Inflammatory Macrophages (InfM)",
            "Mucosal Macrophages (MM)",
            "Brain Microglia (BMG)",
            "Retinal Microglia (RMG)",
            "Splenic Macrophages (SM)",
            "Bone Marrow Macrophages (BMM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophils (PMN)",
                "Macrophages (M\u03a6)",
                "Dendritic Cells (DCs)",
                "Monocytes (MO)",
                "Microglia (MG)",
                "Osteoclasts (OC)",
                "Mast Cells (MC)",
                "Eosinophils (EO)",
                "Basophils (BA)",
                "Kupffer Cells (KC)",
                "Epithelial Cells (EC)",
                "Endothelial Cells (EndoC)",
                "Natural Killer Cells (NK)",
                "Langerhans Cells (LC)",
                "Peritoneal Macrophages (PM)",
                "Alveolar Macrophages (AM)",
                "Interstitial Macrophages (IM)",
                "Resident Macrophages (RM)",
                "Inflammatory Macrophages (InfM)",
                "Mucosal Macrophages (MM)",
                "Brain Microglia (BMG)",
                "Retinal Microglia (RMG)",
                "Splenic Macrophages (SM)",
                "Bone Marrow Macrophages (BMM)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar Macrophages (AM)",
                "Basophils (BA)",
                "Bone Marrow Macrophages (BMM)",
                "Brain Microglia (BMG)",
                "Dendritic Cells (DCs)",
                "Endothelial Cells (EndoC)",
                "Eosinophils (EO)",
                "Epithelial Cells (EC)",
                "Inflammatory Macrophages (InfM)",
                "Interstitial Macrophages (IM)",
                "Kupffer Cells (KC)",
                "Langerhans Cells (LC)",
                "Macrophages (M\u03a6)",
                "Mast Cells (MC)",
                "Microglia (MG)",
                "Monocytes (MO)",
                "Mucosal Macrophages (MM)",
                "Natural Killer Cells (NK)",
                "Neutrophils (PMN)",
                "Osteoclasts (OC)",
                "Peritoneal Macrophages (PM)",
                "Resident Macrophages (RM)",
                "Retinal Microglia (RMG)",
                "Splenic Macrophages (SM)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophil",
            "Macrophage",
            "Dendritic cell",
            "Monocyte",
            "Microglia",
            "Eosinophil",
            "Basophil",
            "Mast cell",
            "Kupffer cell",
            "Osteoclast",
            "Langerhans cell",
            "Alveolar macrophage",
            "Natural killer cell",
            "Peritoneal macrophage",
            "Splenic macrophage",
            "Hepatic macrophage",
            "Intestinal macrophage",
            "Microphage",
            "Pulmonary macrophage",
            "Mononuclear phagocyte",
            "Amoebocyte",
            "Granulocyte",
            "Phagocytic leukocyte",
            "Histiocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil",
                "Macrophage",
                "Dendritic cell",
                "Monocyte",
                "Microglia",
                "Eosinophil",
                "Basophil",
                "Mast cell",
                "Kupffer cell",
                "Osteoclast",
                "Langerhans cell",
                "Alveolar macrophage",
                "Natural killer cell",
                "Peritoneal macrophage",
                "Splenic macrophage",
                "Hepatic macrophage",
                "Intestinal macrophage",
                "Microphage",
                "Pulmonary macrophage",
                "Mononuclear phagocyte",
                "Amoebocyte",
                "Granulocyte",
                "Phagocytic leukocyte",
                "Histiocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage",
                "Amoebocyte",
                "Basophil",
                "Dendritic cell",
                "Eosinophil",
                "Granulocyte",
                "Hepatic macrophage",
                "Histiocyte",
                "Intestinal macrophage",
                "Kupffer cell",
                "Langerhans cell",
                "Macrophage",
                "Mast cell",
                "Microglia",
                "Microphage",
                "Monocyte",
                "Mononuclear phagocyte",
                "Natural killer cell",
                "Neutrophil",
                "Osteoclast",
                "Peritoneal macrophage",
                "Phagocytic leukocyte",
                "Pulmonary macrophage",
                "Splenic macrophage"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Macrophage (M\u03c6)",
            "Neutrophil (PMN)",
            "Dendritic Cell (DC)",
            "Monocyte",
            "Microglia",
            "Kupffer Cell",
            "Osteoclast",
            "Eosinophil",
            "Langerhans Cell",
            "Alveolar Macrophage",
            "Splenic Macrophage",
            "Reticular Cell",
            "Follicular Dendritic Cell",
            "Histiocyte",
            "Giant Cell",
            "Peritoneal Macrophage",
            "Bone Marrow Macrophage",
            "Intestinal Macrophage",
            "Sertoli Cell",
            "Astrocyte",
            "Paneth Cell",
            "Resident Macrophage",
            "Liver Macrophage",
            "Resident Dendritic Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Macrophage (M\u03d5)",
                "Neutrophil (PMN)",
                "Dendritic Cell (DC)",
                "Monocyte",
                "Microglia",
                "Kupffer Cell",
                "Osteoclast",
                "Eosinophil",
                "Langerhans Cell",
                "Alveolar Macrophage",
                "Splenic Macrophage",
                "Reticular Cell",
                "Follicular Dendritic Cell",
                "Histiocyte",
                "Giant Cell",
                "Peritoneal Macrophage",
                "Bone Marrow Macrophage",
                "Intestinal Macrophage",
                "Sertoli Cell",
                "Astrocyte",
                "Paneth Cell",
                "Resident Macrophage",
                "Liver Macrophage",
                "Resident Dendritic Cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar Macrophage",
                "Astrocyte",
                "Bone Marrow Macrophage",
                "Dendritic Cell (DC)",
                "Eosinophil",
                "Follicular Dendritic Cell",
                "Giant Cell",
                "Histiocyte",
                "Intestinal Macrophage",
                "Kupffer Cell",
                "Langerhans Cell",
                "Liver Macrophage",
                "Macrophage (M\u03c6)",
                "Microglia",
                "Monocyte",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Paneth Cell",
                "Peritoneal Macrophage",
                "Resident Dendritic Cell",
                "Resident Macrophage",
                "Reticular Cell",
                "Sertoli Cell",
                "Splenic Macrophage"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Macrophage",
            "Monocyte",
            "Dendritic cell (DC)",
            "Eosinophil",
            "Mast cell",
            "Natural killer cell (NK cell)",
            "Kupffer cell",
            "Microglial cell",
            "Osteoclast",
            "Alveolar macrophage",
            "Langerhans cell",
            "Histiocyte",
            "Epithelioid cell",
            "Foam cell",
            "Multinucleated giant cell",
            "Tingible body macrophage",
            "Sinus histiocyte",
            "Perivascular macrophage",
            "Mesangial cell",
            "Microglia-like cell",
            "Hemocyte",
            "Amoebocyte",
            "Plasmatocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Macrophage",
                "Monocyte",
                "Dendritic cell (DC)",
                "Eosinophil",
                "Mast cell",
                "Natural killer cell (NK cell)",
                "Kupffer cell",
                "Microglial cell",
                "Osteoclast",
                "Alveolar macrophage",
                "Langerhans cell",
                "Histiocyte",
                "Epithelioid cell",
                "Foam cell",
                "Multinucleated giant cell",
                "Tingible body macrophage",
                "Sinus histiocyte",
                "Perivascular macrophage",
                "Mesangial cell"
            ],
            "mismatches": [
                "Microglia-like cell",
                "Hemocyte",
                "Amoebocyte",
                "Plasmatocyte"
            ],
            "true_referents": [
                "Alveolar macrophage",
                "Amoebocyte",
                "Dendritic cell (DC)",
                "Eosinophil",
                "Epithelioid cell",
                "Foam cell",
                "Hemocyte",
                "Histiocyte",
                "Kupffer cell",
                "Langerhans cell",
                "Macrophage",
                "Mast cell",
                "Mesangial cell",
                "Microglia-like cell",
                "Microglial cell",
                "Monocyte",
                "Multinucleated giant cell",
                "Natural killer cell (NK cell)",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Perivascular macrophage",
                "Plasmatocyte",
                "Sinus histiocyte",
                "Tingible body macrophage"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Macrophage (M\u03c6)",
            "Dendritic cell (DC)",
            "Monocyte",
            "Eosinophil",
            "Basophil",
            "Mast cell",
            "Kupffer cell",
            "Alveolar macrophage (AM)",
            "Microglia",
            "Osteoclast",
            "Epithelioid cell",
            "Giant cell",
            "Langerhans cell",
            "Histiocyte",
            "Reticular cell",
            "Sinusoidal endothelial cell",
            "Dust cell",
            "Adipose tissue macrophage (ATM)",
            "Peritoneal macrophage",
            "Thymus macrophage",
            "Splenic macrophage",
            "Bone marrow macrophage",
            "Lymph node macrophage"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Macrophage (M\u03d5)",
                "Dendritic cell (DC)",
                "Monocyte",
                "Eosinophil",
                "Basophil",
                "Mast cell",
                "Kupffer cell",
                "Alveolar macrophage (AM)",
                "Microglia",
                "Osteoclast",
                "Epithelioid cell",
                "Giant cell",
                "Langerhans cell",
                "Histiocyte",
                "Reticular cell",
                "Sinusoidal endothelial cell",
                "Dust cell",
                "Adipose tissue macrophage (ATM)",
                "Peritoneal macrophage",
                "Thymus macrophage",
                "Splenic macrophage",
                "Bone marrow macrophage",
                "Lymph node macrophage"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipose tissue macrophage (ATM)",
                "Alveolar macrophage (AM)",
                "Basophil",
                "Bone marrow macrophage",
                "Dendritic cell (DC)",
                "Dust cell",
                "Eosinophil",
                "Epithelioid cell",
                "Giant cell",
                "Histiocyte",
                "Kupffer cell",
                "Langerhans cell",
                "Lymph node macrophage",
                "Macrophage (M\u03c6)",
                "Mast cell",
                "Microglia",
                "Monocyte",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Peritoneal macrophage",
                "Reticular cell",
                "Sinusoidal endothelial cell",
                "Splenic macrophage",
                "Thymus macrophage"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Monocyte",
            "Macrophage",
            "Dendritic Cell",
            "Mast Cell",
            "Basophil",
            "Eosinophil",
            "Microglia (Brain Macrophage)",
            "Kupffer Cell (Liver Macrophage)",
            "Osteoclast (Bone Macrophage)",
            "Alveolar Macrophage (Lung Macrophage)",
            "Langerhans Cell (Skin Macrophage)",
            "Histiocyte",
            "Retinal Pigment Epithelial Cell",
            "Sertoli Cell (Testicular Macrophage)",
            "Natural Killer Cell",
            "Melanophage",
            "Adipocyte (Fat Cell)",
            "Trophoblast Cell",
            "Mesangial Cell (Kidney Macrophage)",
            "Splenocyte",
            "Fibroblast",
            "Epithelioid Cell",
            "Multinucleated Giant Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Monocyte",
                "Macrophage",
                "Dendritic Cell",
                "Mast Cell",
                "Basophil",
                "Eosinophil",
                "Microglia (Brain Macrophage)",
                "Kupffer Cell (Liver Macrophage)",
                "Osteoclast (Bone Macrophage)",
                "Alveolar Macrophage (Lung Macrophage)",
                "Langerhans Cell (Skin Macrophage)",
                "Histiocyte",
                "Retinal Pigment Epithelial Cell",
                "Sertoli Cell (Testicular Macrophage)",
                "Natural Killer Cell",
                "Melanophage",
                "Adipocyte (Fat Cell)",
                "Trophoblast Cell",
                "Mesangial Cell (Kidney Macrophage)",
                "Splenocyte",
                "Fibroblast",
                "Epithelioid Cell",
                "Multinucleated Giant Cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (Fat Cell)",
                "Alveolar Macrophage (Lung Macrophage)",
                "Basophil",
                "Dendritic Cell",
                "Eosinophil",
                "Epithelioid Cell",
                "Fibroblast",
                "Histiocyte",
                "Kupffer Cell (Liver Macrophage)",
                "Langerhans Cell (Skin Macrophage)",
                "Macrophage",
                "Mast Cell",
                "Melanophage",
                "Mesangial Cell (Kidney Macrophage)",
                "Microglia (Brain Macrophage)",
                "Monocyte",
                "Multinucleated Giant Cell",
                "Natural Killer Cell",
                "Neutrophil (PMN)",
                "Osteoclast (Bone Macrophage)",
                "Retinal Pigment Epithelial Cell",
                "Sertoli Cell (Testicular Macrophage)",
                "Splenocyte",
                "Trophoblast Cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophil (NEUT)",
            "Monocyte (MONO)",
            "Macrophage (MACRO)",
            "Dendritic Cell (DC)",
            "Microglia (MG)",
            "Kupffer Cell (KC)",
            "Alveolar Macrophage (AM)",
            "Histiocyte (HIST)",
            "Osteoclast (OC)",
            "Mast Cell (MC)",
            "Eosinophil (EOS)",
            "Basophil (BASO)",
            "Langerhans Cell (LC)",
            "Splenic Macrophage (SM)",
            "Peritoneal Macrophage (PM)",
            "Lymph Node Macrophage (LNM)",
            "Bone Marrow Macrophage (BMM)",
            "Thymic Macrophage (TM)",
            "Retinal Microglia (RM)",
            "Intestinal Macrophage (IM)",
            "Kidney Macrophage (KM)",
            "Liver Macrophage (LM)",
            "Skin Macrophage (SM)",
            "Cardiac Macrophage (CM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (NEUT)",
                "Monocyte (MONO)",
                "Macrophage (MACRO)",
                "Dendritic Cell (DC)",
                "Microglia (MG)",
                "Kupffer Cell (KC)",
                "Alveolar Macrophage (AM)",
                "Histiocyte (HIST)",
                "Osteoclast (OC)",
                "Mast Cell (MC)",
                "Eosinophil (EOS)",
                "Basophil (BASO)",
                "Langerhans Cell (LC)",
                "Splenic Macrophage (SM)",
                "Peritoneal Macrophage (PM)",
                "Lymph Node Macrophage (LNM)",
                "Bone Marrow Macrophage (BMM)",
                "Thymic Macrophage (TM)",
                "Retinal Microglia (RM)",
                "Intestinal Macrophage (IM)",
                "Kidney Macrophage (KM)",
                "Liver Macrophage (LM)",
                "Skin Macrophage (SM)",
                "Cardiac Macrophage (CM)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar Macrophage (AM)",
                "Basophil (BASO)",
                "Bone Marrow Macrophage (BMM)",
                "Cardiac Macrophage (CM)",
                "Dendritic Cell (DC)",
                "Eosinophil (EOS)",
                "Histiocyte (HIST)",
                "Intestinal Macrophage (IM)",
                "Kidney Macrophage (KM)",
                "Kupffer Cell (KC)",
                "Langerhans Cell (LC)",
                "Liver Macrophage (LM)",
                "Lymph Node Macrophage (LNM)",
                "Macrophage (MACRO)",
                "Mast Cell (MC)",
                "Microglia (MG)",
                "Monocyte (MONO)",
                "Neutrophil (NEUT)",
                "Osteoclast (OC)",
                "Peritoneal Macrophage (PM)",
                "Retinal Microglia (RM)",
                "Skin Macrophage (SM)",
                "Splenic Macrophage (SM)",
                "Thymic Macrophage (TM)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophils (PMNs) (1) in the human immune system",
            "Macrophages (2) in the human immune system",
            "Dendritic cells (3) in the human immune system",
            "Monocytes (4) in the human immune system",
            "Microglia (5) in the central nervous system",
            "Kupffer cells (6) in the liver",
            "Osteoclasts (7) in bone resorption",
            "Epithelioid cells (8) in granulomas",
            "Langhans cells (9) in granulomas",
            "Epithelial cells (10) in the skin",
            "Enterocytes (11) in the gut",
            "Epithelial cells (12) in the respiratory tract",
            "Epithelial cells (13) in the urinary tract",
            "Epithelial cells (14) in the reproductive tract",
            "Microglial cells (15) in the brain",
            "Kupffer cells (16) in the spleen",
            "Alveolar macrophages (17) in the lungs",
            "Pulmonary macrophages (18) in the lungs",
            "Peritoneal macrophages (19) in the peritoneal cavity",
            "Blood monocytes (20) in the blood",
            "Peripheral blood monocytes (21) in the blood",
            "Bone marrow-derived macrophages (22) in the bone marrow",
            "Bone marrow-derived monocytes (23) in the bone marrow",
            "Human macrophages (24) in the human immune system"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophils (PMNs) (1) in the human immune system",
                "Macrophages (2) in the human immune system",
                "Dendritic cells (3) in the human immune system",
                "Monocytes (4) in the human immune system",
                "Microglia (5) in the central nervous system",
                "Kupffer cells (6) in the liver",
                "Osteoclasts (7) in bone resorption",
                "Epithelioid cells (8) in granulomas",
                "Langhans cells (9) in granulomas",
                "Epithelial cells (10) in the skin",
                "Enterocytes (11) in the gut",
                "Epithelial cells (12) in the respiratory tract",
                "Epithelial cells (13) in the urinary tract",
                "Epithelial cells (14) in the reproductive tract",
                "Microglial cells (15) in the brain",
                "Kupffer cells (16) in the spleen",
                "Alveolar macrophages (17) in the lungs",
                "Pulmonary macrophages (18) in the lungs",
                "Peritoneal macrophages (19) in the peritoneal cavity",
                "Blood monocytes (20) in the blood",
                "Peripheral blood monocytes (21) in the blood",
                "Bone marrow-derived macrophages (22) in the bone marrow",
                "Bone marrow-derived monocytes (23) in the bone marrow",
                "Human macrophages (24) in the human immune system"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophages (17) in the lungs",
                "Blood monocytes (20) in the blood",
                "Bone marrow-derived macrophages (22) in the bone marrow",
                "Bone marrow-derived monocytes (23) in the bone marrow",
                "Dendritic cells (3) in the human immune system",
                "Enterocytes (11) in the gut",
                "Epithelial cells (10) in the skin",
                "Epithelial cells (12) in the respiratory tract",
                "Epithelial cells (13) in the urinary tract",
                "Epithelial cells (14) in the reproductive tract",
                "Epithelioid cells (8) in granulomas",
                "Human macrophages (24) in the human immune system",
                "Kupffer cells (16) in the spleen",
                "Kupffer cells (6) in the liver",
                "Langhans cells (9) in granulomas",
                "Macrophages (2) in the human immune system",
                "Microglia (5) in the central nervous system",
                "Microglial cells (15) in the brain",
                "Monocytes (4) in the human immune system",
                "Neutrophils (PMNs) (1) in the human immune system",
                "Osteoclasts (7) in bone resorption",
                "Peripheral blood monocytes (21) in the blood",
                "Peritoneal macrophages (19) in the peritoneal cavity",
                "Pulmonary macrophages (18) in the lungs"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Macrophage (M\u03c6)",
            "Dendritic cell (DC)",
            "Monocyte",
            "Eosinophil",
            "Basophil",
            "Kupffer cell",
            "Histiocyte",
            "Osteoclast",
            "Microglia",
            "Tie2-expressing monocyte (TEM)",
            "CX3CR1-expressing monocyte (CEM)",
            "Ly6C-expressing monocyte (LEM)",
            "M1 macrophage",
            "M2 macrophage",
            "Foam cell",
            "Giant cell",
            "Langhans giant cell",
            "Foreign-body giant cell",
            "Epithelioid cell",
            "Plasma cell",
            "B cell",
            "T cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Macrophage (M\u03c6)",
                "Dendritic cell (DC)",
                "Monocyte",
                "Eosinophil",
                "Basophil",
                "Kupffer cell",
                "Histiocyte",
                "Osteoclast",
                "Microglia",
                "Tie2-expressing monocyte (TEM)",
                "CX3CR1-expressing monocyte (CEM)",
                "Ly6C-expressing monocyte (LEM)",
                "M1 macrophage",
                "M2 macrophage",
                "Foam cell",
                "Giant cell",
                "Langhans giant cell",
                "Foreign-body giant cell",
                "Epithelioid cell",
                "Plasma cell",
                "B cell",
                "T cell"
            ],
            "mismatches": [],
            "true_referents": [
                "B cell",
                "Basophil",
                "CX3CR1-expressing monocyte (CEM)",
                "Dendritic cell (DC)",
                "Eosinophil",
                "Epithelioid cell",
                "Foam cell",
                "Foreign-body giant cell",
                "Giant cell",
                "Histiocyte",
                "Kupffer cell",
                "Langhans giant cell",
                "Ly6C-expressing monocyte (LEM)",
                "M1 macrophage",
                "M2 macrophage",
                "Macrophage (M\u03c6)",
                "Microglia",
                "Monocyte",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Plasma cell",
                "T cell",
                "Tie2-expressing monocyte (TEM)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "phagocyte",
        "domain": "biology",
        "response": [
            {
                "Referent": "Amebocyte",
                "Canonical name": "Amebocyte"
            },
            {
                "Referent": "Amoebocyte",
                "Canonical name": "Amoebocyte"
            },
            {
                "Referent": "Ameloblast",
                "Canonical name": "Ameloblast"
            },
            {
                "Referent": "Ameloblast",
                "Canonical name": "Ameloblast"
            },
            {
                "Referent": "Amelogenin",
                "Canonical name": "Amelogenin"
            },
            {
                "Referent": "Amino acid transporter",
                "Canonical name": "Amino acid transporter"
            },
            {
                "Referent": "Amoebicidal",
                "Canonical name": "Amoebicidal"
            },
            {
                "Referent": "Amoebicidal",
                "Canonical name": "Amoebicidal"
            },
            {
                "Referent": "Amoebiasis",
                "Canonical name": "Amoebiasis"
            },
            {
                "Referent": "Amoeba",
                "Canonical name": "Amoeba"
            },
            {
                "Referent": "Amoebocyte",
                "Canonical name": "Amoebocyte"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            },
            {
                "Referent": "Amoeboid",
                "Canonical name": "Amoeboid"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amebocyte",
                "Amoebocyte",
                "Ameloblast",
                "Amelogenin",
                "Amino acid transporter",
                "Amoebicidal",
                "Amoebiasis",
                "Amoeba",
                "Amoeboid"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"Amebocyte\", \"Canonical name\": \"Amebocyte\"}",
                "{\"Referent\": \"Ameloblast\", \"Canonical name\": \"Ameloblast\"}",
                "{\"Referent\": \"Amelogenin\", \"Canonical name\": \"Amelogenin\"}",
                "{\"Referent\": \"Amino acid transporter\", \"Canonical name\": \"Amino acid transporter\"}",
                "{\"Referent\": \"Amoeba\", \"Canonical name\": \"Amoeba\"}",
                "{\"Referent\": \"Amoebiasis\", \"Canonical name\": \"Amoebiasis\"}",
                "{\"Referent\": \"Amoebicidal\", \"Canonical name\": \"Amoebicidal\"}",
                "{\"Referent\": \"Amoebocyte\", \"Canonical name\": \"Amoebocyte\"}",
                "{\"Referent\": \"Amoeboid\", \"Canonical name\": \"Amoeboid\"}"
            ],
            "TP": 9,
            "FP": 0,
            "FN": 0
        }
    }
]