[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "cell (C)",
            "neuron (N)",
            "red blood cell (RBC)",
            "white blood cell (WBC)",
            "sperm cell (SC)",
            "egg cell (EC)",
            "fibroblast (F)",
            "osteocyte (O)",
            "myocyte (M)",
            "keratinocyte (K)",
            "hepatocyte (H)",
            "pancreatic beta cell (PBC)",
            "endothelial cell (E)",
            "macrophage (MAC)",
            "T lymphocyte (TL)",
            "B lymphocyte (BL)",
            "platelet (PLT)",
            "reticulocyte (RT)",
            "basophil (BAS)",
            "eosinophil (EOS)",
            "neutrophil (NEU)",
            "mast cell (MC)",
            "natural killer cell (NK)",
            "stem cell (SC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neuron",
                "Erythrocytes",
                "Leukocytes",
                "Fibroblasts",
                "Osteocytes",
                "Keratinocytes",
                "Hepatocytes",
                "Endothelial Cells",
                "Macrophages",
                "T-Lymphocytes",
                "B-Lymphocytes",
                "Blood Platelets",
                "Reticulocytes",
                "Basophils",
                "Eosinophils",
                "Neutrophils",
                "Mast Cells",
                "Natural Killer Cells",
                "Stem Cells"
            ],
            "mismatches": [
                "cell (C)",
                "sperm cell (SC)",
                "egg cell (EC)",
                "myocyte (M)",
                "pancreatic beta cell (PBC)",
                "platelet (PLT)",
                "mast cell (MC)"
            ],
            "true_referents": [
                "Adult Stem Cells",
                "B-Lymphocyte Subsets",
                "B-Lymphocytes",
                "Basophils",
                "Blood Cells",
                "Blood Platelets",
                "Cardiac Myocytes",
                "Embryonic Germ Cells",
                "Embryonic Stem Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Eosinophils",
                "Epidermal Cells",
                "Erythrocytes",
                "Eukaryotic Cells",
                "Fibroblasts",
                "Glucagon-Secreting Cells",
                "Granulocytes",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Human Umbilical Vein Endothelial Cells",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Lymphokine-Activated Killer Cells",
                "M Cells",
                "Macrophages",
                "Mast Cells",
                "Motor Neurons",
                "Muscle Cells",
                "Myoblasts",
                "Myofibroblasts",
                "Natural Killer Cells",
                "Natural Killer T-Cells",
                "Neurons",
                "Neutrophils",
                "Oocytes",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Ovum",
                "RAW 264.7 Cells",
                "Reticulocytes",
                "Sperm Head",
                "Spermatocytes",
                "Spermatozoa",
                "Stem Cells",
                "T-Lymphocyte Subsets",
                "T-Lymphocytes",
                "Th1 Cells"
            ],
            "TP": 19,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Human muscle cell (Myocyte)",
            "Human nerve cell (Neuron)",
            "Human red blood cell (Erythrocyte)",
            "Human white blood cell (Leukocyte)",
            "Human skin cell (Keratinocyte)",
            "Human liver cell (Hepatocyte)",
            "Human kidney cell (Nephron)",
            "Human pancreatic cell (Islet cell)",
            "Human intestinal cell (Enterocyte)",
            "Human bone cell (Osteocyte)",
            "Human sperm cell (Spermatozoon)",
            "Human egg cell (Oocyte)",
            "Human blood platelet precursor cell (Megakaryocyte)",
            "Human endothelial cell (Endothelium)",
            "Human fibroblast cell (Fibroblast)",
            "Human adipocyte (Fat cell)",
            "Human cardiac muscle cell (Cardiomyocyte)",
            "Human epithelial cell (Epithelium)",
            "Human astrocyte (Astrocyte)",
            "Human microglia (Microglia)",
            "Human Schwann cell (Schwann cell)",
            "Human oligodendrocyte (Oligodendrocyte)",
            "Human chondrocyte (Chondrocyte)",
            "Human smooth muscle cell (Smooth muscle cell)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Human nerve cell (Neuron)",
                "Human red blood cell (Erythrocyte)",
                "Human white blood cell (Leukocyte)",
                "Human skin cell (Keratinocyte)",
                "Human liver cell (Hepatocyte)",
                "Human intestinal cell (Enterocyte)",
                "Human bone cell (Osteocyte)",
                "Human egg cell (Oocyte)",
                "Human blood platelet precursor cell (Megakaryocyte)",
                "Human fibroblast cell (Fibroblast)",
                "Human adipocyte (Fat cell)",
                "Human cardiac muscle cell (Cardiomyocyte)",
                "Human astrocyte (Astrocyte)",
                "Human microglia (Microglia)",
                "Human Schwann cell (Schwann cell)",
                "Human chondrocyte (Chondrocyte)"
            ],
            "mismatches": [
                "Human muscle cell (Myocyte)",
                "Human kidney cell (Nephron)",
                "Human pancreatic cell (Islet cell)",
                "Human sperm cell (Spermatozoon)",
                "Human endothelial cell (Endothelium)",
                "Human epithelial cell (Epithelium)",
                "Human oligodendrocyte (Oligodendrocyte)",
                "Human smooth muscle cell (Smooth muscle cell)"
            ],
            "true_referents": [
                "Adipocytes",
                "Astrocytes",
                "Bone Marrow Cells",
                "Brown Adipocytes",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Endothelial Cells",
                "Enterocytes",
                "Enteroendocrine Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Epithelioid Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Glucagon-Secreting Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Human Umbilical Vein Endothelial Cells",
                "Insulin-Secreting Cells",
                "Keratinocytes",
                "Leukocytes",
                "Madin Darby Canine Kidney Cells",
                "Megakaryocyte Progenitor Cells",
                "Megakaryocytes",
                "Mesangial Cells",
                "Microglia",
                "Muscle Cells",
                "Myelin Sheath",
                "Myoblasts",
                "Myofibroblasts",
                "Neurites",
                "Neuroepithelial Cells",
                "Neuroglia",
                "Neurons",
                "Neutrophils",
                "Oligodendrocyte Precursor Cells",
                "Oligodendroglia",
                "Oocytes",
                "Osteoblasts",
                "Osteocytes",
                "Ovum",
                "Schwann Cells",
                "Skeletal Muscle Satellite Cells",
                "Smooth Muscle Myoblasts",
                "Smooth Muscle Myocytes",
                "Sperm Head",
                "Spermatocytes",
                "Spermatozoa",
                "Stromal Cells",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Erythrocyte (Red Blood Cell)",
            "Leukocyte (White Blood Cell)",
            "Thrombocyte (Platelet)",
            "Neutrophil",
            "Eosinophil",
            "Basophil",
            "Lymphocyte",
            "Monocyte",
            "Macrophage",
            "Mast Cell",
            "Dendritic Cell",
            "Keratocyte",
            "Osteocyte",
            "Chondrocyte",
            "Adipocyte",
            "Myocyte",
            "Neurocyte",
            "Hepatocyte",
            "Renal Cell",
            "Pancreatic Cell",
            "Insulinoma Cell",
            "Sperm Cell",
            "Oocyte",
            "Ovum"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil",
                "Eosinophil",
                "Basophil",
                "Lymphocyte",
                "Monocyte",
                "Macrophage",
                "Mast Cell",
                "Dendritic Cell",
                "Osteocyte",
                "Chondrocyte",
                "Adipocyte",
                "Hepatocyte",
                "Oocyte",
                "Ovum"
            ],
            "mismatches": [
                "Erythrocyte (Red Blood Cell)",
                "Leukocyte (White Blood Cell)",
                "Thrombocyte (Platelet)",
                "Keratocyte",
                "Myocyte",
                "Neurocyte",
                "Renal Cell",
                "Pancreatic Cell",
                "Insulinoma Cell",
                "Sperm Cell"
            ],
            "true_referents": [
                "Adipocytes",
                "Antigen-Presenting Cells",
                "Astrocytes",
                "B-Lymphocytes",
                "Basophils",
                "Blood Cells",
                "Blood Platelets",
                "Brown Adipocytes",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Dendritic Cells",
                "Endocrine Cells",
                "Endothelial Cells",
                "Eosinophils",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Glucagon-Secreting Cells",
                "Granulocytes",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Macrophages",
                "Madin Darby Canine Kidney Cells",
                "Mast Cells",
                "Mesangial Cells",
                "Monocytes",
                "Muscle Cells",
                "Myoblasts",
                "Neuroepithelial Cells",
                "Neutrophils",
                "Oocytes",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Ovum",
                "Sperm Head",
                "Spermatocytes",
                "Spermatozoa",
                "Stromal Cells",
                "T-Lymphocytes",
                "Th1 Cells",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Human Neuron (Neuron)",
            "Human Hepatocyte (Hepatocyte)",
            "Human Erythrocyte (RBC)",
            "Human Myocyte (Myocyte)",
            "Human Osteocyte (Osteocyte)",
            "Human Chondrocyte (Chondrocyte)",
            "Human Adipocyte (Adipocyte)",
            "Human Fibroblast (Fibroblast)",
            "Human Keratinocyte (Keratinocyte)",
            "Human Melanocyte (Melanocyte)",
            "Human Lymphocyte (Lymphocyte)",
            "Human Neutrophil (Neutrophil)",
            "Human Macrophage (Macrophage)",
            "Human Mast Cell (Mast Cell)",
            "Human Epithelial Cell (Epithelial Cell)",
            "Human Endothelial Cell (Endothelial Cell)",
            "Human Cardiac Myocyte (Cardiac Myocyte)",
            "Human Smooth Muscle Cell (SMC)",
            "Human Skeletal Muscle Fiber (Muscle Fiber)",
            "Human Pancreatic Beta Cell (Beta Cell)",
            "Human Renal Tubular Cell (RTC)",
            "Human Germ Cell (Germ Cell)",
            "Human Oocyte (Oocyte)",
            "Human Sperm Cell (Sperm)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neuron",
                "Hepatocyte",
                "Erythrocyte",
                "Myocyte",
                "Osteocyte",
                "Chondrocyte",
                "Adipocyte",
                "Fibroblast",
                "Keratinocyte",
                "Melanocyte",
                "Lymphocyte",
                "Neutrophil",
                "Macrophage",
                "Mast Cell",
                "Epithelial Cell",
                "Endothelial Cell",
                "Cardiac Myocyte",
                "Germ Cell",
                "Oocyte"
            ],
            "mismatches": [
                "Smooth Muscle Cell",
                "Skeletal Muscle Fiber",
                "Pancreatic Beta Cell",
                "Renal Tubular Cell",
                "Sperm Cell"
            ],
            "true_referents": [
                "Adipocytes",
                "B-Lymphocytes",
                "Brown Adipocytes",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Embryonic Germ Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Epithelioid Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Germ Cells",
                "Glucagon-Secreting Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Human Umbilical Vein Endothelial Cells",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Lymphocytes",
                "Macrophages",
                "Madin Darby Canine Kidney Cells",
                "Mast Cells",
                "Melanocytes",
                "Motor Neurons",
                "Muscle Cells",
                "Myoblasts",
                "Myofibroblasts",
                "Neurons",
                "Neutrophils",
                "Oocytes",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Ovum",
                "RAW 264.7 Cells",
                "Skeletal Muscle Fibers",
                "Skeletal Muscle Satellite Cells",
                "Slow-Twitch Muscle Fibers",
                "Smooth Muscle Myoblasts",
                "Smooth Muscle Myocytes",
                "Sperm Head",
                "Spermatocytes",
                "Spermatozoa",
                "T-Lymphocytes",
                "Telocytes",
                "Th1 Cells",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Neuron",
            "Hepatocyte",
            "Cardiomyocyte",
            "Erythrocyte",
            "Osteocyte",
            "Chondrocyte",
            "Adipocyte",
            "Fibroblast",
            "Keratinocyte",
            "Melanocyte",
            "Lymphocyte",
            "Macrophage",
            "Monocyte",
            "Epithelial cell",
            "Endothelial cell",
            "Smooth muscle cell",
            "Skeletal muscle cell",
            "Astrocyte",
            "Oligodendrocyte",
            "Schwann cell",
            "Microglia",
            "Basophil",
            "Eosinophil",
            "Neutrophil"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neuron",
                "Hepatocyte",
                "Erythrocyte",
                "Osteocyte",
                "Chondrocyte",
                "Adipocyte",
                "Fibroblast",
                "Keratinocyte",
                "Melanocyte",
                "Lymphocyte",
                "Macrophage",
                "Monocyte",
                "Astrocyte",
                "Schwann cell",
                "Microglia",
                "Basophil",
                "Eosinophil",
                "Neutrophil"
            ],
            "mismatches": [
                "Cardiomyocyte",
                "Epithelial cell",
                "Endothelial cell",
                "Smooth muscle cell",
                "Skeletal muscle cell",
                "Oligodendrocyte"
            ],
            "true_referents": [
                "Adipocytes",
                "Astrocytes",
                "Axons",
                "B-Lymphocytes",
                "Basophils",
                "Brown Adipocytes",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Eosinophils",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Interneurons",
                "Keratinocytes",
                "Lymphocytes",
                "Macrophages",
                "Mast Cells",
                "Melanocytes",
                "Melanophores",
                "Microglia",
                "Monocytes",
                "Muscle Cells",
                "Myelin Sheath",
                "Myoblasts",
                "Myofibroblasts",
                "Neuroglia",
                "Neurons",
                "Neutrophils",
                "Oligodendrocyte Precursor Cells",
                "Oligodendroglia",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Schwann Cells",
                "Skeletal Muscle Fibers",
                "Skeletal Muscle Satellite Cells",
                "Smooth Muscle Myoblasts",
                "Smooth Muscle Myocytes",
                "Stromal Cells",
                "T-Lymphocytes",
                "White Adipocytes"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Red Blood Cell (RBC)",
            "Neuron (N)",
            "Muscle Cell (Myocyte)",
            "Epithelial Cell (EC)",
            "Adipocyte (Fat Cell)",
            "Osteocyte (Bone Cell)",
            "Hepatocyte (Liver Cell)",
            "Chondrocyte (Cartilage Cell)",
            "Cardiomyocyte (Heart Muscle Cell)",
            "Lymphocyte (Immune Cell)",
            "Spermatocyte (Sperm Cell)",
            "Oocyte (Egg Cell)",
            "Pancreatic Beta Cell (Insulin-producing Cell)",
            "Goblet Cell (Mucus-secreting Cell)",
            "Keratinocyte (Skin Cell)",
            "Endothelial Cell (Blood Vessel Lining Cell)",
            "Fibroblast (Connective Tissue Cell)",
            "Neuroglia (Glial Cell)",
            "Myofibril (Muscle Fiber Cell)",
            "Mast Cell (Immune Response Cell)",
            "Macrophage (Phagocytic Cell)",
            "B Cell (Antibody-producing Cell)",
            "T Cell (Cytotoxic Cell)",
            "Dendritic Cell (Antigen-presenting Cell)",
            "Retinal Cell (Photoreceptor Cell)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neuron (N)",
                "Muscle Cell (Myocyte)",
                "Epithelial Cell (EC)",
                "Adipocyte (Fat Cell)",
                "Osteocyte (Bone Cell)",
                "Hepatocyte (Liver Cell)",
                "Chondrocyte (Cartilage Cell)",
                "Lymphocyte (Immune Cell)",
                "Spermatocyte (Sperm Cell)",
                "Oocyte (Egg Cell)",
                "Goblet Cell (Mucus-secreting Cell)",
                "Keratinocyte (Skin Cell)",
                "Endothelial Cell (Blood Vessel Lining Cell)",
                "Fibroblast (Connective Tissue Cell)",
                "Neuroglia (Glial Cell)",
                "Mast Cell (Immune Response Cell)",
                "Macrophage (Phagocytic Cell)",
                "Dendritic Cell (Antigen-presenting Cell)"
            ],
            "mismatches": [
                "Red Blood Cell (RBC)",
                "Cardiomyocyte (Heart Muscle Cell)",
                "Pancreatic Beta Cell (Insulin-producing Cell)",
                "Myofibril (Muscle Fiber Cell)",
                "B Cell (Antibody-producing Cell)",
                "T Cell (Cytotoxic Cell)",
                "Retinal Cell (Photoreceptor Cell)"
            ],
            "true_referents": [
                "Adipocytes",
                "Antibody-Producing Cells",
                "Antigen-Presenting Cells",
                "Astrocytes",
                "B-Lymphocytes",
                "Blood Cells",
                "Brown Adipocytes",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Connective Tissue Cells",
                "Cytotoxic T-Lymphocytes",
                "Dendritic Cells",
                "Endothelial Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocytes",
                "Fibroblasts",
                "Gastrin-Secreting Cells",
                "Glucagon-Secreting Cells",
                "Goblet Cells",
                "Hemangioblasts",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Lymphocytes",
                "Macrophages",
                "Mast Cells",
                "Microglia",
                "Motor Neurons",
                "Muscle Cells",
                "Myoblasts",
                "Myofibrils",
                "Myofibroblasts",
                "Neuroglia",
                "Neurons",
                "Oocytes",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Ovum",
                "Sertoli Cells",
                "Skeletal Muscle Satellite Cells",
                "Spermatocytes",
                "Spermatozoa",
                "Stromal Cells",
                "T-Lymphocytes",
                "Th1 Cells",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 18,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Human Neuron Cell (HNC)",
            "Human Red Blood Cell (HRBC)",
            "Human White Blood Cell (HWBC)",
            "Human Skin Cell (HSC)",
            "Human Muscle Cell (HMC)",
            "Human Liver Cell (Hepatocyte)",
            "Human Pancreatic Cell (HPC)",
            "Human Lung Cell (HLC)",
            "Human Kidney Cell (HKC)",
            "Human Cardiac Cell (HCC)",
            "Human Stomach Cell (HSC)",
            "Human Intestinal Cell (HIC)",
            "Human Epithelial Cell (HEC)",
            "Human Endothelial Cell (HEC)",
            "Human Sperm Cell (HSC)",
            "Human Ovum Cell (HOC)",
            "Human Bone Cell (HBC)",
            "Human Fat Cell (Adipocyte)",
            "Human Nerve Cell (Neuron)",
            "Human Hair Cell (HHC)",
            "Human Retinal Cell (HRC)",
            "Human T Cell (HTC)",
            "Human B Cell (HBC)",
            "Human Stem Cell (HSC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neuron",
                "Erythrocytes",
                "Hepatocytes",
                "Epithelial Cells",
                "Endothelial Cells",
                "Spermatozoa",
                "Ovum",
                "Adipocytes",
                "T-Lymphocytes",
                "B-Lymphocytes",
                "Stem Cells"
            ],
            "mismatches": [
                "Human White Blood Cell (HWBC)",
                "Human Skin Cell (HSC)",
                "Human Muscle Cell (HMC)",
                "Human Pancreatic Cell (HPC)",
                "Human Lung Cell (HLC)",
                "Human Kidney Cell (HKC)",
                "Human Cardiac Cell (HCC)",
                "Human Stomach Cell (HSC)",
                "Human Intestinal Cell (HIC)",
                "Human Nerve Cell (Neuron)",
                "Human Hair Cell (HHC)",
                "Human Retinal Cell (HRC)",
                "Human Fat Cell (Adipocyte)"
            ],
            "true_referents": [
                "Adipocytes",
                "Alveolar Epithelial Cells",
                "Auditory Hair Cells",
                "B-Lymphocyte Subsets",
                "B-Lymphocytes",
                "Blood Cells",
                "Bone Marrow Cells",
                "Brown Adipocytes",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Enterocytes",
                "Enteroendocrine Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Epithelioid Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Gastric Chief Cells",
                "Gastric Parietal Cells",
                "Gastrin-Secreting Cells",
                "HaCaT Cells",
                "Hemocytes",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Human Embryonic Stem Cells",
                "Human Umbilical Vein Endothelial Cells",
                "Inner Auditory Hair Cells",
                "K562 Cells",
                "Keratinocytes",
                "Madin Darby Canine Kidney Cells",
                "Muscle Cells",
                "Myoblasts",
                "Neural Stem Cells",
                "Neurites",
                "Neuroepithelial Cells",
                "Neurons",
                "Oocytes",
                "Osteoblasts",
                "Osteocytes",
                "Ovum",
                "Pancreatic Polypeptide-Secreting Cells",
                "Pancreatic Stellate Cells",
                "Pluripotent Stem Cells",
                "RAW 264.7 Cells",
                "Retinal Horizontal Cells",
                "Retinal Rod Photoreceptor Cells",
                "Skeletal Muscle Satellite Cells",
                "Spermatocytes",
                "Spermatozoa",
                "Spherocytes",
                "Stem Cells",
                "T-Lymphocytes",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Red blood cell (RBC)",
            "Neuron",
            "Muscle cell",
            "Skin cell",
            "Liver cell",
            "Kidney cell",
            "Heart cell",
            "Lung cell",
            "Pancreatic cell",
            "Intestinal cell",
            "Bone cell",
            "Fat cell",
            "Nerve cell",
            "Sperm cell",
            "Egg cell",
            "White blood cell (WBC)",
            "Platelet",
            "Epithelial cell",
            "Connective tissue cell",
            "Smooth muscle cell",
            "Cardiac muscle cell",
            "Skeletal muscle cell",
            "Glandular cell",
            "Endothelial cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neuron",
                "Muscle cell",
                "Nerve cell",
                "Sperm cell",
                "Egg cell",
                "White blood cell (WBC)",
                "Platelet",
                "Epithelial cell",
                "Connective tissue cell",
                "Smooth muscle cell",
                "Cardiac muscle cell",
                "Skeletal muscle cell",
                "Endothelial cell"
            ],
            "mismatches": [
                "Red blood cell (RBC)",
                "Skin cell",
                "Liver cell",
                "Kidney cell",
                "Heart cell",
                "Lung cell",
                "Pancreatic cell",
                "Intestinal cell",
                "Bone cell",
                "Fat cell",
                "Glandular cell"
            ],
            "true_referents": [
                "Adipocytes",
                "Alveolar Epithelial Cells",
                "Alveolar Macrophages",
                "Axons",
                "Blood Cells",
                "Blood Platelets",
                "Bone Marrow Cells",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Connective Tissue Cells",
                "Endocrine Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Enterocytes",
                "Enteroendocrine Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocytes",
                "Eukaryotic Cells",
                "Foam Cells",
                "Glucagon-Secreting Cells",
                "Granulocytes",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Madin Darby Canine Kidney Cells",
                "Mesangial Cells",
                "Muscle Cells",
                "Myoblasts",
                "Nerve Fibers",
                "Neurites",
                "Neuroendocrine Cells",
                "Neurons",
                "Oocytes",
                "Osteoblasts",
                "Osteocytes",
                "Ovum",
                "Skeletal Muscle Fibers",
                "Skeletal Muscle Satellite Cells",
                "Smooth Muscle Myoblasts",
                "Smooth Muscle Myocytes",
                "Sperm Head",
                "Spermatocytes",
                "Spermatozoa",
                "Stromal Cells",
                "White Adipocytes"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Erythrocyte (Red blood cell)",
            "Leukocyte (White blood cell)",
            "Neuron",
            "Hepatocyte",
            "Myocyte (Muscle cell)",
            "Adipocyte",
            "Osteocyte",
            "Chondrocyte",
            "Epithelial cell",
            "Fibroblast",
            "Keratinocyte",
            "Pancreatic beta cell",
            "Endothelial cell",
            "Microglia",
            "Astrocyte",
            "Melanocyte",
            "Macrophage",
            "Stem cell",
            "Platelet",
            "Schwann cell",
            "Basophil",
            "Eosinophil",
            "Neutrophil",
            "T-lymphocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Erythrocyte (Red blood cell)",
                "Leukocyte (White blood cell)",
                "Neuron",
                "Hepatocyte",
                "Adipocyte",
                "Osteocyte",
                "Chondrocyte",
                "Epithelial cell",
                "Fibroblast",
                "Keratinocyte",
                "Endothelial cell",
                "Microglia",
                "Astrocyte",
                "Melanocyte",
                "Macrophage",
                "Stem cell",
                "Schwann cell",
                "Basophil",
                "Eosinophil",
                "Neutrophil",
                "T-lymphocyte"
            ],
            "mismatches": [
                "Myocyte (Muscle cell)",
                "Pancreatic beta cell",
                "Platelet"
            ],
            "true_referents": [
                "Adipocytes",
                "Adult Stem Cells",
                "Astrocytes",
                "Axons",
                "Basophils",
                "Blood Cells",
                "Blood Platelets",
                "Brown Adipocytes",
                "Chondrocytes",
                "Cytotoxic T-Lymphocytes",
                "Embryonic Stem Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Eosinophils",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Glucagon-Secreting Cells",
                "Granulocytes",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Macrophages",
                "Mast Cells",
                "Melanocytes",
                "Melanophores",
                "Microglia",
                "Muscle Cells",
                "Myelin Sheath",
                "Myoblasts",
                "Myofibroblasts",
                "Neuroglia",
                "Neurons",
                "Neutrophils",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Schwann Cells",
                "Skeletal Muscle Satellite Cells",
                "Stem Cells",
                "Stromal Cells",
                "T-Lymphocytes",
                "White Adipocytes"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Neuron (nerve cell)",
            "Hepatocyte (liver cell)",
            "Cardiomyocyte (heart muscle cell)",
            "Osteocyte (bone cell)",
            "Erythrocyte (red blood cell)",
            "Leukocyte (white blood cell)",
            "Adipocyte (fat cell)",
            "Myocyte (skeletal muscle cell)",
            "Chondrocyte (cartilage cell)",
            "Fibroblast (connective tissue cell)",
            "Keratinocyte (skin cell)",
            "Enterocyte (intestinal epithelial cell)",
            "Pneumocyte (lung cell)",
            "Podocyte (kidney glomerular cell)",
            "Melanocyte (pigment-producing cell)",
            "Oocyte (egg cell)",
            "Spermatozoon (sperm cell)",
            "Lymphocyte (immune system cell)",
            "Macrophage (immune system cell)",
            "Astrocyte (glial cell)",
            "Beta cell (pancreatic cell)",
            "Endothelial cell (blood vessel lining cell)",
            "Schwann cell (peripheral nervous system cell)",
            "Goblet cell (mucus-secreting cell)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neurons",
                "Hepatocytes",
                "Osteocytes",
                "Erythrocytes",
                "Leukocytes",
                "Adipocytes",
                "Chondrocytes",
                "Fibroblasts",
                "Keratinocytes",
                "Enterocytes",
                "Podocytes",
                "Melanocytes",
                "Oocytes",
                "Lymphocytes",
                "Macrophages",
                "Astrocytes",
                "Endothelial Cells",
                "Schwann Cells",
                "Goblet Cells"
            ],
            "mismatches": [
                "Cardiomyocyte (heart muscle cell)",
                "Myocyte (skeletal muscle cell)",
                "Pneumocyte (lung cell)",
                "Spermatozoon (sperm cell)",
                "Beta cell (pancreatic cell)"
            ],
            "true_referents": [
                "Acrosome",
                "Adipocytes",
                "Alveolar Epithelial Cells",
                "Alveolar Macrophages",
                "Astrocytes",
                "B-Lymphocytes",
                "Brown Adipocytes",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Connective Tissue Cells",
                "Endothelial Cells",
                "Enterocytes",
                "Enteroendocrine Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Gastrin-Secreting Cells",
                "Glucagon-Secreting Cells",
                "Goblet Cells",
                "Granulocytes",
                "Hemangioblasts",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Macrophages",
                "Melanocytes",
                "Mesangial Cells",
                "Microglia",
                "Muscle Cells",
                "Myelin Sheath",
                "Myoblasts",
                "Myofibroblasts",
                "Neurites",
                "Neuroglia",
                "Neurons",
                "Oocytes",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Ovum",
                "Podocytes",
                "Podosomes",
                "Schwann Cells",
                "Skeletal Muscle Satellite Cells",
                "Spermatocytes",
                "Spermatozoa",
                "Stromal Cells",
                "T-Lymphocytes",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Skin cell (keratinocyte)",
            "Muscle cell (myocyte)",
            "Bone cell (osteocyte)",
            "Nerve cell (neuron)",
            "Brain cell (neuron)",
            "Blood cell (erythrocyte)",
            "Immune system cell (lymphocyte)",
            "Fat cell (adipocyte)",
            "Cartilage cell (chondrocyte)",
            "Liver cell (hepatocyte)",
            "Pancreas cell (pancreatic acinar cell)",
            "Kidney cell (nephron cell)",
            "Intestinal cell (enterocyte)",
            "Lung cell (pneumocyte)",
            "Heart muscle cell (cardiomyocyte)",
            "Smooth muscle cell (leiomyocyte)",
            "Skeletal muscle cell (myocyte)",
            "Gland cell (secretory cell)",
            "Hair follicle cell (trichocyte)",
            "Nail cell (onychocyte)",
            "Sweat gland cell (sudoriferous cell)",
            "Thyroid gland cell (thyrocyte)",
            "Adrenal gland cell (adrenocortical cell)",
            "Pituitary gland cell (adenohypophyseal cell)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocytes",
                "Muscle Cells",
                "Osteocytes",
                "Neurons",
                "Blood Cells",
                "Lymphocytes",
                "Adipocytes",
                "Chondrocytes",
                "Hepatocytes",
                "Enterocytes"
            ],
            "mismatches": [
                "Pancreas cell (pancreatic acinar cell)",
                "Kidney cell (nephron cell)",
                "Lung cell (pneumocyte)",
                "Heart muscle cell (cardiomyocyte)",
                "Smooth muscle cell (leiomyocyte)",
                "Skeletal muscle cell (myocyte)",
                "Gland cell (secretory cell)",
                "Hair follicle cell (trichocyte)",
                "Nail cell (onychocyte)",
                "Sweat gland cell (sudoriferous cell)",
                "Thyroid gland cell (thyrocyte)",
                "Adrenal gland cell (adrenocortical cell)",
                "Pituitary gland cell (adenohypophyseal cell)"
            ],
            "true_referents": [
                "Adipocytes",
                "Alveolar Epithelial Cells",
                "Alveolar Macrophages",
                "Astrocytes",
                "B-Lymphocytes",
                "Blood Cells",
                "Bone Marrow Cells",
                "Brown Adipocytes",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Chromaffin Cells",
                "Connective Tissue Cells",
                "Corticotrophs",
                "Endocrine Cells",
                "Enterocytes",
                "Enteroendocrine Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocytes",
                "Eukaryotic Cells",
                "Glucagon-Secreting Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Lymphocytes",
                "Mesangial Cells",
                "Muscle Cells",
                "Myoblasts",
                "Myofibroblasts",
                "Neurites",
                "Neuroendocrine Cells",
                "Neurons",
                "Osteoblasts",
                "Osteocytes",
                "Skeletal Muscle Satellite Cells",
                "Smooth Muscle Myoblasts",
                "Smooth Muscle Myocytes",
                "Somatostatin-Secreting Cells",
                "Stromal Cells",
                "T-Lymphocytes",
                "Thyroid Epithelial Cells",
                "Thyrotrophs",
                "White Adipocytes"
            ],
            "TP": 10,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "red blood cell (erythrocyte)",
            "white blood cell (leukocyte)",
            "platelet (thrombocyte)",
            "muscle cell (myocyte)",
            "nerve cell (neuron)",
            "bone cell (osteocyte)",
            "fat cell (adipocyte)",
            "liver cell (hepatocyte)",
            "skin cell (keratinocyte)",
            "kidney cell (nephrocyte)",
            "pancreatic cell (islet cell)",
            "lung cell (pneumocyte)",
            "intestinal cell (enterocyte)",
            "ovarian cell (oocyte)",
            "sperm cell (spermatocyte)",
            "stem cell",
            "fibroblast",
            "endothelial cell",
            "epithelial cell",
            "lymphocyte",
            "macrophage",
            "monocyte",
            "neutrophil",
            "eosinophil"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Erythrocytes",
                "Leukocytes",
                "Blood Platelets",
                "Muscle Cells",
                "Neurons",
                "Osteocytes",
                "Adipocytes",
                "Hepatocytes",
                "Keratinocytes",
                "Enterocytes",
                "Oocytes",
                "Spermatocytes",
                "Stem Cells",
                "Fibroblasts",
                "Endothelial Cells",
                "Epithelial Cells",
                "Lymphocytes",
                "Macrophages",
                "Monocytes",
                "Neutrophils",
                "Eosinophils"
            ],
            "mismatches": [
                "kidney cell (nephrocyte)",
                "pancreatic cell (islet cell)",
                "lung cell (pneumocyte)"
            ],
            "true_referents": [
                "Adipocytes",
                "Adult Stem Cells",
                "Alveolar Epithelial Cells",
                "Alveolar Macrophages",
                "B-Lymphocytes",
                "Blood Cells",
                "Blood Platelets",
                "Bone Marrow Cells",
                "Brown Adipocytes",
                "Embryonic Stem Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Enterocytes",
                "Enteroendocrine Cells",
                "Eosinophils",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Glucagon-Secreting Cells",
                "Granulocytes",
                "Granulosa Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Macrophages",
                "Mesangial Cells",
                "Monocytes",
                "Muscle Cells",
                "Myoblasts",
                "Myofibroblasts",
                "Neurites",
                "Neurons",
                "Neutrophils",
                "Oocytes",
                "Osteoblasts",
                "Osteocytes",
                "Ovum",
                "Sertoli Cells",
                "Skeletal Muscle Satellite Cells",
                "Spermatocytes",
                "Spermatozoa",
                "Stem Cells",
                "T-Lymphocytes",
                "White Adipocytes"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Skin Cell (SC)",
            "Muscle Cell (MC)",
            "Nerve Cell (NC)",
            "Red Blood Cell (RBC)",
            "White Blood Cell (WBC)",
            "Bone Cell (BC)",
            "Liver Cell (LC)",
            "Kidney Cell (KC)",
            "Lung Cell (LuC)",
            "Heart Cell (HC)",
            "Brain Cell (BrC)",
            "Pancreas Cell (PC)",
            "Intestinal Cell (IC)",
            "Stomach Cell (SC2)",
            "Thyroid Cell (TC)",
            "Adrenal Cell (AC)",
            "Ovarian Cell (OC)",
            "Testicular Cell (TsC)",
            "Retinal Cell (RC)",
            "Cartilage Cell (CaC)",
            "Tendon Cell (TC2)",
            "Ligament Cell (LC2)",
            "Adipose Cell (AC2)",
            "Connective Tissue Cell (CTC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Muscle Cell (MC)",
                "Red Blood Cell (RBC)",
                "White Blood Cell (WBC)",
                "Connective Tissue Cell (CTC)"
            ],
            "mismatches": [
                "Skin Cell (SC)",
                "Nerve Cell (NC)",
                "Bone Cell (BC)",
                "Liver Cell (LC)",
                "Kidney Cell (KC)",
                "Lung Cell (LuC)",
                "Heart Cell (HC)",
                "Brain Cell (BrC)",
                "Pancreas Cell (PC)",
                "Intestinal Cell (IC)",
                "Stomach Cell (SC2)",
                "Thyroid Cell (TC)",
                "Adrenal Cell (AC)",
                "Ovarian Cell (OC)",
                "Testicular Cell (TsC)",
                "Retinal Cell (RC)",
                "Cartilage Cell (CaC)",
                "Tendon Cell (TC2)",
                "Ligament Cell (LC2)",
                "Adipose Cell (AC2)"
            ],
            "true_referents": [
                "Adipocytes",
                "Alveolar Epithelial Cells",
                "Astrocytes",
                "Blood Cells",
                "Bone Marrow Cells",
                "Brown Adipocytes",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Chromaffin Cells",
                "Connective Tissue Cells",
                "Corneal Keratocytes",
                "Endocrine Cells",
                "Enterocytes",
                "Enteroendocrine Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocytes",
                "Gastric Chief Cells",
                "Gastric Parietal Cells",
                "Gastrin-Secreting Cells",
                "Granulocytes",
                "Granulosa Cells",
                "Hemocytes",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "K562 Cells",
                "Keratinocytes",
                "Leukocytes",
                "Leydig Cells",
                "Madin Darby Canine Kidney Cells",
                "Muscle Cells",
                "Myoblasts",
                "Neuroendocrine Cells",
                "Neuroepithelial Cells",
                "Neuroglia",
                "Neurons",
                "Oocytes",
                "Osteoblasts",
                "Osteocytes",
                "Pancreatic Polypeptide-Secreting Cells",
                "RAW 264.7 Cells",
                "Retinal Neurons",
                "Retinal Rod Photoreceptor Cells",
                "Sertoli Cells",
                "Skeletal Muscle Satellite Cells",
                "Stromal Cells",
                "Tenocytes",
                "Thyroid Epithelial Cells",
                "Thyrotrophs",
                "White Adipocytes"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Eukaryotic cell (Eukaryote)",
            "Animal cell (Animal cell)",
            "Plant cell (Plant cell)",
            "Human cell (Human cell)",
            "Mammalian cell (Mammalian cell)",
            "Fungal cell (Fungal cell)",
            "Bacterial cell (Bacterial cell)",
            "Prokaryotic cell (Prokaryote)",
            "Neuron (Neuron)",
            "Muscle cell (Muscle cell)",
            "Red blood cell (Red blood cell)",
            "White blood cell (White blood cell)",
            "Platelet (Platelet)",
            "Hepatocyte (Hepatocyte)",
            "Kidney cell (Kidney cell)",
            "Epithelial cell (Epithelial cell)",
            "Connective tissue cell (Connective tissue cell)",
            "Endothelial cell (Endothelial cell)",
            "Stem cell (Stem cell)",
            "Immune cell (Immune cell)",
            "Cancer cell (Cancer cell)",
            "Tumor cell (Tumor cell)",
            "Leukocyte (Leukocyte)",
            "Macrophage (Macrophage)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Eukaryotic cell (Eukaryote)",
                "Neuron (Neuron)",
                "Muscle cell (Muscle cell)",
                "Hepatocyte (Hepatocyte)",
                "Epithelial cell (Epithelial cell)",
                "Connective tissue cell (Connective tissue cell)",
                "Endothelial cell (Endothelial cell)",
                "Stem cell (Stem cell)",
                "Leukocyte (Leukocyte)",
                "Macrophage (Macrophage)"
            ],
            "mismatches": [
                "Animal cell (Animal cell)",
                "Plant cell (Plant cell)",
                "Human cell (Human cell)",
                "Mammalian cell (Mammalian cell)",
                "Fungal cell (Fungal cell)",
                "Bacterial cell (Bacterial cell)",
                "Prokaryotic cell (Prokaryote)",
                "Red blood cell (Red blood cell)",
                "White blood cell (White blood cell)",
                "Platelet (Platelet)",
                "Kidney cell (Kidney cell)",
                "Immune cell (Immune cell)",
                "Cancer cell (Cancer cell)",
                "Tumor cell (Tumor cell)"
            ],
            "true_referents": [
                "Adult Stem Cells",
                "Antibody-Producing Cells",
                "Blood Cells",
                "Blood Platelets",
                "Connective Tissue Cells",
                "Embryonic Stem Cells",
                "Endothelial Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocytes",
                "Eukaryotic Cells",
                "Giant Cells",
                "Granulocytes",
                "Hemocytes",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Human Umbilical Vein Endothelial Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Macrophages",
                "Mesangial Cells",
                "Muscle Cells",
                "Myoblasts",
                "Natural Killer Cells",
                "Neoplastic Stem Cells",
                "Neurons",
                "Phagocytes",
                "Pyramidal Cells",
                "RAW 264.7 Cells",
                "Skeletal Muscle Satellite Cells",
                "Stem Cells",
                "Stromal Cells"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Neuron (NER)",
            "Muscle cell (MC)",
            "Epithelial cell (EC)",
            "Stem cell (SC)",
            "Red blood cell (RBC)",
            "White blood cell (WBC)",
            "Platelet (PLT)",
            "Adipocyte (AD)",
            "Chondrocyte (CHD)",
            "Osteocyte (OCY)",
            "Fibroblast (FB)",
            "Osteoblast (OB)",
            "Chondroblast (CHB)",
            "Adrenal cell (AC)",
            "Pancreatic cell (PC)",
            "Hepatocyte (Hep)",
            "Neuroglial cell (NGC)",
            "Mesenchymal stem cell (MSC)",
            "Hematopoietic stem cell (HSC)",
            "Endothelial cell (EC)",
            "Keratinocyte (KC)",
            "Lymphocyte (LC)",
            "Macrophage (MP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neuron (NER)",
                "Muscle cell (MC)",
                "Epithelial cell (EC)",
                "Stem cell (SC)",
                "Adipocyte (AD)",
                "Chondrocyte (CHD)",
                "Osteocyte (OCY)",
                "Fibroblast (FB)",
                "Osteoblast (OB)",
                "Hepatocyte (Hep)",
                "Neuroglial cell (NGC)",
                "Mesenchymal stem cell (MSC)",
                "Hematopoietic stem cell (HSC)",
                "Endothelial cell (EC)",
                "Keratinocyte (KC)",
                "Lymphocyte (LC)",
                "Macrophage (MP)"
            ],
            "mismatches": [
                "Red blood cell (RBC)",
                "White blood cell (WBC)",
                "Platelet (PLT)",
                "Chondroblast (CHB)",
                "Adrenal cell (AC)",
                "Pancreatic cell (PC)"
            ],
            "true_referents": [
                "Acanthocytes",
                "Adipocytes",
                "Adult Stem Cells",
                "Astrocytes",
                "B-Lymphocytes",
                "Beige Adipocytes",
                "Blood Cells",
                "Blood Platelets",
                "Bone Marrow Cells",
                "Chondrocytes",
                "Chromaffin Cells",
                "Embryonic Stem Cells",
                "Endocrine Cells",
                "Endothelial Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocytes",
                "Fibroblasts",
                "Granulocytes",
                "Hemangioblasts",
                "Hematopoietic Stem Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Human Umbilical Vein Endothelial Cells",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Macrophages",
                "Mesenchymal Stem Cells",
                "Microglia",
                "Motor Neurons",
                "Muscle Cells",
                "Myoblasts",
                "Myofibroblasts",
                "Neuroendocrine Cells",
                "Neuroglia",
                "Neurons",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Pancreatic Polypeptide-Secreting Cells",
                "Skeletal Muscle Satellite Cells",
                "Stem Cells",
                "T-Lymphocytes",
                "White Adipocytes"
            ],
            "TP": 17,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            {
                "Referent": "Cell",
                "Canonical Name": "Cell"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Cell"
            ],
            "true_referents": [
                "Eukaryotic Cells",
                "Place Cells",
                "RAW 264.7 Cells"
            ],
            "TP": 0,
            "FP": 1,
            "FN": 0
        }
    }
]