[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Red blood cell (RBC)",
            "White blood cell (WBC)",
            "Neuron",
            "Muscle cell (Myocyte)",
            "Fat cell (Adipocyte)",
            "Liver cell (Hepatocyte)",
            "Kidney cell (Renal tubular cell)",
            "Heart muscle cell (Cardiomyocyte)",
            "Skin cell (Keratinocyte)",
            "Bone cell (Osteocyte)",
            "Cartilage cell (Chondrocyte)",
            "Pancreatic cell (Pancreatic beta cell)",
            "Epithelial cell",
            "Sperm cell (Spermatocyte)",
            "Oocyte (Egg cell)",
            "Endothelial cell",
            "Stem cell",
            "Connective tissue cell",
            "Blood platelet",
            "T lymphocyte (T cell)",
            "B lymphocyte (B cell)",
            "Macrophage",
            "Dendritic cell",
            "Natural killer cell (NK cell)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Erythrocytes",
                "Leukocytes",
                "Neurons",
                "Muscle Cells",
                "Adipocytes",
                "Hepatocytes",
                "Cardiac Myocytes",
                "Keratinocytes",
                "Osteocytes",
                "Chondrocytes",
                "Epithelial Cells",
                "Spermatocytes",
                "Oocytes",
                "Endothelial Cells",
                "Stem Cells",
                "Connective Tissue Cells",
                "Blood Platelets",
                "T-Lymphocytes",
                "B-Lymphocytes",
                "Macrophages",
                "Dendritic Cells",
                "Natural Killer Cells"
            ],
            "mismatches": [
                "Kidney cell (Renal tubular cell)",
                "Pancreatic cell (Pancreatic beta cell)"
            ],
            "true_referents": [
                "Adipocytes",
                "Adult Stem Cells",
                "Antigen-Presenting Cells",
                "Axons",
                "B-Lymphocytes",
                "Blood Cells",
                "Blood Platelets",
                "Bone Marrow Cells",
                "Brown Adipocytes",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Connective Tissue Cells",
                "Cytotoxic T-Lymphocytes",
                "Dendritic Cells",
                "Embryonic Stem Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocytes",
                "Eukaryotic Cells",
                "Glucagon-Secreting Cells",
                "Granulocytes",
                "Hemocytes",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Lymphokine-Activated Killer Cells",
                "Macrophages",
                "Mesangial Cells",
                "Muscle Cells",
                "Myoblasts",
                "Natural Killer Cells",
                "Natural Killer T-Cells",
                "Neurons",
                "Oocytes",
                "Osteoblasts",
                "Osteocytes",
                "Ovum",
                "Sertoli Cells",
                "Skeletal Muscle Satellite Cells",
                "Spermatocytes",
                "Spermatozoa",
                "Stem Cells",
                "Stromal Cells",
                "T-Lymphocytes",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Adipocyte (fat cell)",
            "Neuron (nerve cell)",
            "Osteocyte (bone cell)",
            "Chondrocyte (cartilage cell)",
            "Fibroblast (connective tissue cell)",
            "Hepatocyte (liver cell)",
            "Keratinocyte (skin cell)",
            "Erythrocyte (red blood cell)",
            "Leukocyte (white blood cell)",
            "Lymphocyte (immune cell)",
            "Monocyte (immune cell)",
            "Neutrophil (immune cell)",
            "Eosinophil (immune cell)",
            "Basophil (immune cell)",
            "Platelet (thrombocyte)",
            "Muscle cell (myocyte)",
            "Cardiomyocyte (heart muscle cell)",
            "Skeletal myocyte (muscle cell)",
            "Smooth muscle cell",
            "Endothelial cell (vascular cell)",
            "Epithelial cell",
            "Goblet cell (mucous cell)",
            "Sertoli cell (testicular cell)",
            "Oocyte (egg cell)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocytes",
                "Neurons",
                "Osteocytes",
                "Chondrocytes",
                "Fibroblasts",
                "Hepatocytes",
                "Keratinocytes",
                "Erythrocytes",
                "Leukocytes",
                "Lymphocytes",
                "Monocytes",
                "Neutrophils",
                "Eosinophils",
                "Basophils",
                "Blood Platelets",
                "Muscle Cells",
                "Endothelial Cells",
                "Epithelial Cells",
                "Goblet Cells",
                "Sertoli Cells",
                "Oocytes"
            ],
            "mismatches": [
                "Cardiomyocyte (heart muscle cell)",
                "Skeletal myocyte (muscle cell)",
                "Smooth muscle cell"
            ],
            "true_referents": [
                "Adipocytes",
                "B-Lymphocytes",
                "Basophils",
                "Blood Cells",
                "Blood Platelets",
                "Brown Adipocytes",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Connective Tissue Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Enterocytes",
                "Eosinophils",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Goblet Cells",
                "Granulocytes",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Human Umbilical Vein Endothelial Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Mast Cells",
                "Monocytes",
                "Muscle Cells",
                "Myoblasts",
                "Myofibroblasts",
                "Neurites",
                "Neurons",
                "Neutrophils",
                "Oocytes",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Ovum",
                "Phagocytes",
                "Sertoli Cells",
                "Skeletal Muscle Satellite Cells",
                "Skeletal Myoblasts",
                "Smooth Muscle Myoblasts",
                "Smooth Muscle Myocytes",
                "Spermatocytes",
                "Stromal Cells",
                "T-Lymphocytes",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Erythrocyte (Red Blood Cell)",
            "Leukocyte (White Blood Cell)",
            "Thrombocyte (Platelet)",
            "Hepatocyte (Liver Cell)",
            "Nephron (Kidney Cell)",
            "Myocyte (Muscle Cell)",
            "Neuron",
            "Glial Cell",
            "Osteocyte (Bone Cell)",
            "Chondrocyte (Cartilage Cell)",
            "Adipocyte (Fat Cell)",
            "Fibroblast",
            "Endothelial Cell",
            "Epithelial Cell",
            "Keratocyte (Corneal Cell)",
            "Melanocyte",
            "Langerhans Cell",
            "Dendritic Cell",
            "Mast Cell",
            "Basophil",
            "Eosinophil",
            "Neutrophil",
            "B Lymphocyte",
            "T Lymphocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neuron",
                "Chondrocyte (Cartilage Cell)",
                "Adipocyte (Fat Cell)",
                "Fibroblast",
                "Endothelial Cell",
                "Epithelial Cell",
                "Melanocyte",
                "Langerhans Cell",
                "Dendritic Cell",
                "Mast Cell",
                "Basophil",
                "Eosinophil",
                "Neutrophil"
            ],
            "mismatches": [
                "Erythrocyte (Red Blood Cell)",
                "Leukocyte (White Blood Cell)",
                "Thrombocyte (Platelet)",
                "Hepatocyte (Liver Cell)",
                "Nephron (Kidney Cell)",
                "Myocyte (Muscle Cell)",
                "Glial Cell",
                "Osteocyte (Bone Cell)",
                "Keratocyte (Corneal Cell)",
                "B Lymphocyte",
                "T Lymphocyte"
            ],
            "true_referents": [
                "Adipocytes",
                "Antigen-Presenting Cells",
                "Astrocytes",
                "Axons",
                "B-Lymphocyte Subsets",
                "B-Lymphocytes",
                "Basophils",
                "Blood Cells",
                "Blood Platelets",
                "Brown Adipocytes",
                "CD4-Positive T-Lymphocytes",
                "Chondrocytes",
                "Connective Tissue Cells",
                "Corneal Keratocytes",
                "Dendritic Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Eosinophils",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Granulocytes",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Interneurons",
                "Keratinocytes",
                "Langerhans Cells",
                "Leukocytes",
                "Lymphocytes",
                "Mast Cells",
                "Melanocytes",
                "Melanophores",
                "Mesangial Cells",
                "Microglia",
                "Muscle Cells",
                "Myoblasts",
                "Myofibroblasts",
                "Neuroglia",
                "Neurons",
                "Neutrophils",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Skeletal Muscle Satellite Cells",
                "Stromal Cells",
                "T-Lymphocytes",
                "Th1 Cells",
                "White Adipocytes"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Erythrocyte (RBC)",
            "Neutrophil (Neu)",
            "Hepatocyte (Hep)",
            "Neuron (N)",
            "Myocyte (Myo)",
            "Osteoblast (OB)",
            "Fibroblast (Fib)",
            "Adipocyte (Ad)",
            "Melanocyte (Mel)",
            "Keratinocyte (Ker)",
            "B Lymphocyte (B cell)",
            "T Lymphocyte (T cell)",
            "Natural Killer Cell (NK cell)",
            "Monocyte (Mon)",
            "Eosinophil (Eos)",
            "Basophil (Bas)",
            "Pancreatic Beta Cell (\u03b2-cell)",
            "Renal Tubular Epithelial Cell (RTEC)",
            "Pulmonary Alveolar Type II Cell (AT2)",
            "Enterocyte (Ent)",
            "Skeletal Muscle Fiber (SMF)",
            "Cardiac Myocyte (CM)",
            "Schwann Cell (SC)",
            "Oocyte (Ooc)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Erythrocyte (RBC)",
                "Neutrophil (Neu)",
                "Hepatocyte (Hep)",
                "Neuron (N)",
                "Fibroblast (Fib)",
                "Adipocyte (Ad)",
                "Melanocyte (Mel)",
                "Keratinocyte (Ker)",
                "B Lymphocyte (B cell)",
                "T Lymphocyte (T cell)",
                "Natural Killer Cell (NK cell)",
                "Monocyte (Mon)",
                "Eosinophil (Eos)",
                "Basophil (Bas)",
                "Enterocyte (Ent)",
                "Skeletal Muscle Fiber (SMF)",
                "Cardiac Myocyte (CM)",
                "Schwann Cell (SC)",
                "Oocyte (Ooc)"
            ],
            "mismatches": [
                "Myocyte (Myo)",
                "Pancreatic Beta Cell (\u03b2-cell)",
                "Renal Tubular Epithelial Cell (RTEC)",
                "Pulmonary Alveolar Type II Cell (AT2)"
            ],
            "true_referents": [
                "Adipocytes",
                "Alveolar Epithelial Cells",
                "Alveolar Macrophages",
                "B-Lymphocytes",
                "Basophils",
                "Beige Adipocytes",
                "Bone Marrow Cells",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Cytotoxic T-Lymphocytes",
                "Enterocytes",
                "Enteroendocrine Cells",
                "Eosinophils",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Glucagon-Secreting Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Lymphocytes",
                "Lymphokine-Activated Killer Cells",
                "Madin Darby Canine Kidney Cells",
                "Mast Cells",
                "Melanocytes",
                "Melanosomes",
                "Mesangial Cells",
                "Monocytes",
                "Motor Neurons",
                "Muscle Cells",
                "Myelin Sheath",
                "Myoblasts",
                "Myofibroblasts",
                "Natural Killer Cells",
                "Natural Killer T-Cells",
                "Neuroglia",
                "Neurons",
                "Neutrophils",
                "Oocytes",
                "Osteoblasts",
                "Osteocytes",
                "Ovum",
                "Schwann Cells",
                "Skeletal Muscle Fibers",
                "Skeletal Muscle Satellite Cells",
                "Slow-Twitch Muscle Fibers",
                "T-Lymphocytes",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 19,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Neuron (N)",
            "Erythrocyte (RBC)",
            "Hepatocyte (HC)",
            "Cardiomyocyte (CMC)",
            "Osteoblast (OB)",
            "Chondrocyte (CC)",
            "Adipocyte (AC)",
            "Lymphocyte (LC)",
            "Macrophage (M\u03a6)",
            "Keratinocyte (KC)",
            "Fibroblast (FB)",
            "Endothelial Cell (EC)",
            "Pancreatic Beta Cell (\u03b2-cell)",
            "Spermatocyte (SC)",
            "Oocyte (OC)",
            "Melanocyte (MC)",
            "Astrocyte (AstC)",
            "Microglia (MG)",
            "Schwann Cell (SC)",
            "Thrombocyte (Platelet)",
            "Monocyte (MC)",
            "Basophil (BC)",
            "Eosinophil (Eo)",
            "Neutrophil (Neu)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neurons",
                "Erythrocytes",
                "Hepatocytes",
                "Cardiac Myocytes",
                "Osteoblasts",
                "Chondrocytes",
                "Adipocytes",
                "Lymphocytes",
                "Macrophages",
                "Keratinocytes",
                "Fibroblasts",
                "Endothelial Cells",
                "Spermatocytes",
                "Oocytes",
                "Melanocytes",
                "Astrocytes",
                "Microglia",
                "Schwann Cells",
                "Monocytes",
                "Basophils",
                "Eosinophils",
                "Neutrophils"
            ],
            "mismatches": [
                "Pancreatic Beta Cell (\u03b2-cell)",
                "Thrombocyte (Platelet)"
            ],
            "true_referents": [
                "Adipocytes",
                "Astrocytes",
                "B-Lymphocytes",
                "Basophils",
                "Blood Cells",
                "Blood Platelets",
                "Bone Marrow Cells",
                "Brown Adipocytes",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Connective Tissue Cells",
                "Endothelial Cells",
                "Eosinophils",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Glucagon-Secreting Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Human Umbilical Vein Endothelial Cells",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Lymphocytes",
                "Macrophages",
                "Mast Cells",
                "Melanocytes",
                "Melanophores",
                "Microglia",
                "Monocytes",
                "Motor Neurons",
                "Myelin Sheath",
                "Myoblasts",
                "Myofibroblasts",
                "Neuroglia",
                "Neurons",
                "Neutrophils",
                "Oocytes",
                "Osteoblasts",
                "Osteocytes",
                "Ovum",
                "Schwann Cells",
                "Sertoli Cells",
                "Spermatocytes",
                "Spermatozoa",
                "Stromal Cells",
                "T-Lymphocytes",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Erythrocyte (RBC)",
            "Leukocyte (WBC)",
            "Neutrophil (NEUT)",
            "Lymphocyte (LYMPH)",
            "Monocyte (MONO)",
            "Platelet (PLT)",
            "Epithelial cell (EPIT)",
            "Muscle cell (MYOCYTE)",
            "Adipocyte (ADIPO)",
            "Neuron (NEURON)",
            "Osteocyte (OSTEOCYTE)",
            "Chondrocyte (CHONDROCYTE)",
            "Hepatocyte (HEPATO)",
            "Fibroblast (FIBRO)",
            "Endothelial cell (ENDO)",
            "Stem cell (SC)",
            "Keratinocyte (KERATIN)",
            "Goblet cell (GOBLET)",
            "Pancreatic beta cell (BETA)",
            "Cardiac myocyte (CARDIAC)",
            "Skeletal muscle fiber (SKELETAL)",
            "Immature B cell (BIMMATURE)",
            "T cell (TCELL)",
            "Natural killer cell (NK CELL)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Erythrocyte (RBC)",
                "Leukocyte (WBC)",
                "Neutrophil (NEUT)",
                "Lymphocyte (LYMPH)",
                "Monocyte (MONO)",
                "Epithelial cell (EPIT)",
                "Muscle cell (MYOCYTE)",
                "Adipocyte (ADIPO)",
                "Neuron (NEURON)",
                "Osteocyte (OSTEOCYTE)",
                "Chondrocyte (CHONDROCYTE)",
                "Hepatocyte (HEPATO)",
                "Fibroblast (FIBRO)",
                "Endothelial cell (ENDO)",
                "Stem cell (SC)",
                "Keratinocyte (KERATIN)",
                "Goblet cell (GOBLET)",
                "Cardiac myocyte (CARDIAC)",
                "Skeletal muscle fiber (SKELETAL)",
                "Natural killer cell (NK CELL)"
            ],
            "mismatches": [
                "Platelet (PLT)",
                "Pancreatic beta cell (BETA)",
                "Immature B cell (BIMMATURE)",
                "T cell (TCELL)"
            ],
            "true_referents": [
                "Adipocytes",
                "Adult Stem Cells",
                "B-Lymphoid Precursor Cells",
                "Beige Adipocytes",
                "Blood Cells",
                "Blood Platelets",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Connective Tissue Cells",
                "Embryonic Stem Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Epithelioid Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Glucagon-Secreting Cells",
                "Goblet Cells",
                "Granulocytes",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Human Umbilical Vein Endothelial Cells",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Lymphokine-Activated Killer Cells",
                "Monocytes",
                "Muscle Cells",
                "Myoblasts",
                "Myofibroblasts",
                "Natural Killer Cells",
                "Natural Killer T-Cells",
                "Neurons",
                "Neutrophils",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Ovum",
                "Pyramidal Cells",
                "Skeletal Muscle Fibers",
                "Skeletal Muscle Satellite Cells",
                "Stem Cells",
                "T-Lymphocytes",
                "T-Lymphoid Precursor Cells",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Skin Cell (Keratinocyte)",
            "Neuron (Nerve Cell)",
            "Red Blood Cell (Erythrocyte)",
            "White Blood Cell (Leukocyte)",
            "Platelet (Thrombocyte)",
            "Sperm Cell (Spermatozoon)",
            "Egg Cell (Oocyte)",
            "Muscle Cell (Myocyte)",
            "Fat Cell (Adipocyte)",
            "Bone Cell (Osteocyte)",
            "Cartilage Cell (Chondrocyte)",
            "Liver Cell (Hepatocyte)",
            "Pancreatic Cell (Pancreatic Islet Cells)",
            "Stem Cell (Hematopoietic Stem Cell)",
            "Intestinal Cell (Enterocyte)",
            "Retinal Cell (Photoreceptor Cell)",
            "Kidney Cell (Nephron Cell)",
            "Macrophage (Immune Cell)",
            "T Cell (Lymphocyte)",
            "B Cell (Lymphocyte)",
            "Endothelial Cell (Vascular Endothelium)",
            "Epithelial Cell (Epithelium)",
            "Cancer Cell (Carcinoma Cell)",
            "Cardiac Cell (Cardiomyocyte)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocytes",
                "Neurons",
                "Erythrocytes",
                "Leukocytes",
                "Macrophages",
                "Oocytes",
                "Muscle Cells",
                "Adipocytes",
                "Osteocytes",
                "Chondrocytes",
                "Hepatocytes",
                "Hematopoietic Stem Cells",
                "Enterocytes",
                "Photoreceptor Cells",
                "T-Lymphocytes",
                "B-Lymphocytes",
                "Endothelial Cells",
                "Epithelial Cells"
            ],
            "mismatches": [
                "Platelet (Thrombocyte)",
                "Sperm Cell (Spermatozoon)",
                "Pancreatic Cell (Pancreatic Islet Cells)",
                "Kidney Cell (Nephron Cell)",
                "Cancer Cell (Carcinoma Cell)",
                "Cardiac Cell (Cardiomyocyte)"
            ],
            "true_referents": [
                "Acrosome",
                "Adipocytes",
                "B-Lymphocytes",
                "Blood Cells",
                "Blood Platelets",
                "Bone Marrow Cells",
                "Brown Adipocytes",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Connective Tissue Cells",
                "Endothelial Cells",
                "Enterocytes",
                "Enteroendocrine Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Epithelioid Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Eukaryotic Cells",
                "Glucagon-Secreting Cells",
                "Granulocytes",
                "Hematopoietic Stem Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Human Umbilical Vein Endothelial Cells",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Macrophages",
                "Mesangial Cells",
                "Muscle Cells",
                "Myoblasts",
                "Neoplastic Stem Cells",
                "Neurites",
                "Neurons",
                "Oocytes",
                "Osteoblasts",
                "Osteocytes",
                "Ovum",
                "Pericytes",
                "Photoreceptor Cells",
                "RAW 264.7 Cells",
                "Retinal Cone Photoreceptor Cells",
                "Skeletal Muscle Satellite Cells",
                "Spermatocytes",
                "Spermatozoa",
                "Stem Cells",
                "Stromal Cells",
                "T-Lymphocytes",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Red blood cell (RBC)",
            "Neuron",
            "Muscle cell",
            "Skin cell",
            "Fat cell",
            "Bone cell",
            "Liver cell",
            "Heart cell",
            "Lung cell",
            "Kidney cell",
            "Pancreatic cell",
            "Intestinal cell",
            "Sperm cell",
            "Egg cell",
            "White blood cell (WBC)",
            "Platelet",
            "Stem cell",
            "Cancer cell",
            "Immune cell",
            "Nerve cell",
            "Epithelial cell",
            "Endothelial cell",
            "Osteocyte",
            "Hepatocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neuron",
                "Muscle cell",
                "Fat cell",
                "Osteocyte",
                "Hepatocyte",
                "Stem cell",
                "White blood cell (WBC)",
                "Platelet",
                "Epithelial cell",
                "Endothelial cell"
            ],
            "mismatches": [
                "Red blood cell (RBC)",
                "Skin cell",
                "Bone cell",
                "Liver cell",
                "Heart cell",
                "Lung cell",
                "Kidney cell",
                "Pancreatic cell",
                "Intestinal cell",
                "Sperm cell",
                "Egg cell",
                "Cancer cell",
                "Immune cell",
                "Nerve cell"
            ],
            "true_referents": [
                "Adipocytes",
                "Adult Stem Cells",
                "Alveolar Epithelial Cells",
                "Alveolar Macrophages",
                "Axons",
                "Blood Cells",
                "Blood Platelets",
                "Bone Marrow Cells",
                "Cancer-Associated Fibroblasts",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Dendritic Cells",
                "Embryonic Stem Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Enterocytes",
                "Enteroendocrine Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocytes",
                "Eukaryotic Cells",
                "Foam Cells",
                "Glucagon-Secreting Cells",
                "Granulocytes",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Madin Darby Canine Kidney Cells",
                "Mesangial Cells",
                "Muscle Cells",
                "Myoblasts",
                "Neoplastic Stem Cells",
                "Nerve Fibers",
                "Neurites",
                "Neurons",
                "Oocytes",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Ovum",
                "Phagocytes",
                "Skeletal Muscle Satellite Cells",
                "Sperm Head",
                "Spermatocytes",
                "Spermatozoa",
                "Stem Cells",
                "White Adipocytes"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Neuron (N)",
            "Erythrocyte (RBC)",
            "T Lymphocyte (T cell)",
            "B Lymphocyte (B cell)",
            "Hepatocyte",
            "Osteoblast",
            "Myocyte",
            "Adipocyte",
            "Keratinocyte",
            "Melanocyte",
            "Platelet",
            "Fibroblast",
            "Astrocyte",
            "Microglia",
            "Endothelial Cell",
            "Chondrocyte",
            "Pancreatic \u03b2 Cell",
            "Sertoli Cell",
            "Germ Cell",
            "Stem Cell",
            "Macrophage",
            "Dendritic Cell",
            "Epithelial Cell",
            "Schwann Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neurons",
                "Erythrocytes",
                "T-Lymphocytes",
                "B-Lymphocytes",
                "Hepatocytes",
                "Osteoblasts",
                "Adipocytes",
                "Keratinocytes",
                "Melanocytes",
                "Blood Platelets",
                "Fibroblasts",
                "Astrocytes",
                "Microglia",
                "Endothelial Cells",
                "Chondrocytes",
                "Sertoli Cells",
                "Germ Cells",
                "Stem Cells",
                "Macrophages",
                "Dendritic Cells",
                "Epithelial Cells",
                "Schwann Cells"
            ],
            "mismatches": [
                "Myocyte",
                "Pancreatic \u03b2 Cell"
            ],
            "true_referents": [
                "Adipocytes",
                "Adult Stem Cells",
                "Antigen-Presenting Cells",
                "Astrocytes",
                "B-Lymphocytes",
                "Blood Cells",
                "Blood Platelets",
                "Brown Adipocytes",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Cytotoxic T-Lymphocytes",
                "Dendritic Cells",
                "Embryonic Germ Cells",
                "Embryonic Stem Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Germ Cells",
                "Glucagon-Secreting Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Macrophages",
                "Melanocytes",
                "Melanophores",
                "Microglia",
                "Motor Neurons",
                "Muscle Cells",
                "Myelin Sheath",
                "Myoblasts",
                "Myofibroblasts",
                "Neuroglia",
                "Neurons",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Schwann Cells",
                "Sertoli Cells",
                "Spermatocytes",
                "Stem Cells",
                "Stromal Cells",
                "T-Lymphocytes",
                "White Adipocytes"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Neuron (nerve cell)",
            "Erythrocyte (red blood cell)",
            "Leukocyte (white blood cell)",
            "Hepatocyte (liver cell)",
            "Cardiomyocyte (heart muscle cell)",
            "Osteocyte (bone cell)",
            "Adipocyte (fat cell)",
            "Chondrocyte (cartilage cell)",
            "Keratinocyte (skin cell)",
            "Fibroblast (connective tissue cell)",
            "Myocyte (skeletal muscle cell)",
            "Epithelial cell",
            "Endothelial cell",
            "Pancreatic beta cell",
            "Astrocyte (glial cell)",
            "Oocyte (egg cell)",
            "Spermatozoon (sperm cell)",
            "Macrophage",
            "T lymphocyte",
            "B lymphocyte",
            "Natural killer cell (NK cell)",
            "Melanocyte (pigment-producing cell)",
            "Schwann cell",
            "Podocyte (kidney glomerular cell)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neurons",
                "Erythrocytes",
                "Leukocytes",
                "Hepatocytes",
                "Osteocytes",
                "Adipocytes",
                "Chondrocytes",
                "Keratinocytes",
                "Fibroblasts",
                "Epithelial Cells",
                "Endothelial Cells",
                "Astrocytes",
                "Oocytes",
                "Spermatozoa",
                "Macrophages",
                "T-Lymphocytes",
                "B-Lymphocytes",
                "Natural Killer Cells",
                "Melanocytes",
                "Schwann Cells",
                "Podocytes"
            ],
            "mismatches": [
                "Cardiomyocyte (heart muscle cell)",
                "Myocyte (skeletal muscle cell)",
                "Pancreatic beta cell",
                "Natural killer cell (NK cell)"
            ],
            "true_referents": [
                "Acrosome",
                "Adipocytes",
                "Astrocytes",
                "B-Lymphocyte Subsets",
                "B-Lymphocytes",
                "Brown Adipocytes",
                "CD4-Positive T-Lymphocytes",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Connective Tissue Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Glucagon-Secreting Cells",
                "Granulocytes",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Lymphokine-Activated Killer Cells",
                "Macrophages",
                "Melanocytes",
                "Mesangial Cells",
                "Microglia",
                "Muscle Cells",
                "Myelin Sheath",
                "Myoblasts",
                "Myofibroblasts",
                "Natural Killer Cells",
                "Natural Killer T-Cells",
                "Neurites",
                "Neuroglia",
                "Neurons",
                "Oocytes",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Ovum",
                "Podocytes",
                "Podosomes",
                "Schwann Cells",
                "Skeletal Muscle Satellite Cells",
                "Spermatocytes",
                "Spermatozoa",
                "Stromal Cells",
                "T-Lymphocytes",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 21,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Stem cell",
            "Red blood cell (RBC)",
            "White blood cell (WBC)",
            "Platelet",
            "Neuron",
            "Astrocyte",
            "Fibroblast",
            "Keratinocyte",
            "Melanocyte",
            "Osteoblast",
            "Osteoclast",
            "Chondrocyte",
            "Myocyte (muscle cell)",
            "Hepatocyte",
            "Pancreatic beta cell",
            "Thyroid follicular cell",
            "Adrenal cortical cell",
            "Sertoli cell",
            "Leydig cell",
            "Ovarian follicle cell",
            "Mammary gland epithelial cell",
            "Intestinal epithelial cell",
            "Alveolar cell (pneumocyte)",
            "Endothelial cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Stem Cells",
                "Neurons",
                "Astrocytes",
                "Fibroblasts",
                "Keratinocytes",
                "Melanocytes",
                "Osteoblasts",
                "Osteoclasts",
                "Chondrocytes",
                "Muscle Cells",
                "Hepatocytes",
                "Sertoli Cells",
                "Leydig Cells",
                "Endothelial Cells"
            ],
            "mismatches": [
                "Red blood cell (RBC)",
                "White blood cell (WBC)",
                "Platelet",
                "Myocyte (muscle cell)",
                "Pancreatic beta cell",
                "Thyroid follicular cell",
                "Adrenal cortical cell",
                "Ovarian follicle cell",
                "Mammary gland epithelial cell",
                "Intestinal epithelial cell",
                "Alveolar cell (pneumocyte)"
            ],
            "true_referents": [
                "Adult Stem Cells",
                "Alveolar Epithelial Cells",
                "Alveolar Macrophages",
                "Astrocytes",
                "Axons",
                "Blood Cells",
                "Blood Platelets",
                "Chondrocytes",
                "Chromaffin Cells",
                "Corticotrophs",
                "Embryonic Stem Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Enterocytes",
                "Enteroendocrine Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocytes",
                "Fibroblasts",
                "Glucagon-Secreting Cells",
                "Granulocytes",
                "Granulosa Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Leydig Cells",
                "Melanocytes",
                "Melanophores",
                "Microglia",
                "Muscle Cells",
                "Myoblasts",
                "Myofibroblasts",
                "Neuroglia",
                "Neurons",
                "Oocytes",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Sertoli Cells",
                "Skeletal Muscle Satellite Cells",
                "Spermatocytes",
                "Stem Cells",
                "Stromal Cells",
                "T Follicular Helper Cells",
                "Thyroid Epithelial Cells"
            ],
            "TP": 14,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Red blood cell (RBC)",
            "Lymphocyte (T cell, B cell)",
            "Neutrophil",
            "Eosinophil",
            "Basophil",
            "Monocyte",
            "Platelet",
            "Epithelial cell",
            "Endothelial cell",
            "Muscle cell (skeletal, cardiac, smooth)",
            "Nerve cell (neuron)",
            "Adipocyte (fat cell)",
            "Osteoblast",
            "Osteoclast",
            "Chondrocyte",
            "Hepatocyte (liver cell)",
            "Nephron (kidney cell)",
            "Melanocyte",
            "Fibroblast",
            "Stem cell (embryonic, adult)",
            "Goblet cell",
            "Ciliated cell",
            "Parietal cell",
            "Pancreatic islet cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Lymphocyte (T cell, B cell)",
                "Neutrophil",
                "Eosinophil",
                "Basophil",
                "Monocyte",
                "Epithelial cell",
                "Endothelial cell",
                "Muscle cell (skeletal, cardiac, smooth)",
                "Nerve cell (neuron)",
                "Adipocyte (fat cell)",
                "Osteoblast",
                "Osteoclast",
                "Chondrocyte",
                "Hepatocyte (liver cell)",
                "Melanocyte",
                "Fibroblast",
                "Stem cell (embryonic, adult)",
                "Goblet cell",
                "Parietal cell"
            ],
            "mismatches": [
                "Red blood cell (RBC)",
                "Platelet",
                "Nephron (kidney cell)",
                "Ciliated cell",
                "Pancreatic islet cell"
            ],
            "true_referents": [
                "Acinar Cells",
                "Adipocytes",
                "Adult Stem Cells",
                "B-Lymphocytes",
                "Basophils",
                "Blood Cells",
                "Blood Platelets",
                "Brown Adipocytes",
                "Chondrocytes",
                "Embryonic Stem Cells",
                "Endothelial Cells",
                "Endothelial Progenitor Cells",
                "Eosinophils",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocytes",
                "Eukaryotic Cells",
                "Fibroblasts",
                "Gastric Parietal Cells",
                "Glucagon-Secreting Cells",
                "Goblet Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Mast Cells",
                "Melanocytes",
                "Melanophores",
                "Mesangial Cells",
                "Monocytes",
                "Muscle Cells",
                "Myoblasts",
                "Myofibroblasts",
                "Neurites",
                "Neurons",
                "Neutrophils",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Smooth Muscle Myocytes",
                "Stem Cells",
                "Stromal Cells",
                "Tuft Cells",
                "White Adipocytes",
                "Zygote"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Adipocyte (ADIP)",
            "Astrocyte (ASTR)",
            "B Lymphocyte (B_CELL)",
            "Cardiomyocyte (CARM)",
            "Chondrocyte (CHON)",
            "Dendritic Cell (DC)",
            "Endothelial Cell (EC)",
            "Erythrocyte (RBC)",
            "Fibroblast (FIBR)",
            "Hepatocyte (HEPC)",
            "Keratinocyte (KERA)",
            "Lymphatic Endothelial Cell (LEC)",
            "Macrophage (MACRO)",
            "Melanocyte (MELA)",
            "Microglia (MICR)",
            "Monocyte (MONO)",
            "Myoblast (MYOB)",
            "Neuron (NEUR)",
            "Osteoblast (OSTB)",
            "Osteoclast (OSTC)",
            "Pancreatic Islet Cell (PIC)",
            "Platelet (PLT)",
            "T Lymphocyte (T_CELL)",
            "Urothelial Cell (UC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte (ADIP)",
                "Astrocyte (ASTR)",
                "B Lymphocyte (B_CELL)",
                "Chondrocyte (CHON)",
                "Dendritic Cell (DC)",
                "Endothelial Cell (EC)",
                "Erythrocyte (RBC)",
                "Fibroblast (FIBR)",
                "Hepatocyte (HEPC)",
                "Keratinocyte (KERA)",
                "Macrophage (MACRO)",
                "Melanocyte (MELA)",
                "Microglia (MICR)",
                "Monocyte (MONO)",
                "Myoblast (MYOB)",
                "Neuron (NEUR)",
                "Osteoblast (OSTB)",
                "Osteoclast (OSTC)",
                "T Lymphocyte (T_CELL)"
            ],
            "mismatches": [
                "Cardiomyocyte (CARM)",
                "Lymphatic Endothelial Cell (LEC)",
                "Pancreatic Islet Cell (PIC)",
                "Platelet (PLT)",
                "Urothelial Cell (UC)"
            ],
            "true_referents": [
                "Acanthocytes",
                "Adipocytes",
                "Antigen-Presenting Cells",
                "Astrocytes",
                "B-Lymphocytes",
                "Beige Adipocytes",
                "Blood Cells",
                "Blood Platelets",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Dendritic Cells",
                "Endothelial Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Epithelioid Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Glucagon-Secreting Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Human Umbilical Vein Endothelial Cells",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Macrophages",
                "Melanocytes",
                "Melanophores",
                "Microglia",
                "Monocytes",
                "Motor Neurons",
                "Muscle Cells",
                "Myoblasts",
                "Myofibroblasts",
                "Neuroglia",
                "Neurons",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Skeletal Myoblasts",
                "T-Lymphocytes",
                "T-Lymphoid Precursor Cells",
                "White Adipocytes"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Human Keratinocyte (HK)",
            "Neuron (NE)",
            "Epithelial Cell (EC)",
            "Macrophage (M\u03a6)",
            "T-Lymphocyte (T cell)",
            "B-Lymphocyte (B cell)",
            "Dendritic Cell (DC)",
            "Natural Killer Cell (NK cell)",
            "Monocyte (M)",
            "Platelet (PLT)",
            "Erythrocyte (RBC)",
            "Lymphocyte (LY)",
            "Myeloid Progenitor Cell (MPC)",
            "Stem Cell (SC)",
            "Hepatocyte (H)",
            "Pancreatic \u03b2-Cell (P\u03b2C)",
            "Osteoblast (OB)",
            "Osteoclast (OC)",
            "Chondrocyte (Ch)",
            "Fibroblast (FB)",
            "Endothelial Cell (EC)",
            "Smooth Muscle Cell (SMC)",
            "Cardiac Myocyte (CM)",
            "Skeletal Muscle Cell (SMC)",
            "Adipocyte (AD)",
            "Mast Cell (MC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocytes",
                "Neurons",
                "Epithelial Cells",
                "Macrophages",
                "T-Lymphocytes",
                "B-Lymphocytes",
                "Dendritic Cells",
                "Natural Killer Cells",
                "Monocytes",
                "Erythrocytes",
                "Lymphocytes",
                "Myeloid Progenitor Cells",
                "Stem Cells",
                "Hepatocytes",
                "Osteoblasts",
                "Osteoclasts",
                "Chondrocytes",
                "Fibroblasts",
                "Endothelial Cells",
                "Cardiac Myocytes"
            ],
            "mismatches": [
                "Platelet (PLT)",
                "Pancreatic \u03b2-Cell (P\u03b2C)",
                "Smooth Muscle Cell (SMC)",
                "Skeletal Muscle Cell (SMC)",
                "Adipocyte (AD)",
                "Mast Cell (MC)"
            ],
            "true_referents": [
                "Acanthocytes",
                "Adult Stem Cells",
                "Antigen-Presenting Cells",
                "B-Lymphocytes",
                "Blood Cells",
                "Blood Platelets",
                "Bone Marrow Cells",
                "Cardiac Myoblasts",
                "Cardiac Myocytes",
                "Chondrocytes",
                "Connective Tissue Cells",
                "Cytotoxic T-Lymphocytes",
                "Dendritic Cells",
                "Embryonic Stem Cells",
                "Endothelial Cells",
                "Epidermal Cells",
                "Epithelial Cells",
                "Erythrocyte Membrane",
                "Erythrocytes",
                "Fibroblasts",
                "Glucagon-Secreting Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Human Umbilical Vein Endothelial Cells",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Lymphokine-Activated Killer Cells",
                "Macrophages",
                "Monocytes",
                "Muscle Cells",
                "Myeloid Progenitor Cells",
                "Myofibroblasts",
                "Natural Killer Cells",
                "Natural Killer T-Cells",
                "Neurons",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Pyramidal Cells",
                "Skeletal Muscle Satellite Cells",
                "Skeletal Myoblasts",
                "Smooth Muscle Myoblasts",
                "Smooth Muscle Myocytes",
                "Stem Cells",
                "T-Lymphocytes"
            ],
            "TP": 20,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "human cell",
        "domain": "medicine",
        "response": [
            "Neuron (NER)",
            "Adipocyte (ADP)",
            "Muscle cell (MUS)",
            "Epithelial cell (EPI)",
            "Stem cell (SC)",
            "Red blood cell (RBC)",
            "Platelet (PLT)",
            "Natural killer cell (NK)",
            "T cell (T)",
            "B cell (B)",
            "Dendritic cell (DC)",
            "Macrophage (M\u03a6)",
            "Fibroblast (FB)",
            "Osteoblast (OB)",
            "Chondrocyte (CH)",
            "Osteoclast (OC)",
            "Adrenal cell (AC)",
            "Pancreatic beta cell (PBC)",
            "Hepatocyte (HEP)",
            "Keratinocyte (KC)",
            "Melanocyte (MC)",
            "Lymphocyte (LYM)",
            "Monocyte (MON)",
            "Eosinophil (EOS)",
            "Basophil (BAS)",
            "Neutrophil (NEU)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocytes",
                "Chondrocytes",
                "Dendritic Cells",
                "Eosinophils",
                "Epithelial Cells",
                "Fibroblasts",
                "Hepatocytes",
                "Keratinocytes",
                "Lymphocytes",
                "Macrophages",
                "Melanocytes",
                "Monocytes",
                "Muscle Cells",
                "Natural Killer Cells",
                "Neurons",
                "Neutrophils",
                "Osteoblasts",
                "Osteoclasts",
                "Platelets",
                "Stem Cells"
            ],
            "mismatches": [
                "Neuron (NER)",
                "Muscle cell (MUS)",
                "Epithelial cell (EPI)",
                "Red blood cell (RBC)",
                "Platelet (PLT)",
                "Natural killer cell (NK)",
                "T cell (T)",
                "B cell (B)",
                "Macrophage (M\u03a6)",
                "Fibroblast (FB)",
                "Osteoblast (OB)",
                "Chondrocyte (CH)",
                "Osteoclast (OC)",
                "Adrenal cell (AC)",
                "Pancreatic beta cell (PBC)",
                "Hepatocyte (HEP)",
                "Keratinocyte (KC)",
                "Melanocyte (MC)",
                "Lymphocyte (LYM)",
                "Monocyte (MON)",
                "Eosinophil (EOS)",
                "Basophil (BAS)",
                "Neutrophil (NEU)"
            ],
            "true_referents": [
                "Acanthocytes",
                "Adipocytes",
                "Adult Stem Cells",
                "Antigen-Presenting Cells",
                "B-Lymphocyte Subsets",
                "B-Lymphocytes",
                "Beige Adipocytes",
                "Blood Cells",
                "Blood Platelets",
                "Bone Marrow Cells",
                "Chondrocytes",
                "Chromaffin Cells",
                "Connective Tissue Cells",
                "Dendritic Cells",
                "Embryonic Stem Cells",
                "Endocrine Cells",
                "Eosinophils",
                "Epidermal Cells",
                "Epithelial Cells",
                "Epithelioid Cells",
                "Erythrocytes",
                "Fibroblasts",
                "Glucagon-Secreting Cells",
                "Hep G2 Cells",
                "Hepatic Stellate Cells",
                "Hepatocytes",
                "Insulin-Secreting Cells",
                "Interneurons",
                "Keratinocytes",
                "Leukocytes",
                "Lymphocytes",
                "Lymphokine-Activated Killer Cells",
                "Macrophages",
                "Melanocytes",
                "Melanophores",
                "Monocytes",
                "Motor Neurons",
                "Muscle Cells",
                "Myoblasts",
                "Myofibroblasts",
                "Natural Killer Cells",
                "Natural Killer T-Cells",
                "Neuroendocrine Cells",
                "Neurons",
                "Neutrophils",
                "Osteoblasts",
                "Osteoclasts",
                "Osteocytes",
                "Skeletal Muscle Satellite Cells",
                "Stem Cells",
                "T-Lymphocytes",
                "T-Lymphoid Precursor Cells",
                "White Adipocytes"
            ],
            "TP": 20,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "human cell",
        "domain": "medicine",
        "response": "[\n        {\n            \"Canonical Name\": \"Adenosine Triphosphate\" (ATP)\n        },\n        {\n            \"Canonical Name\": \"Adenosine Diphosphate\" (ADP)\n        },\n        {\n            \"Canonical Name\": \"Adenosine Monophosphate\" (AMP)\n        },\n        {\n            \"Canonical Name\": \"Adenosine\"\n        },\n        {\n            \"Canonical Name\": \"Adenine\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 1\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 2\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 3\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 4\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 5\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 6\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 7\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 8\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 9\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 10\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 11\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 12\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 13\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 14\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 15\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 16\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 17\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 18\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 19\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 20\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 21\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 22\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 23\"\n        },\n        {\n            \"Canonical Name\": \"Adenosine Deaminase 24\"\n        }\n    ]",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]