[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast (FB)",
            "Macrophage",
            "Mast Cell",
            "Plasma Cell",
            "Leukocyte",
            "Adipocyte",
            "Eosinophil",
            "Basophil",
            "Dendritic Cell",
            "Mesenchymal Stem Cell",
            "Lymphocyte",
            "Monocyte",
            "Neutrophil",
            "Tissue-resident Memory T Cell",
            "Langerhans Cell",
            "Smooth Muscle Cell",
            "Pericyte",
            "Fibrocyte",
            "Tenocyte",
            "Osteoblast",
            "Chondrocyte",
            "Myofibroblast",
            "Lipocyte",
            "Erythrocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast (FB)",
                "Macrophage",
                "Mast Cell",
                "Plasma Cell",
                "Leukocyte",
                "Adipocyte",
                "Eosinophil",
                "Basophil",
                "Dendritic Cell",
                "Mesenchymal Stem Cell",
                "Lymphocyte",
                "Monocyte",
                "Neutrophil",
                "Tissue-resident Memory T Cell",
                "Langerhans Cell",
                "Smooth Muscle Cell",
                "Pericyte",
                "Fibrocyte",
                "Tenocyte",
                "Osteoblast",
                "Chondrocyte",
                "Myofibroblast",
                "Lipocyte",
                "Erythrocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "Basophil",
                "Chondrocyte",
                "Dendritic Cell",
                "Eosinophil",
                "Erythrocyte",
                "Fibroblast (FB)",
                "Fibrocyte",
                "Langerhans Cell",
                "Leukocyte",
                "Lipocyte",
                "Lymphocyte",
                "Macrophage",
                "Mast Cell",
                "Mesenchymal Stem Cell",
                "Monocyte",
                "Myofibroblast",
                "Neutrophil",
                "Osteoblast",
                "Pericyte",
                "Plasma Cell",
                "Smooth Muscle Cell",
                "Tenocyte",
                "Tissue-resident Memory T Cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast (FB)",
            "Macrophage (M\u03a6)",
            "Mast cell (MC)",
            "Adipocyte (AD)",
            "Plasma cell (PC)",
            "Mesenchymal stem cell (MSC)",
            "Dendritic cell (DC)",
            "Histiocyte (Hist)",
            "Endothelial cell (EC)",
            "Lymphocyte (Lymph)",
            "Neutrophil (Neu)",
            "Eosinophil (Eos)",
            "Basophil (Baso)",
            "Chondroblast (CB)",
            "Osteoblast (OB)",
            "Reticular cell (RC)",
            "Hyaline cartilage cell (HCC)",
            "Myofibroblast (MyoF)",
            "Goblet cell (GC)",
            "Keratinocyte (KC)",
            "Langerhans cell (LC)",
            "Pericyte (Peri)",
            "Chondrocyte (ChC)",
            "Osteoclast (OCL)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast (FB)",
                "Macrophage (M\u03a6)",
                "Mast cell (MC)",
                "Adipocyte (AD)",
                "Plasma cell (PC)",
                "Mesenchymal stem cell (MSC)",
                "Dendritic cell (DC)",
                "Histiocyte (Hist)",
                "Endothelial cell (EC)",
                "Lymphocyte (Lymph)",
                "Neutrophil (Neu)",
                "Eosinophil (Eos)",
                "Basophil (Baso)",
                "Chondroblast (CB)",
                "Osteoblast (OB)",
                "Reticular cell (RC)",
                "Hyaline cartilage cell (HCC)",
                "Myofibroblast (MyoF)",
                "Goblet cell (GC)",
                "Keratinocyte (KC)",
                "Langerhans cell (LC)",
                "Pericyte (Peri)",
                "Chondrocyte (ChC)",
                "Osteoclast (OCL)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (AD)",
                "Basophil (Baso)",
                "Chondroblast (CB)",
                "Chondrocyte (ChC)",
                "Dendritic cell (DC)",
                "Endothelial cell (EC)",
                "Eosinophil (Eos)",
                "Fibroblast (FB)",
                "Goblet cell (GC)",
                "Histiocyte (Hist)",
                "Hyaline cartilage cell (HCC)",
                "Keratinocyte (KC)",
                "Langerhans cell (LC)",
                "Lymphocyte (Lymph)",
                "Macrophage (M\u03a6)",
                "Mast cell (MC)",
                "Mesenchymal stem cell (MSC)",
                "Myofibroblast (MyoF)",
                "Neutrophil (Neu)",
                "Osteoblast (OB)",
                "Osteoclast (OCL)",
                "Pericyte (Peri)",
                "Plasma cell (PC)",
                "Reticular cell (RC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast (FB)",
            "Macrophage (M\u03a6)",
            "Mast Cell (MC)",
            "Adipocyte",
            "Lymphocyte",
            "Monocyte",
            "Neutrophil",
            "Eosinophil",
            "Basophil",
            "Plasma Cell",
            "Dendritic Cell",
            "Lymphoid Stem Cell",
            "Myeloid Stem Cell",
            "Endothelial Cell",
            "Schwann Cell",
            "Pericyte",
            "Smooth Muscle Cell",
            "Mesenchymal Stem Cell",
            "Chondrocyte",
            "Osteoblast",
            "Osteoclast",
            "Tendon Cell",
            "Ligament Cell",
            "Fibrocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast (FB)",
                "Macrophage (M\u03a6)",
                "Mast Cell (MC)",
                "Adipocyte",
                "Lymphocyte",
                "Monocyte",
                "Neutrophil",
                "Eosinophil",
                "Basophil",
                "Plasma Cell",
                "Dendritic Cell",
                "Lymphoid Stem Cell",
                "Myeloid Stem Cell",
                "Endothelial Cell",
                "Schwann Cell",
                "Pericyte",
                "Smooth Muscle Cell",
                "Mesenchymal Stem Cell",
                "Chondrocyte",
                "Osteoblast",
                "Osteoclast",
                "Tendon Cell",
                "Ligament Cell",
                "Fibrocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "Basophil",
                "Chondrocyte",
                "Dendritic Cell",
                "Endothelial Cell",
                "Eosinophil",
                "Fibroblast (FB)",
                "Fibrocyte",
                "Ligament Cell",
                "Lymphocyte",
                "Lymphoid Stem Cell",
                "Macrophage (M\u03a6)",
                "Mast Cell (MC)",
                "Mesenchymal Stem Cell",
                "Monocyte",
                "Myeloid Stem Cell",
                "Neutrophil",
                "Osteoblast",
                "Osteoclast",
                "Pericyte",
                "Plasma Cell",
                "Schwann Cell",
                "Smooth Muscle Cell",
                "Tendon Cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast (FB)",
            "Adipocyte (AD)",
            "Mast Cell (MC)",
            "Macrophage (M\u03a6)",
            "Plasma Cell (PC)",
            "Endothelial Cell (EC)",
            "Pericyte (PR)",
            "Myofibroblast (MF)",
            "Histiocyte (HI)",
            "Collagen-producing cell (CPC)",
            "Reticular cell (RC)",
            "Loose connective tissue macrophage (LCTM)",
            "Adipose-derived stem cell (ADSC)",
            "Connective tissue mast cell (CTMC)",
            "Immune cell in loose connective tissue (ICT)",
            "Interstitial cell (IC)",
            "Dermal fibroblast (DF)",
            "Subcutaneous adipocyte (SAD)",
            "Perivascular cell (PVC)",
            "Loose connective tissue progenitor cell (LCTPC)",
            "Collagen-secreting fibroblast (CSF)",
            "Loose connective tissue histiocyte (LCTH)",
            "Peritoneum-derived cell (PDC)",
            "Visceral adipose tissue cell (VATC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast (FB)",
                "Adipocyte (AD)",
                "Mast Cell (MC)",
                "Macrophage (M\u03a6)",
                "Plasma Cell (PC)",
                "Endothelial Cell (EC)",
                "Pericyte (PR)",
                "Myofibroblast (MF)",
                "Histiocyte (HI)",
                "Collagen-producing cell (CPC)",
                "Reticular cell (RC)",
                "Loose connective tissue macrophage (LCTM)",
                "Adipose-derived stem cell (ADSC)",
                "Connective tissue mast cell (CTMC)",
                "Immune cell in loose connective tissue (ICT)",
                "Interstitial cell (IC)",
                "Dermal fibroblast (DF)",
                "Subcutaneous adipocyte (SAD)",
                "Perivascular cell (PVC)",
                "Loose connective tissue progenitor cell (LCTPC)",
                "Collagen-secreting fibroblast (CSF)",
                "Loose connective tissue histiocyte (LCTH)",
                "Peritoneum-derived cell (PDC)",
                "Visceral adipose tissue cell (VATC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (AD)",
                "Adipose-derived stem cell (ADSC)",
                "Collagen-producing cell (CPC)",
                "Collagen-secreting fibroblast (CSF)",
                "Connective tissue mast cell (CTMC)",
                "Dermal fibroblast (DF)",
                "Endothelial Cell (EC)",
                "Fibroblast (FB)",
                "Histiocyte (HI)",
                "Immune cell in loose connective tissue (ICT)",
                "Interstitial cell (IC)",
                "Loose connective tissue histiocyte (LCTH)",
                "Loose connective tissue macrophage (LCTM)",
                "Loose connective tissue progenitor cell (LCTPC)",
                "Macrophage (M\u03a6)",
                "Mast Cell (MC)",
                "Myofibroblast (MF)",
                "Pericyte (PR)",
                "Peritoneum-derived cell (PDC)",
                "Perivascular cell (PVC)",
                "Plasma Cell (PC)",
                "Reticular cell (RC)",
                "Subcutaneous adipocyte (SAD)",
                "Visceral adipose tissue cell (VATC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast (FB)",
            "Adipocyte (AC)",
            "Mast cell (MC)",
            "Macrophage (MP)",
            "Lymphocyte (LC)",
            "Plasma cell (PC)",
            "Mesenchymal stem cell (MSC)",
            "Endothelial cell (EC)",
            "Pericyte (PC)",
            "Dendritic cell (DC)",
            "Myofibroblast (MF)",
            "Eosinophil (EoC)",
            "Neutrophil (NC)",
            "Basophil (BC)",
            "Reticular cell (RC)",
            "Schwann cell (SC)",
            "Chondrocyte (CC)",
            "Osteoblast (OB)",
            "Osteoclast (OC)",
            "Smooth muscle cell (SMC)",
            "Satellite cell (SatC)",
            "Melanocyte (MC)",
            "T cell (TC)",
            "B cell (BC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast (FB)",
                "Adipocyte (AC)",
                "Mast cell (MC)",
                "Macrophage (MP)",
                "Lymphocyte (LC)",
                "Plasma cell (PC)",
                "Mesenchymal stem cell (MSC)",
                "Endothelial cell (EC)",
                "Pericyte (PC)",
                "Dendritic cell (DC)",
                "Myofibroblast (MF)",
                "Eosinophil (EoC)",
                "Neutrophil (NC)",
                "Basophil (BC)",
                "Reticular cell (RC)",
                "Schwann cell (SC)",
                "Chondrocyte (CC)",
                "Osteoblast (OB)",
                "Osteoclast (OC)",
                "Smooth muscle cell (SMC)",
                "Satellite cell (SatC)",
                "Melanocyte (MC)",
                "T cell (TC)",
                "B cell (BC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (AC)",
                "B cell (BC)",
                "Basophil (BC)",
                "Chondrocyte (CC)",
                "Dendritic cell (DC)",
                "Endothelial cell (EC)",
                "Eosinophil (EoC)",
                "Fibroblast (FB)",
                "Lymphocyte (LC)",
                "Macrophage (MP)",
                "Mast cell (MC)",
                "Melanocyte (MC)",
                "Mesenchymal stem cell (MSC)",
                "Myofibroblast (MF)",
                "Neutrophil (NC)",
                "Osteoblast (OB)",
                "Osteoclast (OC)",
                "Pericyte (PC)",
                "Plasma cell (PC)",
                "Reticular cell (RC)",
                "Satellite cell (SatC)",
                "Schwann cell (SC)",
                "Smooth muscle cell (SMC)",
                "T cell (TC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast (FB)",
            "Adipocyte (AD)",
            "Macrophage (M\u03a6)",
            "Mast cell (MC)",
            "Plasma cell (PC)",
            "Mesenchymal stem cell (MSC)",
            "Lymphocyte (LY)",
            "Eosinophil (EOS)",
            "Neutrophil (NEU)",
            "Basophil (BAS)",
            "Myofibroblast (MFB)",
            "Reticular cell (RC)",
            "Chondrocyte (CC)",
            "Osteoblast (OB)",
            "Osteocyte (OC)",
            "Endothelial cell (EC)",
            "Pericyte (PCy)",
            "Fibrocyte (FC)",
            "Adipose-derived stem cell (ADSC)",
            "Tenocyte (TC)",
            "Skeletal muscle satellite cell (SMSC)",
            "Dermal papilla cell (DPC)",
            "Synovial fibroblast (SF)",
            "Interstitial cell (IC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast (FB)",
                "Adipocyte (AD)",
                "Macrophage (M\u03a6)",
                "Mast cell (MC)",
                "Plasma cell (PC)",
                "Mesenchymal stem cell (MSC)",
                "Lymphocyte (LY)",
                "Eosinophil (EOS)",
                "Neutrophil (NEU)",
                "Basophil (BAS)",
                "Myofibroblast (MFB)",
                "Reticular cell (RC)",
                "Chondrocyte (CC)",
                "Osteoblast (OB)",
                "Osteocyte (OC)",
                "Endothelial cell (EC)",
                "Pericyte (PCy)",
                "Fibrocyte (FC)",
                "Adipose-derived stem cell (ADSC)",
                "Tenocyte (TC)",
                "Skeletal muscle satellite cell (SMSC)",
                "Dermal papilla cell (DPC)",
                "Synovial fibroblast (SF)",
                "Interstitial cell (IC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (AD)",
                "Adipose-derived stem cell (ADSC)",
                "Basophil (BAS)",
                "Chondrocyte (CC)",
                "Dermal papilla cell (DPC)",
                "Endothelial cell (EC)",
                "Eosinophil (EOS)",
                "Fibroblast (FB)",
                "Fibrocyte (FC)",
                "Interstitial cell (IC)",
                "Lymphocyte (LY)",
                "Macrophage (M\u03a6)",
                "Mast cell (MC)",
                "Mesenchymal stem cell (MSC)",
                "Myofibroblast (MFB)",
                "Neutrophil (NEU)",
                "Osteoblast (OB)",
                "Osteocyte (OC)",
                "Pericyte (PCy)",
                "Plasma cell (PC)",
                "Reticular cell (RC)",
                "Skeletal muscle satellite cell (SMSC)",
                "Synovial fibroblast (SF)",
                "Tenocyte (TC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast",
            "Adipocyte",
            "Mast Cell",
            "Macrophage",
            "Plasma Cell",
            "Mesenchymal Cell",
            "Eosinophil",
            "Neutrophil",
            "Basophil",
            "Lymphocyte",
            "Monocyte",
            "Endothelial Cell",
            "Pericyte",
            "Melanocyte",
            "Schwann Cell",
            "Microglia",
            "Kupffer Cell",
            "Fat Cell",
            "White Blood Cell",
            "Red Blood Cell",
            "Platelet",
            "Stem Cell",
            "Dendritic Cell",
            "T Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast",
                "Adipocyte",
                "Mast Cell",
                "Macrophage",
                "Plasma Cell",
                "Mesenchymal Cell",
                "Eosinophil",
                "Neutrophil",
                "Basophil",
                "Lymphocyte",
                "Monocyte",
                "Endothelial Cell",
                "Pericyte",
                "Melanocyte",
                "Schwann Cell",
                "Microglia",
                "Kupffer Cell",
                "Fat Cell",
                "White Blood Cell",
                "Red Blood Cell",
                "Platelet",
                "Stem Cell",
                "Dendritic Cell",
                "T Cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "Basophil",
                "Dendritic Cell",
                "Endothelial Cell",
                "Eosinophil",
                "Fat Cell",
                "Fibroblast",
                "Kupffer Cell",
                "Lymphocyte",
                "Macrophage",
                "Mast Cell",
                "Melanocyte",
                "Mesenchymal Cell",
                "Microglia",
                "Monocyte",
                "Neutrophil",
                "Pericyte",
                "Plasma Cell",
                "Platelet",
                "Red Blood Cell",
                "Schwann Cell",
                "Stem Cell",
                "T Cell",
                "White Blood Cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast",
            "Adipocyte",
            "Mast cell",
            "Macrophage",
            "Plasma cell",
            "Mesenchymal stem cell",
            "Chondrocyte",
            "Osteoblast",
            "Osteoclast",
            "White blood cell",
            "Fibrocyte",
            "Myofibroblast",
            "Pericyte",
            "Endothelial cell",
            "Smooth muscle cell",
            "Eosinophil",
            "Neutrophil",
            "Basophil",
            "Lymphocyte",
            "Monocyte",
            "Natural killer cell",
            "Dendritic cell",
            "Macrophage precursor",
            "Mast cell precursor"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast",
                "Adipocyte",
                "Mast cell",
                "Macrophage",
                "Plasma cell",
                "Mesenchymal stem cell",
                "Chondrocyte",
                "Osteoblast",
                "Osteoclast",
                "White blood cell",
                "Fibrocyte",
                "Myofibroblast",
                "Pericyte",
                "Endothelial cell",
                "Smooth muscle cell",
                "Eosinophil",
                "Neutrophil",
                "Basophil",
                "Lymphocyte",
                "Monocyte",
                "Natural killer cell",
                "Dendritic cell",
                "Macrophage precursor",
                "Mast cell precursor"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "Basophil",
                "Chondrocyte",
                "Dendritic cell",
                "Endothelial cell",
                "Eosinophil",
                "Fibroblast",
                "Fibrocyte",
                "Lymphocyte",
                "Macrophage",
                "Macrophage precursor",
                "Mast cell",
                "Mast cell precursor",
                "Mesenchymal stem cell",
                "Monocyte",
                "Myofibroblast",
                "Natural killer cell",
                "Neutrophil",
                "Osteoblast",
                "Osteoclast",
                "Pericyte",
                "Plasma cell",
                "Smooth muscle cell",
                "White blood cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblasts (Fb)",
            "Adipocytes (Ad)",
            "Mast Cells (MC)",
            "Macrophages (M\u03c6)",
            "Plasma Cells (PC)",
            "T Lymphocytes (T cells)",
            "B Lymphocytes (B cells)",
            "Natural Killer Cells (NK cells)",
            "Neutrophils (Neut)",
            "Eosinophils (Eos)",
            "Basophils (Bas)",
            "Fibrocytes",
            "Dendritic Cells (DC)",
            "Pericytes (PCy)",
            "Mesenchymal Stem Cells (MSC)",
            "Myofibroblasts",
            "Fibroblast-like Cells",
            "Stromal Cells",
            "Resident Immune Cells",
            "Telocytes",
            "Schwann Cells",
            "Endothelial Cells",
            "Smooth Muscle Cells",
            "Satellite Cells"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblasts (Fb)",
                "Adipocytes (Ad)",
                "Mast Cells (MC)",
                "Macrophages (M\u03d5)",
                "Plasma Cells (PC)",
                "T Lymphocytes (T cells)",
                "B Lymphocytes (B cells)",
                "Natural Killer Cells (NK cells)",
                "Neutrophils (Neut)",
                "Eosinophils (Eos)",
                "Basophils (Bas)",
                "Fibrocytes",
                "Dendritic Cells (DC)",
                "Pericytes (PCy)",
                "Mesenchymal Stem Cells (MSC)",
                "Myofibroblasts",
                "Fibroblast-like Cells",
                "Stromal Cells",
                "Resident Immune Cells",
                "Telocytes",
                "Schwann Cells",
                "Endothelial Cells",
                "Smooth Muscle Cells",
                "Satellite Cells"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocytes (Ad)",
                "B Lymphocytes (B cells)",
                "Basophils (Bas)",
                "Dendritic Cells (DC)",
                "Endothelial Cells",
                "Eosinophils (Eos)",
                "Fibroblast-like Cells",
                "Fibroblasts (Fb)",
                "Fibrocytes",
                "Macrophages (M\u03c6)",
                "Mast Cells (MC)",
                "Mesenchymal Stem Cells (MSC)",
                "Myofibroblasts",
                "Natural Killer Cells (NK cells)",
                "Neutrophils (Neut)",
                "Pericytes (PCy)",
                "Plasma Cells (PC)",
                "Resident Immune Cells",
                "Satellite Cells",
                "Schwann Cells",
                "Smooth Muscle Cells",
                "Stromal Cells",
                "T Lymphocytes (T cells)",
                "Telocytes"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast",
            "Macrophage",
            "Mast cell",
            "Plasma cell",
            "Adipocyte",
            "Mesenchymal stem cell",
            "Lymphocyte",
            "Eosinophil",
            "Neutrophil",
            "Dendritic cell",
            "Pericyte",
            "Telocyte",
            "Histiocyte",
            "Myofibroblast",
            "Reticular cell",
            "Melanocyte",
            "Schwann cell",
            "Satellite cell",
            "Interstitial cell of Cajal",
            "Synovial cell",
            "Osteoblast",
            "Chondroblast",
            "Odontoblast",
            "Cementoblast"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast",
                "Macrophage",
                "Mast cell",
                "Plasma cell",
                "Adipocyte",
                "Mesenchymal stem cell",
                "Lymphocyte",
                "Eosinophil",
                "Neutrophil",
                "Dendritic cell",
                "Pericyte",
                "Telocyte",
                "Histiocyte",
                "Myofibroblast",
                "Reticular cell",
                "Melanocyte",
                "Schwann cell",
                "Satellite cell",
                "Interstitial cell of Cajal",
                "Synovial cell",
                "Osteoblast",
                "Chondroblast",
                "Odontoblast",
                "Cementoblast"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "Cementoblast",
                "Chondroblast",
                "Dendritic cell",
                "Eosinophil",
                "Fibroblast",
                "Histiocyte",
                "Interstitial cell of Cajal",
                "Lymphocyte",
                "Macrophage",
                "Mast cell",
                "Melanocyte",
                "Mesenchymal stem cell",
                "Myofibroblast",
                "Neutrophil",
                "Odontoblast",
                "Osteoblast",
                "Pericyte",
                "Plasma cell",
                "Reticular cell",
                "Satellite cell",
                "Schwann cell",
                "Synovial cell",
                "Telocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast",
            "Mesenchymal stem cell (MSC)",
            "Adipocyte",
            "Macrophage",
            "Mast cell",
            "Plasma cell",
            "Reticular cell",
            "Melanocyte",
            "Pericyte",
            "Adventitial cell",
            "Interstitial cell of Cajal (ICC)",
            "Telocyte",
            "Myofibroblast",
            "Fibrocyte",
            "Stromal cell",
            "Stellate cell",
            "Dermal dendrocyte",
            "Histiocyte",
            "Langerhans cell",
            "Dendritic cell (DC)",
            "Endothelial progenitor cell (EPC)",
            "Mesenchymal progenitor cell (MPC)",
            "Smooth muscle progenitor cell (SmPC)",
            "Lymphatic endothelial cell (LEC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast",
                "Mesenchymal stem cell (MSC)",
                "Adipocyte",
                "Macrophage",
                "Mast cell",
                "Plasma cell",
                "Reticular cell",
                "Melanocyte",
                "Pericyte",
                "Adventitial cell",
                "Interstitial cell of Cajal (ICC)",
                "Telocyte",
                "Myofibroblast",
                "Fibrocyte",
                "Stromal cell",
                "Stellate cell",
                "Dermal dendrocyte",
                "Histiocyte",
                "Langerhans cell",
                "Dendritic cell (DC)",
                "Endothelial progenitor cell (EPC)",
                "Mesenchymal progenitor cell (MPC)",
                "Smooth muscle progenitor cell (SmPC)",
                "Lymphatic endothelial cell (LEC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "Adventitial cell",
                "Dendritic cell (DC)",
                "Dermal dendrocyte",
                "Endothelial progenitor cell (EPC)",
                "Fibroblast",
                "Fibrocyte",
                "Histiocyte",
                "Interstitial cell of Cajal (ICC)",
                "Langerhans cell",
                "Lymphatic endothelial cell (LEC)",
                "Macrophage",
                "Mast cell",
                "Melanocyte",
                "Mesenchymal progenitor cell (MPC)",
                "Mesenchymal stem cell (MSC)",
                "Myofibroblast",
                "Pericyte",
                "Plasma cell",
                "Reticular cell",
                "Smooth muscle progenitor cell (SmPC)",
                "Stellate cell",
                "Stromal cell",
                "Telocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast (Fb)",
            "Adipocyte (Ad)",
            "Macrophage (M\u03d5)",
            "Mast cell (MC)",
            "Plasma cell (PC)",
            "Melanocyte (Mel)",
            "Leukocyte (WBC)",
            "Lymphocyte (Ly)",
            "Monocyte (Mo)",
            "Neutrophil (Neu)",
            "Eosinophil (Eo)",
            "Basophil (Ba)",
            "Reticular cell (RC)",
            "Stem cell (SC)",
            "Pericyte (Per)",
            "Myofibroblast (MFb)",
            "Mesenchymal stem cell (MSC)",
            "Fibrocyte (FC)",
            "Histiocyte (HC)",
            "Myoepithelial cell (MEC)",
            "Interstitial cell (IC)",
            "Areolar cell (AC)",
            "Mucosal cell (MuC)",
            "Adventitial cell (AdC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast (Fb)",
                "Adipocyte (Ad)",
                "Macrophage (M\u03d5)",
                "Mast cell (MC)",
                "Plasma cell (PC)",
                "Melanocyte (Mel)",
                "Leukocyte (WBC)",
                "Lymphocyte (Ly)",
                "Monocyte (Mo)",
                "Neutrophil (Neu)",
                "Eosinophil (Eo)",
                "Basophil (Ba)",
                "Reticular cell (RC)",
                "Stem cell (SC)",
                "Pericyte (Per)",
                "Myofibroblast (MFb)",
                "Mesenchymal stem cell (MSC)",
                "Fibrocyte (FC)",
                "Histiocyte (HC)",
                "Myoepithelial cell (MEC)",
                "Interstitial cell (IC)",
                "Areolar cell (AC)",
                "Mucosal cell (MuC)",
                "Adventitial cell (AdC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (Ad)",
                "Adventitial cell (AdC)",
                "Areolar cell (AC)",
                "Basophil (Ba)",
                "Eosinophil (Eo)",
                "Fibroblast (Fb)",
                "Fibrocyte (FC)",
                "Histiocyte (HC)",
                "Interstitial cell (IC)",
                "Leukocyte (WBC)",
                "Lymphocyte (Ly)",
                "Macrophage (M\u03d5)",
                "Mast cell (MC)",
                "Melanocyte (Mel)",
                "Mesenchymal stem cell (MSC)",
                "Monocyte (Mo)",
                "Mucosal cell (MuC)",
                "Myoepithelial cell (MEC)",
                "Myofibroblast (MFb)",
                "Neutrophil (Neu)",
                "Pericyte (Per)",
                "Plasma cell (PC)",
                "Reticular cell (RC)",
                "Stem cell (SC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast (FB)",
            "Adipocyte (AD)",
            "Mast cell (MC)",
            "Macrophage (MP)",
            "Lymphocyte (LC)",
            "Plasma cell (PC)",
            "Neutrophil (NE)",
            "Eosinophil (EO)",
            "Basophil (BA)",
            "Monocyte (MO)",
            "Mesenchymal stem cell (MSC)",
            "Chondrocyte (CH)",
            "Osteoblast (OB)",
            "Osteoclast (OC)",
            "Tenocyte (TC)",
            "Pericyte (PC)",
            "Endothelial cell (EC)",
            "Smooth muscle cell (SMC)",
            "Preadipocyte (PA)",
            "Reticular cell (RC)",
            "Myofibroblast (MFB)",
            "Histiocyte (HC)",
            "Interstitial cell (IC)",
            "Adventitial cell (AC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast (FB)",
                "Adipocyte (AD)",
                "Mast cell (MC)",
                "Macrophage (MP)",
                "Lymphocyte (LC)",
                "Plasma cell (PC)",
                "Neutrophil (NE)",
                "Eosinophil (EO)",
                "Basophil (BA)",
                "Monocyte (MO)",
                "Mesenchymal stem cell (MSC)",
                "Chondrocyte (CH)",
                "Osteoblast (OB)",
                "Osteoclast (OC)",
                "Tenocyte (TC)",
                "Pericyte (PC)",
                "Endothelial cell (EC)",
                "Smooth muscle cell (SMC)",
                "Preadipocyte (PA)",
                "Reticular cell (RC)",
                "Myofibroblast (MFB)",
                "Histiocyte (HC)",
                "Interstitial cell (IC)",
                "Adventitial cell (AC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (AD)",
                "Adventitial cell (AC)",
                "Basophil (BA)",
                "Chondrocyte (CH)",
                "Endothelial cell (EC)",
                "Eosinophil (EO)",
                "Fibroblast (FB)",
                "Histiocyte (HC)",
                "Interstitial cell (IC)",
                "Lymphocyte (LC)",
                "Macrophage (MP)",
                "Mast cell (MC)",
                "Mesenchymal stem cell (MSC)",
                "Monocyte (MO)",
                "Myofibroblast (MFB)",
                "Neutrophil (NE)",
                "Osteoblast (OB)",
                "Osteoclast (OC)",
                "Pericyte (PC)",
                "Plasma cell (PC)",
                "Preadipocyte (PA)",
                "Reticular cell (RC)",
                "Smooth muscle cell (SMC)",
                "Tenocyte (TC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast (FB)",
            "Fibrocyte",
            "Histiocyte",
            "Dermal fibroblast",
            "Endothelial cell",
            "Pericyte",
            "Mesangial cell",
            "Perivascular cell",
            "Myofibroblast",
            "Fibroblast-like synoviocyte",
            "Synoviocyte",
            "Tenocyte",
            "Chondrocyte",
            "Osteocyte",
            "Adipocyte",
            "Macrophage",
            "Dendritic cell",
            "Lymphatic endothelial cell",
            "Endothelial progenitor cell",
            "Vascular smooth muscle cell",
            "Smooth muscle cell",
            "Myoblast",
            "Satellite cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast (FB)",
                "Fibrocyte",
                "Histiocyte",
                "Dermal fibroblast",
                "Endothelial cell",
                "Pericyte",
                "Mesangial cell",
                "Perivascular cell",
                "Myofibroblast",
                "Fibroblast-like synoviocyte",
                "Synoviocyte",
                "Tenocyte",
                "Chondrocyte",
                "Osteocyte",
                "Adipocyte",
                "Macrophage",
                "Dendritic cell",
                "Lymphatic endothelial cell",
                "Endothelial progenitor cell",
                "Vascular smooth muscle cell",
                "Smooth muscle cell",
                "Myoblast",
                "Satellite cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "Chondrocyte",
                "Dendritic cell",
                "Dermal fibroblast",
                "Endothelial cell",
                "Endothelial progenitor cell",
                "Fibroblast (FB)",
                "Fibroblast-like synoviocyte",
                "Fibrocyte",
                "Histiocyte",
                "Lymphatic endothelial cell",
                "Macrophage",
                "Mesangial cell",
                "Myoblast",
                "Myofibroblast",
                "Osteocyte",
                "Pericyte",
                "Perivascular cell",
                "Satellite cell",
                "Smooth muscle cell",
                "Synoviocyte",
                "Tenocyte",
                "Vascular smooth muscle cell"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            "Fibroblast (FB)",
            "Chondrocyte (CHD)",
            "Adipocyte (ADP)",
            "Mast cell (MC)",
            "Chondroblast (CHBL)",
            "Osteocyte (OCY)",
            "Osteoblast (OBL)",
            "Osteoclast (OCL)",
            "Adventitial cell (ADV)",
            "Telocyte (TEL)",
            "Cementocyte (CEM)",
            "Pericyte (PER)",
            "Mesenchymal stem cell (MSC)",
            "Stromal cell (STC)",
            "Pancreatic stellate cell (PSC)",
            "Hepatic stellate cell (HSC)",
            "Renal fibroblast (RFB)",
            "Dermal fibroblast (DFB)",
            "Tendon fibroblast (TFB)",
            "Ligament fibroblast (LFB)",
            "Synovial fibroblast (SFB)",
            "Corneal fibroblast (CFB)",
            "Cardiac fibroblast (CFb)",
            "Pulmonary fibroblast (PFb)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fibroblast (FB)",
                "Chondrocyte (CHD)",
                "Adipocyte (ADP)",
                "Mast cell (MC)",
                "Chondroblast (CHBL)",
                "Osteocyte (OCY)",
                "Osteoblast (OBL)",
                "Osteoclast (OCL)",
                "Adventitial cell (ADV)",
                "Telocyte (TEL)",
                "Cementocyte (CEM)",
                "Pericyte (PER)",
                "Mesenchymal stem cell (MSC)",
                "Stromal cell (STC)",
                "Pancreatic stellate cell (PSC)",
                "Hepatic stellate cell (HSC)",
                "Renal fibroblast (RFB)",
                "Dermal fibroblast (DFB)",
                "Tendon fibroblast (TFB)",
                "Ligament fibroblast (LFB)",
                "Synovial fibroblast (SFB)",
                "Corneal fibroblast (CFB)",
                "Cardiac fibroblast (CFb)",
                "Pulmonary fibroblast (PFb)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (ADP)",
                "Adventitial cell (ADV)",
                "Cardiac fibroblast (CFb)",
                "Cementocyte (CEM)",
                "Chondroblast (CHBL)",
                "Chondrocyte (CHD)",
                "Corneal fibroblast (CFB)",
                "Dermal fibroblast (DFB)",
                "Fibroblast (FB)",
                "Hepatic stellate cell (HSC)",
                "Ligament fibroblast (LFB)",
                "Mast cell (MC)",
                "Mesenchymal stem cell (MSC)",
                "Osteoblast (OBL)",
                "Osteoclast (OCL)",
                "Osteocyte (OCY)",
                "Pancreatic stellate cell (PSC)",
                "Pericyte (PER)",
                "Pulmonary fibroblast (PFb)",
                "Renal fibroblast (RFB)",
                "Stromal cell (STC)",
                "Synovial fibroblast (SFB)",
                "Telocyte (TEL)",
                "Tendon fibroblast (TFB)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "stromal cell",
        "domain": "biology",
        "response": [
            {
                "referent": "areolar connective tissue"
            },
            {
                "referent": "adipose tissue"
            },
            {
                "referent": "bone marrow"
            },
            {
                "referent": "cartilage"
            },
            {
                "referent": "dura mater"
            },
            {
                "referent": "loose connective tissue"
            },
            {
                "referent": "meniscus"
            },
            {
                "referent": "synovial membrane"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "areolar connective tissue",
                "adipose tissue",
                "bone marrow",
                "cartilage",
                "dura mater",
                "loose connective tissue",
                "meniscus",
                "synovial membrane"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"referent\": \"adipose tissue\"}",
                "{\"referent\": \"areolar connective tissue\"}",
                "{\"referent\": \"bone marrow\"}",
                "{\"referent\": \"cartilage\"}",
                "{\"referent\": \"dura mater\"}",
                "{\"referent\": \"loose connective tissue\"}",
                "{\"referent\": \"meniscus\"}",
                "{\"referent\": \"synovial membrane\"}"
            ],
            "TP": 8,
            "FP": 0,
            "FN": 0
        }
    }
]