[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "Adipocyte (fat cell)",
            "Lipid droplet",
            "Oocyte",
            "Spermatocyte",
            "Mammary gland cell",
            "Chondrocyte",
            "Myocyte",
            "Hepatocyte",
            "Neuron",
            "Retinal pigment epithelial cell",
            "Kupffer cell",
            "Macrophage",
            "Melanocyte",
            "Pancreatic beta cell",
            "Platelet",
            "T lymphocyte",
            "B lymphocyte",
            "Erythrocyte",
            "Epithelial cell",
            "Fibroblast",
            "Osteoblast",
            "Osteoclast",
            "Osteocyte",
            "Smooth muscle cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte (fat cell)",
                "Lipid droplet",
                "Oocyte",
                "Spermatocyte",
                "Mammary gland cell",
                "Chondrocyte",
                "Myocyte",
                "Hepatocyte",
                "Neuron",
                "Retinal pigment epithelial cell",
                "Kupffer cell",
                "Macrophage",
                "Melanocyte",
                "Pancreatic beta cell",
                "Platelet",
                "T lymphocyte",
                "B lymphocyte",
                "Erythrocyte",
                "Epithelial cell",
                "Fibroblast",
                "Osteoblast",
                "Osteoclast",
                "Osteocyte",
                "Smooth muscle cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (fat cell)",
                "B lymphocyte",
                "Chondrocyte",
                "Epithelial cell",
                "Erythrocyte",
                "Fibroblast",
                "Hepatocyte",
                "Kupffer cell",
                "Lipid droplet",
                "Macrophage",
                "Mammary gland cell",
                "Melanocyte",
                "Myocyte",
                "Neuron",
                "Oocyte",
                "Osteoblast",
                "Osteoclast",
                "Osteocyte",
                "Pancreatic beta cell",
                "Platelet",
                "Retinal pigment epithelial cell",
                "Smooth muscle cell",
                "Spermatocyte",
                "T lymphocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "Adipocyte (Adipose cell)",
            "Brown adipocyte (Brown fat cell)",
            "White adipocyte (White fat cell)",
            "Unilocular adipocyte",
            "Multilocular adipocyte",
            "Brown fat cell",
            "White fat cell",
            "Beige adipocyte",
            "Subcutaneous adipocyte",
            "Visceral adipocyte",
            "Interscapular brown fat cell",
            "Brown adipose tissue cell",
            "White adipose tissue cell",
            "Adipocyte precursor cell",
            "Adipogenic cell",
            "Pre-adipocyte",
            "Mesenchymal stem cell-derived adipocyte",
            "Adipocyte-derived stem cell",
            "Adipose-derived stem cell",
            "Brown pre-adipocyte",
            "White pre-adipocyte",
            "Adipocyte-like cell",
            "Brown adipocyte progenitor cell",
            "White adipocyte progenitor cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte (Adipose cell)",
                "Brown adipocyte (Brown fat cell)",
                "White adipocyte (White fat cell)",
                "Unilocular adipocyte",
                "Multilocular adipocyte",
                "Brown fat cell",
                "White fat cell",
                "Beige adipocyte",
                "Subcutaneous adipocyte",
                "Visceral adipocyte",
                "Interscapular brown fat cell",
                "Brown adipose tissue cell",
                "White adipose tissue cell",
                "Adipocyte precursor cell",
                "Adipogenic cell",
                "Pre-adipocyte",
                "Mesenchymal stem cell-derived adipocyte",
                "Adipocyte-derived stem cell",
                "Adipose-derived stem cell",
                "Brown pre-adipocyte",
                "White pre-adipocyte",
                "Adipocyte-like cell",
                "Brown adipocyte progenitor cell",
                "White adipocyte progenitor cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (Adipose cell)",
                "Adipocyte precursor cell",
                "Adipocyte-derived stem cell",
                "Adipocyte-like cell",
                "Adipogenic cell",
                "Adipose-derived stem cell",
                "Beige adipocyte",
                "Brown adipocyte (Brown fat cell)",
                "Brown adipocyte progenitor cell",
                "Brown adipose tissue cell",
                "Brown fat cell",
                "Brown pre-adipocyte",
                "Interscapular brown fat cell",
                "Mesenchymal stem cell-derived adipocyte",
                "Multilocular adipocyte",
                "Pre-adipocyte",
                "Subcutaneous adipocyte",
                "Unilocular adipocyte",
                "Visceral adipocyte",
                "White adipocyte (White fat cell)",
                "White adipocyte progenitor cell",
                "White adipose tissue cell",
                "White fat cell",
                "White pre-adipocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "Adipocyte (Fat Cell)",
            "White Adipocyte",
            "Brown Adipocyte",
            "Beige Adipocyte",
            "Lipocyte",
            "Adipose Cell",
            "Preadipocyte",
            "Mammary Gland Cell",
            "Ovarian Theca Cell",
            "Ovarian Granulosa Cell",
            "Mesenchymal Stem Cell (MSC)",
            "Osteoblast",
            "Chondrocyte",
            "Hepatocyte",
            "Enterocyte",
            "Pancreatic Beta Cell",
            "Pancreatic Alpha Cell",
            "Pancreatic Delta Cell",
            "Pancreatic PP Cell",
            "Pancreatic Epsilon Cell",
            "Pancreatic Acinar Cell",
            "Pancreatic Ductal Cell",
            "Smooth Muscle Cell",
            "Cardiomyocyte",
            "Endothelial Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte (Fat Cell)",
                "White Adipocyte",
                "Brown Adipocyte",
                "Beige Adipocyte",
                "Lipocyte",
                "Adipose Cell",
                "Preadipocyte",
                "Mammary Gland Cell",
                "Ovarian Theca Cell",
                "Ovarian Granulosa Cell",
                "Mesenchymal Stem Cell (MSC)",
                "Osteoblast",
                "Chondrocyte",
                "Hepatocyte",
                "Enterocyte",
                "Pancreatic Beta Cell",
                "Pancreatic Alpha Cell",
                "Pancreatic Delta Cell",
                "Pancreatic PP Cell",
                "Pancreatic Epsilon Cell",
                "Pancreatic Acinar Cell",
                "Pancreatic Ductal Cell",
                "Smooth Muscle Cell",
                "Cardiomyocyte"
            ],
            "mismatches": [
                "Endothelial Cell"
            ],
            "true_referents": [
                "Adipocyte (Fat Cell)",
                "Adipose Cell",
                "Beige Adipocyte",
                "Brown Adipocyte",
                "Cardiomyocyte",
                "Chondrocyte",
                "Enterocyte",
                "Hepatocyte",
                "Lipocyte",
                "Mammary Gland Cell",
                "Mesenchymal Stem Cell (MSC)",
                "Osteoblast",
                "Ovarian Granulosa Cell",
                "Ovarian Theca Cell",
                "Pancreatic Acinar Cell",
                "Pancreatic Alpha Cell",
                "Pancreatic Beta Cell",
                "Pancreatic Delta Cell",
                "Pancreatic Ductal Cell",
                "Pancreatic Epsilon Cell",
                "Pancreatic PP Cell",
                "Preadipocyte",
                "Smooth Muscle Cell",
                "White Adipocyte"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "Adipocyte (AD)",
            "Steatoblast",
            "Perilipin-coated lipid droplet",
            "White adipose tissue cell",
            "Brown adipose tissue cell",
            "Hibernating bear adipose cell",
            "Blubber cell (seal)",
            "Subcutaneous adipocyte",
            "Visceral adipocyte",
            "Intramuscular fat cell",
            "Bone marrow adipocyte",
            "Cardiac adipocyte",
            "Periovarian adipocyte",
            "Epididymal adipocyte",
            "Mesenteric adipocyte",
            "Retrop\u0435ritoneal adipocyte",
            "Omental adipocyte",
            "Adipocyte precursor cell",
            "Pre-adipocyte",
            "Mature adipocyte",
            "Multilocular adipocyte",
            "Unilocular adipocyte",
            "Lipoma cell",
            "Sebocyte (skin)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte (AD)",
                "Steatoblast",
                "Perilipin-coated lipid droplet",
                "White adipose tissue cell",
                "Brown adipose tissue cell",
                "Hibernating bear adipose cell",
                "Blubber cell (seal)",
                "Subcutaneous adipocyte",
                "Visceral adipocyte",
                "Intramuscular fat cell",
                "Bone marrow adipocyte",
                "Cardiac adipocyte",
                "Periovarian adipocyte",
                "Epididymal adipocyte",
                "Mesenteric adipocyte",
                "Retrop\u0435ritoneal adipocyte",
                "Omental adipocyte",
                "Adipocyte precursor cell",
                "Pre-adipocyte",
                "Mature adipocyte",
                "Multilocular adipocyte",
                "Unilocular adipocyte",
                "Lipoma cell",
                "Sebocyte (skin)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (AD)",
                "Adipocyte precursor cell",
                "Blubber cell (seal)",
                "Bone marrow adipocyte",
                "Brown adipose tissue cell",
                "Cardiac adipocyte",
                "Epididymal adipocyte",
                "Hibernating bear adipose cell",
                "Intramuscular fat cell",
                "Lipoma cell",
                "Mature adipocyte",
                "Mesenteric adipocyte",
                "Multilocular adipocyte",
                "Omental adipocyte",
                "Perilipin-coated lipid droplet",
                "Periovarian adipocyte",
                "Pre-adipocyte",
                "Retrop\u0435ritoneal adipocyte",
                "Sebocyte (skin)",
                "Steatoblast",
                "Subcutaneous adipocyte",
                "Unilocular adipocyte",
                "Visceral adipocyte",
                "White adipose tissue cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "Adipocyte",
            "Lipid Droplet Cell",
            "Brown Adipocyte",
            "White Adipocyte",
            "Beige Adipocyte",
            "Multilocular Adipocyte",
            "Unilocular Adipocyte",
            "Subcutaneous Fat Cell",
            "Visceral Fat Cell",
            "Intramuscular Adipocyte",
            "Perivascular Adipocyte",
            "Perirenal Adipocyte",
            "Epicardial Adipocyte",
            "Pericardial Adipocyte",
            "Mammary Gland Adipocyte",
            "Bone Marrow Adipocyte",
            "Omental Fat Cell",
            "Mesenteric Fat Cell",
            "Retroperitoneal Adipocyte",
            "Gonadal Fat Cell",
            "Dermal White Adipocyte",
            "Periosteal Adipocyte",
            "Orbital Adipocyte",
            "Buccal Fat Pad Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte",
                "Lipid Droplet Cell",
                "Brown Adipocyte",
                "White Adipocyte",
                "Beige Adipocyte",
                "Multilocular Adipocyte",
                "Unilocular Adipocyte",
                "Subcutaneous Fat Cell",
                "Visceral Fat Cell",
                "Intramuscular Adipocyte",
                "Perivascular Adipocyte",
                "Perirenal Adipocyte",
                "Epicardial Adipocyte",
                "Pericardial Adipocyte",
                "Mammary Gland Adipocyte",
                "Bone Marrow Adipocyte",
                "Omental Fat Cell",
                "Mesenteric Fat Cell",
                "Retroperitoneal Adipocyte",
                "Gonadal Fat Cell",
                "Dermal White Adipocyte",
                "Periosteal Adipocyte",
                "Orbital Adipocyte",
                "Buccal Fat Pad Cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "Beige Adipocyte",
                "Bone Marrow Adipocyte",
                "Brown Adipocyte",
                "Buccal Fat Pad Cell",
                "Dermal White Adipocyte",
                "Epicardial Adipocyte",
                "Gonadal Fat Cell",
                "Intramuscular Adipocyte",
                "Lipid Droplet Cell",
                "Mammary Gland Adipocyte",
                "Mesenteric Fat Cell",
                "Multilocular Adipocyte",
                "Omental Fat Cell",
                "Orbital Adipocyte",
                "Pericardial Adipocyte",
                "Periosteal Adipocyte",
                "Perirenal Adipocyte",
                "Perivascular Adipocyte",
                "Retroperitoneal Adipocyte",
                "Subcutaneous Fat Cell",
                "Unilocular Adipocyte",
                "Visceral Fat Cell",
                "White Adipocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "Adipocyte (ADP)",
            "White adipose tissue cell (WAT)",
            "Brown adipose tissue cell (BAT)",
            "Lipid droplet-containing cell (LDC)",
            "Subcutaneous fat cell (SFC)",
            "Visceral fat cell (VFC)",
            "Hepatic stellate cell (HSC)",
            "Bone marrow adipocyte (BMA)",
            "Pancreatic adipocyte (PAC)",
            "Omental adipocyte (OAC)",
            "Perivascular adipocyte (PVAC)",
            "Epicardial adipocyte (EAC)",
            "Dermal adipocyte (DAC)",
            "Intradermal adipocyte (IDAC)",
            "Renal adipocyte (RAC)",
            "Thyroid adipocyte (TAC)",
            "Muscle adipocyte (MAC)",
            "Chondrocyte-derived adipocyte (CDA)",
            "Neonatal adipocyte (NADP)",
            "Adult adipocyte (AADP)",
            "Pregnant adipocyte (PADP)",
            "Obese adipocyte (OADP)",
            "Diabetic adipocyte (DADP)",
            "Caloric restriction-induced adipocyte (CRADP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte (ADP)",
                "White adipose tissue cell (WAT)",
                "Brown adipose tissue cell (BAT)",
                "Lipid droplet-containing cell (LDC)",
                "Subcutaneous fat cell (SFC)",
                "Visceral fat cell (VFC)",
                "Hepatic stellate cell (HSC)",
                "Bone marrow adipocyte (BMA)",
                "Pancreatic adipocyte (PAC)",
                "Omental adipocyte (OAC)",
                "Perivascular adipocyte (PVAC)",
                "Epicardial adipocyte (EAC)",
                "Dermal adipocyte (DAC)",
                "Intradermal adipocyte (IDAC)",
                "Renal adipocyte (RAC)",
                "Thyroid adipocyte (TAC)",
                "Muscle adipocyte (MAC)",
                "Chondrocyte-derived adipocyte (CDA)",
                "Neonatal adipocyte (NADP)",
                "Adult adipocyte (AADP)",
                "Pregnant adipocyte (PADP)",
                "Obese adipocyte (OADP)",
                "Diabetic adipocyte (DADP)",
                "Caloric restriction-induced adipocyte (CRADP)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (ADP)",
                "Adult adipocyte (AADP)",
                "Bone marrow adipocyte (BMA)",
                "Brown adipose tissue cell (BAT)",
                "Caloric restriction-induced adipocyte (CRADP)",
                "Chondrocyte-derived adipocyte (CDA)",
                "Dermal adipocyte (DAC)",
                "Diabetic adipocyte (DADP)",
                "Epicardial adipocyte (EAC)",
                "Hepatic stellate cell (HSC)",
                "Intradermal adipocyte (IDAC)",
                "Lipid droplet-containing cell (LDC)",
                "Muscle adipocyte (MAC)",
                "Neonatal adipocyte (NADP)",
                "Obese adipocyte (OADP)",
                "Omental adipocyte (OAC)",
                "Pancreatic adipocyte (PAC)",
                "Perivascular adipocyte (PVAC)",
                "Pregnant adipocyte (PADP)",
                "Renal adipocyte (RAC)",
                "Subcutaneous fat cell (SFC)",
                "Thyroid adipocyte (TAC)",
                "Visceral fat cell (VFC)",
                "White adipose tissue cell (WAT)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "Adipocyte (ADI)",
            "White Fat Cell (WFC)",
            "Brown Fat Cell (BFC)",
            "Beige Fat Cell (BFC)",
            "Unilocular Fat Cell (UFC)",
            "Multilocular Fat Cell (MFC)",
            "Visceral Fat Cell (VFC)",
            "Subcutaneous Fat Cell (SFC)",
            "Mesenchymal Stem Cell-derived Adipocyte (MSCA)",
            "Bone Marrow Adipocyte (BMA)",
            "Perivascular Adipocyte (PVA)",
            "Retroperitoneal Fat Cell (RFC)",
            "Omental Fat Cell (OFC)",
            "Intramuscular Adipocyte (IMA)",
            "Interscapular Brown Adipocyte (IBA)",
            "Epididymal White Adipocyte (EWA)",
            "Inguinal White Adipocyte (IWA)",
            "Perirenal Brown Adipocyte (PBA)",
            "Adipose-derived Stem Cell-differentiated Adipocyte (ASCDA)",
            "3T3-L1 Cell Line Adipocyte (3T3-L1)",
            "BAT-derived Beige Adipocyte (BATBA)",
            "Human Preadipocyte-derived Mature Adipocyte (HPDMA)",
            "Mature Murine Adipocyte (MMA)",
            "Human Adipose Tissue-derived Mesenchymal Stem Cell-differentiated Adipocyte (hATMSCDA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte (ADI)",
                "White Fat Cell (WFC)",
                "Brown Fat Cell (BFC)",
                "Beige Fat Cell (BFC)",
                "Unilocular Fat Cell (UFC)",
                "Multilocular Fat Cell (MFC)",
                "Visceral Fat Cell (VFC)",
                "Subcutaneous Fat Cell (SFC)",
                "Mesenchymal Stem Cell-derived Adipocyte (MSCA)",
                "Bone Marrow Adipocyte (BMA)",
                "Perivascular Adipocyte (PVA)",
                "Retroperitoneal Fat Cell (RFC)",
                "Omental Fat Cell (OFC)",
                "Intramuscular Adipocyte (IMA)",
                "Interscapular Brown Adipocyte (IBA)",
                "Epididymal White Adipocyte (EWA)",
                "Inguinal White Adipocyte (IWA)",
                "Perirenal Brown Adipocyte (PBA)",
                "Adipose-derived Stem Cell-differentiated Adipocyte (ASCDA)",
                "3T3-L1 Cell Line Adipocyte (3T3-L1)",
                "BAT-derived Beige Adipocyte (BATBA)",
                "Human Preadipocyte-derived Mature Adipocyte (HPDMA)",
                "Mature Murine Adipocyte (MMA)",
                "Human Adipose Tissue-derived Mesenchymal Stem Cell-differentiated Adipocyte (hATMSCDA)"
            ],
            "mismatches": [],
            "true_referents": [
                "3T3-L1 Cell Line Adipocyte (3T3-L1)",
                "Adipocyte (ADI)",
                "Adipose-derived Stem Cell-differentiated Adipocyte (ASCDA)",
                "BAT-derived Beige Adipocyte (BATBA)",
                "Beige Fat Cell (BFC)",
                "Bone Marrow Adipocyte (BMA)",
                "Brown Fat Cell (BFC)",
                "Epididymal White Adipocyte (EWA)",
                "Human Adipose Tissue-derived Mesenchymal Stem Cell-differentiated Adipocyte (hATMSCDA)",
                "Human Preadipocyte-derived Mature Adipocyte (HPDMA)",
                "Inguinal White Adipocyte (IWA)",
                "Interscapular Brown Adipocyte (IBA)",
                "Intramuscular Adipocyte (IMA)",
                "Mature Murine Adipocyte (MMA)",
                "Mesenchymal Stem Cell-derived Adipocyte (MSCA)",
                "Multilocular Fat Cell (MFC)",
                "Omental Fat Cell (OFC)",
                "Perirenal Brown Adipocyte (PBA)",
                "Perivascular Adipocyte (PVA)",
                "Retroperitoneal Fat Cell (RFC)",
                "Subcutaneous Fat Cell (SFC)",
                "Unilocular Fat Cell (UFC)",
                "Visceral Fat Cell (VFC)",
                "White Fat Cell (WFC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "Adipocyte (A)",
            "Hepatocyte (H)",
            "Myocyte (M)",
            "Osteoblast (O)",
            "Chondrocyte (C)",
            "Kupffer cell (K)",
            "Macrophage (M)",
            "Neutrophil (N)",
            "Lipid droplet (L)",
            "Epidermal cell (E)",
            "Fibroblast (F)",
            "Lung cell (L)",
            "Pancreatic acinar cell (P)",
            "Sertoli cell (S)",
            "Spermatocyte (S)",
            "Intestinal epithelial cell (I)",
            "Adrenal cortical cell (A)",
            "Sebocyte (S)",
            "Mammary epithelial cell (M)",
            "Satellite cell (S)",
            "Renal tubular cell (R)",
            "Cardiomyocyte (C)",
            "Lipoblast (L)",
            "Pericyte (P)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte (A)",
                "Hepatocyte (H)",
                "Myocyte (M)",
                "Osteoblast (O)",
                "Chondrocyte (C)",
                "Kupffer cell (K)",
                "Macrophage (M)",
                "Neutrophil (N)",
                "Lipid droplet (L)",
                "Epidermal cell (E)",
                "Fibroblast (F)",
                "Lung cell (L)",
                "Pancreatic acinar cell (P)",
                "Sertoli cell (S)",
                "Spermatocyte (S)",
                "Intestinal epithelial cell (I)",
                "Adrenal cortical cell (A)",
                "Sebocyte (S)",
                "Mammary epithelial cell (M)",
                "Satellite cell (S)",
                "Renal tubular cell (R)",
                "Cardiomyocyte (C)",
                "Lipoblast (L)",
                "Pericyte (P)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (A)",
                "Adrenal cortical cell (A)",
                "Cardiomyocyte (C)",
                "Chondrocyte (C)",
                "Epidermal cell (E)",
                "Fibroblast (F)",
                "Hepatocyte (H)",
                "Intestinal epithelial cell (I)",
                "Kupffer cell (K)",
                "Lipid droplet (L)",
                "Lipoblast (L)",
                "Lung cell (L)",
                "Macrophage (M)",
                "Mammary epithelial cell (M)",
                "Myocyte (M)",
                "Neutrophil (N)",
                "Osteoblast (O)",
                "Pancreatic acinar cell (P)",
                "Pericyte (P)",
                "Renal tubular cell (R)",
                "Satellite cell (S)",
                "Sebocyte (S)",
                "Sertoli cell (S)",
                "Spermatocyte (S)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "White adipocyte (WAC)",
            "Brown adipocyte (BAC)",
            "Beige adipocyte",
            "Macrophage foam cell",
            "Hepatocyte",
            "Astrocyte",
            "Enterocyte",
            "Adipose-derived stem cell (ADSC)",
            "Omental adipocyte",
            "Subcutaneous adipocyte",
            "Visceral adipocyte",
            "Intramuscular adipocyte",
            "Perirenal adipocyte",
            "Epicardial adipocyte",
            "Bone marrow adipocyte",
            "Retinal pigment epithelial cell",
            "Cholesterol ester storage cell",
            "Lipid-laden microglia",
            "Neuronal lipid storage cell",
            "Cholesterol-laden macrophage",
            "Adipocyte-like hepatocyte",
            "Depot-specific adipocyte",
            "Shivering brown fat cell",
            "Non-shivering brown fat cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "White adipocyte (WAC)",
                "Brown adipocyte (BAC)",
                "Beige adipocyte",
                "Macrophage foam cell",
                "Hepatocyte",
                "Astrocyte",
                "Enterocyte",
                "Adipose-derived stem cell (ADSC)",
                "Omental adipocyte",
                "Subcutaneous adipocyte",
                "Visceral adipocyte",
                "Intramuscular adipocyte",
                "Perirenal adipocyte",
                "Epicardial adipocyte",
                "Bone marrow adipocyte",
                "Retinal pigment epithelial cell",
                "Cholesterol ester storage cell",
                "Lipid-laden microglia",
                "Neuronal lipid storage cell",
                "Cholesterol-laden macrophage",
                "Adipocyte-like hepatocyte",
                "Depot-specific adipocyte",
                "Shivering brown fat cell",
                "Non-shivering brown fat cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte-like hepatocyte",
                "Adipose-derived stem cell (ADSC)",
                "Astrocyte",
                "Beige adipocyte",
                "Bone marrow adipocyte",
                "Brown adipocyte (BAC)",
                "Cholesterol ester storage cell",
                "Cholesterol-laden macrophage",
                "Depot-specific adipocyte",
                "Enterocyte",
                "Epicardial adipocyte",
                "Hepatocyte",
                "Intramuscular adipocyte",
                "Lipid-laden microglia",
                "Macrophage foam cell",
                "Neuronal lipid storage cell",
                "Non-shivering brown fat cell",
                "Omental adipocyte",
                "Perirenal adipocyte",
                "Retinal pigment epithelial cell",
                "Shivering brown fat cell",
                "Subcutaneous adipocyte",
                "Visceral adipocyte",
                "White adipocyte (WAC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "Adipocyte (fat cell)",
            "White adipocyte",
            "Brown adipocyte",
            "Beige adipocyte",
            "Hepatocyte (liver cell)",
            "Sebocyte",
            "Mammary epithelial cell",
            "Lipocyte",
            "Steatocyte",
            "Foam cell",
            "Ito cell (hepatic stellate cell)",
            "Kupffer cell",
            "Myocyte (muscle cell)",
            "Cardiomyocyte",
            "Osteoblast",
            "Adrenocortical cell",
            "Luteal cell",
            "Theca cell",
            "Sertoli cell",
            "Leydig cell",
            "Neuron",
            "Glial cell",
            "Mast cell",
            "Macrophage"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte (fat cell)",
                "White adipocyte",
                "Brown adipocyte",
                "Beige adipocyte",
                "Hepatocyte (liver cell)",
                "Sebocyte",
                "Mammary epithelial cell",
                "Lipocyte",
                "Steatocyte",
                "Foam cell",
                "Ito cell (hepatic stellate cell)",
                "Kupffer cell",
                "Myocyte (muscle cell)",
                "Cardiomyocyte",
                "Osteoblast",
                "Adrenocortical cell",
                "Luteal cell",
                "Theca cell",
                "Sertoli cell",
                "Leydig cell",
                "Neuron",
                "Glial cell",
                "Mast cell",
                "Macrophage"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (fat cell)",
                "Adrenocortical cell",
                "Beige adipocyte",
                "Brown adipocyte",
                "Cardiomyocyte",
                "Foam cell",
                "Glial cell",
                "Hepatocyte (liver cell)",
                "Ito cell (hepatic stellate cell)",
                "Kupffer cell",
                "Leydig cell",
                "Lipocyte",
                "Luteal cell",
                "Macrophage",
                "Mammary epithelial cell",
                "Mast cell",
                "Myocyte (muscle cell)",
                "Neuron",
                "Osteoblast",
                "Sebocyte",
                "Sertoli cell",
                "Steatocyte",
                "Theca cell",
                "White adipocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "Adipocyte",
            "White fat cell",
            "Brown fat cell",
            "Beige fat cell",
            "Lipocyte",
            "Fat-storing cell",
            "Unilocular adipocyte",
            "Multilocular adipocyte",
            "Visceral fat cell",
            "Subcutaneous fat cell",
            "Perirenal fat cell",
            "Epicardial fat cell",
            "Bone marrow adipocyte",
            "Breast adipocyte",
            "Orbital fat cell",
            "Periarticular fat cell",
            "Mesenteric fat cell",
            "Omental fat cell",
            "Retroperitoneal fat cell",
            "Pericardial fat cell",
            "Intramuscular fat cell",
            "Dermal fat cell",
            "Ectopic fat cell",
            "Lipid-laden macrophage"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte",
                "White fat cell",
                "Brown fat cell",
                "Beige fat cell",
                "Lipocyte",
                "Fat-storing cell",
                "Unilocular adipocyte",
                "Multilocular adipocyte",
                "Visceral fat cell",
                "Subcutaneous fat cell",
                "Perirenal fat cell",
                "Epicardial fat cell",
                "Bone marrow adipocyte",
                "Breast adipocyte",
                "Orbital fat cell",
                "Periarticular fat cell",
                "Mesenteric fat cell",
                "Omental fat cell",
                "Retroperitoneal fat cell",
                "Pericardial fat cell",
                "Intramuscular fat cell",
                "Dermal fat cell",
                "Ectopic fat cell",
                "Lipid-laden macrophage"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "Beige fat cell",
                "Bone marrow adipocyte",
                "Breast adipocyte",
                "Brown fat cell",
                "Dermal fat cell",
                "Ectopic fat cell",
                "Epicardial fat cell",
                "Fat-storing cell",
                "Intramuscular fat cell",
                "Lipid-laden macrophage",
                "Lipocyte",
                "Mesenteric fat cell",
                "Multilocular adipocyte",
                "Omental fat cell",
                "Orbital fat cell",
                "Periarticular fat cell",
                "Pericardial fat cell",
                "Perirenal fat cell",
                "Retroperitoneal fat cell",
                "Subcutaneous fat cell",
                "Unilocular adipocyte",
                "Visceral fat cell",
                "White fat cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "adipocyte (fat cell)",
            "lipocyte",
            "fat body cell (insect)",
            "elaioplast (plant fat storage organelle)",
            "adipose tissue",
            "white adipose tissue",
            "brown adipose tissue",
            "lipid droplet",
            "oil body (plant cell)",
            "milk fat globule",
            "yolk",
            "egg yolk",
            "vitellus",
            "lipoprotein particle",
            "chylomicron",
            "very low-density lipoprotein (VLDL)",
            "low-density lipoprotein (LDL)",
            "high-density lipoprotein (HDL)",
            "lipid bilayer (cell membrane)",
            "myelin sheath",
            "sebaceous gland",
            "mammary gland",
            "adipocyte precursor cell",
            "preadipocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "adipocyte (fat cell)",
                "lipocyte",
                "fat body cell (insect)",
                "elaioplast (plant fat storage organelle)",
                "adipose tissue",
                "white adipose tissue",
                "brown adipose tissue",
                "lipid droplet",
                "oil body (plant cell)",
                "milk fat globule",
                "yolk",
                "egg yolk",
                "vitellus",
                "lipoprotein particle",
                "chylomicron",
                "very low-density lipoprotein (VLDL)",
                "low-density lipoprotein (LDL)",
                "high-density lipoprotein (HDL)",
                "lipid bilayer (cell membrane)",
                "myelin sheath",
                "sebaceous gland",
                "mammary gland",
                "adipocyte precursor cell",
                "preadipocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "adipocyte (fat cell)",
                "adipocyte precursor cell",
                "adipose tissue",
                "brown adipose tissue",
                "chylomicron",
                "egg yolk",
                "elaioplast (plant fat storage organelle)",
                "fat body cell (insect)",
                "high-density lipoprotein (HDL)",
                "lipid bilayer (cell membrane)",
                "lipid droplet",
                "lipocyte",
                "lipoprotein particle",
                "low-density lipoprotein (LDL)",
                "mammary gland",
                "milk fat globule",
                "myelin sheath",
                "oil body (plant cell)",
                "preadipocyte",
                "sebaceous gland",
                "very low-density lipoprotein (VLDL)",
                "vitellus",
                "white adipose tissue",
                "yolk"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "Adipocyte (AD)",
            "Lipocyte (LC)",
            "Lipoblast (LB)",
            "Preadipocyte (PA)",
            "Adipose stem cell (ASC)",
            "Beige adipocyte (BA)",
            "Brown adipocyte (BrA)",
            "White adipocyte (WA)",
            "Perivascular adipocyte (PVA)",
            "Epicardial adipocyte (EA)",
            "Mesenteric adipocyte (MA)",
            "Omental adipocyte (OA)",
            "Subcutaneous adipocyte (SA)",
            "Visceral adipocyte (VA)",
            "Bone marrow adipocyte (BMA)",
            "Hepatic adipocyte (HA)",
            "Renal adipocyte (RA)",
            "Skeletal muscle adipocyte (SMA)",
            "Cardiac adipocyte (CA)",
            "Pancreatic adipocyte (PA)",
            "Thyroid adipocyte (TA)",
            "Adrenal adipocyte (AA)",
            "Ovarian adipocyte (OvA)",
            "Testicular adipocyte (TA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte (AD)",
                "Lipocyte (LC)",
                "Lipoblast (LB)",
                "Preadipocyte (PA)",
                "Adipose stem cell (ASC)",
                "Beige adipocyte (BA)",
                "Brown adipocyte (BrA)",
                "White adipocyte (WA)",
                "Perivascular adipocyte (PVA)",
                "Epicardial adipocyte (EA)",
                "Mesenteric adipocyte (MA)",
                "Omental adipocyte (OA)",
                "Subcutaneous adipocyte (SA)",
                "Visceral adipocyte (VA)",
                "Bone marrow adipocyte (BMA)",
                "Hepatic adipocyte (HA)",
                "Renal adipocyte (RA)",
                "Skeletal muscle adipocyte (SMA)",
                "Cardiac adipocyte (CA)",
                "Pancreatic adipocyte (PA)",
                "Thyroid adipocyte (TA)",
                "Adrenal adipocyte (AA)",
                "Ovarian adipocyte (OvA)",
                "Testicular adipocyte (TA)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (AD)",
                "Adipose stem cell (ASC)",
                "Adrenal adipocyte (AA)",
                "Beige adipocyte (BA)",
                "Bone marrow adipocyte (BMA)",
                "Brown adipocyte (BrA)",
                "Cardiac adipocyte (CA)",
                "Epicardial adipocyte (EA)",
                "Hepatic adipocyte (HA)",
                "Lipoblast (LB)",
                "Lipocyte (LC)",
                "Mesenteric adipocyte (MA)",
                "Omental adipocyte (OA)",
                "Ovarian adipocyte (OvA)",
                "Pancreatic adipocyte (PA)",
                "Perivascular adipocyte (PVA)",
                "Preadipocyte (PA)",
                "Renal adipocyte (RA)",
                "Skeletal muscle adipocyte (SMA)",
                "Subcutaneous adipocyte (SA)",
                "Testicular adipocyte (TA)",
                "Thyroid adipocyte (TA)",
                "Visceral adipocyte (VA)",
                "White adipocyte (WA)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "Adipocyte (Adipo)",
            "Adipose Stem Cell",
            "Adipose-Derived Stem Cell",
            "Brown Adipocyte",
            "Brown Fat Cell",
            "Fat Cell",
            "Fat-Storing Cell",
            "Hepatocyte",
            "Lipoblast",
            "Lipocyte",
            "Lipogenic Cell",
            "Lipogenic Stem Cell",
            "Lipomuscle Cell",
            "Liposarcoma Cell",
            "Mesenchymal Stem Cell",
            "Myeloid Stem Cell",
            "Omental Fat Cell",
            "Pancreatic Islet Cell",
            "Pre-Adipocyte",
            "Stem Cell",
            "Stromal Vascular Cell",
            "White Adipocyte",
            "White Fat Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte (Adipo)",
                "Adipose Stem Cell",
                "Adipose-Derived Stem Cell",
                "Brown Adipocyte",
                "Brown Fat Cell",
                "Fat Cell",
                "Fat-Storing Cell",
                "Hepatocyte",
                "Lipoblast",
                "Lipocyte",
                "Lipogenic Cell",
                "Lipogenic Stem Cell",
                "Lipomuscle Cell",
                "Liposarcoma Cell",
                "Mesenchymal Stem Cell",
                "Myeloid Stem Cell",
                "Omental Fat Cell",
                "Pancreatic Islet Cell",
                "Pre-Adipocyte",
                "Stem Cell",
                "Stromal Vascular Cell",
                "White Adipocyte",
                "White Fat Cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (Adipo)",
                "Adipose Stem Cell",
                "Adipose-Derived Stem Cell",
                "Brown Adipocyte",
                "Brown Fat Cell",
                "Fat Cell",
                "Fat-Storing Cell",
                "Hepatocyte",
                "Lipoblast",
                "Lipocyte",
                "Lipogenic Cell",
                "Lipogenic Stem Cell",
                "Lipomuscle Cell",
                "Liposarcoma Cell",
                "Mesenchymal Stem Cell",
                "Myeloid Stem Cell",
                "Omental Fat Cell",
                "Pancreatic Islet Cell",
                "Pre-Adipocyte",
                "Stem Cell",
                "Stromal Vascular Cell",
                "White Adipocyte",
                "White Fat Cell"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            "Adipocyte (Ad)",
            "Brown Adipocyte (BA)",
            "White Adipocyte (WA)",
            "Unilocular Adipocyte (UA)",
            "Multilocular Adipocyte (MA)",
            "Cardiac Adipocyte (CA)",
            "Mesenteric Adipocyte (MeA)",
            "Epididymal Adipocyte (EpA)",
            "Perirenal Adipocyte (PRA)",
            "Subcutaneous Adipocyte (SbA)",
            "Visceral Adipocyte (VA)",
            "Intramuscular Adipocyte (IMA)",
            "Intermuscular Adipocyte (IntMA)",
            "Perimuscular Adipocyte (PmMA)",
            "Lipocyte (L)",
            "Lipid Storing Cell (LSC)",
            "Fat Cell (FC)",
            "Lipoblast (Lb)",
            "Preadipocyte (PdA)",
            "Adipoblast (Ab)",
            "Lipogenic Cell (LgC)",
            "Adipocytic Cell (AdC)",
            "Fat Storing Cell (FSC)",
            "Lipid Accumulating Cell (LAC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adipocyte (Ad)",
                "Brown Adipocyte (BA)",
                "White Adipocyte (WA)",
                "Unilocular Adipocyte (UA)",
                "Multilocular Adipocyte (MA)",
                "Cardiac Adipocyte (CA)",
                "Mesenteric Adipocyte (MeA)",
                "Epididymal Adipocyte (EpA)",
                "Perirenal Adipocyte (PRA)",
                "Subcutaneous Adipocyte (SbA)",
                "Visceral Adipocyte (VA)",
                "Intramuscular Adipocyte (IMA)",
                "Intermuscular Adipocyte (IntMA)",
                "Perimuscular Adipocyte (PmMA)",
                "Lipocyte (L)",
                "Lipid Storing Cell (LSC)",
                "Fat Cell (FC)",
                "Lipoblast (Lb)",
                "Preadipocyte (PdA)",
                "Adipoblast (Ab)",
                "Lipogenic Cell (LgC)",
                "Adipocytic Cell (AdC)",
                "Fat Storing Cell (FSC)",
                "Lipid Accumulating Cell (LAC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipoblast (Ab)",
                "Adipocyte (Ad)",
                "Adipocytic Cell (AdC)",
                "Brown Adipocyte (BA)",
                "Cardiac Adipocyte (CA)",
                "Epididymal Adipocyte (EpA)",
                "Fat Cell (FC)",
                "Fat Storing Cell (FSC)",
                "Intermuscular Adipocyte (IntMA)",
                "Intramuscular Adipocyte (IMA)",
                "Lipid Accumulating Cell (LAC)",
                "Lipid Storing Cell (LSC)",
                "Lipoblast (Lb)",
                "Lipocyte (L)",
                "Lipogenic Cell (LgC)",
                "Mesenteric Adipocyte (MeA)",
                "Multilocular Adipocyte (MA)",
                "Perimuscular Adipocyte (PmMA)",
                "Perirenal Adipocyte (PRA)",
                "Preadipocyte (PdA)",
                "Subcutaneous Adipocyte (SbA)",
                "Unilocular Adipocyte (UA)",
                "Visceral Adipocyte (VA)",
                "White Adipocyte (WA)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "adipocyte",
        "domain": "biology",
        "response": [
            {
                "Referent": "adipocyte",
                "Canonical name": "adipocyte"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "adipocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"adipocyte\", \"Canonical name\": \"adipocyte\"}"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 0
        }
    }
]