[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-4 (IL-4)",
            "Interleukin-6 (IL-6)",
            "Interleukin-10 (IL-10)",
            "Interleukin-12 (IL-12)",
            "Interleukin-15 (IL-15)",
            "Interleukin-17 (IL-17)",
            "Interferon-gamma (IFN-\u03b3)",
            "Tumor necrosis factor-alpha (TNF-\u03b1)",
            "Transforming growth factor-beta (TGF-\u03b2)",
            "Granulocyte-macrophage colony-stimulating factor (GM-CSF)",
            "Granulocyte colony-stimulating factor (G-CSF)",
            "Macrophage colony-stimulating factor (M-CSF)",
            "Epidermal growth factor (EGF)",
            "Fibroblast growth factor (FGF)",
            "Vascular endothelial growth factor (VEGF)",
            "Platelet-derived growth factor (PDGF)",
            "Leukemia inhibitory factor (LIF)",
            "Hepatocyte growth factor (HGF)",
            "Chemokine (C-C motif) ligand 2 (CCL2)",
            "Chemokine (C-X-C motif) ligand 1 (CXCL1)",
            "Chemokine (C-X-C motif) ligand 8 (CXCL8)",
            "Chemokine (C-C motif) ligand 11 (CCL11)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-4 (IL-4)",
                "Interleukin-6 (IL-6)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-15 (IL-15)",
                "Interleukin-17 (IL-17)",
                "Interferon-gamma (IFN-\u03b3)",
                "Tumor necrosis factor-alpha (TNF-\u03b1)",
                "Granulocyte-macrophage colony-stimulating factor (GM-CSF)",
                "Granulocyte colony-stimulating factor (G-CSF)",
                "Macrophage colony-stimulating factor (M-CSF)",
                "Leukemia inhibitory factor (LIF)",
                "Hepatocyte growth factor (HGF)",
                "Chemokine (C-C motif) ligand 2 (CCL2)",
                "Chemokine (C-C motif) ligand 11 (CCL11)",
                "Chemokine (C-X-C motif) ligand 1 (CXCL1)"
            ],
            "mismatches": [
                "Transforming growth factor-beta (TGF-\u03b2)",
                "Epidermal growth factor (EGF)",
                "Fibroblast growth factor (FGF)",
                "Vascular endothelial growth factor (VEGF)",
                "Platelet-derived growth factor (PDGF)",
                "Chemokine (C-X-C motif) ligand 8 (CXCL8)"
            ],
            "true_referents": [
                "Chemokine CCL11",
                "Chemokine CCL2",
                "Chemokine CCL21",
                "Chemokine CCL8",
                "Chemokine CX3CL1",
                "Chemokine CXCL1",
                "Chemokine CXCL11",
                "Chemokine CXCL2",
                "Chemokine CXCL9",
                "Colony-Stimulating Factors",
                "Granulocyte Colony-Stimulating Factor",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Hematopoietic Cell Growth Factors",
                "Hepatocyte Growth Factor",
                "Interferon-alpha",
                "Interferon-gamma",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-12",
                "Interleukin-15",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-23",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Leukemia Inhibitory Factor",
                "Leukocyte Migration-Inhibitory Factors",
                "Macrophage Colony-Stimulating Factor",
                "Transforming Growth Factor beta",
                "Transforming Growth Factor beta1",
                "Transforming Growth Factor beta2",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Interleukin-10 (IL-10)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Interferon-alpha (IFN-\u03b1)",
            "Interferon-beta (IFN-\u03b2)",
            "Interferon-gamma (IFN-\u03b3)",
            "Interleukin-4 (IL-4)",
            "Interleukin-12 (IL-12)",
            "Interleukin-17 (IL-17)",
            "Interleukin-23 (IL-23)",
            "Interleukin-27 (IL-27)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Granulocyte Colony-Stimulating Factor (G-CSF)",
            "Macrophage Colony-Stimulating Factor (M-CSF)",
            "Vascular Endothelial Growth Factor (VEGF)",
            "Fibroblast Growth Factor (FGF)",
            "Epidermal Growth Factor (EGF)",
            "Platelet-Derived Growth Factor (PDGF)",
            "B-cell Activating Factor (BAFF)",
            "A Proliferation Inducing Ligand (APRIL)",
            "Chemokine (C-C motif) Ligand 2 (CCL2)",
            "Chemokine (C-X-C motif) Ligand 8 (CXCL8)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Interleukin-10 (IL-10)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-4 (IL-4)",
                "Interleukin-12 (IL-12)",
                "Interleukin-17 (IL-17)",
                "Interleukin-23 (IL-23)",
                "Interleukin-27 (IL-27)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "B-cell Activating Factor (BAFF)",
                "Chemokine (C-C motif) Ligand 2 (CCL2)"
            ],
            "mismatches": [
                "Vascular Endothelial Growth Factor (VEGF)",
                "Fibroblast Growth Factor (FGF)",
                "Epidermal Growth Factor (EGF)",
                "Platelet-Derived Growth Factor (PDGF)",
                "A Proliferation Inducing Ligand (APRIL)",
                "Chemokine (C-X-C motif) Ligand 8 (CXCL8)"
            ],
            "true_referents": [
                "4-1BB Ligand",
                "B-Cell Activating Factor",
                "Chemokine CCL2",
                "Chemokine CXCL2",
                "Colony-Stimulating Factors",
                "Granulocyte Colony-Stimulating Factor",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Interferon alpha-2",
                "Interferon beta-1a",
                "Interferon beta-1b",
                "Interferon-alpha",
                "Interferon-beta",
                "Interferon-gamma",
                "Interferons",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-12",
                "Interleukin-13",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-23",
                "Interleukin-27",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Interleukin-7",
                "Macrophage Colony-Stimulating Factor",
                "Macrophage-Activating Factors",
                "RANK Ligand",
                "TNF-Related Apoptosis-Inducing Ligand",
                "Transforming Growth Factor beta",
                "Transforming Growth Factor beta1",
                "Transforming Growth Factor beta2",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors"
            ],
            "TP": 19,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Cytokine (e.g., Interleukin-1)",
            "Chemokine (e.g., CXCL8)",
            "Interleukin-6",
            "Interleukin-10",
            "Interleukin-12",
            "Interferon-gamma",
            "Tumor Necrosis Factor-alpha",
            "Transforming Growth Factor-beta",
            "Interleukin-2",
            "Interleukin-4",
            "Interleukin-5",
            "Interleukin-7",
            "Interleukin-8",
            "Interleukin-9",
            "Interleukin-13",
            "Interleukin-15",
            "Interleukin-17",
            "Interleukin-18",
            "Interleukin-21",
            "Interleukin-22",
            "Interleukin-23",
            "Interleukin-27",
            "Interleukin-31",
            "Interleukin-33",
            "Interleukin-35"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-6",
                "Interleukin-10",
                "Interleukin-12",
                "Interferon-gamma",
                "Tumor Necrosis Factor-alpha",
                "Interleukin-2",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-7",
                "Interleukin-8",
                "Interleukin-9",
                "Interleukin-13",
                "Interleukin-15",
                "Interleukin-17",
                "Interleukin-18",
                "Interleukin-22",
                "Interleukin-23",
                "Interleukin-27",
                "Interleukin-33"
            ],
            "mismatches": [
                "Cytokine (e.g., Interleukin-1)",
                "Chemokine (e.g., CXCL8)",
                "Transforming Growth Factor-beta",
                "Interleukin-21",
                "Interleukin-31",
                "Interleukin-35"
            ],
            "true_referents": [
                "Chemokine CCL8",
                "Chemokine CXCL1",
                "Chemokine CXCL2",
                "Interferon-alpha",
                "Interferon-gamma",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-11",
                "Interleukin-12",
                "Interleukin-13",
                "Interleukin-15",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-18",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-22",
                "Interleukin-23",
                "Interleukin-27",
                "Interleukin-3",
                "Interleukin-33",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Interleukin-7",
                "Interleukin-8",
                "Interleukin-9",
                "Transforming Growth Factor beta",
                "Transforming Growth Factor beta1",
                "Transforming Growth Factor beta2",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors"
            ],
            "TP": 19,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Interleukin-10 (IL-10)",
            "Interleukin-12 (IL-12)",
            "Interleukin-17 (IL-17)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Interferon-gamma (IFN-\u03b3)",
            "Interferon-alpha (IFN-\u03b1)",
            "Chemokine (C-X-C motif) ligand 8 (CXCL8)",
            "Chemokine (C-C motif) ligand 2 (CCL2)",
            "Platelet-Activating Factor (PAF)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Macrophage Colony-Stimulating Factor (M-CSF)",
            "Epidermal Growth Factor (EGF)",
            "Vascular Endothelial Growth Factor (VEGF)",
            "Fibroblast Growth Factor 2 (FGF2)",
            "Nerve Growth Factor (NGF)",
            "Brain-Derived Neurotrophic Factor (BDNF)",
            "Glial Cell Line-Derived Neurotrophic Factor (GDNF)",
            "Cystine-rich secretory protein (CRISP)",
            "Lymphotactin (Lymphotactin)",
            "B Lymphocyte Attractant (BlyS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-17 (IL-17)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interferon-alpha (IFN-\u03b1)",
                "Chemokine (C-C motif) ligand 2 (CCL2)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Macrophage Colony-Stimulating Factor (M-CSF)"
            ],
            "mismatches": [
                "Chemokine (C-X-C motif) ligand 8 (CXCL8)",
                "Platelet-Activating Factor (PAF)",
                "Epidermal Growth Factor (EGF)",
                "Vascular Endothelial Growth Factor (VEGF)",
                "Fibroblast Growth Factor 2 (FGF2)",
                "Nerve Growth Factor (NGF)",
                "Brain-Derived Neurotrophic Factor (BDNF)",
                "Glial Cell Line-Derived Neurotrophic Factor (GDNF)",
                "Cystine-rich secretory protein (CRISP)",
                "Lymphotactin (Lymphotactin)",
                "B Lymphocyte Attractant (BlyS)"
            ],
            "true_referents": [
                "B-Cell Activating Factor",
                "Chemokine CCL2",
                "Chemokine CCL24",
                "Chemokine CCL26",
                "Chemokine CCL8",
                "Chemokine CXCL1",
                "Chemokine CXCL2",
                "Chemokine CXCL6",
                "Chemokine CXCL9",
                "Granulocyte Colony-Stimulating Factor",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Growth Differentiation Factor 15",
                "Interferon alpha-2",
                "Interferon-alpha",
                "Interferon-gamma",
                "Interferons",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-12",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-23",
                "Interleukin-5",
                "Interleukin-6",
                "Lymphokines",
                "Lymphotoxin-alpha",
                "Lymphotoxin-beta",
                "Macrophage Colony-Stimulating Factor",
                "Platelet Factor 4",
                "Stem Cell Factor",
                "Transforming Growth Factor beta",
                "Transforming Growth Factor beta1",
                "Transforming Growth Factor beta2",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Interleukin-10 (IL-10)",
            "Interleukin-12 (IL-12)",
            "Interleukin-17 (IL-17)",
            "Tumor Necrosis Factor-alpha (TNF-alpha)",
            "Interferon-gamma (IFN-gamma)",
            "Interferon-alpha (IFN-alpha)",
            "Interferon-beta (IFN-beta)",
            "Transforming Growth Factor-beta (TGF-beta)",
            "Interleukin-4 (IL-4)",
            "Interleukin-5 (IL-5)",
            "Interleukin-8 (IL-8)",
            "Interleukin-13 (IL-13)",
            "Interleukin-15 (IL-15)",
            "Interleukin-18 (IL-18)",
            "Interleukin-23 (IL-23)",
            "Interleukin-22 (IL-22)",
            "Interleukin-21 (IL-21)",
            "Interleukin-9 (IL-9)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Macrophage Inflammatory Protein-1 alpha (MIP-1 alpha)",
            "Monocyte Chemoattractant Protein-1 (MCP-1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-17 (IL-17)",
                "Tumor Necrosis Factor-alpha (TNF-alpha)",
                "Interferon-gamma (IFN-gamma)",
                "Interferon-alpha (IFN-alpha)",
                "Interferon-beta (IFN-beta)",
                "Transforming Growth Factor-beta (TGF-beta)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-8 (IL-8)",
                "Interleukin-13 (IL-13)",
                "Interleukin-15 (IL-15)",
                "Interleukin-18 (IL-18)",
                "Interleukin-23 (IL-23)",
                "Interleukin-22 (IL-22)",
                "Interleukin-9 (IL-9)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)"
            ],
            "mismatches": [
                "Interleukin-21 (IL-21)",
                "Macrophage Inflammatory Protein-1 alpha (MIP-1 alpha)",
                "Monocyte Chemoattractant Protein-1 (MCP-1)"
            ],
            "true_referents": [
                "Chemokine CCL1",
                "Chemokine CXCL1",
                "Granulocyte Colony-Stimulating Factor",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Interferon alpha-2",
                "Interferon beta-1a",
                "Interferon beta-1b",
                "Interferon-alpha",
                "Interferon-beta",
                "Interferon-gamma",
                "Interferons",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-11",
                "Interleukin-12",
                "Interleukin-13",
                "Interleukin-15",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-18",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-22",
                "Interleukin-23",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Interleukin-7",
                "Interleukin-8",
                "Interleukin-9",
                "Macrophage Colony-Stimulating Factor",
                "Macrophage Inflammatory Proteins",
                "Monocyte Chemoattractant Proteins",
                "Transforming Growth Factor beta",
                "Transforming Growth Factor beta1",
                "Transforming Growth Factor beta2",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Interleukin-10 (IL-10)",
            "Interleukin-12 (IL-12)",
            "Interleukin-17 (IL-17)",
            "Tumor Necrosis Factor-alpha (TNF-alpha)",
            "Transforming Growth Factor-beta (TGF-beta)",
            "Interferon-gamma (IFN-gamma)",
            "Chemokine (C-C motif) ligand 2 (CCL2)",
            "Chemokine (C-X-C motif) ligand 8 (CXCL8)",
            "Granulocyte-macrophage colony-stimulating factor (GM-CSF)",
            "Platelet-derived growth factor (PDGF)",
            "Vascular endothelial growth factor (VEGF)",
            "Macrophage inflammatory protein 1-alpha (MIP-1\u03b1)",
            "RANTES (Regulated on Activation, Normal T Expressed and Secreted)",
            "Eotaxin (CCL11)",
            "Leptin",
            "Resistin",
            "Adiponectin",
            "Insulin-like growth factor 1 (IGF-1)",
            "Myostatin",
            "Hepcidin",
            "Ghrelin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1",
                "Interleukin-2",
                "Interleukin-6",
                "Interleukin-10",
                "Interleukin-12",
                "Interleukin-17",
                "Tumor Necrosis Factor-alpha",
                "Transforming Growth Factor beta",
                "Interferon-gamma",
                "Chemokine CCL2",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Macrophage Inflammatory Proteins",
                "Chemokine CCL11"
            ],
            "mismatches": [
                "Chemokine (C-X-C motif) ligand 8 (CXCL8)",
                "Platelet-derived growth factor (PDGF)",
                "Vascular endothelial growth factor (VEGF)",
                "RANTES (Regulated on Activation, Normal T Expressed and Secreted)",
                "Leptin",
                "Resistin",
                "Adiponectin",
                "Insulin-like growth factor 1 (IGF-1)",
                "Myostatin",
                "Hepcidin",
                "Ghrelin"
            ],
            "true_referents": [
                "Chemokine CCL1",
                "Chemokine CCL11",
                "Chemokine CCL2",
                "Chemokine CCL8",
                "Chemokine CXCL1",
                "Chemokine CXCL11",
                "Chemokine CXCL2",
                "Chemokine CXCL9",
                "Chemokines",
                "Erythropoietin",
                "Granulocyte Colony-Stimulating Factor",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Growth Differentiation Factor 15",
                "Interferon-alpha",
                "Interferon-gamma",
                "Interleukin 1 Receptor Antagonist Protein",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-12",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-23",
                "Interleukin-5",
                "Interleukin-6",
                "Macrophage Colony-Stimulating Factor",
                "Macrophage Inflammatory Proteins",
                "Monokines",
                "Osteopontin",
                "Transforming Growth Factor beta",
                "Transforming Growth Factor beta1",
                "Transforming Growth Factor beta2",
                "Transforming Growth Factor beta3",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Interleukin 1 (IL-1)",
            "Interleukin 2 (IL-2)",
            "Interleukin 3 (IL-3)",
            "Interleukin 4 (IL-4)",
            "Interleukin 5 (IL-5)",
            "Interleukin 6 (IL-6)",
            "Interleukin 7 (IL-7)",
            "Interleukin 8 (IL-8)",
            "Interleukin 9 (IL-9)",
            "Interleukin 10 (IL-10)",
            "Interleukin 11 (IL-11)",
            "Interleukin 12 (IL-12)",
            "Interleukin 13 (IL-13)",
            "Interleukin 14 (IL-14)",
            "Interleukin 15 (IL-15)",
            "Interleukin 16 (IL-16)",
            "Interleukin 17 (IL-17)",
            "Interferon gamma (IFN-\u03b3)",
            "Tumor Necrosis Factor Alpha (TNF-\u03b1)",
            "Transforming Growth Factor Beta (TGF-\u03b2)",
            "Colony Stimulating Factor 1 (CSF-1)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Macrophage Colony-Stimulating Factor (M-CSF)",
            "Granulocyte Colony-Stimulating Factor (G-CSF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1",
                "Interleukin-2",
                "Interleukin-3",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Interleukin-7",
                "Interleukin-8",
                "Interleukin-9",
                "Interleukin-10",
                "Interleukin-11",
                "Interleukin-12",
                "Interleukin-13",
                "Interleukin-15",
                "Interleukin-16",
                "Interleukin-17",
                "Interferon-gamma",
                "Tumor Necrosis Factor-alpha",
                "Transforming Growth Factor beta",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Macrophage Colony-Stimulating Factor",
                "Granulocyte Colony-Stimulating Factor"
            ],
            "mismatches": [
                "Interleukin 14 (IL-14)",
                "Colony Stimulating Factor 1 (CSF-1)"
            ],
            "true_referents": [
                "Colony-Stimulating Factors",
                "Granulocyte Colony-Stimulating Factor",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Interferon-alpha",
                "Interferon-gamma",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-11",
                "Interleukin-12",
                "Interleukin-13",
                "Interleukin-15",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-23",
                "Interleukin-3",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Interleukin-7",
                "Interleukin-8",
                "Interleukin-9",
                "Macrophage Colony-Stimulating Factor",
                "Transforming Growth Factor beta",
                "Transforming Growth Factor beta1",
                "Transforming Growth Factor beta2",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Interleukin-10 (IL-10)",
            "Interleukin-12 (IL-12)",
            "Tumor necrosis factor-alpha (TNF-alpha)",
            "Tumor necrosis factor-beta (TNF-beta)",
            "Interferon-gamma (IFN-gamma)",
            "Interferon-alpha (IFN-alpha)",
            "Interferon-beta (IFN-beta)",
            "Interferon-lambda (IFN-lambda)",
            "Transforming growth factor-beta (TGF-beta)",
            "Epidermal growth factor (EGF)",
            "Fibroblast growth factor (FGF)",
            "Platelet-derived growth factor (PDGF)",
            "Vascular endothelial growth factor (VEGF)",
            "Insulin-like growth factor (IGF)",
            "Nerve growth factor (NGF)",
            "Hepatocyte growth factor (HGF)",
            "Erythropoietin (EPO)",
            "Thrombopoietin (TPO)",
            "Granulocyte colony-stimulating factor (G-CSF)",
            "Macrophage colony-stimulating factor (M-CSF)",
            "Interleukin-4 (IL-4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Tumor necrosis factor-alpha (TNF-alpha)",
                "Interferon-gamma (IFN-gamma)",
                "Interferon-alpha (IFN-alpha)",
                "Interferon-beta (IFN-beta)",
                "Transforming growth factor-beta (TGF-beta)",
                "Hepatocyte growth factor (HGF)",
                "Erythropoietin (EPO)",
                "Thrombopoietin (TPO)",
                "Granulocyte colony-stimulating factor (G-CSF)",
                "Macrophage colony-stimulating factor (M-CSF)",
                "Interleukin-4 (IL-4)"
            ],
            "mismatches": [
                "Tumor necrosis factor-beta (TNF-beta)",
                "Interferon-lambda (IFN-lambda)",
                "Epidermal growth factor (EGF)",
                "Fibroblast growth factor (FGF)",
                "Platelet-derived growth factor (PDGF)",
                "Vascular endothelial growth factor (VEGF)",
                "Insulin-like growth factor (IGF)",
                "Nerve growth factor (NGF)"
            ],
            "true_referents": [
                "Colony-Stimulating Factors",
                "Epoetin Alfa",
                "Erythropoietin",
                "Granulocyte Colony-Stimulating Factor",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Hematopoietic Cell Growth Factors",
                "Hepatocyte Growth Factor",
                "Interferon Lambda",
                "Interferon alpha-2",
                "Interferon beta-1a",
                "Interferon beta-1b",
                "Interferon-alpha",
                "Interferon-beta",
                "Interferon-gamma",
                "Interferons",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-12",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Macrophage Colony-Stimulating Factor",
                "Platelet Factor 4",
                "Thrombopoietin",
                "Transforming Growth Factor beta",
                "Transforming Growth Factor beta1",
                "Transforming Growth Factor beta2",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors",
                "beta-Thromboglobulin"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-4 (IL-4)",
            "Interleukin-6 (IL-6)",
            "Interleukin-10 (IL-10)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Interferon-gamma (IFN-\u03b3)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Interleukin-12 (IL-12)",
            "Interleukin-17 (IL-17)",
            "Interleukin-23 (IL-23)",
            "Interferon-alpha (IFN-\u03b1)",
            "Interferon-beta (IFN-\u03b2)",
            "Erythropoietin (EPO)",
            "Granulocyte Colony-Stimulating Factor (G-CSF)",
            "Colony Stimulating Factor 1 (CSF-1)",
            "Macrophage Inflammatory Protein-1 alpha (MIP-1\u03b1)",
            "Monocyte Chemoattractant Protein-1 (MCP-1)",
            "C-X-C motif ligand 8 (CXCL8)",
            "C-C motif ligand 2 (CCL2)",
            "C-X-C motif ligand 10 (CXCL10)",
            "C-C motif ligand 5 (CCL5)",
            "Fibroblast Growth Factor (FGF)",
            "Vascular Endothelial Growth Factor (VEGF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-4 (IL-4)",
                "Interleukin-6 (IL-6)",
                "Interleukin-10 (IL-10)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Interferon-gamma (IFN-\u03b3)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interleukin-12 (IL-12)",
                "Interleukin-17 (IL-17)",
                "Interleukin-23 (IL-23)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Erythropoietin (EPO)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Macrophage Inflammatory Protein-1 alpha (MIP-1\u03b1)",
                "Monocyte Chemoattractant Protein-1 (MCP-1)",
                "C-C motif ligand 2 (CCL2)",
                "C-X-C motif ligand 10 (CXCL10)",
                "C-C motif ligand 5 (CCL5)"
            ],
            "mismatches": [
                "Colony Stimulating Factor 1 (CSF-1)",
                "C-X-C motif ligand 8 (CXCL8)",
                "Fibroblast Growth Factor (FGF)",
                "Vascular Endothelial Growth Factor (VEGF)"
            ],
            "true_referents": [
                "CC Chemokines",
                "Chemokine CCL1",
                "Chemokine CCL2",
                "Chemokine CCL5",
                "Chemokine CCL8",
                "Chemokine CXCL1",
                "Chemokine CXCL10",
                "Chemokine CXCL2",
                "Chemokine CXCL5",
                "Chemokine CXCL9",
                "Colony-Stimulating Factors",
                "Epoetin Alfa",
                "Erythropoietin",
                "Granulocyte Colony-Stimulating Factor",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Interferon alpha-2",
                "Interferon beta-1a",
                "Interferon beta-1b",
                "Interferon-alpha",
                "Interferon-beta",
                "Interferon-gamma",
                "Interferons",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-12",
                "Interleukin-13",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-23",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Macrophage Colony-Stimulating Factor",
                "Macrophage Inflammatory Proteins",
                "Monocyte Chemoattractant Proteins",
                "Thrombopoietin",
                "Transforming Growth Factor beta",
                "Transforming Growth Factor beta1",
                "Transforming Growth Factor beta2",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors"
            ],
            "TP": 21,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Interferon-gamma (IFN-\u03b3)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Chemokine (C-C motif) ligand 2 (CCL2)",
            "Interleukin-10 (IL-10)",
            "Interleukin-4 (IL-4)",
            "Interleukin-12 (IL-12)",
            "Interleukin-17 (IL-17)",
            "Interleukin-8 (IL-8)",
            "Interferon-alpha (IFN-\u03b1)",
            "Interferon-beta (IFN-\u03b2)",
            "Macrophage Inflammatory Protein-1alpha (MIP-1\u03b1)",
            "Macrophage Inflammatory Protein-1beta (MIP-1\u03b2)",
            "RANTES (CCL5)",
            "Eotaxin (CCL11)",
            "Monocyte Chemoattractant Protein-1 (MCP-1)",
            "Granulocyte Colony-Stimulating Factor (G-CSF)",
            "Leukemia Inhibitory Factor (LIF)",
            "Oncostatin M (OSM)",
            "Stem Cell Factor (SCF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1",
                "Interleukin-2",
                "Interleukin-6",
                "Tumor Necrosis Factor-alpha",
                "Interferon-gamma",
                "Transforming Growth Factor beta",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Chemokine CCL2",
                "Interleukin-10",
                "Interleukin-4",
                "Interleukin-12",
                "Interleukin-17",
                "Interleukin-8",
                "Interferon-alpha",
                "Interferon-beta",
                "Macrophage Inflammatory Proteins",
                "Chemokine CCL5",
                "Chemokine CCL11",
                "Monocyte Chemoattractant Proteins",
                "Granulocyte Colony-Stimulating Factor",
                "Leukemia Inhibitory Factor",
                "Oncostatin M",
                "Stem Cell Factor"
            ],
            "mismatches": [],
            "true_referents": [
                "Chemokine CCL1",
                "Chemokine CCL11",
                "Chemokine CCL2",
                "Chemokine CCL5",
                "Chemokine CXCL1",
                "Chemokine CXCL11",
                "Chemokine CXCL2",
                "Chemokine CXCL5",
                "Colony-Stimulating Factors",
                "Granulocyte Colony-Stimulating Factor",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Hematopoietic Cell Growth Factors",
                "Interferon alpha-2",
                "Interferon beta-1a",
                "Interferon beta-1b",
                "Interferon-alpha",
                "Interferon-beta",
                "Interferon-gamma",
                "Interferons",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-12",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-1alpha",
                "Interleukin-1beta",
                "Interleukin-2",
                "Interleukin-23",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Interleukin-8",
                "Lenograstim",
                "Leukemia Inhibitory Factor",
                "Leukocyte Migration-Inhibitory Factors",
                "Macrophage Colony-Stimulating Factor",
                "Macrophage Inflammatory Proteins",
                "Monocyte Chemoattractant Proteins",
                "Oncostatin M",
                "RANK Ligand",
                "Stem Cell Factor",
                "Transforming Growth Factor beta",
                "Transforming Growth Factor beta1",
                "Transforming Growth Factor beta2",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-4 (IL-4)",
            "Interleukin-6 (IL-6)",
            "Interleukin-8 (IL-8)",
            "Interleukin-10 (IL-10)",
            "Interleukin-12 (IL-12)",
            "Interleukin-13 (IL-13)",
            "Interleukin-17 (IL-17)",
            "Interleukin-18 (IL-18)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Interferon-alpha (IFN-\u03b1)",
            "Interferon-beta (IFN-\u03b2)",
            "Interferon-gamma (IFN-\u03b3)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Granulocyte Colony-Stimulating Factor (G-CSF)",
            "Macrophage Colony-Stimulating Factor (M-CSF)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Chemokine (C-C motif) Ligand 2 (CCL2)",
            "Chemokine (C-C motif) Ligand 5 (CCL5)",
            "Chemokine (C-X-C motif) Ligand 8 (CXCL8)",
            "Chemokine (C-X-C motif) Ligand 10 (CXCL10)",
            "Leukemia Inhibitory Factor (LIF)",
            "Oncostatin M (OSM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-4 (IL-4)",
                "Interleukin-6 (IL-6)",
                "Interleukin-8 (IL-8)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Interferon-gamma (IFN-\u03b3)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Chemokine (C-C motif) Ligand 2 (CCL2)",
                "Chemokine (C-C motif) Ligand 5 (CCL5)",
                "Oncostatin M (OSM)",
                "Leukemia Inhibitory Factor (LIF)"
            ],
            "mismatches": [
                "Chemokine (C-X-C motif) Ligand 8 (CXCL8)"
            ],
            "true_referents": [
                "Chemokine CCL1",
                "Chemokine CCL2",
                "Chemokine CCL5",
                "Chemokine CCL8",
                "Chemokine CXCL1",
                "Chemokine CXCL10",
                "Chemokine CXCL2",
                "Chemokine CXCL5",
                "Chemokine CXCL9",
                "Colony-Stimulating Factors",
                "Granulocyte Colony-Stimulating Factor",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Interferon alpha-2",
                "Interferon beta-1a",
                "Interferon beta-1b",
                "Interferon-alpha",
                "Interferon-beta",
                "Interferon-gamma",
                "Interferons",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-12",
                "Interleukin-13",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-18",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-23",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Interleukin-8",
                "Lenograstim",
                "Leukemia Inhibitory Factor",
                "Leukocyte Migration-Inhibitory Factors",
                "Macrophage Colony-Stimulating Factor",
                "Oncostatin M",
                "RANK Ligand",
                "Transforming Growth Factor beta",
                "Transforming Growth Factor beta1",
                "Transforming Growth Factor beta2",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors"
            ],
            "TP": 22,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-3 (IL-3)",
            "Interleukin-4 (IL-4)",
            "Interleukin-5 (IL-5)",
            "Interleukin-6 (IL-6)",
            "Interleukin-7 (IL-7)",
            "Interleukin-8 (IL-8)",
            "Interleukin-9 (IL-9)",
            "Interleukin-10 (IL-10)",
            "Interleukin-11 (IL-11)",
            "Interleukin-12 (IL-12)",
            "Interleukin-13 (IL-13)",
            "Interleukin-14 (IL-14)",
            "Interleukin-15 (IL-15)",
            "Interleukin-16 (IL-16)",
            "Interleukin-17 (IL-17)",
            "Interleukin-18 (IL-18)",
            "Interleukin-19 (IL-19)",
            "Interleukin-20 (IL-20)",
            "Interleukin-21 (IL-21)",
            "Interleukin-22 (IL-22)",
            "Interleukin-23 (IL-23)",
            "Interleukin-24 (IL-24)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-3 (IL-3)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-7 (IL-7)",
                "Interleukin-8 (IL-8)",
                "Interleukin-9 (IL-9)",
                "Interleukin-10 (IL-10)",
                "Interleukin-11 (IL-11)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-15 (IL-15)",
                "Interleukin-16 (IL-16)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)"
            ],
            "mismatches": [
                "Interleukin-14 (IL-14)",
                "Interleukin-19 (IL-19)",
                "Interleukin-20 (IL-20)",
                "Interleukin-21 (IL-21)",
                "Interleukin-24 (IL-24)"
            ],
            "true_referents": [
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-11",
                "Interleukin-12",
                "Interleukin-13",
                "Interleukin-15",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-18",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-22",
                "Interleukin-23",
                "Interleukin-3",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Interleukin-7",
                "Interleukin-8",
                "Interleukin-9"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-4 (IL-4)",
            "Interleukin-6 (IL-6)",
            "Interleukin-8 (IL-8)",
            "Interleukin-10 (IL-10)",
            "Interleukin-12 (IL-12)",
            "Interferon-gamma (IFN-\u03b3)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Macrophage Colony-Stimulating Factor (M-CSF)",
            "Platelet-Derived Growth Factor (PDGF)",
            "Epidermal Growth Factor (EGF)",
            "Fibroblast Growth Factor (FGF)",
            "Vascular Endothelial Growth Factor (VEGF)",
            "Nerve Growth Factor (NGF)",
            "Insulin-Like Growth Factor (IGF)",
            "Erythropoietin (EPO)",
            "Thrombopoietin (TPO)",
            "Adiponectin",
            "Leptin",
            "Ghrelin",
            "Resistin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-4 (IL-4)",
                "Interleukin-6 (IL-6)",
                "Interleukin-8 (IL-8)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interferon-gamma (IFN-\u03b3)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Erythropoietin (EPO)",
                "Thrombopoietin (TPO)"
            ],
            "mismatches": [
                "Platelet-Derived Growth Factor (PDGF)",
                "Epidermal Growth Factor (EGF)",
                "Fibroblast Growth Factor (FGF)",
                "Vascular Endothelial Growth Factor (VEGF)",
                "Nerve Growth Factor (NGF)",
                "Insulin-Like Growth Factor (IGF)",
                "Adiponectin",
                "Leptin",
                "Ghrelin",
                "Resistin"
            ],
            "true_referents": [
                "Epoetin Alfa",
                "Erythropoietin",
                "Granulocyte Colony-Stimulating Factor",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Growth Differentiation Factor 15",
                "Interferon-alpha",
                "Interferon-gamma",
                "Interleukin 1 Receptor Antagonist Protein",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-12",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Interleukin-8",
                "Macrophage Colony-Stimulating Factor",
                "Osteopontin",
                "Platelet Factor 4",
                "Thrombopoietin",
                "Transforming Growth Factor beta",
                "Transforming Growth Factor beta1",
                "Transforming Growth Factor beta2",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors",
                "beta-Thromboglobulin"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-4 (IL-4)",
            "Interleukin-6 (IL-6)",
            "Interleukin-8 (IL-8)",
            "Tumor Necrosis Factor-alpha (TNF-alpha)",
            "Interferon-gamma (IFN-gamma)",
            "Transforming Growth Factor-beta (TGF-beta)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Macrophage Inflammatory Protein-1 (MIP-1)",
            "Chemokine (C-C motif) ligand 2 (CCL2)",
            "Chemokine (C-X-C motif) ligand 10 (CXCL10)",
            "Interleukin-10 (IL-10)",
            "Interleukin-12 (IL-12)",
            "Interleukin-15 (IL-15)",
            "Interleukin-18 (IL-18)",
            "Leukemia Inhibitory Factor (LIF)",
            "Oncostatin M (OSM)",
            "Cardiotrophin-1 (CT-1)",
            "Cytokine-induced neutrophil chemoattractant-1 (CINC-1)",
            "Platelet-derived growth factor (PDGF)",
            "Vascular endothelial growth factor (VEGF)",
            "Eotaxin (CCL11)",
            "Monocyte chemoattractant protein-1 (MCP-1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-4 (IL-4)",
                "Interleukin-6 (IL-6)",
                "Interleukin-8 (IL-8)",
                "Tumor Necrosis Factor-alpha (TNF-alpha)",
                "Interferon-gamma (IFN-gamma)",
                "Transforming Growth Factor-beta (TGF-beta)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Macrophage Inflammatory Protein-1 (MIP-1)",
                "Chemokine (C-C motif) ligand 2 (CCL2)",
                "Chemokine (C-X-C motif) ligand 10 (CXCL10)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-15 (IL-15)",
                "Interleukin-18 (IL-18)",
                "Leukemia Inhibitory Factor (LIF)",
                "Oncostatin M (OSM)",
                "Eotaxin (CCL11)",
                "Monocyte chemoattractant protein-1 (MCP-1)"
            ],
            "mismatches": [
                "Cardiotrophin-1 (CT-1)",
                "Cytokine-induced neutrophil chemoattractant-1 (CINC-1)",
                "Platelet-derived growth factor (PDGF)",
                "Vascular endothelial growth factor (VEGF)"
            ],
            "true_referents": [
                "Chemokine CCL1",
                "Chemokine CCL11",
                "Chemokine CCL2",
                "Chemokine CXCL1",
                "Chemokine CXCL10",
                "Chemokine CXCL11",
                "Chemokine CXCL2",
                "Chemokine CXCL9",
                "Colony-Stimulating Factors",
                "Granulocyte Colony-Stimulating Factor",
                "Granulocyte-Macrophage Colony-Stimulating Factor",
                "Interferon-alpha",
                "Interferon-gamma",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-12",
                "Interleukin-15",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-18",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Interleukin-8",
                "Lenograstim",
                "Leukemia Inhibitory Factor",
                "Leukocyte Migration-Inhibitory Factors",
                "Macrophage Colony-Stimulating Factor",
                "Macrophage Inflammatory Proteins",
                "Monocyte Chemoattractant Proteins",
                "Oncostatin M",
                "Osteopontin",
                "RANK Ligand",
                "Transforming Growth Factor beta",
                "Transforming Growth Factor beta1",
                "Transforming Growth Factor beta2",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "cytokine",
        "domain": "biology",
        "response": [
            "Cytokine (CYT)",
            "Interferon-alpha (IFN-\u03b1)",
            "Interferon-beta (IFN-\u03b2)",
            "Interferon-gamma (IFN-\u03b3)",
            "Tumor necrosis factor-alpha (TNF-\u03b1)",
            "Tumor necrosis factor-beta (TNF-\u03b2)",
            "Interleukin-1 alpha (IL-1\u03b1)",
            "Interleukin-1 beta (IL-1\u03b2)",
            "Interleukin-2 (IL-2)",
            "Interleukin-3 (IL-3)",
            "Interleukin-4 (IL-4)",
            "Interleukin-5 (IL-5)",
            "Interleukin-6 (IL-6)",
            "Interleukin-7 (IL-7)",
            "Interleukin-8 (IL-8)",
            "Interleukin-9 (IL-9)",
            "Interleukin-10 (IL-10)",
            "Interleukin-11 (IL-11)",
            "Interleukin-12 (IL-12)",
            "Interleukin-13 (IL-13)",
            "Interleukin-14 (IL-14)",
            "Interleukin-15 (IL-15)",
            "Interleukin-16 (IL-16)",
            "Interleukin-17 (IL-17)",
            "Interleukin-18 (IL-18)",
            "Interleukin-19 (IL-19)",
            "Interleukin-20 (IL-20)",
            "Interleukin-21 (IL-21)",
            "Interleukin-22 (IL-22)",
            "Interleukin-23 (IL-23)",
            "Interleukin-24 (IL-24)",
            "Interleukin-26 (IL-26)",
            "Interleukin-27 (IL-27)",
            "Interleukin-28 (IL-28)",
            "Interleukin-29 (IL-29)",
            "Interleukin-30 (IL-30)",
            "Interleukin-31 (IL-31)",
            "Interleukin-32 (IL-32)",
            "Interleukin-33 (IL-33)",
            "Interleukin-34 (IL-34)",
            "Interleukin-35 (IL-35)",
            "Granulocyte colony-stimulating factor (G-CSF)",
            "Granulocyte-macrophage colony-stimulating factor (GM-CSF)",
            "Macrophage colony-stimulating factor (M-CSF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interferon-alpha",
                "Interferon-beta",
                "Interferon-gamma",
                "Tumor Necrosis Factor-alpha",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-3",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Interleukin-7",
                "Interleukin-8",
                "Interleukin-9",
                "Interleukin-10",
                "Interleukin-11",
                "Interleukin-12",
                "Interleukin-13",
                "Interleukin-15",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-23"
            ],
            "mismatches": [
                "Cytokine (CYT)",
                "Tumor necrosis factor-beta (TNF-\u03b2)",
                "Interleukin-1 beta (IL-1\u03b2)",
                "Interleukin-14 (IL-14)",
                "Interleukin-18 (IL-18)",
                "Interleukin-19 (IL-19)",
                "Interleukin-20 (IL-20)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-24 (IL-24)",
                "Interleukin-26 (IL-26)",
                "Interleukin-27 (IL-27)",
                "Interleukin-28 (IL-28)",
                "Interleukin-29 (IL-29)",
                "Interleukin-30 (IL-30)",
                "Interleukin-31 (IL-31)",
                "Interleukin-32 (IL-32)",
                "Interleukin-33 (IL-33)",
                "Interleukin-34 (IL-34)",
                "Interleukin-35 (IL-35)",
                "Granulocyte colony-stimulating factor (G-CSF)",
                "Granulocyte-macrophage colony-stimulating factor (GM-CSF)",
                "Macrophage colony-stimulating factor (M-CSF)"
            ],
            "true_referents": [
                "Interferon alpha-2",
                "Interferon beta-1a",
                "Interferon beta-1b",
                "Interferon-alpha",
                "Interferon-beta",
                "Interferon-gamma",
                "Interferons",
                "Interleukin-1",
                "Interleukin-10",
                "Interleukin-11",
                "Interleukin-12",
                "Interleukin-13",
                "Interleukin-15",
                "Interleukin-16",
                "Interleukin-17",
                "Interleukin-1alpha",
                "Interleukin-2",
                "Interleukin-23",
                "Interleukin-3",
                "Interleukin-4",
                "Interleukin-5",
                "Interleukin-6",
                "Interleukin-7",
                "Interleukin-8",
                "Interleukin-9",
                "Tumor Necrosis Factor-alpha",
                "Tumor Necrosis Factors"
            ],
            "TP": 21,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "cytokine",
        "domain": "biology",
        "response": "{\n    \"referent\": \"Interleukin 1\",\n    \"canonical name\": \"IL1\"\n},\n{\n    \"referent\": \"Interleukin 2\",\n    \"canonical name\": \"IL2\"\n},\n{\n    \"referent\": \"Interleukin 3\",\n    \"canonical name\": \"IL3\"\n},\n{\n    \"referent\": \"Interleukin 4\",\n    \"canonical name\": \"IL4\"\n},\n{\n    \"referent\": \"Interleukin 5\",\n    \"canonical name\": \"IL5\"\n},\n{\n    \"referent\": \"Interleukin 6\",\n    \"canonical name\": \"IL6\"\n},\n{\n    \"referent\": \"Interleukin 7\",\n    \"canonical name\": \"IL7\"\n},\n{\n    \"referent\": \"Interleukin 8\",\n    \"canonical name\": \"IL8\"\n},\n{\n    \"referent\": \"Interleukin 9\",\n    \"canonical name\": \"IL9\"\n},\n{\n    \"referent\": \"Interleukin 10\",\n    \"canonical name\": \"IL10\"\n},\n{\n    \"referent\": \"Interleukin 11\",\n    \"canonical name\": \"IL11\"\n},\n{\n    \"referent\": \"Interleukin 12\",\n    \"canonical name\": \"IL12\"\n},\n{\n    \"referent\": \"Interleukin 13\",\n    \"canonical name\": \"IL13\"\n},\n{\n    \"referent\": \"Interleukin 14\",\n    \"canonical name\": \"IL14\"\n},\n{\n    \"referent\": \"Interleukin 15\",\n    \"canonical name\": \"IL15\"\n},\n{\n    \"referent\": \"Interleukin 16\",\n    \"canonical name\": \"IL16\"\n},\n{\n    \"referent\": \"Interleukin 17\",\n    \"canonical name\": \"IL17\"\n},\n{\n    \"referent\": \"Interleukin 18\",\n    \"canonical name\": \"IL18\"\n},\n{\n    \"referent\": \"Interleukin 19\",\n    \"canonical name\": \"IL19\"\n},\n{\n    \"referent\": \"Interleukin 20\",\n    \"canonical name\": \"IL20\"\n},\n{\n    \"referent\": \"Interleukin 21\",\n    \"canonical name\": \"IL21\"\n},\n{\n    \"referent\": \"Interleukin 22\",\n    \"canonical name\": \"IL22\"\n},\n{\n    \"referent\": \"Interleukin 23\",\n    \"canonical name\": \"IL23\"\n},\n{\n    \"referent\": \"Interleukin 24\",\n    \"canonical name\": \"IL24\"\n},\n{\n    \"referent\": \"Interleukin 25\",\n    \"canonical name\": \"IL25\"\n},\n{\n    \"referent\": \"Interleukin 26\",\n    \"canonical name\": \"IL26\"\n},\n{\n    \"referent\": \"Interleukin 27\",\n    \"canonical name\": \"IL27\"\n},\n{\n    \"referent\": \"Interleukin 28\",\n    \"canonical name\": \"IL28\"\n},\n{\n    \"referent\": \"Interleukin 29\",\n    \"canonical name\": \"IL29\"\n},\n{\n    \"referent\": \"Interleukin 30\",\n    \"canonical name\": \"IL30\"\n},\n{\n    \"referent\": \"Interleukin 31\",\n    \"canonical name\": \"IL31\"\n},\n{\n    \"referent\": \"Interleukin 33\",\n    \"canonical name\": \"IL33\"\n},\n{\n    \"referent\": \"Interleukin 34\",\n    \"canonical name\": \"IL34\"\n},\n{\n    \"referent\": \"Interleukin 35\",\n    \"canonical name\": \"IL35\"\n}",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]