[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "IL-10 (IL-10)",
            "TGF-beta (TGF-\u03b2)",
            "IL-1 receptor antagonist (IL-1ra)",
            "IL-13 (IL-13)",
            "IL-4 (IL-4)",
            "IL-17A (IL-17A)",
            "IL-27 (IL-27)",
            "IL-35 (IL-35)",
            "PGE2 (PGE2)",
            "IL-18 binding protein (IL-18BP)",
            "CRF (CRF)",
            "IL-18 binding protein (IL-18BP)",
            "IL-22 (IL-22)",
            "IL-6 (IL-6)",
            "IL-21 (IL-21)",
            "IL-33 (IL-33)",
            "IL-25 (IL-25)",
            "IL-37 (IL-37)",
            "IL-38 (IL-38)",
            "IL-12p40 (p40)",
            "IL-15 (IL-15)",
            "IL-9 (IL-9)",
            "IL-2 (IL-2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "IL-10 (IL-10)",
                "TGF-beta (TGF-\u03b2)",
                "IL-1 receptor antagonist (IL-1ra)",
                "IL-13 (IL-13)",
                "IL-4 (IL-4)",
                "IL-17A (IL-17A)",
                "IL-27 (IL-27)",
                "IL-35 (IL-35)",
                "PGE2 (PGE2)",
                "IL-18 binding protein (IL-18BP)",
                "CRF (CRF)",
                "IL-22 (IL-22)",
                "IL-6 (IL-6)",
                "IL-21 (IL-21)",
                "IL-33 (IL-33)",
                "IL-25 (IL-25)",
                "IL-37 (IL-37)",
                "IL-38 (IL-38)",
                "IL-12p40 (p40)",
                "IL-15 (IL-15)",
                "IL-9 (IL-9)",
                "IL-2 (IL-2)"
            ],
            "mismatches": [],
            "true_referents": [
                "CRF (CRF)",
                "IL-1 receptor antagonist (IL-1ra)",
                "IL-10 (IL-10)",
                "IL-12p40 (p40)",
                "IL-13 (IL-13)",
                "IL-15 (IL-15)",
                "IL-17A (IL-17A)",
                "IL-18 binding protein (IL-18BP)",
                "IL-2 (IL-2)",
                "IL-21 (IL-21)",
                "IL-22 (IL-22)",
                "IL-25 (IL-25)",
                "IL-27 (IL-27)",
                "IL-33 (IL-33)",
                "IL-35 (IL-35)",
                "IL-37 (IL-37)",
                "IL-38 (IL-38)",
                "IL-4 (IL-4)",
                "IL-6 (IL-6)",
                "IL-9 (IL-9)",
                "PGE2 (PGE2)",
                "TGF-beta (TGF-\u03b2)"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-10 (IL-10)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Interleukin-35 (IL-35)",
            "Interleukin-4 (IL-4)",
            "Interleukin-27 (IL-27)",
            "Interleukin-13 (IL-13)",
            "Interleukin-1 receptor antagonist (IL-1Ra)",
            "Interleukin-9 (IL-9)",
            "Interleukin-25 (IL-25)",
            "Interleukin-31 (IL-31)",
            "Interleukin-37 (IL-37)",
            "Interleukin-22 (IL-22)",
            "Interleukin-23 (IL-23)",
            "Interleukin-17A (IL-17A)",
            "Interleukin-6 (IL-6)",
            "Interleukin-11 (IL-11)",
            "Interleukin-21 (IL-21)",
            "Interleukin-2 (IL-2)",
            "Interleukin-5 (IL-5)",
            "Interleukin-17F (IL-17F)",
            "Interleukin-18 (IL-18)",
            "Interleukin-12 (IL-12)",
            "Interleukin-23 (IL-23)",
            "Interleukin-28B (IL-28B)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-10 (IL-10)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Interleukin-35 (IL-35)",
                "Interleukin-4 (IL-4)",
                "Interleukin-27 (IL-27)",
                "Interleukin-13 (IL-13)",
                "Interleukin-1 receptor antagonist (IL-1Ra)",
                "Interleukin-9 (IL-9)",
                "Interleukin-25 (IL-25)",
                "Interleukin-31 (IL-31)",
                "Interleukin-37 (IL-37)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-17A (IL-17A)",
                "Interleukin-6 (IL-6)",
                "Interleukin-11 (IL-11)",
                "Interleukin-21 (IL-21)",
                "Interleukin-2 (IL-2)",
                "Interleukin-5 (IL-5)",
                "Interleukin-17F (IL-17F)",
                "Interleukin-18 (IL-18)",
                "Interleukin-12 (IL-12)",
                "Interleukin-28B (IL-28B)"
            ],
            "mismatches": [],
            "true_referents": [
                "Interleukin-1 receptor antagonist (IL-1Ra)",
                "Interleukin-10 (IL-10)",
                "Interleukin-11 (IL-11)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-17A (IL-17A)",
                "Interleukin-17F (IL-17F)",
                "Interleukin-18 (IL-18)",
                "Interleukin-2 (IL-2)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-25 (IL-25)",
                "Interleukin-27 (IL-27)",
                "Interleukin-28B (IL-28B)",
                "Interleukin-31 (IL-31)",
                "Interleukin-35 (IL-35)",
                "Interleukin-37 (IL-37)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-9 (IL-9)",
                "Transforming Growth Factor-beta (TGF-\u03b2)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-10 (IL-10)",
            "Transforming growth factor beta (TGF-\u03b2)",
            "Interleukin-35 (IL-35)",
            "Interleukin-1 receptor antagonist (IL-1RA)",
            "Interleukin-13 (IL-13)",
            "Interleukin-4 (IL-4)",
            "Interleukin-27 (IL-27)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Interleukin-8 (IL-8)",
            "Interleukin-9 (IL-9)",
            "Interleukin-11 (IL-11)",
            "Interleukin-12 (IL-12)",
            "Interleukin-15 (IL-15)",
            "Interleukin-16 (IL-16)",
            "Interleukin-17 (IL-17)",
            "Interleukin-18 (IL-18)",
            "Interleukin-19 (IL-19)",
            "Interleukin-20 (IL-20)",
            "Interleukin-21 (IL-21)",
            "Interleukin-22 (IL-22)",
            "Interleukin-23 (IL-23)",
            "Interleukin-24 (IL-24)",
            "Interleukin-25 (IL-25)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-10 (IL-10)",
                "Transforming growth factor beta (TGF-\u03b2)",
                "Interleukin-35 (IL-35)",
                "Interleukin-1 receptor antagonist (IL-1RA)",
                "Interleukin-13 (IL-13)",
                "Interleukin-4 (IL-4)",
                "Interleukin-27 (IL-27)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Interleukin-8 (IL-8)",
                "Interleukin-9 (IL-9)",
                "Interleukin-11 (IL-11)",
                "Interleukin-12 (IL-12)",
                "Interleukin-15 (IL-15)",
                "Interleukin-16 (IL-16)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-19 (IL-19)",
                "Interleukin-20 (IL-20)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-24 (IL-24)",
                "Interleukin-25 (IL-25)"
            ],
            "mismatches": [],
            "true_referents": [
                "Interleukin-1 receptor antagonist (IL-1RA)",
                "Interleukin-10 (IL-10)",
                "Interleukin-11 (IL-11)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-15 (IL-15)",
                "Interleukin-16 (IL-16)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-19 (IL-19)",
                "Interleukin-2 (IL-2)",
                "Interleukin-20 (IL-20)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-24 (IL-24)",
                "Interleukin-25 (IL-25)",
                "Interleukin-27 (IL-27)",
                "Interleukin-35 (IL-35)",
                "Interleukin-4 (IL-4)",
                "Interleukin-6 (IL-6)",
                "Interleukin-8 (IL-8)",
                "Interleukin-9 (IL-9)",
                "Transforming growth factor beta (TGF-\u03b2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-10 (IL-10)",
            "Transforming Growth Factor beta (TGF-\u03b2)",
            "Interleukin-35 (IL-35)",
            "Regulatory T cell-derived Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Tumor Necrosis Factor alpha (TNF-\u03b1) - in certain contexts",
            "Prostaglandin E2 (PGE2)",
            "Cortisol",
            "Cyclosporine A",
            "Tacrolimus",
            "Sirolimus",
            "Dexamethasone",
            "Prednisolone",
            "Indomethacin",
            "Galectin-1",
            "Arginase 1",
            "IDO1 (Indoleamine 2,3-dioxygenase 1)",
            "PD-1 Ligand 1 (PD-L1)",
            "PD-1 Ligand 2 (PD-L2)",
            "CTLA-4",
            "IL-27",
            "Lipoxins",
            "Resolvins",
            "Protectins",
            "Maresins"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-10 (IL-10)",
                "Transforming Growth Factor beta (TGF-\u03b2)",
                "Interleukin-35 (IL-35)",
                "Regulatory T cell-derived Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Tumor Necrosis Factor alpha (TNF-\u03b1) - in certain contexts",
                "Prostaglandin E2 (PGE2)",
                "Cortisol",
                "Cyclosporine A",
                "Tacrolimus",
                "Sirolimus",
                "Dexamethasone",
                "Prednisolone",
                "Indomethacin",
                "Galectin-1",
                "Arginase 1",
                "IDO1 (Indoleamine 2,3-dioxygenase 1)",
                "PD-1 Ligand 1 (PD-L1)",
                "PD-1 Ligand 2 (PD-L2)",
                "CTLA-4",
                "IL-27",
                "Lipoxins",
                "Resolvins",
                "Protectins",
                "Maresins"
            ],
            "mismatches": [],
            "true_referents": [
                "Arginase 1",
                "CTLA-4",
                "Cortisol",
                "Cyclosporine A",
                "Dexamethasone",
                "Galectin-1",
                "IDO1 (Indoleamine 2,3-dioxygenase 1)",
                "IL-27",
                "Indomethacin",
                "Interleukin-10 (IL-10)",
                "Interleukin-35 (IL-35)",
                "Lipoxins",
                "Maresins",
                "PD-1 Ligand 1 (PD-L1)",
                "PD-1 Ligand 2 (PD-L2)",
                "Prednisolone",
                "Prostaglandin E2 (PGE2)",
                "Protectins",
                "Regulatory T cell-derived Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Resolvins",
                "Sirolimus",
                "Tacrolimus",
                "Transforming Growth Factor beta (TGF-\u03b2)",
                "Tumor Necrosis Factor alpha (TNF-\u03b1) - in certain contexts"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Transforming Growth Factor Beta (TGF-\u03b2)",
            "Interleukin-10 (IL-10)",
            "Interleukin-35 (IL-35)",
            "Interleukin-27 (IL-27)",
            "Interleukin-19 (IL-19)",
            "Interleukin-24 (IL-24)",
            "Interleukin-37 (IL-37)",
            "Interleukin-38 (IL-38)",
            "Interleukin-22 (IL-22)",
            "Interleukin-9 (IL-9)",
            "Interleukin-20 (IL-20)",
            "Interleukin-29 (IL-29)",
            "Interleukin-31 (IL-31)",
            "Interleukin-32 (IL-32)",
            "Interleukin-34 (IL-34)",
            "Interleukin-35 (IL-35)",
            "Interleukin-40 (IL-40)",
            "Interleukin-41 (IL-41)",
            "Interleukin-42 (IL-42)",
            "Interleukin-43 (IL-43)",
            "Interleukin-44 (IL-44)",
            "Interleukin-45 (IL-45)",
            "Interleukin-46 (IL-46)",
            "Interleukin-47 (IL-47)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Transforming Growth Factor Beta (TGF-\u03b2)",
                "Interleukin-10 (IL-10)",
                "Interleukin-35 (IL-35)",
                "Interleukin-27 (IL-27)",
                "Interleukin-19 (IL-19)",
                "Interleukin-24 (IL-24)",
                "Interleukin-37 (IL-37)",
                "Interleukin-38 (IL-38)",
                "Interleukin-22 (IL-22)",
                "Interleukin-9 (IL-9)",
                "Interleukin-20 (IL-20)",
                "Interleukin-29 (IL-29)",
                "Interleukin-31 (IL-31)",
                "Interleukin-32 (IL-32)",
                "Interleukin-34 (IL-34)",
                "Interleukin-40 (IL-40)",
                "Interleukin-41 (IL-41)",
                "Interleukin-42 (IL-42)",
                "Interleukin-43 (IL-43)",
                "Interleukin-44 (IL-44)",
                "Interleukin-45 (IL-45)",
                "Interleukin-46 (IL-46)",
                "Interleukin-47 (IL-47)"
            ],
            "mismatches": [],
            "true_referents": [
                "Interleukin-10 (IL-10)",
                "Interleukin-19 (IL-19)",
                "Interleukin-20 (IL-20)",
                "Interleukin-22 (IL-22)",
                "Interleukin-24 (IL-24)",
                "Interleukin-27 (IL-27)",
                "Interleukin-29 (IL-29)",
                "Interleukin-31 (IL-31)",
                "Interleukin-32 (IL-32)",
                "Interleukin-34 (IL-34)",
                "Interleukin-35 (IL-35)",
                "Interleukin-37 (IL-37)",
                "Interleukin-38 (IL-38)",
                "Interleukin-40 (IL-40)",
                "Interleukin-41 (IL-41)",
                "Interleukin-42 (IL-42)",
                "Interleukin-43 (IL-43)",
                "Interleukin-44 (IL-44)",
                "Interleukin-45 (IL-45)",
                "Interleukin-46 (IL-46)",
                "Interleukin-47 (IL-47)",
                "Interleukin-9 (IL-9)",
                "Transforming Growth Factor Beta (TGF-\u03b2)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Transforming Growth Factor Beta (TGF-\u03b2)",
            "Interleukin-10 (IL-10)",
            "Interleukin-4 (IL-4)",
            "Interleukin-13 (IL-13)",
            "Interleukin-35 (IL-35)",
            "Interleukin-9 (IL-9)",
            "Interleukin-21 (IL-21)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Prostaglandin E2 (PGE2)",
            "Tumor Necrosis Factor Alpha (TNF-\u03b1)",
            "Interferon Gamma (IFN-\u03b3)",
            "Interleukin-6 (IL-6)",
            "Interleukin-1 Receptor Antagonist (IL-1Ra)",
            "Vascular Endothelial Growth Factor (VEGF)",
            "Macrophage Inflammatory Protein-1 Alpha (MIP-1\u03b1)",
            "C-C Motif Chemokine Ligand 22 (CCL22)",
            "Cytokine-Induced Neutrophil Chemoattractant 1 (CINC-1)",
            "Interleukin-12 (IL-12)",
            "Interleukin-27 (IL-27)",
            "Interleukin-15 (IL-15)",
            "Interleukin-2 (IL-2)",
            "Interleukin-5 (IL-5)",
            "Interleukin-18 (IL-18)",
            "Interleukin-17 (IL-17)",
            "Interleukin-8 (IL-8)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Transforming Growth Factor Beta (TGF-\u03b2)",
                "Interleukin-10 (IL-10)",
                "Interleukin-4 (IL-4)",
                "Interleukin-13 (IL-13)",
                "Interleukin-35 (IL-35)",
                "Interleukin-9 (IL-9)",
                "Interleukin-21 (IL-21)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Prostaglandin E2 (PGE2)",
                "Tumor Necrosis Factor Alpha (TNF-\u03b1)",
                "Interferon Gamma (IFN-\u03b3)",
                "Interleukin-6 (IL-6)",
                "Interleukin-1 Receptor Antagonist (IL-1Ra)",
                "Vascular Endothelial Growth Factor (VEGF)",
                "Macrophage Inflammatory Protein-1 Alpha (MIP-1\u03b1)",
                "C-C Motif Chemokine Ligand 22 (CCL22)",
                "Cytokine-Induced Neutrophil Chemoattractant 1 (CINC-1)",
                "Interleukin-12 (IL-12)",
                "Interleukin-27 (IL-27)",
                "Interleukin-15 (IL-15)",
                "Interleukin-2 (IL-2)",
                "Interleukin-5 (IL-5)",
                "Interleukin-18 (IL-18)",
                "Interleukin-17 (IL-17)"
            ],
            "mismatches": [
                "Interleukin-8 (IL-8)"
            ],
            "true_referents": [
                "C-C Motif Chemokine Ligand 22 (CCL22)",
                "Cytokine-Induced Neutrophil Chemoattractant 1 (CINC-1)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interferon Gamma (IFN-\u03b3)",
                "Interleukin-1 Receptor Antagonist (IL-1Ra)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-15 (IL-15)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-2 (IL-2)",
                "Interleukin-21 (IL-21)",
                "Interleukin-27 (IL-27)",
                "Interleukin-35 (IL-35)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-9 (IL-9)",
                "Macrophage Inflammatory Protein-1 Alpha (MIP-1\u03b1)",
                "Prostaglandin E2 (PGE2)",
                "Transforming Growth Factor Beta (TGF-\u03b2)",
                "Tumor Necrosis Factor Alpha (TNF-\u03b1)",
                "Vascular Endothelial Growth Factor (VEGF)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Transforming Growth Factor Beta (TGF-\u03b2)",
            "Interleukin 10 (IL-10)",
            "Interleukin 35 (IL-35)",
            "Interleukin 4 (IL-4)",
            "Interleukin 13 (IL-13)",
            "Vascular Endothelial Growth Factor (VEGF)",
            "Fibroblast Growth Factor (FGF)",
            "Platelet-Derived Growth Factor (PDGF)",
            "Interferon Alpha (IFN\u03b1)",
            "Interferon Beta (IFN\u03b2)",
            "Tumor Necrosis Factor Beta (TNF-\u03b2)",
            "Colony Stimulating Factor 1 (CSF1)",
            "Granulocyte Colony-Stimulating Factor (G-CSF)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Macrophage Colony-Stimulating Factor (M-CSF)",
            "Interleukin 27 (IL-27)",
            "Interleukin 37 (IL-37)",
            "Interleukin 38 (IL-38)",
            "Interleukin 1 Receptor Antagonist (IL1RA)",
            "Interleukin 11 (IL-11)",
            "Interleukin 24 (IL-24)",
            "Interleukin 33 (IL-33)",
            "Interleukin 36 (IL-36)",
            "Interleukin 9 (IL-9)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Transforming Growth Factor Beta (TGF-\u03b2)",
                "Interleukin 10 (IL-10)",
                "Interleukin 35 (IL-35)",
                "Interleukin 4 (IL-4)",
                "Interleukin 13 (IL-13)",
                "Vascular Endothelial Growth Factor (VEGF)",
                "Fibroblast Growth Factor (FGF)",
                "Platelet-Derived Growth Factor (PDGF)",
                "Interferon Alpha (IFN\u03b1)",
                "Interferon Beta (IFN\u03b2)",
                "Tumor Necrosis Factor Beta (TNF-\u03b2)",
                "Colony Stimulating Factor 1 (CSF1)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Interleukin 27 (IL-27)",
                "Interleukin 37 (IL-37)",
                "Interleukin 38 (IL-38)",
                "Interleukin 1 Receptor Antagonist (IL1RA)",
                "Interleukin 11 (IL-11)",
                "Interleukin 24 (IL-24)",
                "Interleukin 33 (IL-33)",
                "Interleukin 36 (IL-36)",
                "Interleukin 9 (IL-9)"
            ],
            "mismatches": [],
            "true_referents": [
                "Colony Stimulating Factor 1 (CSF1)",
                "Fibroblast Growth Factor (FGF)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interferon Alpha (IFN\u03b1)",
                "Interferon Beta (IFN\u03b2)",
                "Interleukin 1 Receptor Antagonist (IL1RA)",
                "Interleukin 10 (IL-10)",
                "Interleukin 11 (IL-11)",
                "Interleukin 13 (IL-13)",
                "Interleukin 24 (IL-24)",
                "Interleukin 27 (IL-27)",
                "Interleukin 33 (IL-33)",
                "Interleukin 35 (IL-35)",
                "Interleukin 36 (IL-36)",
                "Interleukin 37 (IL-37)",
                "Interleukin 38 (IL-38)",
                "Interleukin 4 (IL-4)",
                "Interleukin 9 (IL-9)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Platelet-Derived Growth Factor (PDGF)",
                "Transforming Growth Factor Beta (TGF-\u03b2)",
                "Tumor Necrosis Factor Beta (TNF-\u03b2)",
                "Vascular Endothelial Growth Factor (VEGF)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-10 (IL-10)",
            "Transforming Growth Factor-beta (TGF-beta)",
            "Interleukin-4 (IL-4)",
            "Interleukin-13 (IL-13)",
            "Interleukin-35 (IL-35)",
            "Interleukin-27 (IL-27)",
            "Interleukin-1 receptor antagonist (IL-1ra)",
            "Interleukin-18 binding protein (IL-18BP)",
            "Interleukin-11 (IL-11)",
            "Interleukin-6 (IL-6)",
            "Tumor necrosis factor-alpha (TNF-alpha)",
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-3 (IL-3)",
            "Interleukin-12 (IL-12)",
            "Interleukin-15 (IL-15)",
            "Interleukin-16 (IL-16)",
            "Interleukin-17 (IL-17)",
            "Interleukin-21 (IL-21)",
            "Interleukin-23 (IL-23)",
            "Interleukin-25 (IL-25)",
            "Interleukin-31 (IL-31)",
            "Interleukin-33 (IL-33)",
            "Interferon-gamma (IFN-gamma)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-10 (IL-10)",
                "Transforming Growth Factor-beta (TGF-beta)",
                "Interleukin-4 (IL-4)",
                "Interleukin-13 (IL-13)",
                "Interleukin-35 (IL-35)",
                "Interleukin-27 (IL-27)",
                "Interleukin-1 receptor antagonist (IL-1ra)",
                "Interleukin-18 binding protein (IL-18BP)",
                "Interleukin-11 (IL-11)",
                "Interleukin-6 (IL-6)",
                "Tumor necrosis factor-alpha (TNF-alpha)",
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-3 (IL-3)",
                "Interleukin-12 (IL-12)",
                "Interleukin-15 (IL-15)",
                "Interleukin-16 (IL-16)",
                "Interleukin-17 (IL-17)",
                "Interleukin-21 (IL-21)",
                "Interleukin-23 (IL-23)",
                "Interleukin-25 (IL-25)",
                "Interleukin-31 (IL-31)",
                "Interleukin-33 (IL-33)",
                "Interferon-gamma (IFN-gamma)"
            ],
            "mismatches": [],
            "true_referents": [
                "Interferon-gamma (IFN-gamma)",
                "Interleukin-1 (IL-1)",
                "Interleukin-1 receptor antagonist (IL-1ra)",
                "Interleukin-10 (IL-10)",
                "Interleukin-11 (IL-11)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-15 (IL-15)",
                "Interleukin-16 (IL-16)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 binding protein (IL-18BP)",
                "Interleukin-2 (IL-2)",
                "Interleukin-21 (IL-21)",
                "Interleukin-23 (IL-23)",
                "Interleukin-25 (IL-25)",
                "Interleukin-27 (IL-27)",
                "Interleukin-3 (IL-3)",
                "Interleukin-31 (IL-31)",
                "Interleukin-33 (IL-33)",
                "Interleukin-35 (IL-35)",
                "Interleukin-4 (IL-4)",
                "Interleukin-6 (IL-6)",
                "Transforming Growth Factor-beta (TGF-beta)",
                "Tumor necrosis factor-alpha (TNF-alpha)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-10 (IL-10)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Interleukin-4 (IL-4)",
            "Interleukin-13 (IL-13)",
            "Interleukin-35 (IL-35)",
            "Interleukin-27 (IL-27)",
            "Interleukin-37 (IL-37)",
            "Interleukin-1 receptor antagonist (IL-1ra)",
            "Interleukin-19 (IL-19)",
            "Interleukin-20 (IL-20)",
            "Interleukin-22 (IL-22)",
            "Interleukin-24 (IL-24)",
            "Interleukin-38 (IL-38)",
            "Interleukin-16 (IL-16)",
            "Interleukin-9 (IL-9)",
            "Interleukin-7 (IL-7)",
            "Interleukin-15 (IL-15)",
            "Interleukin-21 (IL-21)",
            "Interleukin-23 (IL-23)",
            "Interleukin-17F (IL-17F)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-10 (IL-10)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Interleukin-4 (IL-4)",
                "Interleukin-13 (IL-13)",
                "Interleukin-35 (IL-35)",
                "Interleukin-27 (IL-27)",
                "Interleukin-37 (IL-37)",
                "Interleukin-1 receptor antagonist (IL-1ra)",
                "Interleukin-19 (IL-19)",
                "Interleukin-20 (IL-20)",
                "Interleukin-22 (IL-22)",
                "Interleukin-24 (IL-24)",
                "Interleukin-38 (IL-38)",
                "Interleukin-16 (IL-16)",
                "Interleukin-9 (IL-9)",
                "Interleukin-7 (IL-7)",
                "Interleukin-15 (IL-15)",
                "Interleukin-21 (IL-21)",
                "Interleukin-23 (IL-23)",
                "Interleukin-17F (IL-17F)"
            ],
            "mismatches": [],
            "true_referents": [
                "Interleukin-1 receptor antagonist (IL-1ra)",
                "Interleukin-10 (IL-10)",
                "Interleukin-13 (IL-13)",
                "Interleukin-15 (IL-15)",
                "Interleukin-16 (IL-16)",
                "Interleukin-17F (IL-17F)",
                "Interleukin-19 (IL-19)",
                "Interleukin-20 (IL-20)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-24 (IL-24)",
                "Interleukin-27 (IL-27)",
                "Interleukin-35 (IL-35)",
                "Interleukin-37 (IL-37)",
                "Interleukin-38 (IL-38)",
                "Interleukin-4 (IL-4)",
                "Interleukin-7 (IL-7)",
                "Interleukin-9 (IL-9)",
                "Transforming Growth Factor-beta (TGF-\u03b2)"
            ],
            "TP": 20,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-10 (IL-10)",
            "Transforming Growth Factor Beta (TGF-\u03b2)",
            "Interleukin-35 (IL-35)",
            "Interleukin-37 (IL-37)",
            "Prostaglandin E2 (PGE2)",
            "Tumor Necrosis Factor Alpha (TNF-\u03b1)",
            "Interleukin-4 (IL-4)",
            "Interleukin-13 (IL-13)",
            "Interleukin-22 (IL-22)",
            "Interleukin-27 (IL-27)",
            "Interleukin-33 (IL-33)",
            "Interleukin-38 (IL-38)",
            "Interferon Beta (IFN-\u03b2)",
            "Leukemia Inhibitory Factor (LIF)",
            "Activin A",
            "Melanoma Differentiation-Associated Protein 5 (MDA5)",
            "Galectin-1",
            "Indoleamine 2,3-dioxygenase (IDO)",
            "Programmed Death-Ligand 1 (PD-L1)",
            "Cytotoxic T-Lymphocyte-Associated Protein 4 (CTLA-4)",
            "Lymphocyte-Activation Gene 3 (LAG-3)",
            "T-Cell Immunoglobulin and Mucin-Domain Containing-3 (TIM-3)",
            "V-Domain Ig Suppressor of T Cell Activation (VISTA)",
            "B and T Lymphocyte Attenuator (BTLA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-10 (IL-10)",
                "Transforming Growth Factor Beta (TGF-\u03b2)",
                "Interleukin-35 (IL-35)",
                "Interleukin-37 (IL-37)",
                "Prostaglandin E2 (PGE2)",
                "Tumor Necrosis Factor Alpha (TNF-\u03b1)",
                "Interleukin-4 (IL-4)",
                "Interleukin-13 (IL-13)",
                "Interleukin-22 (IL-22)",
                "Interleukin-27 (IL-27)",
                "Interleukin-33 (IL-33)",
                "Interleukin-38 (IL-38)",
                "Interferon Beta (IFN-\u03b2)",
                "Leukemia Inhibitory Factor (LIF)",
                "Activin A",
                "Melanoma Differentiation-Associated Protein 5 (MDA5)",
                "Galectin-1",
                "Indoleamine 2,3-dioxygenase (IDO)",
                "Programmed Death-Ligand 1 (PD-L1)",
                "Cytotoxic T-Lymphocyte-Associated Protein 4 (CTLA-4)",
                "Lymphocyte-Activation Gene 3 (LAG-3)",
                "T-Cell Immunoglobulin and Mucin-Domain Containing-3 (TIM-3)",
                "V-Domain Ig Suppressor of T Cell Activation (VISTA)",
                "B and T Lymphocyte Attenuator (BTLA)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activin A",
                "B and T Lymphocyte Attenuator (BTLA)",
                "Cytotoxic T-Lymphocyte-Associated Protein 4 (CTLA-4)",
                "Galectin-1",
                "Indoleamine 2,3-dioxygenase (IDO)",
                "Interferon Beta (IFN-\u03b2)",
                "Interleukin-10 (IL-10)",
                "Interleukin-13 (IL-13)",
                "Interleukin-22 (IL-22)",
                "Interleukin-27 (IL-27)",
                "Interleukin-33 (IL-33)",
                "Interleukin-35 (IL-35)",
                "Interleukin-37 (IL-37)",
                "Interleukin-38 (IL-38)",
                "Interleukin-4 (IL-4)",
                "Leukemia Inhibitory Factor (LIF)",
                "Lymphocyte-Activation Gene 3 (LAG-3)",
                "Melanoma Differentiation-Associated Protein 5 (MDA5)",
                "Programmed Death-Ligand 1 (PD-L1)",
                "Prostaglandin E2 (PGE2)",
                "T-Cell Immunoglobulin and Mucin-Domain Containing-3 (TIM-3)",
                "Transforming Growth Factor Beta (TGF-\u03b2)",
                "Tumor Necrosis Factor Alpha (TNF-\u03b1)",
                "V-Domain Ig Suppressor of T Cell Activation (VISTA)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-10 (IL-10)",
            "Transforming growth factor beta (TGF-\u03b2)",
            "Interleukin-35 (IL-35)",
            "Interleukin-27 (IL-27)",
            "Interleukin-1 receptor antagonist (IL-1RA)",
            "Prostaglandin E2 (PGE2)",
            "Adenosine",
            "Vasoactive intestinal peptide (VIP)",
            "Somatostatin (SST)",
            "Alpha-melanocyte stimulating hormone (\u03b1-MSH)",
            "Lipoxins",
            "Resolvins",
            "Protectins",
            "Annexin A1",
            "Galectin-1",
            "Galectin-9",
            "Indoleamine 2,3-dioxygenase (IDO)",
            "Arginase",
            "Heme oxygenase-1 (HO-1)",
            "Nitric oxide (NO)",
            "Carbon monoxide (CO)",
            "Hydrogen sulfide (H2S)",
            "Soluble tumor necrosis factor receptor (sTNFR)",
            "Soluble interleukin-1 receptor (sIL-1R)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-10 (IL-10)",
                "Transforming growth factor beta (TGF-\u03b2)",
                "Interleukin-35 (IL-35)",
                "Interleukin-27 (IL-27)",
                "Interleukin-1 receptor antagonist (IL-1RA)",
                "Prostaglandin E2 (PGE2)",
                "Adenosine",
                "Vasoactive intestinal peptide (VIP)",
                "Somatostatin (SST)",
                "Alpha-melanocyte stimulating hormone (\u03b1-MSH)",
                "Lipoxins",
                "Resolvins",
                "Protectins",
                "Annexin A1",
                "Galectin-1",
                "Galectin-9",
                "Indoleamine 2,3-dioxygenase (IDO)",
                "Arginase",
                "Heme oxygenase-1 (HO-1)",
                "Nitric oxide (NO)",
                "Carbon monoxide (CO)",
                "Hydrogen sulfide (H2S)",
                "Soluble tumor necrosis factor receptor (sTNFR)",
                "Soluble interleukin-1 receptor (sIL-1R)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adenosine",
                "Alpha-melanocyte stimulating hormone (\u03b1-MSH)",
                "Annexin A1",
                "Arginase",
                "Carbon monoxide (CO)",
                "Galectin-1",
                "Galectin-9",
                "Heme oxygenase-1 (HO-1)",
                "Hydrogen sulfide (H2S)",
                "Indoleamine 2,3-dioxygenase (IDO)",
                "Interleukin-1 receptor antagonist (IL-1RA)",
                "Interleukin-10 (IL-10)",
                "Interleukin-27 (IL-27)",
                "Interleukin-35 (IL-35)",
                "Lipoxins",
                "Nitric oxide (NO)",
                "Prostaglandin E2 (PGE2)",
                "Protectins",
                "Resolvins",
                "Soluble interleukin-1 receptor (sIL-1R)",
                "Soluble tumor necrosis factor receptor (sTNFR)",
                "Somatostatin (SST)",
                "Transforming growth factor beta (TGF-\u03b2)",
                "Vasoactive intestinal peptide (VIP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-10 (IL-10)",
            "Transforming Growth Factor Beta (TGF-\u03b2)",
            "Interleukin-35 (IL-35)",
            "Interleukin-37 (IL-37)",
            "Interleukin-27 (IL-27)",
            "Interleukin-22 (IL-22)",
            "Glucocorticoids",
            "Prostaglandin E2 (PGE2)",
            "Indoleamine 2,3-dioxygenase (IDO)",
            "Cytotoxic T-Lymphocyte Antigen 4 (CTLA-4)",
            "Programmed Cell Death Protein 1 (PD-1)",
            "Programmed Death-Ligand 1 (PD-L1)",
            "Galectin-9",
            "Adenosine",
            "Leukemia Inhibitory Factor (LIF)",
            "Interleukin-16 (IL-16)",
            "Interleukin-1 Receptor Antagonist (IL-1RA)",
            "Soluble Tumor Necrosis Factor Receptor (sTNFR)",
            "Interleukin-38 (IL-38)",
            "Interleukin-24 (IL-24)",
            "Interleukin-36 Receptor Antagonist (IL-36Ra)",
            "Interleukin-1 Family Member 7 (IL-1F7)",
            "Interleukin-1 Family Member 10 (IL-1F10)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-10 (IL-10)",
                "Transforming Growth Factor Beta (TGF-\u03b2)",
                "Interleukin-35 (IL-35)",
                "Interleukin-37 (IL-37)",
                "Interleukin-27 (IL-27)",
                "Interleukin-22 (IL-22)",
                "Glucocorticoids",
                "Prostaglandin E2 (PGE2)",
                "Indoleamine 2,3-dioxygenase (IDO)",
                "Cytotoxic T-Lymphocyte Antigen 4 (CTLA-4)",
                "Programmed Cell Death Protein 1 (PD-1)",
                "Programmed Death-Ligand 1 (PD-L1)",
                "Galectin-9",
                "Adenosine",
                "Leukemia Inhibitory Factor (LIF)",
                "Interleukin-16 (IL-16)",
                "Interleukin-1 Receptor Antagonist (IL-1RA)",
                "Soluble Tumor Necrosis Factor Receptor (sTNFR)",
                "Interleukin-38 (IL-38)",
                "Interleukin-24 (IL-24)",
                "Interleukin-36 Receptor Antagonist (IL-36Ra)",
                "Interleukin-1 Family Member 7 (IL-1F7)",
                "Interleukin-1 Family Member 10 (IL-1F10)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adenosine",
                "Cytotoxic T-Lymphocyte Antigen 4 (CTLA-4)",
                "Galectin-9",
                "Glucocorticoids",
                "Indoleamine 2,3-dioxygenase (IDO)",
                "Interleukin-1 Family Member 10 (IL-1F10)",
                "Interleukin-1 Family Member 7 (IL-1F7)",
                "Interleukin-1 Receptor Antagonist (IL-1RA)",
                "Interleukin-10 (IL-10)",
                "Interleukin-16 (IL-16)",
                "Interleukin-22 (IL-22)",
                "Interleukin-24 (IL-24)",
                "Interleukin-27 (IL-27)",
                "Interleukin-35 (IL-35)",
                "Interleukin-36 Receptor Antagonist (IL-36Ra)",
                "Interleukin-37 (IL-37)",
                "Interleukin-38 (IL-38)",
                "Leukemia Inhibitory Factor (LIF)",
                "Programmed Cell Death Protein 1 (PD-1)",
                "Programmed Death-Ligand 1 (PD-L1)",
                "Prostaglandin E2 (PGE2)",
                "Soluble Tumor Necrosis Factor Receptor (sTNFR)",
                "Transforming Growth Factor Beta (TGF-\u03b2)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-10 (IL-10)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Programmed Death-Ligand 1 (PD-L1)",
            "Cytotoxic T-Lymphocyte-Associated Protein 4 (CTLA-4)",
            "Adenosine",
            "Prostaglandin E2 (PGE2)",
            "Indoleamine 2,3-Dioxygenase (IDO)",
            "Heme Oxygenase-1 (HO-1)",
            "Regulatory T Cells (Tregs)",
            "Myeloid-Derived Suppressor Cells (MDSCs)",
            "Tumor-Associated Macrophages (TAMs)",
            "Mesenchymal Stem Cells (MSCs)",
            "Glucocorticoids",
            "Vitamin D3",
            "Interleukin-35 (IL-35)",
            "Galectin-1",
            "Galectin-3",
            "Interleukin-27 (IL-27)",
            "Leukemia Inhibitory Factor (LIF)",
            "Oncostatin M (OSM)",
            "Carcinoembryonic Antigen (CEA)",
            "Alpha-Fetoprotein (AFP)",
            "Prostate-Specific Antigen (PSA)",
            "Human Chorionic Gonadotropin (hCG)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-10 (IL-10)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Programmed Death-Ligand 1 (PD-L1)",
                "Cytotoxic T-Lymphocyte-Associated Protein 4 (CTLA-4)",
                "Adenosine",
                "Prostaglandin E2 (PGE2)",
                "Indoleamine 2,3-Dioxygenase (IDO)",
                "Heme Oxygenase-1 (HO-1)",
                "Regulatory T Cells (Tregs)",
                "Myeloid-Derived Suppressor Cells (MDSCs)",
                "Tumor-Associated Macrophages (TAMs)",
                "Mesenchymal Stem Cells (MSCs)",
                "Glucocorticoids",
                "Vitamin D3",
                "Interleukin-35 (IL-35)",
                "Galectin-1",
                "Galectin-3",
                "Interleukin-27 (IL-27)",
                "Leukemia Inhibitory Factor (LIF)",
                "Oncostatin M (OSM)",
                "Carcinoembryonic Antigen (CEA)",
                "Alpha-Fetoprotein (AFP)",
                "Prostate-Specific Antigen (PSA)",
                "Human Chorionic Gonadotropin (hCG)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adenosine",
                "Alpha-Fetoprotein (AFP)",
                "Carcinoembryonic Antigen (CEA)",
                "Cytotoxic T-Lymphocyte-Associated Protein 4 (CTLA-4)",
                "Galectin-1",
                "Galectin-3",
                "Glucocorticoids",
                "Heme Oxygenase-1 (HO-1)",
                "Human Chorionic Gonadotropin (hCG)",
                "Indoleamine 2,3-Dioxygenase (IDO)",
                "Interleukin-10 (IL-10)",
                "Interleukin-27 (IL-27)",
                "Interleukin-35 (IL-35)",
                "Leukemia Inhibitory Factor (LIF)",
                "Mesenchymal Stem Cells (MSCs)",
                "Myeloid-Derived Suppressor Cells (MDSCs)",
                "Oncostatin M (OSM)",
                "Programmed Death-Ligand 1 (PD-L1)",
                "Prostaglandin E2 (PGE2)",
                "Prostate-Specific Antigen (PSA)",
                "Regulatory T Cells (Tregs)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Tumor-Associated Macrophages (TAMs)",
                "Vitamin D3"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "TGF-beta (TGF\u03b2)",
            "IL-10",
            "IL-4",
            "IL-22",
            "IL-35",
            "IL-27",
            "IL-31",
            "IL-39",
            "IL-33",
            "IL-37",
            "TGF-alpha",
            "Fas ligand",
            "GITR ligand",
            "CTLA-4 ligand",
            "PD-1 ligand",
            "PD-L1",
            "PD-L2",
            "Vegf-C",
            "Vegf-D",
            "Vegf-E",
            "Vegf-F",
            "Vegf-B",
            "HGF",
            "GDF-15",
            "GDF-16",
            "GDF-17"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TGF-beta (TGF\u03b2)",
                "IL-10",
                "IL-4",
                "IL-22",
                "IL-35",
                "IL-27",
                "IL-31",
                "IL-39",
                "IL-33",
                "IL-37",
                "TGF-alpha",
                "Fas ligand",
                "GITR ligand",
                "CTLA-4 ligand",
                "PD-1 ligand",
                "PD-L1",
                "PD-L2",
                "Vegf-C",
                "Vegf-D",
                "Vegf-E",
                "Vegf-F",
                "Vegf-B",
                "HGF",
                "GDF-15"
            ],
            "mismatches": [
                "GDF-16",
                "GDF-17"
            ],
            "true_referents": [
                "CTLA-4 ligand",
                "Fas ligand",
                "GDF-15",
                "GITR ligand",
                "HGF",
                "IL-10",
                "IL-22",
                "IL-27",
                "IL-31",
                "IL-33",
                "IL-35",
                "IL-37",
                "IL-39",
                "IL-4",
                "PD-1 ligand",
                "PD-L1",
                "PD-L2",
                "TGF-alpha",
                "TGF-beta (TGF\u03b2)",
                "Vegf-B",
                "Vegf-C",
                "Vegf-D",
                "Vegf-E",
                "Vegf-F"
            ],
            "TP": 24,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "TGF-beta (TGFB)",
            "IL-10 (IL10)",
            "IL-35",
            "TSLP",
            "GDF-15",
            "CTLA-4",
            "PD-1",
            "PD-L1",
            "PD-L2",
            "IDO",
            "Tregs",
            "Adenosine",
            "Galectin-1",
            "Galectin-3",
            "Galectin-9",
            "TIM-1",
            "TIM-2",
            "TIM-3",
            "TIM-4",
            "CD200",
            "CD200R",
            "B7-H3",
            "B7-H4"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TGF-beta (TGFB)",
                "IL-10 (IL10)",
                "IL-35",
                "TSLP",
                "GDF-15",
                "CTLA-4",
                "PD-1",
                "PD-L1",
                "PD-L2",
                "IDO",
                "Tregs",
                "Adenosine",
                "Galectin-1",
                "Galectin-3",
                "Galectin-9",
                "TIM-1",
                "TIM-2",
                "TIM-3",
                "TIM-4",
                "CD200",
                "CD200R",
                "B7-H3",
                "B7-H4"
            ],
            "mismatches": [],
            "true_referents": [
                "Adenosine",
                "B7-H3",
                "B7-H4",
                "CD200",
                "CD200R",
                "CTLA-4",
                "GDF-15",
                "Galectin-1",
                "Galectin-3",
                "Galectin-9",
                "IDO",
                "IL-10 (IL10)",
                "IL-35",
                "PD-1",
                "PD-L1",
                "PD-L2",
                "TGF-beta (TGFB)",
                "TIM-1",
                "TIM-2",
                "TIM-3",
                "TIM-4",
                "TSLP",
                "Tregs"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "anti-inflammatory cytokine",
        "domain": "biology",
        "response": [
            {
                "Referent": "Interleukin-10",
                "Canonical name": "IL-10"
            },
            {
                "Referent": "Interleukin-10 receptor",
                "Canonical name": "IL-10R"
            },
            {
                "Referent": "Interleukin-10 receptor alpha subunit",
                "Canonical name": "IL-10RA"
            },
            {
                "Referent": "Interleukin-10 receptor beta subunit",
                "Canonical name": "IL-10RB"
            },
            {
                "Referent": "Interleukin-10 receptor gamma subunit",
                "Canonical name": "IL-10RG"
            },
            {
                "Referent": "Interleukin-10 receptor delta subunit",
                "Canonical name": "IL-10RD"
            },
            {
                "Referent": "Interleukin-10 receptor subunit alpha",
                "Canonical name": "IL-10RA"
            },
            {
                "Referent": "Interleukin-10 receptor subunit beta",
                "Canonical name": "IL-10RB"
            },
            {
                "Referent": "Interleukin-10 receptor subunit gamma",
                "Canonical name": "IL-10RG"
            },
            {
                "Referent": "Interleukin-10 receptor subunit delta",
                "Canonical name": "IL-10RD"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-10",
                "Interleukin-10 receptor",
                "Interleukin-10 receptor alpha subunit",
                "Interleukin-10 receptor beta subunit",
                "Interleukin-10 receptor gamma subunit",
                "Interleukin-10 receptor delta subunit",
                "Interleukin-10 receptor subunit alpha",
                "Interleukin-10 receptor subunit beta",
                "Interleukin-10 receptor subunit gamma",
                "Interleukin-10 receptor subunit delta"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"Interleukin-10 receptor alpha subunit\", \"Canonical name\": \"IL-10RA\"}",
                "{\"Referent\": \"Interleukin-10 receptor beta subunit\", \"Canonical name\": \"IL-10RB\"}",
                "{\"Referent\": \"Interleukin-10 receptor delta subunit\", \"Canonical name\": \"IL-10RD\"}",
                "{\"Referent\": \"Interleukin-10 receptor gamma subunit\", \"Canonical name\": \"IL-10RG\"}",
                "{\"Referent\": \"Interleukin-10 receptor subunit alpha\", \"Canonical name\": \"IL-10RA\"}",
                "{\"Referent\": \"Interleukin-10 receptor subunit beta\", \"Canonical name\": \"IL-10RB\"}",
                "{\"Referent\": \"Interleukin-10 receptor subunit delta\", \"Canonical name\": \"IL-10RD\"}",
                "{\"Referent\": \"Interleukin-10 receptor subunit gamma\", \"Canonical name\": \"IL-10RG\"}",
                "{\"Referent\": \"Interleukin-10 receptor\", \"Canonical name\": \"IL-10R\"}",
                "{\"Referent\": \"Interleukin-10\", \"Canonical name\": \"IL-10\"}"
            ],
            "TP": 10,
            "FP": 0,
            "FN": 0
        }
    }
]