[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Interleukin-12 (IL-12)",
            "Interleukin-15 (IL-15)",
            "Interleukin-18 (IL-18)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Interferon-alpha (IFN-\u03b1)",
            "Interferon-gamma (IFN-\u03b3)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Granulocyte Colony-Stimulating Factor (G-CSF)",
            "Macrophage Colony-Stimulating Factor (M-CSF)",
            "Interleukin-17 (IL-17)",
            "Interleukin-21 (IL-21)",
            "Interleukin-23 (IL-23)",
            "Interleukin-4 (IL-4)",
            "Interleukin-5 (IL-5)",
            "Interleukin-10 (IL-10)",
            "Interleukin-13 (IL-13)",
            "Interleukin-22 (IL-22)",
            "Interleukin-33 (IL-33)",
            "Interleukin-35 (IL-35)",
            "Interleukin-37 (IL-37)",
            "Interleukin-38 (IL-38)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Interleukin-12 (IL-12)",
                "Interleukin-15 (IL-15)",
                "Interleukin-18 (IL-18)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-gamma (IFN-\u03b3)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Interleukin-17 (IL-17)",
                "Interleukin-21 (IL-21)",
                "Interleukin-23 (IL-23)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-10 (IL-10)",
                "Interleukin-13 (IL-13)",
                "Interleukin-22 (IL-22)",
                "Interleukin-33 (IL-33)",
                "Interleukin-35 (IL-35)",
                "Interleukin-37 (IL-37)",
                "Interleukin-38 (IL-38)"
            ],
            "mismatches": [],
            "true_referents": [
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-1 (IL-1)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-15 (IL-15)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-2 (IL-2)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-33 (IL-33)",
                "Interleukin-35 (IL-35)",
                "Interleukin-37 (IL-37)",
                "Interleukin-38 (IL-38)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Interleukin-12 (IL-12)",
            "Interleukin-15 (IL-15)",
            "Interleukin-18 (IL-18)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Interferon-alpha (IFN-\u03b1)",
            "Interferon-beta (IFN-\u03b2)",
            "Interferon-gamma (IFN-\u03b3)",
            "Interleukin-8 (IL-8)",
            "Interleukin-17 (IL-17)",
            "Interleukin-22 (IL-22)",
            "Interleukin-23 (IL-23)",
            "Interleukin-33 (IL-33)",
            "Interleukin-37 (IL-37)",
            "Macrophage Migration Inhibitory Factor (MIF)",
            "Vascular Endothelial Growth Factor (VEGF)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Macrophage Colony-Stimulating Factor (M-CSF)",
            "Granulocyte Colony-Stimulating Factor (G-CSF)",
            "Fms-like Tyrosine Kinase 3 Ligand (FLK3L or FLT3L)",
            "Interleukin-27 (IL-27)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Interleukin-12 (IL-12)",
                "Interleukin-15 (IL-15)",
                "Interleukin-18 (IL-18)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-8 (IL-8)",
                "Interleukin-17 (IL-17)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-33 (IL-33)",
                "Interleukin-37 (IL-37)",
                "Macrophage Migration Inhibitory Factor (MIF)",
                "Vascular Endothelial Growth Factor (VEGF)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Fms-like Tyrosine Kinase 3 Ligand (FLK3L or FLT3L)",
                "Interleukin-27 (IL-27)"
            ],
            "mismatches": [],
            "true_referents": [
                "Fms-like Tyrosine Kinase 3 Ligand (FLK3L or FLT3L)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-1 (IL-1)",
                "Interleukin-12 (IL-12)",
                "Interleukin-15 (IL-15)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-2 (IL-2)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-27 (IL-27)",
                "Interleukin-33 (IL-33)",
                "Interleukin-37 (IL-37)",
                "Interleukin-6 (IL-6)",
                "Interleukin-8 (IL-8)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Macrophage Migration Inhibitory Factor (MIF)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Vascular Endothelial Growth Factor (VEGF)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-3 (IL-3)",
            "Interleukin-4 (IL-4)",
            "Interleukin-5 (IL-5)",
            "Interleukin-6 (IL-6)",
            "Interleukin-7 (IL-7)",
            "Interleukin-8 (IL-8)",
            "Interleukin-9 (IL-9)",
            "Interleukin-10 (IL-10)",
            "Interleukin-11 (IL-11)",
            "Interleukin-12 (IL-12)",
            "Interleukin-13 (IL-13)",
            "Interleukin-14 (IL-14)",
            "Interleukin-15 (IL-15)",
            "Interleukin-16 (IL-16)",
            "Interleukin-17 (IL-17)",
            "Interleukin-18 (IL-18)",
            "Interleukin-21 (IL-21)",
            "Interleukin-22 (IL-22)",
            "Interleukin-23 (IL-23)",
            "Interferon-gamma (IFN-\u03b3)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Tumor Necrosis Factor-beta (TNF-\u03b2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-3 (IL-3)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-7 (IL-7)",
                "Interleukin-8 (IL-8)",
                "Interleukin-9 (IL-9)",
                "Interleukin-10 (IL-10)",
                "Interleukin-11 (IL-11)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-14 (IL-14)",
                "Interleukin-15 (IL-15)",
                "Interleukin-16 (IL-16)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interferon-gamma (IFN-\u03b3)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Tumor Necrosis Factor-beta (TNF-\u03b2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-1 (IL-1)",
                "Interleukin-10 (IL-10)",
                "Interleukin-11 (IL-11)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-14 (IL-14)",
                "Interleukin-15 (IL-15)",
                "Interleukin-16 (IL-16)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-2 (IL-2)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-3 (IL-3)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-7 (IL-7)",
                "Interleukin-8 (IL-8)",
                "Interleukin-9 (IL-9)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Tumor Necrosis Factor-beta (TNF-\u03b2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Interleukin-12 (IL-12)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Interferon-gamma (IFN-\u03b3)",
            "Interferon-alpha (IFN-\u03b1)",
            "Interferon-beta (IFN-\u03b2)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Granulocyte Colony-Stimulating Factor (G-CSF)",
            "Macrophage Colony-Stimulating Factor (M-CSF)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Platelet-Derived Growth Factor (PDGF)",
            "Vascular Endothelial Growth Factor (VEGF)",
            "Chemokine (C-X-C motif) ligand 8 (CXCL8)",
            "Chemokine (C-C motif) ligand 2 (CCL2)",
            "Chemokine (C-C motif) ligand 5 (CCL5)",
            "Lymphotoxin-alpha (LT-\u03b1)",
            "Lymphotoxin-beta (LT-\u03b2)",
            "B cell activating factor (BAFF)",
            "A proliferation-inducing ligand (APRIL)",
            "Interleukin-17A (IL-17A)",
            "Interleukin-18 (IL-18)",
            "Interleukin-23 (IL-23)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Interleukin-12 (IL-12)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Platelet-Derived Growth Factor (PDGF)",
                "Vascular Endothelial Growth Factor (VEGF)",
                "Chemokine (C-X-C motif) ligand 8 (CXCL8)",
                "Chemokine (C-C motif) ligand 2 (CCL2)",
                "Chemokine (C-C motif) ligand 5 (CCL5)",
                "Lymphotoxin-alpha (LT-\u03b1)",
                "Lymphotoxin-beta (LT-\u03b2)",
                "B cell activating factor (BAFF)",
                "A proliferation-inducing ligand (APRIL)",
                "Interleukin-17A (IL-17A)",
                "Interleukin-18 (IL-18)",
                "Interleukin-23 (IL-23)"
            ],
            "mismatches": [],
            "true_referents": [
                "A proliferation-inducing ligand (APRIL)",
                "B cell activating factor (BAFF)",
                "Chemokine (C-C motif) ligand 2 (CCL2)",
                "Chemokine (C-C motif) ligand 5 (CCL5)",
                "Chemokine (C-X-C motif) ligand 8 (CXCL8)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-1 (IL-1)",
                "Interleukin-12 (IL-12)",
                "Interleukin-17A (IL-17A)",
                "Interleukin-18 (IL-18)",
                "Interleukin-2 (IL-2)",
                "Interleukin-23 (IL-23)",
                "Interleukin-6 (IL-6)",
                "Lymphotoxin-alpha (LT-\u03b1)",
                "Lymphotoxin-beta (LT-\u03b2)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Platelet-Derived Growth Factor (PDGF)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Vascular Endothelial Growth Factor (VEGF)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Interleukin-12 (IL-12)",
            "Interleukin-17 (IL-17)",
            "Interferon-gamma (IFN-\u03b3)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Interleukin-4 (IL-4)",
            "Interleukin-5 (IL-5)",
            "Interleukin-10 (IL-10)",
            "Interleukin-13 (IL-13)",
            "Interleukin-15 (IL-15)",
            "Interleukin-18 (IL-18)",
            "Interleukin-21 (IL-21)",
            "Interleukin-23 (IL-23)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Interleukin-7 (IL-7)",
            "Interleukin-9 (IL-9)",
            "Interleukin-22 (IL-22)",
            "Interleukin-27 (IL-27)",
            "Interleukin-33 (IL-33)",
            "Interleukin-36 (IL-36)",
            "Interferon-alpha (IFN-\u03b1)",
            "Interferon-beta (IFN-\u03b2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Interleukin-12 (IL-12)",
                "Interleukin-17 (IL-17)",
                "Interferon-gamma (IFN-\u03b3)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-10 (IL-10)",
                "Interleukin-13 (IL-13)",
                "Interleukin-15 (IL-15)",
                "Interleukin-18 (IL-18)",
                "Interleukin-21 (IL-21)",
                "Interleukin-23 (IL-23)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interleukin-7 (IL-7)",
                "Interleukin-9 (IL-9)",
                "Interleukin-22 (IL-22)",
                "Interleukin-27 (IL-27)",
                "Interleukin-33 (IL-33)",
                "Interleukin-36 (IL-36)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-1 (IL-1)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-15 (IL-15)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-2 (IL-2)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-27 (IL-27)",
                "Interleukin-33 (IL-33)",
                "Interleukin-36 (IL-36)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-7 (IL-7)",
                "Interleukin-9 (IL-9)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Interleukin-12 (IL-12)",
            "Interleukin-17 (IL-17)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Interferon-gamma (IFN-\u03b3)",
            "Interleukin-4 (IL-4)",
            "Interleukin-10 (IL-10)",
            "Interleukin-15 (IL-15)",
            "Interleukin-18 (IL-18)",
            "Interleukin-21 (IL-21)",
            "Interleukin-23 (IL-23)",
            "Interleukin-27 (IL-27)",
            "Granulocyte-macrophage colony-stimulating factor (GM-CSF)",
            "Macrophage inflammatory protein-1 alpha (MIP-1\u03b1)",
            "Chemokine (C-C motif) ligand 5 (CCL5/RANTES)",
            "Interleukin-3 (IL-3)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Vascular Endothelial Growth Factor (VEGF)",
            "Interleukin-9 (IL-9)",
            "Interleukin-13 (IL-13)",
            "Interleukin-8 (IL-8)",
            "Platelet-derived growth factor (PDGF)",
            "Chemokine (C-X-C motif) ligand 10 (CXCL10/IP-10)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Interleukin-12 (IL-12)",
                "Interleukin-17 (IL-17)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-4 (IL-4)",
                "Interleukin-10 (IL-10)",
                "Interleukin-15 (IL-15)",
                "Interleukin-18 (IL-18)",
                "Interleukin-21 (IL-21)",
                "Interleukin-23 (IL-23)",
                "Interleukin-27 (IL-27)",
                "Granulocyte-macrophage colony-stimulating factor (GM-CSF)",
                "Macrophage inflammatory protein-1 alpha (MIP-1\u03b1)",
                "Chemokine (C-C motif) ligand 5 (CCL5/RANTES)",
                "Interleukin-3 (IL-3)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Vascular Endothelial Growth Factor (VEGF)",
                "Interleukin-9 (IL-9)",
                "Interleukin-13 (IL-13)",
                "Interleukin-8 (IL-8)",
                "Platelet-derived growth factor (PDGF)"
            ],
            "mismatches": [
                "Chemokine (C-X-C motif) ligand 10 (CXCL10/IP-10)"
            ],
            "true_referents": [
                "Chemokine (C-C motif) ligand 5 (CCL5/RANTES)",
                "Granulocyte-macrophage colony-stimulating factor (GM-CSF)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-1 (IL-1)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-15 (IL-15)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-2 (IL-2)",
                "Interleukin-21 (IL-21)",
                "Interleukin-23 (IL-23)",
                "Interleukin-27 (IL-27)",
                "Interleukin-3 (IL-3)",
                "Interleukin-4 (IL-4)",
                "Interleukin-6 (IL-6)",
                "Interleukin-8 (IL-8)",
                "Interleukin-9 (IL-9)",
                "Macrophage inflammatory protein-1 alpha (MIP-1\u03b1)",
                "Platelet-derived growth factor (PDGF)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Vascular Endothelial Growth Factor (VEGF)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interferon-gamma (IFN-\u03b3)",
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-4 (IL-4)",
            "Interleukin-5 (IL-5)",
            "Interleukin-6 (IL-6)",
            "Interleukin-8 (IL-8)",
            "Interleukin-10 (IL-10)",
            "Interleukin-12 (IL-12)",
            "Interleukin-13 (IL-13)",
            "Interleukin-17 (IL-17)",
            "Interleukin-18 (IL-18)",
            "Interleukin-21 (IL-21)",
            "Interleukin-22 (IL-22)",
            "Interleukin-23 (IL-23)",
            "Interleukin-27 (IL-27)",
            "Interleukin-33 (IL-33)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Granulocyte Colony-Stimulating Factor (G-CSF)",
            "Macrophage Colony-Stimulating Factor (M-CSF)",
            "Interferon-alpha (IFN-\u03b1)",
            "Interferon-beta (IFN-\u03b2)",
            "Transforming Growth Factor-beta (TGF-\u03b2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-8 (IL-8)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-27 (IL-27)",
                "Interleukin-33 (IL-33)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Transforming Growth Factor-beta (TGF-\u03b2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-1 (IL-1)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-2 (IL-2)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-27 (IL-27)",
                "Interleukin-33 (IL-33)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-8 (IL-8)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Interleukin-12 (IL-12)",
            "Interleukin-18 (IL-18)",
            "Tumor Necrosis Factor-alpha (TNF-alpha)",
            "Tumor Necrosis Factor-beta (TNF-beta)",
            "Interferon-gamma (IFN-gamma)",
            "Interferon-alpha (IFN-alpha)",
            "Interferon-beta (IFN-beta)",
            "Interferon-lambda (IFN-lambda)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Macrophage Colony-Stimulating Factor (M-CSF)",
            "Transforming Growth Factor-beta (TGF-beta)",
            "Epidermal Growth Factor (EGF)",
            "Fibroblast Growth Factor (FGF)",
            "Platelet-Derived Growth Factor (PDGF)",
            "Vascular Endothelial Growth Factor (VEGF)",
            "Insulin-like Growth Factor (IGF)",
            "Nerve Growth Factor (NGF)",
            "Hepatocyte Growth Factor (HGF)",
            "Keratinocyte Growth Factor (KGF)",
            "Leukemia Inhibitory Factor (LIF)",
            "Colony-Stimulating Factor-1 (CSF-1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Interleukin-12 (IL-12)",
                "Interleukin-18 (IL-18)",
                "Tumor Necrosis Factor-alpha (TNF-alpha)",
                "Tumor Necrosis Factor-beta (TNF-beta)",
                "Interferon-gamma (IFN-gamma)",
                "Interferon-alpha (IFN-alpha)",
                "Interferon-beta (IFN-beta)",
                "Interferon-lambda (IFN-lambda)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Transforming Growth Factor-beta (TGF-beta)",
                "Epidermal Growth Factor (EGF)",
                "Fibroblast Growth Factor (FGF)",
                "Platelet-Derived Growth Factor (PDGF)",
                "Vascular Endothelial Growth Factor (VEGF)",
                "Insulin-like Growth Factor (IGF)",
                "Nerve Growth Factor (NGF)",
                "Hepatocyte Growth Factor (HGF)",
                "Keratinocyte Growth Factor (KGF)",
                "Leukemia Inhibitory Factor (LIF)",
                "Colony-Stimulating Factor-1 (CSF-1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Colony-Stimulating Factor-1 (CSF-1)",
                "Epidermal Growth Factor (EGF)",
                "Fibroblast Growth Factor (FGF)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Hepatocyte Growth Factor (HGF)",
                "Insulin-like Growth Factor (IGF)",
                "Interferon-alpha (IFN-alpha)",
                "Interferon-beta (IFN-beta)",
                "Interferon-gamma (IFN-gamma)",
                "Interferon-lambda (IFN-lambda)",
                "Interleukin-1 (IL-1)",
                "Interleukin-12 (IL-12)",
                "Interleukin-18 (IL-18)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Keratinocyte Growth Factor (KGF)",
                "Leukemia Inhibitory Factor (LIF)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Nerve Growth Factor (NGF)",
                "Platelet-Derived Growth Factor (PDGF)",
                "Transforming Growth Factor-beta (TGF-beta)",
                "Tumor Necrosis Factor-alpha (TNF-alpha)",
                "Tumor Necrosis Factor-beta (TNF-beta)",
                "Vascular Endothelial Growth Factor (VEGF)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-4 (IL-4)",
            "Interleukin-5 (IL-5)",
            "Interleukin-6 (IL-6)",
            "Interleukin-7 (IL-7)",
            "Interleukin-12 (IL-12)",
            "Interleukin-15 (IL-15)",
            "Interleukin-17 (IL-17)",
            "Interleukin-21 (IL-21)",
            "Interleukin-23 (IL-23)",
            "Interferon-alpha (IFN-\u03b1)",
            "Interferon-gamma (IFN-\u03b3)",
            "Interferon-beta (IFN-\u03b2)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Colony Stimulating Factor 1 (CSF1)",
            "Chemokine (C-X-C motif) ligand 8 (CXCL8)",
            "Chemokine (C-C motif) ligand 2 (CCL2)",
            "Chemokine (C-C motif) ligand 5 (CCL5)",
            "Chemokine (C-X-C motif) ligand 10 (CXCL10)",
            "Chemokine (C-C motif) ligand 3 (CCL3)",
            "Chemokine (C-X3-C motif) ligand 1 (CX3CL1)",
            "Chemokine (C-C motif) ligand 7 (CCL7)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-7 (IL-7)",
                "Interleukin-12 (IL-12)",
                "Interleukin-15 (IL-15)",
                "Interleukin-17 (IL-17)",
                "Interleukin-21 (IL-21)",
                "Interleukin-23 (IL-23)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interferon-beta (IFN-\u03b2)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Colony Stimulating Factor 1 (CSF1)",
                "Chemokine (C-X-C motif) ligand 8 (CXCL8)",
                "Chemokine (C-C motif) ligand 2 (CCL2)",
                "Chemokine (C-C motif) ligand 5 (CCL5)",
                "Chemokine (C-X-C motif) ligand 10 (CXCL10)",
                "Chemokine (C-C motif) ligand 3 (CCL3)",
                "Chemokine (C-X3-C motif) ligand 1 (CX3CL1)",
                "Chemokine (C-C motif) ligand 7 (CCL7)"
            ],
            "mismatches": [],
            "true_referents": [
                "Chemokine (C-C motif) ligand 2 (CCL2)",
                "Chemokine (C-C motif) ligand 3 (CCL3)",
                "Chemokine (C-C motif) ligand 5 (CCL5)",
                "Chemokine (C-C motif) ligand 7 (CCL7)",
                "Chemokine (C-X-C motif) ligand 10 (CXCL10)",
                "Chemokine (C-X-C motif) ligand 8 (CXCL8)",
                "Chemokine (C-X3-C motif) ligand 1 (CX3CL1)",
                "Colony Stimulating Factor 1 (CSF1)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-1 (IL-1)",
                "Interleukin-12 (IL-12)",
                "Interleukin-15 (IL-15)",
                "Interleukin-17 (IL-17)",
                "Interleukin-2 (IL-2)",
                "Interleukin-21 (IL-21)",
                "Interleukin-23 (IL-23)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-7 (IL-7)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Interferon-gamma (IFN-\u03b3)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Interleukin-12 (IL-12)",
            "Interleukin-18 (IL-18)",
            "Interleukin-23 (IL-23)",
            "Interleukin-17 (IL-17)",
            "Interferon-alpha (IFN-\u03b1)",
            "Interferon-beta (IFN-\u03b2)",
            "C-C Motif Chemokine Ligand 2 (CCL2)",
            "C-X-C Motif Chemokine Ligand 8 (CXCL8)",
            "Interleukin-15 (IL-15)",
            "Interleukin-21 (IL-21)",
            "Interleukin-33 (IL-33)",
            "Thymic Stromal Lymphopoietin (TSLP)",
            "Interleukin-7 (IL-7)",
            "Interleukin-9 (IL-9)",
            "Interleukin-22 (IL-22)",
            "Interleukin-25 (IL-25)",
            "Interleukin-27 (IL-27)",
            "Interleukin-35 (IL-35)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Interferon-gamma (IFN-\u03b3)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interleukin-12 (IL-12)",
                "Interleukin-18 (IL-18)",
                "Interleukin-23 (IL-23)",
                "Interleukin-17 (IL-17)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "C-C Motif Chemokine Ligand 2 (CCL2)",
                "C-X-C Motif Chemokine Ligand 8 (CXCL8)",
                "Interleukin-15 (IL-15)",
                "Interleukin-21 (IL-21)",
                "Interleukin-33 (IL-33)",
                "Thymic Stromal Lymphopoietin (TSLP)",
                "Interleukin-7 (IL-7)",
                "Interleukin-9 (IL-9)",
                "Interleukin-22 (IL-22)",
                "Interleukin-25 (IL-25)",
                "Interleukin-27 (IL-27)",
                "Interleukin-35 (IL-35)"
            ],
            "mismatches": [],
            "true_referents": [
                "C-C Motif Chemokine Ligand 2 (CCL2)",
                "C-X-C Motif Chemokine Ligand 8 (CXCL8)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-1 (IL-1)",
                "Interleukin-12 (IL-12)",
                "Interleukin-15 (IL-15)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-2 (IL-2)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-25 (IL-25)",
                "Interleukin-27 (IL-27)",
                "Interleukin-33 (IL-33)",
                "Interleukin-35 (IL-35)",
                "Interleukin-6 (IL-6)",
                "Interleukin-7 (IL-7)",
                "Interleukin-9 (IL-9)",
                "Thymic Stromal Lymphopoietin (TSLP)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-4 (IL-4)",
            "Interleukin-5 (IL-5)",
            "Interleukin-6 (IL-6)",
            "Interleukin-7 (IL-7)",
            "Interleukin-8 (IL-8)",
            "Interleukin-10 (IL-10)",
            "Interleukin-12 (IL-12)",
            "Interleukin-13 (IL-13)",
            "Interleukin-15 (IL-15)",
            "Interleukin-17 (IL-17)",
            "Interleukin-18 (IL-18)",
            "Interleukin-21 (IL-21)",
            "Interleukin-23 (IL-23)",
            "Tumor Necrosis Factor (TNF)",
            "Interferon-alpha (IFN-\u03b1)",
            "Interferon-beta (IFN-\u03b2)",
            "Interferon-gamma (IFN-\u03b3)",
            "Granulocyte Colony-Stimulating Factor (G-CSF)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Macrophage Inflammatory Protein-1 (MIP-1)",
            "Monocyte Chemoattractant Protein-1 (MCP-1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-7 (IL-7)",
                "Interleukin-8 (IL-8)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-15 (IL-15)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-21 (IL-21)",
                "Interleukin-23 (IL-23)",
                "Tumor Necrosis Factor (TNF)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Interferon-gamma (IFN-\u03b3)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Macrophage Inflammatory Protein-1 (MIP-1)",
                "Monocyte Chemoattractant Protein-1 (MCP-1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interferon-alpha (IFN-\u03b1)",
                "Interferon-beta (IFN-\u03b2)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-1 (IL-1)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-15 (IL-15)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-2 (IL-2)",
                "Interleukin-21 (IL-21)",
                "Interleukin-23 (IL-23)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-7 (IL-7)",
                "Interleukin-8 (IL-8)",
                "Macrophage Inflammatory Protein-1 (MIP-1)",
                "Monocyte Chemoattractant Protein-1 (MCP-1)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Tumor Necrosis Factor (TNF)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-3 (IL-3)",
            "Interleukin-4 (IL-4)",
            "Interleukin-5 (IL-5)",
            "Interleukin-6 (IL-6)",
            "Interleukin-7 (IL-7)",
            "Interleukin-8 (IL-8)",
            "Interleukin-9 (IL-9)",
            "Interleukin-10 (IL-10)",
            "Interleukin-11 (IL-11)",
            "Interleukin-12 (IL-12)",
            "Interleukin-13 (IL-13)",
            "Interleukin-14 (IL-14)",
            "Interleukin-15 (IL-15)",
            "Interleukin-16 (IL-16)",
            "Interleukin-17 (IL-17)",
            "Interleukin-18 (IL-18)",
            "Interleukin-19 (IL-19)",
            "Interleukin-20 (IL-20)",
            "Interleukin-21 (IL-21)",
            "Interleukin-22 (IL-22)",
            "Interleukin-23 (IL-23)",
            "Interleukin-24 (IL-24)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-3 (IL-3)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-7 (IL-7)",
                "Interleukin-8 (IL-8)",
                "Interleukin-9 (IL-9)",
                "Interleukin-10 (IL-10)",
                "Interleukin-11 (IL-11)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-14 (IL-14)",
                "Interleukin-15 (IL-15)",
                "Interleukin-16 (IL-16)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-19 (IL-19)",
                "Interleukin-20 (IL-20)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)"
            ],
            "mismatches": [
                "Interleukin-24 (IL-24)"
            ],
            "true_referents": [
                "Interleukin-1 (IL-1)",
                "Interleukin-10 (IL-10)",
                "Interleukin-11 (IL-11)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-14 (IL-14)",
                "Interleukin-15 (IL-15)",
                "Interleukin-16 (IL-16)",
                "Interleukin-17 (IL-17)",
                "Interleukin-18 (IL-18)",
                "Interleukin-19 (IL-19)",
                "Interleukin-2 (IL-2)",
                "Interleukin-20 (IL-20)",
                "Interleukin-21 (IL-21)",
                "Interleukin-22 (IL-22)",
                "Interleukin-23 (IL-23)",
                "Interleukin-24 (IL-24)",
                "Interleukin-3 (IL-3)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-7 (IL-7)",
                "Interleukin-8 (IL-8)",
                "Interleukin-9 (IL-9)"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 (IL-1)",
            "Interleukin-2 (IL-2)",
            "Interleukin-6 (IL-6)",
            "Interferon-gamma (IFN-\u03b3)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Interleukin-12 (IL-12)",
            "Interleukin-15 (IL-15)",
            "Interleukin-18 (IL-18)",
            "Interleukin-23 (IL-23)",
            "Transforming Growth Factor-beta (TGF-\u03b2)",
            "Macrophage Inflammatory Protein-1 (MIP-1)",
            "Regulated on Activation, Normal T Expressed and Secreted (RANTES)",
            "Monocyte Chemoattractant Protein-1 (MCP-1)",
            "Interleukin-8 (IL-8)",
            "Interleukin-4 (IL-4)",
            "Interleukin-5 (IL-5)",
            "Interleukin-10 (IL-10)",
            "Interleukin-13 (IL-13)",
            "Granulocyte Colony-Stimulating Factor (G-CSF)",
            "Macrophage Colony-Stimulating Factor (M-CSF)",
            "Vascular Endothelial Growth Factor (VEGF)",
            "Platelet-Derived Growth Factor (PDGF)",
            "Fibroblast Growth Factor (FGF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 (IL-1)",
                "Interleukin-2 (IL-2)",
                "Interleukin-6 (IL-6)",
                "Interferon-gamma (IFN-\u03b3)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interleukin-12 (IL-12)",
                "Interleukin-15 (IL-15)",
                "Interleukin-18 (IL-18)",
                "Interleukin-23 (IL-23)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Macrophage Inflammatory Protein-1 (MIP-1)",
                "Regulated on Activation, Normal T Expressed and Secreted (RANTES)",
                "Monocyte Chemoattractant Protein-1 (MCP-1)",
                "Interleukin-8 (IL-8)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-10 (IL-10)",
                "Interleukin-13 (IL-13)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Vascular Endothelial Growth Factor (VEGF)",
                "Platelet-Derived Growth Factor (PDGF)",
                "Fibroblast Growth Factor (FGF)"
            ],
            "mismatches": [],
            "true_referents": [
                "Fibroblast Growth Factor (FGF)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-1 (IL-1)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-13 (IL-13)",
                "Interleukin-15 (IL-15)",
                "Interleukin-18 (IL-18)",
                "Interleukin-2 (IL-2)",
                "Interleukin-23 (IL-23)",
                "Interleukin-4 (IL-4)",
                "Interleukin-5 (IL-5)",
                "Interleukin-6 (IL-6)",
                "Interleukin-8 (IL-8)",
                "Macrophage Colony-Stimulating Factor (M-CSF)",
                "Macrophage Inflammatory Protein-1 (MIP-1)",
                "Monocyte Chemoattractant Protein-1 (MCP-1)",
                "Platelet-Derived Growth Factor (PDGF)",
                "Regulated on Activation, Normal T Expressed and Secreted (RANTES)",
                "Transforming Growth Factor-beta (TGF-\u03b2)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Vascular Endothelial Growth Factor (VEGF)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin-1 beta (IL-1\u03b2)",
            "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
            "Interleukin-6 (IL-6)",
            "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
            "Interleukin-12 (IL-12)",
            "Interferon-gamma (IFN-\u03b3)",
            "Tumor Necrosis Factor-beta (TNF-\u03b2)",
            "Interleukin-2 (IL-2)",
            "Interleukin-8 (IL-8)",
            "Granulocyte Colony-Stimulating Factor (G-CSF)",
            "Macrophage Inflammatory Protein-1 alpha (MIP-1\u03b1)",
            "Interleukin-10 (IL-10)",
            "Interleukin-17 (IL-17)",
            "Interleukin-23 (IL-23)",
            "Interleukin-27 (IL-27)",
            "Interleukin-31 (IL-31)",
            "Interleukin-33 (IL-33)",
            "Tumor Necrosis Factor-like Weak Inducer of Apoptosis (TWEAK)",
            "Fibroblast Growth Factor-basic (FGF-b)",
            "Eotaxin",
            "MCP-1 (Monocyte Chemoattractant Protein-1)",
            "RANTES (Regulated on Activation, Normal T cell Expressed and Secreted)",
            "MIP-1\u03b2 (Macrophage Inflammatory Protein-1 beta)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin-1 beta (IL-1\u03b2)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Interleukin-6 (IL-6)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interleukin-12 (IL-12)",
                "Interferon-gamma (IFN-\u03b3)",
                "Tumor Necrosis Factor-beta (TNF-\u03b2)",
                "Interleukin-2 (IL-2)",
                "Interleukin-8 (IL-8)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Macrophage Inflammatory Protein-1 alpha (MIP-1\u03b1)",
                "Interleukin-10 (IL-10)",
                "Interleukin-17 (IL-17)",
                "Interleukin-23 (IL-23)",
                "Interleukin-27 (IL-27)",
                "Interleukin-31 (IL-31)",
                "Interleukin-33 (IL-33)",
                "Tumor Necrosis Factor-like Weak Inducer of Apoptosis (TWEAK)",
                "Fibroblast Growth Factor-basic (FGF-b)",
                "Eotaxin",
                "MCP-1 (Monocyte Chemoattractant Protein-1)",
                "RANTES (Regulated on Activation, Normal T cell Expressed and Secreted)",
                "MIP-1\u03b2 (Macrophage Inflammatory Protein-1 beta)"
            ],
            "mismatches": [],
            "true_referents": [
                "Eotaxin",
                "Fibroblast Growth Factor-basic (FGF-b)",
                "Granulocyte Colony-Stimulating Factor (G-CSF)",
                "Granulocyte-Macrophage Colony-Stimulating Factor (GM-CSF)",
                "Interferon-gamma (IFN-\u03b3)",
                "Interleukin-1 beta (IL-1\u03b2)",
                "Interleukin-10 (IL-10)",
                "Interleukin-12 (IL-12)",
                "Interleukin-17 (IL-17)",
                "Interleukin-2 (IL-2)",
                "Interleukin-23 (IL-23)",
                "Interleukin-27 (IL-27)",
                "Interleukin-31 (IL-31)",
                "Interleukin-33 (IL-33)",
                "Interleukin-6 (IL-6)",
                "Interleukin-8 (IL-8)",
                "MCP-1 (Monocyte Chemoattractant Protein-1)",
                "MIP-1\u03b2 (Macrophage Inflammatory Protein-1 beta)",
                "Macrophage Inflammatory Protein-1 alpha (MIP-1\u03b1)",
                "RANTES (Regulated on Activation, Normal T cell Expressed and Secreted)",
                "Tumor Necrosis Factor-alpha (TNF-\u03b1)",
                "Tumor Necrosis Factor-beta (TNF-\u03b2)",
                "Tumor Necrosis Factor-like Weak Inducer of Apoptosis (TWEAK)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            "Interleukin 1 alpha (IL1A)",
            "Interleukin 1 beta (IL1B)",
            "Interleukin 2 (IL2)",
            "Interleukin 3 (IL3)",
            "Interleukin 4 (IL4)",
            "Interleukin 5 (IL5)",
            "Interleukin 6 (IL6)",
            "Interleukin 7 (IL7)",
            "Interleukin 8 (IL8)",
            "Interleukin 9 (IL9)",
            "Interleukin 10 (IL10)",
            "Interleukin 11 (IL11)",
            "Interleukin 12 (IL12)",
            "Interleukin 13 (IL13)",
            "Interleukin 15 (IL15)",
            "Interleukin 16 (IL16)",
            "Interleukin 17A (IL17A)",
            "Interleukin 17B (IL17B)",
            "Interleukin 17C (IL17C)",
            "Interleukin 17D (IL17D)",
            "Interleukin 17E (IL17E)",
            "Interleukin 17F (IL17F)",
            "Granulocyte-colony stimulating factor (G-CSF)",
            "Granulocyte macrophage-colony stimulating factor (GM-CSF)",
            "Tumor necrosis factor alpha (TNF-alpha)",
            "Lymphotactin (XCL1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin 1 alpha (IL1A)",
                "Interleukin 1 beta (IL1B)",
                "Interleukin 2 (IL2)",
                "Interleukin 3 (IL3)",
                "Interleukin 4 (IL4)",
                "Interleukin 5 (IL5)",
                "Interleukin 6 (IL6)",
                "Interleukin 7 (IL7)",
                "Interleukin 8 (IL8)",
                "Interleukin 9 (IL9)",
                "Interleukin 10 (IL10)",
                "Interleukin 11 (IL11)",
                "Interleukin 12 (IL12)",
                "Interleukin 13 (IL13)",
                "Interleukin 15 (IL15)",
                "Interleukin 16 (IL16)",
                "Interleukin 17A (IL17A)",
                "Interleukin 17B (IL17B)",
                "Interleukin 17C (IL17C)",
                "Interleukin 17D (IL17D)",
                "Interleukin 17E (IL17E)",
                "Interleukin 17F (IL17F)",
                "Granulocyte-colony stimulating factor (G-CSF)",
                "Granulocyte macrophage-colony stimulating factor (GM-CSF)"
            ],
            "mismatches": [
                "Tumor necrosis factor alpha (TNF-alpha)",
                "Lymphotactin (XCL1)"
            ],
            "true_referents": [
                "Granulocyte macrophage-colony stimulating factor (GM-CSF)",
                "Granulocyte-colony stimulating factor (G-CSF)",
                "Interleukin 1 alpha (IL1A)",
                "Interleukin 1 beta (IL1B)",
                "Interleukin 10 (IL10)",
                "Interleukin 11 (IL11)",
                "Interleukin 12 (IL12)",
                "Interleukin 13 (IL13)",
                "Interleukin 15 (IL15)",
                "Interleukin 16 (IL16)",
                "Interleukin 17A (IL17A)",
                "Interleukin 17B (IL17B)",
                "Interleukin 17C (IL17C)",
                "Interleukin 17D (IL17D)",
                "Interleukin 17E (IL17E)",
                "Interleukin 17F (IL17F)",
                "Interleukin 2 (IL2)",
                "Interleukin 3 (IL3)",
                "Interleukin 4 (IL4)",
                "Interleukin 5 (IL5)",
                "Interleukin 6 (IL6)",
                "Interleukin 7 (IL7)",
                "Interleukin 8 (IL8)",
                "Interleukin 9 (IL9)"
            ],
            "TP": 24,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "pro-inflammatory cytokine",
        "domain": "biology",
        "response": [
            {
                "Referent": "Interleukin 2",
                "Canonical Name": "IL-2"
            },
            {
                "Referent": "Interleukin 4",
                "Canonical Name": "IL-4"
            },
            {
                "Referent": "Interleukin 6",
                "Canonical Name": "IL-6"
            },
            {
                "Referent": "Interleukin 7",
                "Canonical Name": "IL-7"
            },
            {
                "Referent": "Interleukin 8",
                "Canonical Name": "IL-8"
            },
            {
                "Referent": "Interleukin 10",
                "Canonical Name": "IL-10"
            },
            {
                "Referent": "Interleukin 11",
                "Canonical Name": "IL-11"
            },
            {
                "Referent": "Interleukin 12",
                "Canonical Name": "IL-12"
            },
            {
                "Referent": "Interleukin 13",
                "Canonical Name": "IL-13"
            },
            {
                "Referent": "Interleukin 15",
                "Canonical Name": "IL-15"
            },
            {
                "Referent": "Interleukin 17",
                "Canonical Name": "IL-17"
            },
            {
                "Referent": "Interleukin 18",
                "Canonical Name": "IL-18"
            },
            {
                "Referent": "Interleukin 19",
                "Canonical Name": "IL-19"
            },
            {
                "Referent": "Interleukin 20",
                "Canonical Name": "IL-20"
            },
            {
                "Referent": "Interleukin 21",
                "Canonical Name": "IL-21"
            },
            {
                "Referent": "Interleukin 22",
                "Canonical Name": "IL-22"
            },
            {
                "Referent": "Interleukin 23",
                "Canonical Name": "IL-23"
            },
            {
                "Referent": "Interleukin 24",
                "Canonical Name": "IL-24"
            },
            {
                "Referent": "Interleukin 25",
                "Canonical Name": "IL-25"
            },
            {
                "Referent": "Interleukin 26",
                "Canonical Name": "IL-26"
            },
            {
                "Referent": "Interleukin 27",
                "Canonical Name": "IL-27"
            },
            {
                "Referent": "Interleukin 28",
                "Canonical Name": "IL-28"
            },
            {
                "Referent": "Interleukin 29",
                "Canonical Name": "IL-29"
            },
            {
                "Referent": "Interleukin 30",
                "Canonical Name": "IL-30"
            },
            {
                "Referent": "Interleukin 31",
                "Canonical Name": "IL-31"
            },
            {
                "Referent": "Interleukin 32",
                "Canonical Name": "IL-32"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Interleukin 2",
                "Interleukin 4",
                "Interleukin 6",
                "Interleukin 7",
                "Interleukin 8",
                "Interleukin 10",
                "Interleukin 11",
                "Interleukin 12",
                "Interleukin 13",
                "Interleukin 15",
                "Interleukin 17",
                "Interleukin 18",
                "Interleukin 19",
                "Interleukin 20",
                "Interleukin 21",
                "Interleukin 22",
                "Interleukin 23",
                "Interleukin 24",
                "Interleukin 25",
                "Interleukin 26",
                "Interleukin 27",
                "Interleukin 28",
                "Interleukin 29",
                "Interleukin 30"
            ],
            "mismatches": [
                "Interleukin 31",
                "Interleukin 32"
            ],
            "true_referents": [
                "{\"Referent\": \"Interleukin 10\", \"Canonical Name\": \"IL-10\"}",
                "{\"Referent\": \"Interleukin 11\", \"Canonical Name\": \"IL-11\"}",
                "{\"Referent\": \"Interleukin 12\", \"Canonical Name\": \"IL-12\"}",
                "{\"Referent\": \"Interleukin 13\", \"Canonical Name\": \"IL-13\"}",
                "{\"Referent\": \"Interleukin 15\", \"Canonical Name\": \"IL-15\"}",
                "{\"Referent\": \"Interleukin 17\", \"Canonical Name\": \"IL-17\"}",
                "{\"Referent\": \"Interleukin 18\", \"Canonical Name\": \"IL-18\"}",
                "{\"Referent\": \"Interleukin 19\", \"Canonical Name\": \"IL-19\"}",
                "{\"Referent\": \"Interleukin 2\", \"Canonical Name\": \"IL-2\"}",
                "{\"Referent\": \"Interleukin 20\", \"Canonical Name\": \"IL-20\"}",
                "{\"Referent\": \"Interleukin 21\", \"Canonical Name\": \"IL-21\"}",
                "{\"Referent\": \"Interleukin 22\", \"Canonical Name\": \"IL-22\"}",
                "{\"Referent\": \"Interleukin 23\", \"Canonical Name\": \"IL-23\"}",
                "{\"Referent\": \"Interleukin 24\", \"Canonical Name\": \"IL-24\"}",
                "{\"Referent\": \"Interleukin 25\", \"Canonical Name\": \"IL-25\"}",
                "{\"Referent\": \"Interleukin 26\", \"Canonical Name\": \"IL-26\"}",
                "{\"Referent\": \"Interleukin 27\", \"Canonical Name\": \"IL-27\"}",
                "{\"Referent\": \"Interleukin 28\", \"Canonical Name\": \"IL-28\"}",
                "{\"Referent\": \"Interleukin 29\", \"Canonical Name\": \"IL-29\"}",
                "{\"Referent\": \"Interleukin 30\", \"Canonical Name\": \"IL-30\"}",
                "{\"Referent\": \"Interleukin 4\", \"Canonical Name\": \"IL-4\"}",
                "{\"Referent\": \"Interleukin 6\", \"Canonical Name\": \"IL-6\"}",
                "{\"Referent\": \"Interleukin 7\", \"Canonical Name\": \"IL-7\"}",
                "{\"Referent\": \"Interleukin 8\", \"Canonical Name\": \"IL-8\"}"
            ],
            "TP": 24,
            "FP": 2,
            "FN": 0
        }
    }
]