[
    {
        "test": "decide-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains"
            ],
            "mismatches": [],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Single-Chain Antibodies",
            "Complementarity Determining Regions",
            "Catalytic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies",
                "Complementarity Determining Regions"
            ],
            "mismatches": [
                "Catalytic Antibodies"
            ],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 3,
            "FP": 1,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Hepatitis A Antibodies",
            "Single-Chain Antibodies",
            "Antitoxins",
            "Anticardiolipin Antibodies",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin Gm Allotypes",
            "Catalytic Antibodies",
            "Antineutrophil Cytoplasmic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Antitoxins",
                "Anticardiolipin Antibodies",
                "Catalytic Antibodies",
                "Antineutrophil Cytoplasmic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 5,
            "FP": 4,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "phi-v4",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin Gm Allotypes",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin Gm Allotypes",
                "Immunoglobulin mu-Chains"
            ],
            "mismatches": [],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 7,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "phi-v4",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "CD4 Immunoadhesins",
            "Complementarity Determining Regions",
            "Single-Chain Antibodies",
            "Immunoglobulin Idiotypes"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Single-Domain Antibodies",
                "CD4 Immunoadhesins",
                "Complementarity Determining Regions",
                "Single-Chain Antibodies",
                "Immunoglobulin Idiotypes"
            ],
            "mismatches": [],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "phi-v4",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "CD4 Immunoadhesins",
            "Hepatitis A Antibodies",
            "Antitoxins",
            "Single-Chain Antibodies",
            "Anticardiolipin Antibodies",
            "Catalytic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Antitoxins",
                "Anticardiolipin Antibodies",
                "Catalytic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "CD4 Immunoadhesins",
                "Single-Chain Antibodies"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 4,
            "FP": 3,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin Gm Allotypes",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin Gm Allotypes",
                "Immunoglobulin mu-Chains"
            ],
            "mismatches": [],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 7,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Complementarity Determining Regions"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Complementarity Determining Regions"
            ],
            "mismatches": [],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 7
        }
    },
    {
        "test": "decide-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Hepatitis A Antibodies",
            "Antitoxins",
            "Single-Chain Antibodies",
            "Anticardiolipin Antibodies",
            "Catalytic Antibodies",
            "Antineutrophil Cytoplasmic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Antitoxins",
                "Anticardiolipin Antibodies",
                "Catalytic Antibodies",
                "Antineutrophil Cytoplasmic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 5,
            "FP": 2,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "gemma-3",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains"
            ],
            "mismatches": [],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "gemma-3",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains",
            "Complementarity Determining Regions"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Complementarity Determining Regions"
            ],
            "mismatches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains"
            ],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 1,
            "FP": 6,
            "FN": 7
        }
    },
    {
        "test": "decide-referents",
        "responder": "gemma-3",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Hepatitis A Antibodies",
            "Thyroid-Stimulating Immunoglobulins",
            "Antitoxins",
            "Single-Chain Antibodies",
            "Anticardiolipin Antibodies",
            "Catalytic Antibodies",
            "Antineutrophil Cytoplasmic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Antitoxins",
                "Anticardiolipin Antibodies",
                "Catalytic Antibodies",
                "Antineutrophil Cytoplasmic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 6,
            "FP": 2,
            "FN": 2
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains"
            ],
            "mismatches": [],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 2
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Complementarity Determining Regions",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Complementarity Determining Regions"
            ],
            "mismatches": [
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains"
            ],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 1,
            "FP": 5,
            "FN": 7
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Hepatitis A Antibodies",
            "Antitoxins",
            "Single-Chain Antibodies",
            "Anticardiolipin Antibodies",
            "Catalytic Antibodies",
            "Antineutrophil Cytoplasmic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Antitoxins",
                "Anticardiolipin Antibodies",
                "Catalytic Antibodies",
                "Antineutrophil Cytoplasmic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 5,
            "FP": 2,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o-mini",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains"
            ],
            "mismatches": [],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 2
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o-mini",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Single-Chain Antibodies",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies"
            ],
            "mismatches": [
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains"
            ],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 2,
            "FP": 5,
            "FN": 6
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o-mini",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Hepatitis A Antibodies",
            "Antitoxins",
            "Single-Chain Antibodies",
            "Anticardiolipin Antibodies",
            "Catalytic Antibodies",
            "Antineutrophil Cytoplasmic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Antitoxins",
                "Anticardiolipin Antibodies",
                "Catalytic Antibodies",
                "Antineutrophil Cytoplasmic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 5,
            "FP": 2,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4-32k",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains"
            ],
            "mismatches": [],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 2
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4-32k",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Single-Chain Antibodies",
            "Complementarity Determining Regions"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies",
                "Complementarity Determining Regions"
            ],
            "mismatches": [],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4-32k",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Hepatitis A Antibodies",
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Thyroid-Stimulating Immunoglobulins",
            "Single-Chain Antibodies",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin Idiotypes",
            "Anticardiolipin Antibodies",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin Gm Allotypes",
            "Immunoglobulin mu-Chains",
            "Catalytic Antibodies",
            "Antineutrophil Cytoplasmic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Anticardiolipin Antibodies",
                "Catalytic Antibodies",
                "Antineutrophil Cytoplasmic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Single-Chain Antibodies",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin Idiotypes",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin Gm Allotypes",
                "Immunoglobulin mu-Chains"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 5,
            "FP": 10,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains"
            ],
            "mismatches": [],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 2
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "CD4 Immunoadhesins",
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin Idiotypes",
            "Complementarity Determining Regions",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin Gm Allotypes",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Single-Domain Antibodies",
                "CD4 Immunoadhesins",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions"
            ],
            "mismatches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin Gm Allotypes",
                "Immunoglobulin mu-Chains"
            ],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 4,
            "FP": 7,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "CD4 Immunoadhesins",
            "Immunoglobulin J-Chains",
            "Hepatitis A Antibodies",
            "Immunoglobulin kappa-Chains",
            "Thyroid-Stimulating Immunoglobulins",
            "Antitoxins",
            "Single-Chain Antibodies",
            "Immunoglobulin epsilon-Chains",
            "Tuftsin",
            "Immunoglobulin Idiotypes",
            "Anticardiolipin Antibodies",
            "Complementarity Determining Regions",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Certolizumab Pegol",
            "Immunoglobulin Gm Allotypes",
            "Immunoglobulin mu-Chains",
            "Inotuzumab Ozogamicin",
            "Catalytic Antibodies",
            "Secretory Component",
            "Antineutrophil Cytoplasmic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Antitoxins",
                "Anticardiolipin Antibodies",
                "Inotuzumab Ozogamicin",
                "Catalytic Antibodies",
                "Antineutrophil Cytoplasmic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "CD4 Immunoadhesins",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Single-Chain Antibodies",
                "Immunoglobulin epsilon-Chains",
                "Tuftsin",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Certolizumab Pegol",
                "Immunoglobulin Gm Allotypes",
                "Immunoglobulin mu-Chains",
                "Secretory Component"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 7,
            "FP": 15,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "o1-mini",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains"
            ],
            "mismatches": [],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 2
        }
    },
    {
        "test": "decide-referents",
        "responder": "o1-mini",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Single-Chain Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies"
            ],
            "mismatches": [],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 2,
            "FP": 0,
            "FN": 6
        }
    },
    {
        "test": "decide-referents",
        "responder": "o1-mini",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Hepatitis A Antibodies",
            "Thyroid-Stimulating Immunoglobulins",
            "Antitoxins",
            "Single-Chain Antibodies",
            "Anticardiolipin Antibodies",
            "Certolizumab Pegol",
            "Inotuzumab Ozogamicin",
            "Catalytic Antibodies",
            "Antineutrophil Cytoplasmic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Antitoxins",
                "Anticardiolipin Antibodies",
                "Inotuzumab Ozogamicin",
                "Catalytic Antibodies",
                "Antineutrophil Cytoplasmic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies",
                "Certolizumab Pegol"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 7,
            "FP": 3,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains"
            ],
            "mismatches": [],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 2
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Immunoglobulin kappa-Chains",
            "Single-Chain Antibodies",
            "Immunoglobulin epsilon-Chains",
            "Complementarity Determining Regions",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies",
                "Complementarity Determining Regions"
            ],
            "mismatches": [
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains"
            ],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 3,
            "FP": 5,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Hepatitis A Antibodies",
            "Antitoxins",
            "Single-Chain Antibodies",
            "Anticardiolipin Antibodies",
            "Antineutrophil Cytoplasmic Antibodies",
            "Catalytic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Antitoxins",
                "Anticardiolipin Antibodies",
                "Antineutrophil Cytoplasmic Antibodies",
                "Catalytic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 5,
            "FP": 2,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains",
            "Secretory Component"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains",
                "Secretory Component"
            ],
            "mismatches": [],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 7,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Single-Chain Antibodies",
            "Complementarity Determining Regions",
            "Certolizumab Pegol",
            "Inotuzumab Ozogamicin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies",
                "Complementarity Determining Regions",
                "Certolizumab Pegol"
            ],
            "mismatches": [
                "Inotuzumab Ozogamicin"
            ],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 4,
            "FP": 1,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "CD4 Immunoadhesins",
            "Hepatitis A Antibodies",
            "Thyroid-Stimulating Immunoglobulins",
            "Antitoxins",
            "Single-Chain Antibodies",
            "Anticardiolipin Antibodies",
            "Catalytic Antibodies",
            "Antineutrophil Cytoplasmic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Antitoxins",
                "Anticardiolipin Antibodies",
                "Catalytic Antibodies",
                "Antineutrophil Cytoplasmic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "CD4 Immunoadhesins",
                "Single-Chain Antibodies"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 6,
            "FP": 3,
            "FN": 2
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin Idiotypes",
            "Complementarity Determining Regions",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin Gm Allotypes",
            "Immunoglobulin mu-Chains",
            "Secretory Component"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin Gm Allotypes",
                "Immunoglobulin mu-Chains",
                "Secretory Component"
            ],
            "mismatches": [
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions"
            ],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 8,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Single-Chain Antibodies",
            "Complementarity Determining Regions",
            "Catalytic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies",
                "Complementarity Determining Regions"
            ],
            "mismatches": [
                "Catalytic Antibodies"
            ],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 3,
            "FP": 1,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Hepatitis A Antibodies",
            "Antitoxins",
            "Single-Chain Antibodies",
            "Immunoglobulin Idiotypes",
            "Anticardiolipin Antibodies",
            "Complementarity Determining Regions",
            "Immunoglobulin Gm Allotypes",
            "Catalytic Antibodies",
            "Antineutrophil Cytoplasmic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Antitoxins",
                "Anticardiolipin Antibodies",
                "Catalytic Antibodies",
                "Antineutrophil Cytoplasmic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Immunoglobulin Gm Allotypes"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 5,
            "FP": 5,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin Idiotypes",
            "Complementarity Determining Regions",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin Gm Allotypes",
            "Immunoglobulin mu-Chains"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin Gm Allotypes",
                "Immunoglobulin mu-Chains"
            ],
            "mismatches": [
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions"
            ],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 7,
            "FP": 2,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Single-Chain Antibodies",
            "Complementarity Determining Regions",
            "Catalytic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies",
                "Complementarity Determining Regions"
            ],
            "mismatches": [
                "Catalytic Antibodies"
            ],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 3,
            "FP": 1,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Hepatitis A Antibodies",
            "Thyroid-Stimulating Immunoglobulins",
            "Antitoxins",
            "Single-Chain Antibodies",
            "Anticardiolipin Antibodies",
            "Complementarity Determining Regions",
            "Immunoglobulin gamma-Chains",
            "Certolizumab Pegol",
            "Immunoglobulin Gm Allotypes",
            "Catalytic Antibodies",
            "Antineutrophil Cytoplasmic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Antitoxins",
                "Anticardiolipin Antibodies",
                "Catalytic Antibodies",
                "Antineutrophil Cytoplasmic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "Single-Chain Antibodies",
                "Complementarity Determining Regions",
                "Immunoglobulin gamma-Chains",
                "Certolizumab Pegol",
                "Immunoglobulin Gm Allotypes"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 6,
            "FP": 6,
            "FN": 2
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "CD4 Immunoadhesins",
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains",
            "Immunoglobulin Idiotypes",
            "Immunoglobulin Gm Allotypes"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin Gm Allotypes"
            ],
            "mismatches": [
                "CD4 Immunoadhesins",
                "Immunoglobulin Idiotypes"
            ],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 7,
            "FP": 2,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "CD4 Immunoadhesins",
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin Idiotypes",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains",
            "Immunoglobulin Gm Allotypes",
            "Immunoglobulin J-Chains",
            "Complementarity Determining Regions",
            "Immunoglobulin Fragments"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Single-Domain Antibodies",
                "CD4 Immunoadhesins",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions"
            ],
            "mismatches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin Gm Allotypes",
                "Immunoglobulin Fragments"
            ],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 4,
            "FP": 8,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "Hepatitis A Antibodies",
            "Anticardiolipin Antibodies",
            "Immunoglobulin Idiotypes",
            "Certolizumab Pegol",
            "Inotuzumab Ozogamicin",
            "Catalytic Antibodies",
            "Antineutrophil Cytoplasmic Antibodies"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Anticardiolipin Antibodies",
                "Inotuzumab Ozogamicin",
                "Catalytic Antibodies",
                "Antineutrophil Cytoplasmic Antibodies"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Certolizumab Pegol"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 5,
            "FP": 3,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "Immunoglobulin Subunits",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains",
            "Immunoglobulin Gm Allotypes"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin Gm Allotypes"
            ],
            "mismatches": [],
            "true_referents": [
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin Gm Allotypes",
                "Secretory Component",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin mu-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains"
            ],
            "TP": 7,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "Immunoglobulin Fragments",
        "domain": "biology",
        "response": [
            "Immunoglobulin J-Chains",
            "Immunoglobulin kappa-Chains",
            "Immunoglobulin epsilon-Chains",
            "Immunoglobulin gamma-Chains",
            "Immunoglobulin lambda-Chains",
            "Immunoglobulin mu-Chains",
            "Complementarity Determining Regions"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Complementarity Determining Regions"
            ],
            "mismatches": [
                "Immunoglobulin J-Chains",
                "Immunoglobulin kappa-Chains",
                "Immunoglobulin epsilon-Chains",
                "Immunoglobulin gamma-Chains",
                "Immunoglobulin lambda-Chains",
                "Immunoglobulin mu-Chains"
            ],
            "true_referents": [
                "Single-Chain Antibodies",
                "Certolizumab Pegol",
                "Tuftsin",
                "Single-Domain Antibodies",
                "Immunoglobulin Idiotypes",
                "Complementarity Determining Regions",
                "Etanercept",
                "CD4 Immunoadhesins"
            ],
            "TP": 1,
            "FP": 6,
            "FN": 7
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "Antibodies",
        "domain": "biology",
        "response": [
            "Single-Domain Antibodies",
            "CD4 Immunoadhesins",
            "Hepatitis A Antibodies",
            "Thyroid-Stimulating Immunoglobulins",
            "Etanercept",
            "Single-Chain Antibodies",
            "Antitoxins",
            "Anticardiolipin Antibodies",
            "Catalytic Antibodies",
            "Antineutrophil Cytoplasmic Antibodies",
            "Certolizumab Pegol",
            "Inotuzumab Ozogamicin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Antitoxins",
                "Anticardiolipin Antibodies",
                "Catalytic Antibodies",
                "Antineutrophil Cytoplasmic Antibodies",
                "Inotuzumab Ozogamicin"
            ],
            "mismatches": [
                "Single-Domain Antibodies",
                "CD4 Immunoadhesins",
                "Etanercept",
                "Single-Chain Antibodies",
                "Certolizumab Pegol"
            ],
            "true_referents": [
                "Catalytic Antibodies",
                "Anticardiolipin Antibodies",
                "Hepatitis A Antibodies",
                "Thyroid-Stimulating Immunoglobulins",
                "Inotuzumab Ozogamicin",
                "Antineutrophil Cytoplasmic Antibodies",
                "Long-Acting Thyroid Stimulator",
                "Antitoxins"
            ],
            "TP": 7,
            "FP": 5,
            "FN": 1
        }
    }
]