[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "Acetylcholine receptor (AChR)",
            "Adenosine A1 receptor (A1R)",
            "Adenosine A2A receptor (A2AR)",
            "Adenosine A2B receptor (A2BR)",
            "Adenosine A3 receptor (A3R)",
            "Adrenergic \u03b11 receptor (\u03b11AR)",
            "Adrenergic \u03b12 receptor (\u03b12AR)",
            "Adrenergic \u03b21 receptor (\u03b21AR)",
            "Adrenergic \u03b22 receptor (\u03b22AR)",
            "Dopamine D1 receptor (D1R)",
            "Dopamine D2 receptor (D2R)",
            "Dopamine D3 receptor (D3R)",
            "Dopamine D4 receptor (D4R)",
            "Dopamine D5 receptor (D5R)",
            "GABA A receptor (GABAA)",
            "GABA B receptor (GABAB)",
            "Glutamate AMPA receptor (AMPAR)",
            "Glutamate kainate receptor (KAR)",
            "Glutamate NMDA receptor (NMDAR)",
            "Histamine H1 receptor (H1R)",
            "Histamine H2 receptor (H2R)",
            "Histamine H3 receptor (H3R)",
            "Serotonin 5-HT1A receptor (5-HT1AR)",
            "Serotonin 5-HT2A receptor (5-HT2AR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adenosine A1 receptor (A1R)",
                "Adenosine A2A receptor (A2AR)",
                "Adenosine A2B receptor (A2BR)",
                "Adenosine A3 receptor (A3R)",
                "Adrenergic \u03b11 receptor (\u03b11AR)",
                "Adrenergic \u03b12 receptor (\u03b12AR)",
                "Adrenergic \u03b21 receptor (\u03b21AR)",
                "Adrenergic \u03b22 receptor (\u03b22AR)",
                "Dopamine D1 receptor (D1R)",
                "Dopamine D2 receptor (D2R)",
                "Dopamine D3 receptor (D3R)",
                "Dopamine D4 receptor (D4R)",
                "Dopamine D5 receptor (D5R)",
                "GABA A receptor (GABAA)",
                "GABA B receptor (GABAB)",
                "Glutamate AMPA receptor (AMPAR)",
                "Glutamate kainate receptor (KAR)",
                "Glutamate NMDA receptor (NMDAR)",
                "Histamine H1 receptor (H1R)",
                "Histamine H2 receptor (H2R)",
                "Histamine H3 receptor (H3R)",
                "Serotonin 5-HT1A receptor (5-HT1AR)",
                "Serotonin 5-HT2A receptor (5-HT2AR)"
            ],
            "mismatches": [
                "Acetylcholine receptor (AChR)"
            ],
            "true_referents": [
                "AMPA receptor",
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "D3 dopamine receptor",
                "D4 dopamine receptor",
                "D5 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "GluK2 kainate receptor",
                "GluK3 kainate receptor",
                "N-methyl-D-aspartate receptor",
                "adenosine A1 receptor",
                "adenosine A2 receptor",
                "adenosine A2A receptor",
                "adenosine A2B receptor",
                "adenosine A3 receptor",
                "adrenergic receptor",
                "alpha adrenergic receptor",
                "alpha-1 adrenergic receptor",
                "alpha-2 adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "beta adrenergic receptor",
                "beta-1 adrenergic receptor",
                "beta-2 adrenergic receptor",
                "cholinergic receptor",
                "dopamine receptor",
                "glutamate receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "histamine H3 receptor",
                "histamine receptor",
                "ionotropic glutamate receptor",
                "kainic acid receptor",
                "nicotinic receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT1D receptor",
                "serotonin 5-HT2 receptor",
                "serotonin 5-HT2A receptor"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "Acetylcholine receptor (AChR)",
            "Dopamine receptor (DR)",
            "Serotonin receptor (5-HT receptor)",
            "Gamma-aminobutyric acid receptor (GABA receptor)",
            "Glutamate receptor (GluR)",
            "Nicotinic acetylcholine receptor (nAChR)",
            "Muscarinic acetylcholine receptor (mAChR)",
            "NMDA receptor (N-methyl-D-aspartate receptor)",
            "AMPA receptor (\u03b1-amino-3-hydroxy-5-methyl-4-isoxazolepropionic acid receptor)",
            "Kainate receptor (KA receptor)",
            "Glycine receptor (GlyR)",
            "Adenosine receptor (AdoR)",
            "Opioid receptor (OR)",
            "Histamine receptor (H1, H2, H3, H4 receptors)",
            "Adrenergic receptor (\u03b1, \u03b2-adrenergic receptors)",
            "Serotonin 5-HT1A receptor",
            "Serotonin 5-HT2A receptor",
            "Dopamine D1 receptor",
            "Dopamine D2 receptor",
            "GABA-A receptor",
            "GABA-B receptor",
            "Metabotropic glutamate receptor (mGluR)",
            "Purinergic receptor (P2X, P2Y receptors)",
            "Neurokinin receptor (NK1, NK2, NK3 receptors)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "dopamine receptor",
                "serotonin receptor",
                "GABA receptor",
                "glutamate receptor",
                "nicotinic receptor",
                "muscarinic receptor",
                "N-methyl-D-aspartate receptor",
                "AMPA receptor",
                "kainic acid receptor",
                "glycine receptor",
                "adenosine A1 receptor",
                "adenosine A2 receptor",
                "adrenergic receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT2A receptor",
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "metabotropic glutamate receptor",
                "purinergic receptor",
                "neurokinin-1 receptor",
                "neurokinin-2 receptor",
                "neurokinin-3 receptor"
            ],
            "mismatches": [
                "Acetylcholine receptor (AChR)",
                "Muscarinic acetylcholine receptor (mAChR)",
                "Kainate receptor (KA receptor)",
                "Adenosine receptor (AdoR)",
                "Opioid receptor (OR)",
                "Histamine receptor (H1, H2, H3, H4 receptors)"
            ],
            "true_referents": [
                "AMPA receptor",
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "D4 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "GluK2 kainate receptor",
                "GluK3 kainate receptor",
                "N-methyl-D-aspartate receptor",
                "P2X1 purinergic receptor",
                "P2Y purinergic receptor",
                "adenosine A1 receptor",
                "adenosine A2 receptor",
                "adenosine A2A receptor",
                "adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "amino acid receptor",
                "beta adrenergic receptor",
                "beta-1 adrenergic receptor",
                "cholinergic receptor",
                "dopamine receptor",
                "glutamate receptor",
                "glycine receptor",
                "histamine H2 receptor",
                "histamine H4 receptor",
                "histamine receptor",
                "ionotropic glutamate receptor",
                "kainic acid receptor",
                "kappa opioid receptor",
                "metabotropic glutamate receptor",
                "metabotropic glutamate receptor 5",
                "mu opioid receptor",
                "muscarinic M4 receptor",
                "muscarinic M5 receptor",
                "muscarinic receptor",
                "neurokinin-1 receptor",
                "neurokinin-2 receptor",
                "neurokinin-3 receptor",
                "nicotinic receptor",
                "opioid receptor",
                "purinergic receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT1D receptor",
                "serotonin 5-HT2 receptor",
                "serotonin 5-HT2A receptor",
                "serotonin receptor"
            ],
            "TP": 24,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "Acetylcholine Receptor (AChR)",
            "Adrenergic Receptor (AR)",
            "Alpha-1 Adrenergic Receptor (\u03b11-AR)",
            "Alpha-2 Adrenergic Receptor (\u03b12-AR)",
            "Beta-1 Adrenergic Receptor (\u03b21-AR)",
            "Beta-2 Adrenergic Receptor (\u03b22-AR)",
            "Beta-3 Adrenergic Receptor (\u03b23-AR)",
            "Dopamine Receptor (DR)",
            "D1 Dopamine Receptor (D1R)",
            "D2 Dopamine Receptor (D2R)",
            "D3 Dopamine Receptor (D3R)",
            "D4 Dopamine Receptor (D4R)",
            "D5 Dopamine Receptor (D5R)",
            "GABA Receptor (GABA-R)",
            "GABA-A Receptor (GABA-AR)",
            "GABA-B Receptor (GABA-BR)",
            "Glutamate Receptor (GluR)",
            "N-Methyl-D-aspartate Receptor (NMDAR)",
            "Amino-3-hydroxy-5-methyl-4-isoxazolepropionic acid Receptor (AMPAR)",
            "Kainate Receptor (KAR)",
            "Serotonin Receptor (5-HTR)",
            "5-HT1A Receptor",
            "5-HT2A Receptor",
            "5-HT3 Receptor"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alpha-1 Adrenergic Receptor (\u03b11-AR)",
                "Alpha-2 Adrenergic Receptor (\u03b12-AR)",
                "Beta-1 Adrenergic Receptor (\u03b21-AR)",
                "Beta-2 Adrenergic Receptor (\u03b22-AR)",
                "Beta-3 Adrenergic Receptor (\u03b23-AR)",
                "D1 Dopamine Receptor (D1R)",
                "D2 Dopamine Receptor (D2R)",
                "D3 Dopamine Receptor (D3R)",
                "D4 Dopamine Receptor (D4R)",
                "D5 Dopamine Receptor (D5R)",
                "GABA Receptor (GABA-R)",
                "GABA-A Receptor (GABA-AR)",
                "GABA-B Receptor (GABA-BR)",
                "N-Methyl-D-aspartate Receptor (NMDAR)",
                "Amino-3-hydroxy-5-methyl-4-isoxazolepropionic acid Receptor (AMPAR)",
                "Kainate Receptor (KAR)",
                "5-HT1A Receptor",
                "5-HT2A Receptor",
                "5-HT3 Receptor"
            ],
            "mismatches": [
                "Acetylcholine Receptor (AChR)",
                "Adrenergic Receptor (AR)",
                "Dopamine Receptor (DR)",
                "Glutamate Receptor (GluR)",
                "Serotonin Receptor (5-HTR)"
            ],
            "true_referents": [
                "AMPA receptor",
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "D3 dopamine receptor",
                "D4 dopamine receptor",
                "D5 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "GluK2 kainate receptor",
                "GluK3 kainate receptor",
                "N-methyl-D-aspartate receptor",
                "adrenergic receptor",
                "alpha adrenergic receptor",
                "alpha-1 adrenergic receptor",
                "alpha-2 adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "amino acid receptor",
                "beta adrenergic receptor",
                "beta-1 adrenergic receptor",
                "beta-2 adrenergic receptor",
                "beta-3 adrenergic receptor",
                "cholinergic receptor",
                "dopamine receptor",
                "glutamate receptor",
                "ionotropic glutamate receptor",
                "kainic acid receptor",
                "nicotinic receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT1D receptor",
                "serotonin 5-HT2 receptor",
                "serotonin 5-HT2A receptor",
                "serotonin 5-HT3 receptor"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "Acetylcholine Receptor, Nicotinic (nAChR)",
            "Acetylcholine Receptor, Muscarinic M1 (M1R)",
            "Dopamine Receptor D1 (D1R)",
            "Dopamine Receptor D2 (D2R)",
            "Serotonin Receptor 5-HT1A (5-HT1AR)",
            "Serotonin Receptor 5-HT2A (5-HT2AR)",
            "GABA Receptor A (GABAA)",
            "GABA Receptor B1 (GABAB1)",
            "Glutamate Receptor NMDA (NMDAR)",
            "Glutamate Receptor AMPA (AMPAR)",
            "Glutamate Receptor Kainate (KAR)",
            "Histamine Receptor H1 (H1R)",
            "Histamine Receptor H2 (H2R)",
            "Adrenergic Receptor Alpha-1A (\u03b11A-AR)",
            "Adrenergic Receptor Beta-2 (\u03b22-AR)",
            "Opioid Receptor Mu (MOR)",
            "Opioid Receptor Delta (DOR)",
            "Opioid Receptor Kappa (KOR)",
            "Cannabinoid Receptor CB1 (CB1R)",
            "Cannabinoid Receptor CB2 (CB2R)",
            "ATP Receptor P2X2 (P2X2R)",
            "Sigma Receptor Sigma-1 (\u03c31R)",
            "Vanilloid Receptor TRPV1 (TRPV1)",
            "Neuropeptide Y Receptor Y1 (Y1R)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT2A receptor",
                "GABA-A receptor",
                "N-methyl-D-aspartate receptor",
                "AMPA receptor",
                "GluK2 kainate receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "alpha-1 adrenergic receptor",
                "beta-2 adrenergic receptor",
                "mu opioid receptor",
                "delta opioid receptor",
                "kappa opioid receptor",
                "P2X2 purinergic receptor",
                "sigma-1 receptor",
                "neuropeptide Y receptor"
            ],
            "mismatches": [
                "Acetylcholine Receptor, Nicotinic (nAChR)",
                "Acetylcholine Receptor, Muscarinic M1 (M1R)",
                "GABA Receptor B1 (GABAB1)",
                "Cannabinoid Receptor CB1 (CB1R)",
                "Cannabinoid Receptor CB2 (CB2R)",
                "Vanilloid Receptor TRPV1 (TRPV1)"
            ],
            "true_referents": [
                "AMPA receptor",
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "D4 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "GluK2 kainate receptor",
                "GluK3 kainate receptor",
                "N-methyl-D-aspartate receptor",
                "P2X purinergic receptor",
                "P2X1 purinergic receptor",
                "P2X2 purinergic receptor",
                "P2Y1 purinergic receptor",
                "adrenergic receptor",
                "alpha adrenergic receptor",
                "alpha-1 adrenergic receptor",
                "alpha-2 adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "beta adrenergic receptor",
                "beta-1 adrenergic receptor",
                "beta-2 adrenergic receptor",
                "cholinergic receptor",
                "delta opioid receptor",
                "dopamine receptor",
                "glutamate receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "histamine receptor",
                "ionotropic glutamate receptor",
                "kainic acid receptor",
                "kappa opioid receptor",
                "mu opioid receptor",
                "muscarinic M1 receptor",
                "muscarinic M4 receptor",
                "muscarinic receptor",
                "neurokinin-1 receptor",
                "neuropeptide Y receptor",
                "neuropeptide receptor",
                "nicotinic receptor",
                "opioid receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT1D receptor",
                "serotonin 5-HT2 receptor",
                "serotonin 5-HT2A receptor",
                "sigma receptor",
                "sigma-1 receptor",
                "tachykinin receptor"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "N-Methyl-D-Aspartate receptor (NMDA)",
            "Gamma-Aminobutyric Acid A receptor (GABA-A)",
            "Gamma-Aminobutyric Acid B receptor (GABA-B)",
            "Alpha-7 Nicotinic Acetylcholine receptor (\u03b17 nAChR)",
            "Muscarinic Acetylcholine receptor M1 (M1 mAChR)",
            "Muscarinic Acetylcholine receptor M2 (M2 mAChR)",
            "Muscarinic Acetylcholine receptor M3 (M3 mAChR)",
            "Muscarinic Acetylcholine receptor M4 (M4 mAChR)",
            "Muscarinic Acetylcholine receptor M5 (M5 mAChR)",
            "Dopamine receptor D1 (D1)",
            "Dopamine receptor D2 (D2)",
            "Dopamine receptor D3 (D3)",
            "Dopamine receptor D4 (D4)",
            "Dopamine receptor D5 (D5)",
            "Serotonin receptor 5-HT1A (5-HT1A)",
            "Serotonin receptor 5-HT2A (5-HT2A)",
            "Serotonin receptor 5-HT3 (5-HT3)",
            "Serotonin receptor 5-HT4 (5-HT4)",
            "Serotonin receptor 5-HT5A (5-HT5A)",
            "Serotonin receptor 5-HT6 (5-HT6)",
            "Serotonin receptor 5-HT7 (5-HT7)",
            "Histamine receptor H1 (H1)",
            "Histamine receptor H2 (H2)",
            "Histamine receptor H3 (H3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-Methyl-D-Aspartate receptor (NMDA)",
                "Gamma-Aminobutyric Acid A receptor (GABA-A)",
                "Gamma-Aminobutyric Acid B receptor (GABA-B)",
                "Alpha-7 Nicotinic Acetylcholine receptor (\u03b17 nAChR)",
                "Muscarinic Acetylcholine receptor M1 (M1 mAChR)",
                "Muscarinic Acetylcholine receptor M2 (M2 mAChR)",
                "Muscarinic Acetylcholine receptor M3 (M3 mAChR)",
                "Muscarinic Acetylcholine receptor M4 (M4 mAChR)",
                "Muscarinic Acetylcholine receptor M5 (M5 mAChR)",
                "Dopamine receptor D1 (D1)",
                "Dopamine receptor D2 (D2)",
                "Dopamine receptor D3 (D3)",
                "Dopamine receptor D4 (D4)",
                "Dopamine receptor D5 (D5)",
                "Serotonin receptor 5-HT1A (5-HT1A)",
                "Serotonin receptor 5-HT2A (5-HT2A)",
                "Serotonin receptor 5-HT3 (5-HT3)",
                "Serotonin receptor 5-HT4 (5-HT4)",
                "Histamine receptor H1 (H1)",
                "Histamine receptor H2 (H2)",
                "Histamine receptor H3 (H3)"
            ],
            "mismatches": [
                "Serotonin receptor 5-HT5A (5-HT5A)",
                "Serotonin receptor 5-HT6 (5-HT6)",
                "Serotonin receptor 5-HT7 (5-HT7)"
            ],
            "true_referents": [
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "D3 dopamine receptor",
                "D4 dopamine receptor",
                "D5 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "N-methyl-D-aspartate receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "cholinergic receptor",
                "dopamine receptor",
                "glutamate receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "histamine H3 receptor",
                "histamine receptor",
                "muscarinic M1 receptor",
                "muscarinic M2 receptor",
                "muscarinic M3 receptor",
                "muscarinic M4 receptor",
                "muscarinic M5 receptor",
                "muscarinic receptor",
                "nicotinic receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT1D receptor",
                "serotonin 5-HT2 receptor",
                "serotonin 5-HT2A receptor",
                "serotonin 5-HT3 receptor",
                "serotonin 5-HT4 receptor",
                "serotonin receptor"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "Dopamine receptor D1 (DRD1)",
            "Dopamine receptor D2 (DRD2)",
            "Serotonin receptor 5-HT1A (HTR1A)",
            "Serotonin receptor 5-HT2A (HTR2A)",
            "Norepinephrine receptor alpha-1 (ADRA1)",
            "Norepinephrine receptor alpha-2 (ADRA2)",
            "Acetylcholine receptor nicotinic alpha-7 (CHRNA7)",
            "Acetylcholine receptor muscarinic M1 (CHRM1)",
            "Glutamate receptor NMDA (GRIN1)",
            "Glutamate receptor AMPA (GRIA1)",
            "GABA receptor A (GABRA1)",
            "GABA receptor B (GABBR1)",
            "Histamine receptor H1 (HRH1)",
            "Histamine receptor H2 (HRH2)",
            "Endocannabinoid receptor CB1 (CNR1)",
            "Endocannabinoid receptor CB2 (CNR2)",
            "Opioid receptor mu (OPRM1)",
            "Opioid receptor delta (OPRD1)",
            "Opioid receptor kappa (OPRK1)",
            "Vasopressin receptor V1A (AVPR1A)",
            "Vasopressin receptor V2 (AVPR2)",
            "Neuropeptide Y receptor Y1 (NPY1R)",
            "Neuropeptide Y receptor Y2 (NPY2R)",
            "Somatostatin receptor 1 (SSTR1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT2A receptor",
                "alpha-1 adrenergic receptor",
                "alpha-2 adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "muscarinic M1 receptor",
                "N-methyl-D-aspartate receptor",
                "AMPA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "mu opioid receptor",
                "delta opioid receptor",
                "kappa opioid receptor",
                "vasopressin receptor",
                "neuropeptide Y receptor",
                "somatostatin receptor"
            ],
            "mismatches": [
                "Endocannabinoid receptor CB1 (CNR1)",
                "Endocannabinoid receptor CB2 (CNR2)",
                "Vasopressin receptor V1A (AVPR1A)",
                "Vasopressin receptor V2 (AVPR2)",
                "Neuropeptide Y receptor Y1 (NPY1R)",
                "Neuropeptide Y receptor Y2 (NPY2R)",
                "Somatostatin receptor 1 (SSTR1)"
            ],
            "true_referents": [
                "AMPA receptor",
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "D4 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "N-methyl-D-aspartate receptor",
                "P2Y1 purinergic receptor",
                "P2Y2 purinergic receptor",
                "adrenergic receptor",
                "alpha adrenergic receptor",
                "alpha-1 adrenergic receptor",
                "alpha-2 adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "beta-2 adrenergic receptor",
                "cholinergic receptor",
                "delta opioid receptor",
                "dopamine receptor",
                "glutamate receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "histamine H3 receptor",
                "histamine receptor",
                "ionotropic glutamate receptor",
                "kappa opioid receptor",
                "melanocortin type 2 receptor",
                "mu opioid receptor",
                "muscarinic M1 receptor",
                "muscarinic M4 receptor",
                "muscarinic receptor",
                "neurokinin-1 receptor",
                "neurokinin-2 receptor",
                "neuropeptide Y receptor",
                "neuropeptide receptor",
                "nicotinic receptor",
                "opioid receptor",
                "oxytocin receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT1D receptor",
                "serotonin 5-HT2 receptor",
                "serotonin 5-HT2A receptor",
                "serotonin receptor",
                "somatostatin receptor",
                "thyrotropin receptor",
                "vasoactive intestinal peptide receptor",
                "vasopressin receptor"
            ],
            "TP": 20,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "N-Methyl-D-aspartate receptor (NMDAR)",
            "Alpha-1 adrenergic receptor (\u03b11-AR)",
            "Alpha-2 adrenergic receptor (\u03b12-AR)",
            "Beta-1 adrenergic receptor (\u03b21-AR)",
            "Beta-2 adrenergic receptor (\u03b22-AR)",
            "Dopamine receptor D1 (DRD1)",
            "Dopamine receptor D2 (DRD2)",
            "GABA-A receptor (GABAAR)",
            "GABA-B receptor (GABABR)",
            "Serotonin receptor 1A (5-HT1A)",
            "Serotonin receptor 2A (5-HT2A)",
            "Serotonin receptor 3 (5-HT3)",
            "Muscarinic acetylcholine receptor M1 (M1R)",
            "Muscarinic acetylcholine receptor M2 (M2R)",
            "Nicotinic acetylcholine receptor (nAChR)",
            "Opioid receptor Mu (MOR)",
            "Opioid receptor Delta (DOR)",
            "Opioid receptor Kappa (KOR)",
            "Cannabinoid receptor 1 (CB1)",
            "Cannabinoid receptor 2 (CB2)",
            "Glutamate receptor, ionotropic, AMPA 1 (GRIA1)",
            "Glutamate receptor, ionotropic, NMDA 2A (GRIN2A)",
            "Glutamate receptor, metabotropic 1 (GRM1)",
            "Vasopressin 1A receptor (AVPR1A)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-methyl-D-aspartate receptor",
                "alpha-1 adrenergic receptor",
                "alpha-2 adrenergic receptor",
                "beta-1 adrenergic receptor",
                "beta-2 adrenergic receptor",
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT2A receptor",
                "serotonin 5-HT3 receptor",
                "muscarinic M1 receptor",
                "muscarinic M2 receptor",
                "nicotinic receptor",
                "mu opioid receptor",
                "delta opioid receptor",
                "kappa opioid receptor",
                "AMPA receptor",
                "vasopressin receptor"
            ],
            "mismatches": [
                "cannabinoid receptor 1",
                "cannabinoid receptor 2",
                "glutamate receptor, metabotropic 1"
            ],
            "true_referents": [
                "AMPA receptor",
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "D4 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "N-methyl-D-aspartate receptor",
                "adrenergic receptor",
                "alpha adrenergic receptor",
                "alpha-1 adrenergic receptor",
                "alpha-2 adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "beta adrenergic receptor",
                "beta-1 adrenergic receptor",
                "beta-2 adrenergic receptor",
                "cholinergic receptor",
                "delta opioid receptor",
                "dopamine receptor",
                "glutamate receptor",
                "ionotropic glutamate receptor",
                "kappa opioid receptor",
                "melanocortin type 1 receptor",
                "metabotropic glutamate receptor",
                "metabotropic glutamate receptor 5",
                "mu opioid receptor",
                "muscarinic M1 receptor",
                "muscarinic M2 receptor",
                "muscarinic M3 receptor",
                "muscarinic receptor",
                "neurokinin-2 receptor",
                "nicotinic receptor",
                "opioid receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT1D receptor",
                "serotonin 5-HT2 receptor",
                "serotonin 5-HT2A receptor",
                "serotonin 5-HT3 receptor",
                "serotonin receptor",
                "vasoactive intestinal peptide receptor",
                "vasopressin receptor"
            ],
            "TP": 20,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "Dopamine receptor (DRD1)",
            "Serotonin receptor (5-HT1A)",
            "Gamma-aminobutyric acid receptor (GABA-A)",
            "Glutamate receptor (AMPA)",
            "Acetylcholine receptor (nAChR)",
            "Norepinephrine receptor (\u03b11-AR)",
            "Histamine receptor (H1)",
            "Opioid receptor (MOR)",
            "Cannabinoid receptor (CB1)",
            "Adenosine receptor (A1)",
            "Glycine receptor (GlyR)",
            "Nicotinic acetylcholine receptor (nAChR)",
            "Glutamate receptor (NMDA)",
            "Epinephrine receptor (\u03b22-AR)",
            "Dopamine receptor (DRD2)",
            "Serotonin receptor (5-HT2A)",
            "GABA-B receptor",
            "Acetylcholine receptor (muscarinic)",
            "Norepinephrine receptor (\u03b21-AR)",
            "Histamine receptor (H2)",
            "Opioid receptor (DOR)",
            "Cannabinoid receptor (CB2)",
            "Adenosine receptor (A2A)",
            "Glutamate receptor (kainate)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "D1 dopamine receptor",
                "serotonin 5-HT1A receptor",
                "GABA-A receptor",
                "AMPA receptor",
                "nicotinic receptor",
                "histamine H1 receptor",
                "mu opioid receptor",
                "adenosine A1 receptor",
                "glycine receptor",
                "nicotinic receptor",
                "N-methyl-D-aspartate receptor",
                "beta-2 adrenergic receptor",
                "D2 dopamine receptor",
                "serotonin 5-HT2A receptor",
                "GABA-B receptor",
                "muscarinic receptor",
                "beta-1 adrenergic receptor",
                "histamine H2 receptor",
                "delta opioid receptor",
                "adenosine A2A receptor",
                "kainic acid receptor"
            ],
            "mismatches": [
                "Cannabinoid receptor (CB1)",
                "Cannabinoid receptor (CB2)"
            ],
            "true_referents": [
                "AMPA receptor",
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "D4 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "GluK2 kainate receptor",
                "N-methyl-D-aspartate receptor",
                "adenosine A1 receptor",
                "adenosine A2 receptor",
                "adenosine A2A receptor",
                "adenosine A2B receptor",
                "adrenergic receptor",
                "alpha adrenergic receptor",
                "alpha-1 adrenergic receptor",
                "alpha-2 adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "amino acid receptor",
                "beta adrenergic receptor",
                "beta-1 adrenergic receptor",
                "beta-2 adrenergic receptor",
                "cholinergic receptor",
                "delta opioid receptor",
                "dopamine receptor",
                "glutamate receptor",
                "glycine receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "histamine receptor",
                "ionotropic glutamate receptor",
                "kainic acid receptor",
                "kappa opioid receptor",
                "mu opioid receptor",
                "muscarinic M4 receptor",
                "muscarinic M5 receptor",
                "muscarinic receptor",
                "nicotinic receptor",
                "opioid receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT1D receptor",
                "serotonin 5-HT2 receptor",
                "serotonin 5-HT2A receptor"
            ],
            "TP": 20,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "NMDA receptor (NMDAR)",
            "AMPA receptor (AMPAR)",
            "Kainate receptor",
            "GABA_A receptor",
            "GABA_B receptor",
            "Dopamine D1 receptor",
            "Dopamine D2 receptor",
            "Serotonin 5-HT1A receptor",
            "Serotonin 5-HT2A receptor",
            "Nicotinic acetylcholine receptor (nAChR)",
            "Muscarinic acetylcholine receptor M1",
            "Muscarinic acetylcholine receptor M2",
            "Histamine H1 receptor",
            "Histamine H2 receptor",
            "Glycine receptor",
            "Metabotropic glutamate receptor 1 (mGluR1)",
            "Metabotropic glutamate receptor 2 (mGluR2)",
            "Opioid \u03bc receptor (\u03bcOR)",
            "Opioid \u03b4 receptor (\u03b4OR)",
            "Opioid \u03ba receptor (\u03baOR)",
            "Cannabinoid CB1 receptor",
            "Cannabinoid CB2 receptor",
            "Adrenergic \u03b11 receptor",
            "Adrenergic \u03b22 receptor"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "AMPA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT2A receptor",
                "nicotinic receptor",
                "muscarinic M1 receptor",
                "muscarinic M2 receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "glycine receptor",
                "delta opioid receptor",
                "kappa opioid receptor"
            ],
            "mismatches": [
                "NMDA receptor (NMDAR)",
                "Kainate receptor",
                "Dopamine D1 receptor",
                "Dopamine D2 receptor",
                "Muscarinic acetylcholine receptor M1",
                "Muscarinic acetylcholine receptor M2",
                "Metabotropic glutamate receptor 1 (mGluR1)",
                "Metabotropic glutamate receptor 2 (mGluR2)",
                "Opioid \u03bc receptor (\u03bcOR)",
                "Opioid \u03b4 receptor (\u03b4OR)",
                "Opioid \u03ba receptor (\u03baOR)",
                "Cannabinoid CB1 receptor",
                "Cannabinoid CB2 receptor",
                "Adrenergic \u03b11 receptor",
                "Adrenergic \u03b22 receptor"
            ],
            "true_referents": [
                "AMPA receptor",
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "D4 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "GluK2 kainate receptor",
                "GluK3 kainate receptor",
                "N-methyl-D-aspartate receptor",
                "adrenergic receptor",
                "alpha adrenergic receptor",
                "alpha-1 adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "amino acid receptor",
                "beta adrenergic receptor",
                "beta-1 adrenergic receptor",
                "beta-2 adrenergic receptor",
                "cholinergic receptor",
                "delta opioid receptor",
                "dopamine receptor",
                "glutamate receptor",
                "glycine receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "histamine receptor",
                "ionotropic glutamate receptor",
                "kainic acid receptor",
                "kappa opioid receptor",
                "metabotropic glutamate receptor",
                "metabotropic glutamate receptor 5",
                "mu opioid receptor",
                "muscarinic M1 receptor",
                "muscarinic M2 receptor",
                "muscarinic M3 receptor",
                "muscarinic receptor",
                "nicotinic receptor",
                "opioid receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT1D receptor",
                "serotonin 5-HT2 receptor",
                "serotonin 5-HT2A receptor"
            ],
            "TP": 15,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "Serotonin receptor (5-HT receptor)",
            "Dopamine receptor (D receptor)",
            "GABA receptor (GABAR)",
            "Glutamate receptor (GluR)",
            "Acetylcholine receptor (AChR)",
            "Norepinephrine receptor (\u03b1 and \u03b2 adrenergic receptors)",
            "Histamine receptor (H receptor)",
            "Glycine receptor (GlyR)",
            "Adenosine receptor (A receptor)",
            "Opioid receptor (\u03bc, \u03b4, \u03ba receptors)",
            "Cannabinoid receptor (CB receptor)",
            "Nicotinic acetylcholine receptor (nAChR)",
            "Muscarinic acetylcholine receptor (mAChR)",
            "NMDA receptor",
            "AMPA receptor",
            "Kainate receptor",
            "Metabotropic glutamate receptor (mGluR)",
            "GABAA receptor",
            "GABAB receptor",
            "Glycine receptor",
            "P2X receptor",
            "P2Y receptor",
            "Vasopressin receptor (V1 and V2 receptors)",
            "Oxytocin receptor (OTR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dopamine receptor",
                "GABA receptor",
                "Glutamate receptor",
                "Histamine receptor",
                "Glycine receptor",
                "Opioid receptor",
                "Nicotinic acetylcholine receptor",
                "AMPA receptor",
                "Metabotropic glutamate receptor",
                "GABAA receptor",
                "GABAB receptor",
                "Glycine receptor",
                "P2X receptor",
                "P2Y receptor",
                "Vasopressin receptor",
                "Oxytocin receptor"
            ],
            "mismatches": [
                "Serotonin receptor (5-HT receptor)",
                "Acetylcholine receptor (AChR)",
                "Norepinephrine receptor (\u03b1 and \u03b2 adrenergic receptors)",
                "Adenosine receptor (A receptor)",
                "Cannabinoid receptor (CB receptor)",
                "Muscarinic acetylcholine receptor (mAChR)",
                "NMDA receptor",
                "Kainate receptor"
            ],
            "true_referents": [
                "AMPA receptor",
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "GluK2 kainate receptor",
                "GluK3 kainate receptor",
                "N-methyl-D-aspartate receptor",
                "P2X purinergic receptor",
                "P2X1 purinergic receptor",
                "P2X2 purinergic receptor",
                "P2Y purinergic receptor",
                "P2Y1 purinergic receptor",
                "P2Y2 purinergic receptor",
                "adenosine A1 receptor",
                "adenosine A2 receptor",
                "adenosine A2A receptor",
                "adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "amino acid receptor",
                "beta adrenergic receptor",
                "beta-1 adrenergic receptor",
                "cholinergic receptor",
                "delta opioid receptor",
                "dopamine receptor",
                "glutamate receptor",
                "glycine receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "histamine receptor",
                "ionotropic glutamate receptor",
                "kainic acid receptor",
                "kappa opioid receptor",
                "metabotropic glutamate receptor",
                "metabotropic glutamate receptor 5",
                "muscarinic M4 receptor",
                "muscarinic M5 receptor",
                "muscarinic receptor",
                "neuropeptide receptor",
                "nicotinic receptor",
                "opioid receptor",
                "oxytocin receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin receptor",
                "vasoactive intestinal peptide receptor",
                "vasopressin receptor"
            ],
            "TP": 15,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "5-HT1A receptor (HTR1A)",
            "Dopamine D2 receptor (DRD2)",
            "GABAA receptor (GABAAR)",
            "Nicotinic acetylcholine receptor (nAChR)",
            "NMDA receptor (NMDAR)",
            "Muscarinic acetylcholine receptor M1 (CHRM1)",
            "Glycine receptor (GlyR)",
            "Cannabinoid receptor 1 (CB1)",
            "Adenosine A1 receptor (ADORA1)",
            "Metabotropic glutamate receptor 1 (mGluR1)",
            "Oxytocin receptor (OXTR)",
            "Vasopressin V1a receptor (AVPR1A)",
            "Orexin receptor 1 (HCRTR1)",
            "Neuropeptide Y receptor Y1 (NPY1R)",
            "Substance P receptor (TACR1)",
            "Melanocortin receptor 4 (MC4R)",
            "Histamine H1 receptor (HRH1)",
            "Melatonin receptor 1A (MTNR1A)",
            "Opioid receptor mu 1 (OPRM1)",
            "Serotonin 5-HT2A receptor (HTR2A)",
            "GABA-B receptor (GABABR)",
            "Adrenergic receptor alpha 2A (ADRA2A)",
            "Dopamine D1 receptor (DRD1)",
            "Somatostatin receptor 2 (SSTR2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dopamine D2 receptor (DRD2)",
                "GABAA receptor (GABAAR)",
                "Nicotinic acetylcholine receptor (nAChR)",
                "NMDA receptor (NMDAR)",
                "Muscarinic acetylcholine receptor M1 (CHRM1)",
                "Glycine receptor (GlyR)",
                "Adenosine A1 receptor (ADORA1)",
                "Oxytocin receptor (OXTR)",
                "Orexin receptor 1 (HCRTR1)",
                "Neuropeptide Y receptor Y1 (NPY1R)",
                "Melanocortin receptor 4 (MC4R)",
                "Histamine H1 receptor (HRH1)",
                "Opioid receptor mu 1 (OPRM1)",
                "Serotonin 5-HT2A receptor (HTR2A)",
                "GABA-B receptor (GABABR)",
                "Adrenergic receptor alpha 2A (ADRA2A)",
                "Dopamine D1 receptor (DRD1)",
                "Somatostatin receptor 2 (SSTR2)"
            ],
            "mismatches": [
                "5-HT1A receptor (HTR1A)",
                "Cannabinoid receptor 1 (CB1)",
                "Metabotropic glutamate receptor 1 (mGluR1)",
                "Vasopressin V1a receptor (AVPR1A)",
                "Substance P receptor (TACR1)",
                "Melatonin receptor 1A (MTNR1A)"
            ],
            "true_referents": [
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "D4 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "N-methyl-D-aspartate receptor",
                "P2Y1 purinergic receptor",
                "adenosine A1 receptor",
                "adenosine A2 receptor",
                "adenosine A2A receptor",
                "alpha adrenergic receptor",
                "alpha-2 adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "amino acid receptor",
                "beta-2 adrenergic receptor",
                "cholinergic receptor",
                "dopamine receptor",
                "glutamate receptor",
                "glycine receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "histamine receptor",
                "kappa opioid receptor",
                "melanocortin receptor",
                "melanocortin type 1 receptor",
                "melanocortin type 2 receptor",
                "melanocortin type 4 receptor",
                "metabotropic glutamate receptor",
                "metabotropic glutamate receptor 5",
                "mu opioid receptor",
                "muscarinic M1 receptor",
                "muscarinic M4 receptor",
                "muscarinic receptor",
                "neurokinin-1 receptor",
                "neurokinin-2 receptor",
                "neuropeptide Y receptor",
                "neuropeptide receptor",
                "nicotinic receptor",
                "opioid receptor",
                "orexin receptor",
                "oxytocin receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT1D receptor",
                "serotonin 5-HT2 receptor",
                "serotonin 5-HT2A receptor",
                "somatostatin receptor",
                "tachykinin receptor",
                "thyrotropin-releasing hormone receptor",
                "vasoactive intestinal peptide receptor",
                "vasopressin receptor"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "Nicotinic acetylcholine receptor (nAChR)",
            "Muscarinic acetylcholine receptor (mAChR)",
            "GABA-A receptor",
            "GABA-B receptor",
            "Glutamate receptor (AMPA, NMDA, kainate)",
            "Dopamine receptor (D1, D2, D3, D4, D5)",
            "Serotonin receptor (5-HT1, 5-HT2, 5-HT3, 5-HT4, 5-HT5, 5-HT6, 5-HT7)",
            "Norepinephrine receptor (\u03b11, \u03b12, \u03b21, \u03b22, \u03b23)",
            "Epinephrine receptor (\u03b11, \u03b12, \u03b21, \u03b22, \u03b23)",
            "Histamine receptor (H1, H2, H3, H4)",
            "Glycine receptor",
            "Cannabinoid receptor (CB1, CB2)",
            "Opioid receptor (\u03bc, \u03b4, \u03ba, nociceptin)",
            "Adenosine receptor (A1, A2A, A2B, A3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "GABA-A receptor",
                "GABA-B receptor",
                "glycine receptor",
                "opioid receptor"
            ],
            "mismatches": [
                "Nicotinic acetylcholine receptor (nAChR)",
                "Muscarinic acetylcholine receptor (mAChR)",
                "Glutamate receptor (AMPA, NMDA, kainate)",
                "Dopamine receptor (D1, D2, D3, D4, D5)",
                "Serotonin receptor (5-HT1, 5-HT2, 5-HT3, 5-HT4, 5-HT5, 5-HT6, 5-HT7)",
                "Norepinephrine receptor (\u03b11, \u03b12, \u03b21, \u03b22, \u03b23)",
                "Epinephrine receptor (\u03b11, \u03b12, \u03b21, \u03b22, \u03b23)",
                "Histamine receptor (H1, H2, H3, H4)",
                "Cannabinoid receptor (CB1, CB2)",
                "Adenosine receptor (A1, A2A, A2B, A3)"
            ],
            "true_referents": [
                "AMPA receptor",
                "D1 dopamine receptor",
                "D4 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "GluK2 kainate receptor",
                "adenosine A1 receptor",
                "adenosine A2 receptor",
                "adenosine A2A receptor",
                "adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "amino acid receptor",
                "beta adrenergic receptor",
                "beta-1 adrenergic receptor",
                "cholinergic receptor",
                "dopamine receptor",
                "glutamate receptor",
                "glycine receptor",
                "histamine H1 receptor",
                "histamine H4 receptor",
                "histamine receptor",
                "kappa opioid receptor",
                "muscarinic M4 receptor",
                "muscarinic M5 receptor",
                "muscarinic receptor",
                "nicotinic receptor",
                "nociceptin receptor",
                "opioid receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT2 receptor",
                "serotonin receptor"
            ],
            "TP": 4,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "Acetylcholine Receptor (AChR)",
            "Dopamine Receptor (DR)",
            "Serotonin Receptor (5-HT Receptor)",
            "Glutamate Receptor (GluR)",
            "GABA Receptor (GABAR)",
            "Glycine Receptor (GlyR)",
            "Nicotinic Acetylcholine Receptor (nAChR)",
            "Muscarinic Acetylcholine Receptor (mAChR)",
            "Adrenergic Receptor (AR)",
            "Opioid Receptor (OR)",
            "Cannabinoid Receptor (CB Receptor)",
            "Histamine Receptor (HR)",
            "Purinergic Receptor (P2 Receptor)",
            "Sigma Receptor (\u03c3 Receptor)",
            "Metabotropic Glutamate Receptor (mGluR)",
            "Ionotropic Glutamate Receptor (iGluR)",
            "NMDA Receptor (NMDAR)",
            "AMPA Receptor (AMPAR)",
            "Kainate Receptor (KAR)",
            "GABA-A Receptor (GABAAR)",
            "GABA-B Receptor (GABABR)",
            "Nicotinic Acetylcholine Receptor Subunit (nAChR Subunit)",
            "Muscarinic Acetylcholine Receptor Subunit (mAChR Subunit)",
            "Adrenergic Receptor Subunit (AR Subunit)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dopamine Receptor (DR)",
                "Serotonin Receptor (5-HT Receptor)",
                "Glutamate Receptor (GluR)",
                "GABA Receptor (GABAR)",
                "Glycine Receptor (GlyR)",
                "Nicotinic Acetylcholine Receptor (nAChR)",
                "Muscarinic Acetylcholine Receptor (mAChR)",
                "Adrenergic Receptor (AR)",
                "Opioid Receptor (OR)",
                "Histamine Receptor (HR)",
                "Purinergic Receptor (P2 Receptor)",
                "Sigma Receptor (\u03c3 Receptor)",
                "Metabotropic Glutamate Receptor (mGluR)",
                "Ionotropic Glutamate Receptor (iGluR)",
                "NMDA Receptor (NMDAR)",
                "AMPA Receptor (AMPAR)",
                "Kainate Receptor (KAR)",
                "GABA-A Receptor (GABAAR)",
                "GABA-B Receptor (GABABR)"
            ],
            "mismatches": [
                "Acetylcholine Receptor (AChR)",
                "Cannabinoid Receptor (CB Receptor)",
                "Nicotinic Acetylcholine Receptor Subunit (nAChR Subunit)",
                "Muscarinic Acetylcholine Receptor Subunit (mAChR Subunit)",
                "Adrenergic Receptor Subunit (AR Subunit)"
            ],
            "true_referents": [
                "AMPA receptor",
                "D1 dopamine receptor",
                "D4 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "GluK2 kainate receptor",
                "GluK3 kainate receptor",
                "N-methyl-D-aspartate receptor",
                "P1 purinergic receptor",
                "P2 purinergic receptor",
                "adrenergic receptor",
                "alpha adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "amino acid receptor",
                "beta-1 adrenergic receptor",
                "cholinergic receptor",
                "dopamine receptor",
                "glutamate receptor",
                "glycine receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "histamine receptor",
                "ionotropic glutamate receptor",
                "kainic acid receptor",
                "kappa opioid receptor",
                "metabotropic glutamate receptor",
                "metabotropic glutamate receptor 5",
                "mu opioid receptor",
                "muscarinic M1 receptor",
                "muscarinic M4 receptor",
                "muscarinic M5 receptor",
                "muscarinic receptor",
                "nicotinic receptor",
                "opioid receptor",
                "purinergic receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin receptor",
                "sigma receptor",
                "sigma-1 receptor"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "GABA receptor (GABA-R)",
            "N-methyl-D-aspartate receptor (NMDAR)",
            "Dopamine receptor D1 (DRD1)",
            "Dopamine receptor D2 (DRD2)",
            "Serotonin receptor 5-HT1A (5-HT1A)",
            "Serotonin receptor 5-HT2A (5-HT2A)",
            "Glutamate receptor (GluR)",
            "Acetylcholine receptor (AChR)",
            "Nicotinic acetylcholine receptor (nAChR)",
            "Muscarinic acetylcholine receptor (mAChR)",
            "Adrenergic receptor alpha-1 (\u03b11-AR)",
            "Adrenergic receptor beta-1 (\u03b21-AR)",
            "Adrenergic receptor beta-2 (\u03b22-AR)",
            "Adrenergic receptor beta-3 (\u03b23-AR)",
            "Histamine receptor H1 (H1-R)",
            "Histamine receptor H2 (H2-R)",
            "Histamine receptor H3 (H3-R)",
            "Histamine receptor H4 (H4-R)",
            "Vasopressin receptor V1A (V1A-R)",
            "Vasopressin receptor V2 (V2-R)",
            "Oxytocin receptor (OT-R)",
            "Melatonin receptor MT1 (MT1-R)",
            "Melatonin receptor MT2 (MT2-R)",
            "Galanin receptor (GAL-R)",
            "Neurokinin receptor NK1 (NK1-R)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "GABA receptor",
                "N-methyl-D-aspartate receptor",
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT2A receptor",
                "glutamate receptor",
                "nicotinic receptor",
                "muscarinic receptor",
                "alpha-1 adrenergic receptor",
                "beta-1 adrenergic receptor",
                "beta-2 adrenergic receptor",
                "beta-3 adrenergic receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "histamine H3 receptor",
                "histamine H4 receptor",
                "vasopressin receptor",
                "oxytocin receptor",
                "galanin receptor"
            ],
            "mismatches": [
                "Acetylcholine receptor (AChR)",
                "Melatonin receptor MT1 (MT1-R)",
                "Melatonin receptor MT2 (MT2-R)",
                "Neurokinin receptor NK1 (NK1-R)"
            ],
            "true_referents": [
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "D4 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "N-methyl-D-aspartate receptor",
                "adrenergic receptor",
                "alpha adrenergic receptor",
                "alpha-1 adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "amino acid receptor",
                "beta adrenergic receptor",
                "beta-1 adrenergic receptor",
                "beta-2 adrenergic receptor",
                "beta-3 adrenergic receptor",
                "cholinergic receptor",
                "dopamine receptor",
                "galanin receptor",
                "glutamate receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "histamine H3 receptor",
                "histamine H4 receptor",
                "histamine receptor",
                "ionotropic glutamate receptor",
                "melanocortin type 1 receptor",
                "melanocortin type 2 receptor",
                "muscarinic M4 receptor",
                "muscarinic M5 receptor",
                "muscarinic receptor",
                "neuropeptide receptor",
                "nicotinic receptor",
                "oxytocin receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT1D receptor",
                "serotonin 5-HT2 receptor",
                "serotonin 5-HT2A receptor",
                "serotonin receptor",
                "thyrotropin-releasing hormone receptor",
                "vasoactive intestinal peptide receptor",
                "vasopressin receptor"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            "Acetylcholine receptor (AChR)",
            "Adrenergic receptor (ADRB)",
            "Adenosine receptor (ADORA)",
            "Angiotensin receptor (AGTR)",
            "Benzodiazepine receptor (BZRP)",
            "Cannabinoid receptor (CB)",
            "Cholecystokinin receptor (CCKR)",
            "Dopamine receptor (DRD)",
            "GABA receptor (GABAR)",
            "GluR1 receptor (GRIA1)",
            "Glycine receptor (GLRA)",
            "Histamine receptor (HRH)",
            "Imidazoline receptor (I1R)",
            "Melatonin receptor (MTNR)",
            "Muscarinic acetylcholine receptor (CHRM)",
            "Nicotinic acetylcholine receptor (CHRN)",
            "NMDA receptor (GRIN)",
            "Opioid receptor (OPRD)",
            "P2X receptor (P2RX)",
            "Purinergic receptor (P2YR)",
            "Serotonin receptor (HTR)",
            "Sigma receptor (SGMR)",
            "Trk receptor (NTRK)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenergic receptor (ADRB)",
                "Cholecystokinin receptor (CCKR)",
                "Dopamine receptor (DRD)",
                "GABA receptor (GABAR)",
                "Glycine receptor (GLRA)",
                "Histamine receptor (HRH)",
                "Muscarinic acetylcholine receptor (CHRM)",
                "Nicotinic acetylcholine receptor (CHRN)",
                "Opioid receptor (OPRD)",
                "Purinergic receptor (P2YR)",
                "Serotonin receptor (HTR)",
                "Sigma receptor (SGMR)"
            ],
            "mismatches": [
                "Acetylcholine receptor (AChR)",
                "Adenosine receptor (ADORA)",
                "Angiotensin receptor (AGTR)",
                "Benzodiazepine receptor (BZRP)",
                "Cannabinoid receptor (CB)",
                "GluR1 receptor (GRIA1)",
                "Imidazoline receptor (I1R)",
                "Melatonin receptor (MTNR)",
                "NMDA receptor (GRIN)",
                "P2X receptor (P2RX)",
                "Trk receptor (NTRK)"
            ],
            "true_referents": [
                "D1 dopamine receptor",
                "D2 dopamine receptor",
                "GABA receptor",
                "GABA-A receptor",
                "GABA-B receptor",
                "N-methyl-D-aspartate receptor",
                "P2X purinergic receptor",
                "P2X1 purinergic receptor",
                "P2X2 purinergic receptor",
                "P2Y purinergic receptor",
                "P2Y1 purinergic receptor",
                "adenosine A1 receptor",
                "adenosine A2 receptor",
                "adenosine A2A receptor",
                "adrenergic receptor",
                "alpha adrenergic receptor",
                "alpha7 nicotinic acetylcholine receptor",
                "amino acid receptor",
                "beta-1 adrenergic receptor",
                "cholecystokinin A receptor",
                "cholecystokinin B receptor",
                "cholecystokinin receptor",
                "cholinergic receptor",
                "delta opioid receptor",
                "dopamine receptor",
                "glutamate receptor",
                "glycine receptor",
                "histamine H1 receptor",
                "histamine H2 receptor",
                "histamine receptor",
                "ionotropic glutamate receptor",
                "mu opioid receptor",
                "muscarinic M2 receptor",
                "muscarinic M5 receptor",
                "muscarinic receptor",
                "neurokinin-1 receptor",
                "neurokinin-3 receptor",
                "neurotensin receptor",
                "nicotinic receptor",
                "opioid receptor",
                "purinergic receptor",
                "serotonin 5-HT1 receptor",
                "serotonin 5-HT1A receptor",
                "serotonin 5-HT1D receptor",
                "serotonin receptor",
                "sigma receptor",
                "sigma-1 receptor",
                "tachykinin receptor"
            ],
            "TP": 12,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "neurotransmitter receptor",
        "domain": "biology",
        "response": [
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            },
            {
                "Referent": "Adrenergic receptor",
                "Canonical name": "ADR"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenergic receptor"
            ],
            "mismatches": [],
            "true_referents": [
                "adrenergic receptor",
                "alpha adrenergic receptor",
                "beta-1 adrenergic receptor"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 0
        }
    }
]