[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Adrenergic receptor alpha-1A (ADRA1A)",
            "Adrenergic receptor alpha-1B (ADRA1B)",
            "Adrenergic receptor alpha-1D (ADRA1D)",
            "Adrenergic receptor alpha-2A (ADRA2A)",
            "Adrenergic receptor alpha-2B (ADRA2B)",
            "Adrenergic receptor alpha-2C (ADRA2C)",
            "Adrenergic receptor beta-1 (ADRB1)",
            "Adrenergic receptor beta-2 (ADRB2)",
            "Adrenergic receptor beta-3 (ADRB3)",
            "Dopamine receptor D1 (DRD1)",
            "Dopamine receptor D2 (DRD2)",
            "Dopamine receptor D3 (DRD3)",
            "Dopamine receptor D4 (DRD4)",
            "Dopamine receptor D5 (DRD5)",
            "Histamine receptor H1 (HRH1)",
            "Histamine receptor H2 (HRH2)",
            "Histamine receptor H3 (HRH3)",
            "Histamine receptor H4 (HRH4)",
            "Opioid receptor mu (OPRM1)",
            "Opioid receptor delta (OPRD1)",
            "Opioid receptor kappa (OPRK1)",
            "Serotonin receptor 5-HT1A (HTR1A)",
            "Serotonin receptor 5-HT2A (HTR2A)",
            "Serotonin receptor 5-HT3A (HTR3A)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenergic receptor alpha-1A (ADRA1A)",
                "Adrenergic receptor alpha-1B (ADRA1B)",
                "Adrenergic receptor alpha-1D (ADRA1D)",
                "Adrenergic receptor alpha-2A (ADRA2A)",
                "Adrenergic receptor alpha-2B (ADRA2B)",
                "Adrenergic receptor alpha-2C (ADRA2C)",
                "Adrenergic receptor beta-1 (ADRB1)",
                "Adrenergic receptor beta-2 (ADRB2)",
                "Adrenergic receptor beta-3 (ADRB3)",
                "Dopamine receptor D1 (DRD1)",
                "Dopamine receptor D2 (DRD2)",
                "Dopamine receptor D3 (DRD3)",
                "Dopamine receptor D4 (DRD4)",
                "Dopamine receptor D5 (DRD5)",
                "Histamine receptor H1 (HRH1)",
                "Histamine receptor H2 (HRH2)",
                "Histamine receptor H4 (HRH4)",
                "Opioid receptor mu (OPRM1)",
                "Opioid receptor delta (OPRD1)",
                "Opioid receptor kappa (OPRK1)",
                "Serotonin receptor 5-HT1A (HTR1A)",
                "Serotonin receptor 5-HT2A (HTR2A)"
            ],
            "mismatches": [
                "Histamine receptor H3 (HRH3)",
                "Serotonin receptor 5-HT3A (HTR3A)"
            ],
            "true_referents": [
                "5-HT1 Serotonin Receptors",
                "5-HT1A Serotonin Receptor",
                "5-HT1D Serotonin Receptor",
                "5-HT2 Serotonin Receptors",
                "5-HT2A Serotonin Receptor",
                "Adrenergic Receptors",
                "Dopamine D1 Receptors",
                "Dopamine D2 Receptors",
                "Dopamine D3 Receptors",
                "Dopamine D4 Receptors",
                "Dopamine D5 Receptors",
                "Dopamine Receptors",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "Muscarinic M1 Receptor",
                "Opioid Receptors",
                "alpha Adrenergic Receptors",
                "alpha-1 Adrenergic Receptors",
                "alpha-2 Adrenergic Receptors",
                "beta Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "beta-2 Adrenergic Receptors",
                "beta-3 Adrenergic Receptors",
                "delta Opioid Receptors",
                "kappa Opioid Receptors",
                "mu Opioid Receptors"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Rhodopsin (RHO)",
            "Beta-2 adrenergic receptor (ADRB2)",
            "Muscarinic acetylcholine receptor M2 (CHRM2)",
            "Dopamine receptor D2 (DRD2)",
            "Serotonin receptor 5-HT1A (HTR1A)",
            "Glucagon receptor (GCGR)",
            "Angiotensin II receptor type 1 (AGTR1)",
            "Oxytocin receptor (OXTR)",
            "Vasopressin receptor 1A (AVPR1A)",
            "Frizzled receptor 1 (FZD1)",
            "Cannabinoid receptor 1 (CNR1)",
            "Melatonin receptor 1A (MTNR1A)",
            "Adenosine A1 receptor (ADORA1)",
            "Histamine H1 receptor (HRH1)",
            "Somatostatin receptor 5 (SSTR5)",
            "Calcitonin receptor (CALCR)",
            "Thyroid hormone receptor beta (THRB)",
            "Gastrin-releasing peptide receptor (GRPR)",
            "Adenosine A2A receptor (ADORA2A)",
            "Neurokinin-1 receptor (TACR1)",
            "Prolactin receptor (PRLR)",
            "Parathyroid hormone receptor 1 (PTHR1)",
            "Secretin receptor (SCTR)",
            "Gastrin receptor (CCKBR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rhodopsin",
                "beta-2 Adrenergic Receptors",
                "Muscarinic M2 Receptor",
                "Dopamine D2 Receptors",
                "5-HT1A Serotonin Receptor",
                "Glucagon Receptors",
                "Type 1 Angiotensin Receptor",
                "Oxytocin Receptors",
                "Frizzled Receptors",
                "CB1 Cannabinoid Receptor",
                "MT1 Melatonin Receptor",
                "Adenosine A1 Receptor",
                "Histamine H1 Receptors",
                "Somatostatin Receptors",
                "Calcitonin Receptors",
                "Adenosine A2A Receptor",
                "Neurokinin-1 Receptors",
                "Type 1 Parathyroid Hormone Receptor"
            ],
            "mismatches": [
                "Vasopressin receptor 1A (AVPR1A)",
                "Thyroid hormone receptor beta (THRB)",
                "Gastrin-releasing peptide receptor (GRPR)",
                "Prolactin receptor (PRLR)",
                "Secretin receptor (SCTR)",
                "Gastrin receptor (CCKBR)"
            ],
            "true_referents": [
                "5-HT1 Serotonin Receptors",
                "5-HT1A Serotonin Receptor",
                "5-HT1D Serotonin Receptor",
                "Adenosine A1 Receptor",
                "Adenosine A2 Receptors",
                "Adenosine A2A Receptor",
                "Adenosine A2B Receptor",
                "Adenosine A3 Receptor",
                "Angiotensin Receptors",
                "CB1 Cannabinoid Receptor",
                "CB2 Cannabinoid Receptor",
                "Calcitonin Gene-Related Peptide Receptors",
                "Calcitonin Receptor-Like Protein",
                "Calcitonin Receptors",
                "Cannabinoid Receptors",
                "Cholecystokinin A Receptor",
                "Cholecystokinin B Receptor",
                "Cholecystokinin Receptors",
                "Dopamine D2 Receptors",
                "Dopamine D4 Receptors",
                "Dopamine Receptors",
                "FSH Receptors",
                "Frizzled Receptors",
                "Glucagon Receptors",
                "Glucagon-Like Peptide Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Glucagon-Like Peptide-2 Receptor",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "LH Receptors",
                "MT1 Melatonin Receptor",
                "MT2 Melatonin Receptor",
                "Melatonin Receptors",
                "Muscarinic M1 Receptor",
                "Muscarinic M2 Receptor",
                "Muscarinic Receptors",
                "Neurokinin-1 Receptors",
                "Neurokinin-2 Receptors",
                "Neurokinin-3 Receptors",
                "Oxytocin Receptors",
                "Parathyroid Hormone Receptors",
                "Rhodopsin",
                "Smoothened Receptor",
                "Somatostatin Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 1 Parathyroid Hormone Receptor",
                "Type 2 Angiotensin Receptor",
                "Type 2 Parathyroid Hormone Receptor",
                "Type I Vasoactive Intestinal Polypeptide Receptors",
                "Vasopressin Receptors",
                "beta Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "beta-2 Adrenergic Receptors"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Adrenergic Receptor (ADR)",
            "Angiotensin II Receptor (AGTR)",
            "Brachyury",
            "Cannabinoid Receptor (CNR)",
            "Chemokine Receptor (CXCR)",
            "Dopamine Receptor (DR)",
            "Frizzled",
            "GABA Receptor (GABBR)",
            "Gastrin-Releasing Peptide Receptor (GRPR)",
            "Glutamate Receptor (GRM)",
            "Histamine Receptor (HRH)",
            "Melanocortin Receptor (MC)",
            "Neurokinin Receptor (TACR)",
            "Opsin",
            "Opioid Receptor (OPRM)",
            "Purinergic Receptor (P2Y)",
            "Prostaglandin Receptor (PTGER)",
            "Rhodopsin",
            "Serotonin Receptor (HTR)",
            "Somatostatin Receptor (SSTR)",
            "Thyroid-Stimulating Hormone Receptor (TSHR)",
            "Taste Receptor (TAS)",
            "Vasopressin Receptor (AVPR)",
            "Vitamin D Receptor (VDR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenergic Receptors",
                "Angiotensin Receptors",
                "Cannabinoid Receptors",
                "Chemokine Receptors",
                "Dopamine Receptors",
                "Frizzled Receptors",
                "GABA-B Receptors",
                "Histamine H1 Receptors",
                "Melanocortin Receptors",
                "Opioid Receptors",
                "Purinergic P2Y Receptors",
                "Prostaglandin Receptors",
                "Rhodopsin",
                "Serotonin Receptors",
                "Somatostatin Receptors",
                "Vasopressin Receptors"
            ],
            "mismatches": [
                "Brachyury",
                "Gastrin-Releasing Peptide Receptor (GRPR)",
                "Glutamate Receptor (GRM)",
                "Neurokinin Receptor (TACR)",
                "Opsin",
                "Thyroid-Stimulating Hormone Receptor (TSHR)",
                "Taste Receptor (TAS)",
                "Vitamin D Receptor (VDR)"
            ],
            "true_referents": [
                "5-HT1 Serotonin Receptors",
                "5-HT1D Serotonin Receptor",
                "Adrenergic Receptors",
                "Angiotensin Receptors",
                "CB1 Cannabinoid Receptor",
                "CB2 Cannabinoid Receptor",
                "CX3C Chemokine Receptor 1",
                "CXCR Receptors",
                "Cannabinoid Receptors",
                "Chemokine Receptors",
                "Dopamine D1 Receptors",
                "Dopamine D2 Receptors",
                "Dopamine Receptors",
                "Frizzled Receptors",
                "GABA-B Receptors",
                "Glucagon-Like Peptide Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Glucagon-Like Peptide-2 Receptor",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "LH Receptors",
                "Lipoxin Receptors",
                "Melanocortin Receptors",
                "Metabotropic Glutamate 5 Receptor",
                "Metabotropic Glutamate Receptors",
                "Muscarinic M5 Receptor",
                "Neurokinin-1 Receptors",
                "Neurokinin-2 Receptors",
                "Odorant Receptors",
                "Opioid Receptors",
                "Parathyroid Hormone Receptors",
                "Prostaglandin E Receptors",
                "Prostaglandin H2 Thromboxane A2 Receptors",
                "Prostaglandin Receptors",
                "Purinergic P2Y Receptors",
                "Purinergic P2Y1 Receptors",
                "Purinergic P2Y2 Receptors",
                "Rhodopsin",
                "Serotonin Receptors",
                "Smoothened Receptor",
                "Somatostatin Receptors",
                "Tachykinin Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 1 Melanocortin Receptor",
                "Type 1 Parathyroid Hormone Receptor",
                "Type 2 Angiotensin Receptor",
                "Type 2 Melanocortin Receptor",
                "Type 2 Parathyroid Hormone Receptor",
                "Type 2 Taste Receptors",
                "Type II Vasoactive Intestinal Peptide Receptors",
                "Vasoactive Intestinal Peptide Receptors",
                "Vasopressin Receptors",
                "alpha Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "delta Opioid Receptors",
                "mu Opioid Receptors"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Adrenergic Receptor \u03b11A (ADRA1A)",
            "Adrenergic Receptor \u03b22 (ADRB2)",
            "Muscarinic Acetylcholine Receptor M1 (CHRM1)",
            "Dopamine Receptor D1 (DRD1)",
            "Histamine Receptor H1 (HRH1)",
            "Serotonin Receptor 5-HT1A (HTR1A)",
            "Serotonin Receptor 5-HT2A (HTR2A)",
            "Opioid Receptor \u03bc (OPRM1)",
            "Opioid Receptor \u03b4 (OPRD1)",
            "Cannabinoid Receptor CB1 (CNR1)",
            "Chemokine Receptor CCR5",
            "Chemokine Receptor CXCR4",
            "Angiotensin II Receptor AT1 (AGTR1)",
            "Endothelin Receptor Type A (EDNRA)",
            "Prostaglandin Receptor DP1 (PTGDR)",
            "Somatostatin Receptor SSTR1 (SSTR1)",
            "Vasopressin Receptor V1A (AVPR1A)",
            "Oxytocin Receptor (OXTR)",
            "Glucagon Receptor (GCGR)",
            "Cholecystokinin Receptor CCK2R (CCK2R)",
            "Melatonin Receptor MT1 (MTNR1A)",
            "Taste Receptor T2R38 (TAS2R38)",
            "Formyl Peptide Receptor FPR1 (FPR1)",
            "Lysophosphatidic Acid Receptor LPAR1 (LPAR1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenergic Receptors",
                "Muscarinic Receptors",
                "Dopamine Receptors",
                "Histamine H1 Receptors",
                "5-HT1A Serotonin Receptor",
                "5-HT2A Serotonin Receptor",
                "mu Opioid Receptors",
                "delta Opioid Receptors",
                "CB1 Cannabinoid Receptor",
                "CCR5 Receptors",
                "CXCR4 Receptors",
                "Type 1 Angiotensin Receptor",
                "Endothelin A Receptor",
                "Prostaglandin Receptors",
                "Somatostatin Receptors",
                "Vasopressin Receptors",
                "Oxytocin Receptors",
                "Glucagon Receptors",
                "Cholecystokinin B Receptor",
                "MT1 Melatonin Receptor",
                "Type 2 Taste Receptors",
                "Formyl Peptide Receptors",
                "Lysophosphatidic Acid Receptors"
            ],
            "mismatches": [],
            "true_referents": [
                "5-HT1 Serotonin Receptors",
                "5-HT1A Serotonin Receptor",
                "5-HT1D Serotonin Receptor",
                "5-HT2 Serotonin Receptors",
                "5-HT2A Serotonin Receptor",
                "Adrenergic Receptors",
                "Angiotensin Receptors",
                "CB1 Cannabinoid Receptor",
                "CB2 Cannabinoid Receptor",
                "CCR1 Receptors",
                "CCR4 Receptors",
                "CCR5 Receptors",
                "CXCR4 Receptors",
                "Cannabinoid Receptors",
                "Chemokine Receptors",
                "Cholecystokinin A Receptor",
                "Cholecystokinin B Receptor",
                "Cholecystokinin Receptors",
                "Dopamine D1 Receptors",
                "Dopamine D4 Receptors",
                "Dopamine Receptors",
                "EP1 Subtype Prostaglandin E Receptors",
                "Endothelin A Receptor",
                "Endothelin B Receptor",
                "Endothelin Receptors",
                "Formyl Peptide Receptors",
                "Glucagon Receptors",
                "Glucagon-Like Peptide Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Glucagon-Like Peptide-2 Receptor",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "Lysophosphatidic Acid Receptors",
                "Lysophospholipid Receptors",
                "Lysosphingolipid Receptors",
                "MT1 Melatonin Receptor",
                "MT2 Melatonin Receptor",
                "Melatonin Receptors",
                "Muscarinic M1 Receptor",
                "Muscarinic M4 Receptor",
                "Muscarinic Receptors",
                "Opioid Receptors",
                "Oxytocin Receptors",
                "PAR-1 Receptor",
                "Prostaglandin E Receptors",
                "Prostaglandin Receptors",
                "Somatostatin Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 2 Angiotensin Receptor",
                "Type 2 Taste Receptors",
                "Type I Vasoactive Intestinal Polypeptide Receptors",
                "Vasoactive Intestinal Peptide Receptors",
                "Vasopressin Receptors",
                "alpha Adrenergic Receptors",
                "alpha-1 Adrenergic Receptors",
                "alpha-2 Adrenergic Receptors",
                "beta Adrenergic Receptors",
                "beta-2 Adrenergic Receptors",
                "delta Opioid Receptors",
                "kappa Opioid Receptors",
                "mu Opioid Receptors"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Beta-2 adrenergic receptor (ADRB2)",
            "Alpha-1 adrenergic receptor (ADRA1)",
            "Dopamine receptor D2 (DRD2)",
            "Serotonin 5-HT1A receptor (HTR1A)",
            "Histamine H1 receptor (HRH1)",
            "Muscarinic acetylcholine receptor M2 (CHRM2)",
            "Angiotensin II receptor type 1 (AGTR1)",
            "Cannabinoid receptor type 1 (CNR1)",
            "Vasopressin V1a receptor (AVPR1A)",
            "Opioid receptor mu 1 (OPRM1)",
            "Glucagon receptor (GCGR)",
            "Rhodopsin (RHO)",
            "Chemokine receptor type 4 (CXCR4)",
            "Frizzled class receptor 1 (FZD1)",
            "Metabotropic glutamate receptor 1 (GRM1)",
            "Prostaglandin E2 receptor EP3 subtype (PTGER3)",
            "Lysophosphatidic acid receptor 1 (LPAR1)",
            "Neuropeptide Y receptor Y1 (NPY1R)",
            "Endothelin receptor type A (EDNRA)",
            "Bradykinin receptor B2 (BDKRB2)",
            "Purinergic receptor P2Y12 (P2RY12)",
            "Melanocortin 4 receptor (MC4R)",
            "Somatostatin receptor 2 (SSTR2)",
            "Free fatty acid receptor 1 (FFAR1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "beta-2 Adrenergic Receptors",
                "alpha-1 Adrenergic Receptors",
                "Dopamine D2 Receptors",
                "5-HT1A Serotonin Receptor",
                "Histamine H1 Receptors",
                "Muscarinic M2 Receptor",
                "Type 1 Angiotensin Receptor",
                "CB1 Cannabinoid Receptor",
                "Vasopressin Receptors",
                "mu Opioid Receptors",
                "Glucagon Receptors",
                "Rhodopsin",
                "CXCR4 Receptors",
                "Frizzled Receptors",
                "Metabotropic Glutamate Receptors",
                "EP3 Subtype Prostaglandin E Receptors",
                "Lysophosphatidic Acid Receptors",
                "Neuropeptide Y Receptors",
                "Endothelin A Receptor",
                "Bradykinin B2 Receptor",
                "Purinergic P2Y12 Receptors",
                "Type 4 Melanocortin Receptor",
                "Somatostatin Receptors"
            ],
            "mismatches": [
                "Vasopressin V1a receptor (AVPR1A)",
                "Frizzled class receptor 1 (FZD1)",
                "Metabotropic glutamate receptor 1 (GRM1)",
                "Neuropeptide Y receptor Y1 (NPY1R)",
                "Somatostatin receptor 2 (SSTR2)",
                "Free fatty acid receptor 1 (FFAR1)"
            ],
            "true_referents": [
                "5-HT1 Serotonin Receptors",
                "5-HT1A Serotonin Receptor",
                "5-HT1D Serotonin Receptor",
                "5-HT2 Serotonin Receptors",
                "Angiotensin Receptors",
                "Bradykinin B1 Receptor",
                "Bradykinin B2 Receptor",
                "Bradykinin Receptors",
                "CB1 Cannabinoid Receptor",
                "CB2 Cannabinoid Receptor",
                "CCR4 Receptors",
                "CX3C Chemokine Receptor 1",
                "CXCR4 Receptors",
                "Cannabinoid Receptors",
                "Dopamine D2 Receptors",
                "Dopamine D4 Receptors",
                "Dopamine Receptors",
                "EP1 Subtype Prostaglandin E Receptors",
                "EP2 Subtype Prostaglandin E Receptors",
                "EP3 Subtype Prostaglandin E Receptors",
                "Endothelin A Receptor",
                "Endothelin B Receptor",
                "Endothelin Receptors",
                "FSH Receptors",
                "Frizzled Receptors",
                "Glucagon Receptors",
                "Glucagon-Like Peptide Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Glucagon-Like Peptide-2 Receptor",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "Lysophosphatidic Acid Receptors",
                "Lysophospholipid Receptors",
                "Melanocortin Receptors",
                "Metabotropic Glutamate 5 Receptor",
                "Metabotropic Glutamate Receptors",
                "Muscarinic M1 Receptor",
                "Muscarinic M2 Receptor",
                "Muscarinic Receptors",
                "Neuropeptide Y Receptors",
                "Opioid Receptors",
                "PAR-1 Receptor",
                "Purinergic P2Y Receptors",
                "Purinergic P2Y1 Receptors",
                "Purinergic P2Y12 Receptors",
                "Purinergic P2Y2 Receptors",
                "Rhodopsin",
                "Smoothened Receptor",
                "Somatostatin Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 1 Melanocortin Receptor",
                "Type 2 Angiotensin Receptor",
                "Type 4 Melanocortin Receptor",
                "Type I Vasoactive Intestinal Polypeptide Receptors",
                "Vasoactive Intestinal Peptide Receptors",
                "Vasopressin Receptors",
                "alpha Adrenergic Receptors",
                "alpha-1 Adrenergic Receptors",
                "alpha-2 Adrenergic Receptors",
                "beta Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "beta-2 Adrenergic Receptors",
                "mu Opioid Receptors"
            ],
            "TP": 23,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Beta-adrenergic receptor (ADRB1)",
            "Dopamine receptor D1 (DRD1)",
            "Serotonin receptor 5-HT1A (HTR1A)",
            "Histamine H1 receptor (HRH1)",
            "Muscarinic acetylcholine receptor M1 (CHRM1)",
            "Opioid receptor mu (OPRM1)",
            "Vasopressin receptor V1A (AVPR1A)",
            "Angiotensin II receptor type 1 (AGTR1)",
            "Neurokinin 1 receptor (NK1R)",
            "Corticotropin-releasing hormone receptor 1 (CRHR1)",
            "Chemokine receptor CCR5 (CCR5)",
            "Thyrotropin-releasing hormone receptor (TRHR)",
            "Prostaglandin E receptor 2 (PTGER2)",
            "Endothelin receptor type A (EDNRA)",
            "Bradykinin B2 receptor (BDKRB2)",
            "Sphingosine-1-phosphate receptor 1 (S1PR1)",
            "Cannabinoid receptor 1 (CNR1)",
            "Platelet-activating factor receptor (PTAFR)",
            "Melanocortin receptor 4 (MC4R)",
            "Parathyroid hormone receptor 1 (PTH1R)",
            "Glucagon receptor (GCGR)",
            "Leptin receptor (LEPR)",
            "Ghrelin receptor (GHSR)",
            "Adrenomedullin receptor (ADMR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dopamine Receptors",
                "5-HT1A Serotonin Receptor",
                "Histamine H1 Receptors",
                "Muscarinic M1 Receptor",
                "mu Opioid Receptors",
                "Type 1 Angiotensin Receptor",
                "Neurokinin-1 Receptors",
                "Type 1 CRF Receptor",
                "CCR5 Receptors",
                "Prostaglandin E Receptors",
                "Endothelin A Receptor",
                "Bradykinin B2 Receptor",
                "Sphingosine-1-Phosphate Receptors",
                "CB1 Cannabinoid Receptor",
                "Type 4 Melanocortin Receptor",
                "Type 1 Parathyroid Hormone Receptor",
                "Glucagon Receptors",
                "Ghrelin Receptors",
                "Adrenomedullin Receptors"
            ],
            "mismatches": [
                "Beta-adrenergic receptor (ADRB1)",
                "Vasopressin receptor V1A (AVPR1A)",
                "Thyrotropin-releasing hormone receptor (TRHR)",
                "Platelet-activating factor receptor (PTAFR)",
                "Leptin receptor (LEPR)"
            ],
            "true_referents": [
                "5-HT1 Serotonin Receptors",
                "5-HT1A Serotonin Receptor",
                "5-HT1D Serotonin Receptor",
                "Adrenergic Receptors",
                "Adrenomedullin Receptors",
                "Angiotensin Receptors",
                "Bradykinin B1 Receptor",
                "Bradykinin B2 Receptor",
                "Bradykinin Receptors",
                "CB1 Cannabinoid Receptor",
                "CB2 Cannabinoid Receptor",
                "CCR Receptors",
                "CCR1 Receptors",
                "CCR5 Receptors",
                "Cannabinoid Receptors",
                "Corticotropin-Releasing Hormone Receptors",
                "Dopamine D1 Receptors",
                "Dopamine D4 Receptors",
                "Dopamine Receptors",
                "EP2 Subtype Prostaglandin E Receptors",
                "Endothelin A Receptor",
                "Endothelin B Receptor",
                "Endothelin Receptors",
                "Ghrelin Receptors",
                "Glucagon Receptors",
                "Glucagon-Like Peptide Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Glucagon-Like Peptide-2 Receptor",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "LH Receptors",
                "LHRH Receptors",
                "Lysosphingolipid Receptors",
                "Melanocortin Receptors",
                "Muscarinic M1 Receptor",
                "Muscarinic M4 Receptor",
                "Muscarinic Receptors",
                "Neurokinin-1 Receptors",
                "Neurokinin-2 Receptors",
                "Neurokinin-3 Receptors",
                "Opioid Receptors",
                "PAR-1 Receptor",
                "PAR-2 Receptor",
                "Parathyroid Hormone Receptors",
                "Prostaglandin E Receptors",
                "Prostaglandin Receptors",
                "Somatostatin Receptors",
                "Sphingosine Phosphorylcholine Receptors",
                "Sphingosine-1-Phosphate Receptors",
                "Thromboxane Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 1 CRF Receptor",
                "Type 1 Melanocortin Receptor",
                "Type 1 Parathyroid Hormone Receptor",
                "Type 2 Angiotensin Receptor",
                "Type 2 Parathyroid Hormone Receptor",
                "Type 4 Melanocortin Receptor",
                "Type I Vasoactive Intestinal Polypeptide Receptors",
                "Vasoactive Intestinal Peptide Receptors",
                "Vasopressin Receptors",
                "alpha Adrenergic Receptors",
                "beta Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "mu Opioid Receptors"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Rhodopsin (RHO)",
            "Beta-2 adrenergic receptor (ADRB2)",
            "Alpha-1A adrenergic receptor (ADRA1A)",
            "Alpha-1B adrenergic receptor (ADRA1B)",
            "Alpha-1D adrenergic receptor (ADRA1D)",
            "Alpha-2A adrenergic receptor (ADRA2A)",
            "Alpha-2B adrenergic receptor (ADRA2B)",
            "Alpha-2C adrenergic receptor (ADRA2C)",
            "Beta-1 adrenergic receptor (ADRB1)",
            "Beta-3 adrenergic receptor (ADRB3)",
            "Dopamine receptor D1 (DRD1)",
            "Dopamine receptor D2 (DRD2)",
            "Dopamine receptor D3 (DRD3)",
            "Dopamine receptor D4 (DRD4)",
            "Dopamine receptor D5 (DRD5)",
            "Serotonin receptor 1A (HTR1A)",
            "Serotonin receptor 1B (HTR1B)",
            "Serotonin receptor 2A (HTR2A)",
            "Serotonin receptor 2B (HTR2B)",
            "Serotonin receptor 2C (HTR2C)",
            "Serotonin receptor 3A (HTR3A)",
            "Serotonin receptor 3B (HTR3B)",
            "Serotonin receptor 4 (HTR4)",
            "Serotonin receptor 5A (HTR5A)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rhodopsin (RHO)",
                "Beta-2 adrenergic receptor (ADRB2)",
                "Beta-1 adrenergic receptor (ADRB1)",
                "Beta-3 adrenergic receptor (ADRB3)",
                "Dopamine receptor D1 (DRD1)",
                "Dopamine receptor D2 (DRD2)",
                "Dopamine receptor D3 (DRD3)",
                "Dopamine receptor D4 (DRD4)",
                "Dopamine receptor D5 (DRD5)",
                "Serotonin receptor 1A (HTR1A)",
                "Serotonin receptor 1B (HTR1B)",
                "Serotonin receptor 2A (HTR2A)",
                "Serotonin receptor 2B (HTR2B)",
                "Serotonin receptor 2C (HTR2C)",
                "Serotonin receptor 4 (HTR4)"
            ],
            "mismatches": [
                "Alpha-1A adrenergic receptor (ADRA1A)",
                "Alpha-1B adrenergic receptor (ADRA1B)",
                "Alpha-1D adrenergic receptor (ADRA1D)",
                "Alpha-2A adrenergic receptor (ADRA2A)",
                "Alpha-2B adrenergic receptor (ADRA2B)",
                "Alpha-2C adrenergic receptor (ADRA2C)",
                "Serotonin receptor 3A (HTR3A)",
                "Serotonin receptor 3B (HTR3B)",
                "Serotonin receptor 5A (HTR5A)"
            ],
            "true_referents": [
                "5-HT1 Serotonin Receptors",
                "5-HT1A Serotonin Receptor",
                "5-HT1B Serotonin Receptor",
                "5-HT1D Serotonin Receptor",
                "5-HT2 Serotonin Receptors",
                "5-HT2A Serotonin Receptor",
                "5-HT2B Serotonin Receptor",
                "5-HT2C Serotonin Receptor",
                "5-HT4 Serotonin Receptors",
                "Adrenergic Receptors",
                "CB1 Cannabinoid Receptor",
                "Dopamine D1 Receptors",
                "Dopamine D2 Receptors",
                "Dopamine D3 Receptors",
                "Dopamine D4 Receptors",
                "Dopamine D5 Receptors",
                "Dopamine Receptors",
                "Rhodopsin",
                "Serotonin Receptors",
                "alpha Adrenergic Receptors",
                "alpha-1 Adrenergic Receptors",
                "alpha-2 Adrenergic Receptors",
                "beta Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "beta-2 Adrenergic Receptors",
                "beta-3 Adrenergic Receptors"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Beta-2 adrenergic receptor (ADRB2)",
            "Dopamine D2 receptor (DRD2)",
            "Serotonin 5-HT1A receptor (HTR1A)",
            "Histamine H1 receptor (HRH1)",
            "Glucagon receptor (GCGR)",
            "Adenosine A2A receptor (ADORA2A)",
            "Angiotensin II receptor type 1 (AGTR1)",
            "Cannabinoid receptor type 1 (CNR1)",
            "Mu-opioid receptor (OPRM1)",
            "Epinephrine receptor (ADRA1B)",
            "Melatonin receptor type 1A (MTNR1A)",
            "Prostaglandin E2 receptor EP3 subtype (PTGER3)",
            "Neurotensin receptor 1 (NTSR1)",
            "Oxytocin receptor (OXTR)",
            "Corticotropin-releasing factor receptor 1 (CRHR1)",
            "Sphingosine 1-phosphate receptor 1 (S1PR1)",
            "Vasopressin V2 receptor (AVPR2)",
            "Leukotriene B4 receptor (LTB4R)",
            "Thromboxane A2 receptor (TBXA2R)",
            "Cholecystokinin receptor type A (CCKAR)",
            "Neuropeptide Y receptor type 1 (NPY1R)",
            "Ghrelin receptor (GHSR)",
            "Frizzled class receptor 4 (FZD4)",
            "Neurokinin 1 receptor (TACR1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dopamine D2 receptor (DRD2)",
                "Serotonin 5-HT1A receptor (HTR1A)",
                "Histamine H1 receptor (HRH1)",
                "Glucagon receptor (GCGR)",
                "Adenosine A2A receptor (ADORA2A)",
                "Cannabinoid receptor type 1 (CNR1)",
                "Mu-opioid receptor (OPRM1)",
                "Melatonin receptor type 1A (MTNR1A)",
                "Prostaglandin E2 receptor EP3 subtype (PTGER3)",
                "Oxytocin receptor (OXTR)",
                "Corticotropin-releasing factor receptor 1 (CRHR1)",
                "Sphingosine 1-phosphate receptor 1 (S1PR1)",
                "Vasopressin V2 receptor (AVPR2)",
                "Leukotriene B4 receptor (LTB4R)",
                "Thromboxane A2 receptor (TBXA2R)",
                "Cholecystokinin receptor type A (CCKAR)",
                "Neuropeptide Y receptor type 1 (NPY1R)",
                "Ghrelin receptor (GHSR)",
                "Frizzled class receptor 4 (FZD4)",
                "Neurokinin 1 receptor (TACR1)"
            ],
            "mismatches": [
                "Beta-2 adrenergic receptor (ADRB2)",
                "Angiotensin II receptor type 1 (AGTR1)",
                "Epinephrine receptor (ADRA1B)",
                "Neurotensin receptor 1 (NTSR1)"
            ],
            "true_referents": [
                "5-HT1 Serotonin Receptors",
                "5-HT1A Serotonin Receptor",
                "5-HT1D Serotonin Receptor",
                "Adenosine A2 Receptors",
                "Adenosine A2A Receptor",
                "Adenosine A2B Receptor",
                "Adrenergic Receptors",
                "Angiotensin Receptors",
                "CB1 Cannabinoid Receptor",
                "CB2 Cannabinoid Receptor",
                "CCR4 Receptors",
                "Cannabinoid Receptors",
                "Cholecystokinin A Receptor",
                "Cholecystokinin B Receptor",
                "Cholecystokinin Receptors",
                "Corticotropin-Releasing Hormone Receptors",
                "Dopamine D2 Receptors",
                "Dopamine D4 Receptors",
                "Dopamine Receptors",
                "EP1 Subtype Prostaglandin E Receptors",
                "EP2 Subtype Prostaglandin E Receptors",
                "EP3 Subtype Prostaglandin E Receptors",
                "Eicosanoid Receptors",
                "Frizzled Receptors",
                "Ghrelin Receptors",
                "Glucagon Receptors",
                "Glucagon-Like Peptide Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Glucagon-Like Peptide-2 Receptor",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "Leukotriene B4 Receptors",
                "Leukotriene Receptors",
                "Lysosphingolipid Receptors",
                "MT1 Melatonin Receptor",
                "MT2 Melatonin Receptor",
                "Melatonin Receptors",
                "Neurokinin-1 Receptors",
                "Neurokinin-2 Receptors",
                "Neurokinin-3 Receptors",
                "Neuropeptide Y Receptors",
                "Neurotensin Receptors",
                "Opioid Receptors",
                "Oxytocin Receptors",
                "Prostaglandin H2 Thromboxane A2 Receptors",
                "Purinergic P2Y1 Receptors",
                "Purinergic P2Y2 Receptors",
                "Smoothened Receptor",
                "Sphingosine Phosphorylcholine Receptors",
                "Sphingosine-1-Phosphate Receptors",
                "Thromboxane Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 1 CRF Receptor",
                "Type 1 Melanocortin Receptor",
                "Type 2 Angiotensin Receptor",
                "Type II Vasoactive Intestinal Peptide Receptors",
                "Vasopressin Receptors",
                "beta Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "beta-2 Adrenergic Receptors",
                "kappa Opioid Receptors",
                "mu Opioid Receptors"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Beta-adrenergic receptor (\u03b2-AR)",
            "Muscarinic acetylcholine receptor M1 (CHRM1)",
            "Dopamine receptor D2 (DRD2)",
            "Serotonin receptor 5-HT1A (HTR1A)",
            "Opioid receptor mu (OPRM1)",
            "Histamine receptor H1 (HRH1)",
            "Rhodopsin (RHO)",
            "Glutamate receptor mGluR5 (GRM5)",
            "Frizzled receptor (FZD)",
            "Chemokine receptor CXCR4",
            "Parathyroid hormone receptor (PTH1R)",
            "Angiotensin II receptor type 1 (AGTR1)",
            "Calcitonin receptor (CALCR)",
            "Cannabinoid receptor CB1 (CNR1)",
            "Taste receptor T1R3 (TAS1R3)",
            "Melatonin receptor MT1 (MTNR1A)",
            "Somatostatin receptor subtype 2 (SSTR2)",
            "Vasopressin receptor V1A (AVPR1A)",
            "Neuropeptide Y receptor Y1 (NPY1R)",
            "Prostaglandin E receptor EP2 (PTGER2)",
            "Sphingosine-1-phosphate receptor 1 (S1PR1)",
            "Relaxin receptor RXFP1",
            "Bombesin receptor subtype 3 (BRS3)",
            "Leukotriene B4 receptor 1 (BLT1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "beta Adrenergic Receptors",
                "Muscarinic M1 Receptor",
                "Dopamine D2 Receptors",
                "5-HT1A Serotonin Receptor",
                "mu Opioid Receptors",
                "Histamine H1 Receptors",
                "Rhodopsin",
                "Metabotropic Glutamate 5 Receptor",
                "Frizzled Receptors",
                "CXCR4 Receptors",
                "Type 1 Parathyroid Hormone Receptor",
                "Type 1 Angiotensin Receptor",
                "Calcitonin Receptors",
                "CB1 Cannabinoid Receptor",
                "MT1 Melatonin Receptor",
                "Somatostatin Receptors",
                "Vasopressin Receptors",
                "Neuropeptide Y Receptors",
                "EP2 Subtype Prostaglandin E Receptors",
                "Sphingosine-1-Phosphate Receptors",
                "Bombesin Receptors",
                "Leukotriene B4 Receptors"
            ],
            "mismatches": [
                "Taste receptor T1R3 (TAS1R3)",
                "Relaxin receptor RXFP1"
            ],
            "true_referents": [
                "5-HT1 Serotonin Receptors",
                "5-HT1A Serotonin Receptor",
                "5-HT1D Serotonin Receptor",
                "5-HT1F Serotonin Receptor",
                "5-HT2 Serotonin Receptors",
                "Adenosine A3 Receptor",
                "Angiotensin Receptors",
                "Bombesin Receptors",
                "CB1 Cannabinoid Receptor",
                "CB2 Cannabinoid Receptor",
                "CCR3 Receptors",
                "CCR4 Receptors",
                "CXCR4 Receptors",
                "Calcitonin Gene-Related Peptide Receptors",
                "Calcitonin Receptor-Like Protein",
                "Calcitonin Receptors",
                "Cannabinoid Receptors",
                "Chemokine Receptors",
                "Cholecystokinin B Receptor",
                "Dopamine D2 Receptors",
                "Dopamine D4 Receptors",
                "Dopamine Receptors",
                "EP1 Subtype Prostaglandin E Receptors",
                "EP2 Subtype Prostaglandin E Receptors",
                "Eicosanoid Receptors",
                "FSH Receptors",
                "Frizzled Receptors",
                "Glucagon-Like Peptide-2 Receptor",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "Leukotriene B4 Receptors",
                "Leukotriene Receptors",
                "Lysosphingolipid Receptors",
                "MT1 Melatonin Receptor",
                "MT2 Melatonin Receptor",
                "Melatonin Receptors",
                "Metabotropic Glutamate 5 Receptor",
                "Metabotropic Glutamate Receptors",
                "Muscarinic M1 Receptor",
                "Muscarinic M4 Receptor",
                "Muscarinic M5 Receptor",
                "Muscarinic Receptors",
                "Neurokinin-3 Receptors",
                "Neuropeptide Y Receptors",
                "Opioid Receptors",
                "PAR-1 Receptor",
                "Parathyroid Hormone Receptors",
                "Prostaglandin E Receptors",
                "Purinergic P2Y1 Receptors",
                "Purinergic P2Y2 Receptors",
                "Rhodopsin",
                "Smoothened Receptor",
                "Somatostatin Receptors",
                "Sphingosine Phosphorylcholine Receptors",
                "Sphingosine-1-Phosphate Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 1 CRF Receptor",
                "Type 1 Parathyroid Hormone Receptor",
                "Type 2 Angiotensin Receptor",
                "Type 2 Parathyroid Hormone Receptor",
                "Type 2 Taste Receptors",
                "Type I Vasoactive Intestinal Polypeptide Receptors",
                "Vasoactive Intestinal Peptide Receptors",
                "Vasopressin Receptors",
                "beta Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "beta-2 Adrenergic Receptors",
                "mu Opioid Receptors"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Beta-2 adrenergic receptor (ADRB2)",
            "Dopamine D2 receptor (DRD2)",
            "Mu-opioid receptor (OPRM1)",
            "Serotonin 5-HT1A receptor (HTR1A)",
            "Cannabinoid receptor 1 (CNR1)",
            "Angiotensin II receptor type 1 (AGTR1)",
            "Glucagon-like peptide-1 receptor (GLP1R)",
            "Vasopressin V2 receptor (AVPR2)",
            "C-X-C chemokine receptor type 4 (CXCR4)",
            "Rhodopsin (RHO)",
            "Glucagon receptor (GCGR)",
            "Adenosine A2A receptor (ADORA2A)",
            "Histamine H1 receptor (HRH1)",
            "Gonadotropin-releasing hormone receptor (GNRHR)",
            "Melanocortin 4 receptor (MC4R)",
            "Calcitonin receptor (CALCR)",
            "Parathyroid hormone 1 receptor (PTH1R)",
            "Thyrotropin receptor (TSHR)",
            "Luteinizing hormone/choriogonadotropin receptor (LHCGR)",
            "Follicle-stimulating hormone receptor (FSHR)",
            "Metabotropic glutamate receptor 1 (GRM1)",
            "Prostaglandin E2 receptor EP4 subtype (PTGER4)",
            "Sphingosine-1-phosphate receptor 1 (S1PR1)",
            "Corticotropin-releasing hormone receptor 1 (CRHR1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Beta-2 adrenergic receptor (ADRB2)",
                "Dopamine D2 receptor (DRD2)",
                "Mu-opioid receptor (OPRM1)",
                "Serotonin 5-HT1A receptor (HTR1A)",
                "Cannabinoid receptor 1 (CNR1)",
                "Angiotensin II receptor type 1 (AGTR1)",
                "Glucagon-like peptide-1 receptor (GLP1R)",
                "Vasopressin V2 receptor (AVPR2)",
                "C-X-C chemokine receptor type 4 (CXCR4)",
                "Rhodopsin (RHO)",
                "Glucagon receptor (GCGR)",
                "Adenosine A2A receptor (ADORA2A)",
                "Histamine H1 receptor (HRH1)",
                "Calcitonin receptor (CALCR)",
                "Parathyroid hormone 1 receptor (PTH1R)",
                "Follicle-stimulating hormone receptor (FSHR)",
                "Prostaglandin E2 receptor EP4 subtype (PTGER4)",
                "Sphingosine-1-phosphate receptor 1 (S1PR1)",
                "Corticotropin-releasing hormone receptor 1 (CRHR1)"
            ],
            "mismatches": [
                "Gonadotropin-releasing hormone receptor (GNRHR)",
                "Melanocortin 4 receptor (MC4R)",
                "Thyrotropin receptor (TSHR)",
                "Luteinizing hormone/choriogonadotropin receptor (LHCGR)",
                "Metabotropic glutamate receptor 1 (GRM1)"
            ],
            "true_referents": [
                "5-HT1 Serotonin Receptors",
                "5-HT1A Serotonin Receptor",
                "5-HT1D Serotonin Receptor",
                "Adenosine A2 Receptors",
                "Adenosine A2A Receptor",
                "Adenosine A2B Receptor",
                "Angiotensin Receptors",
                "CB1 Cannabinoid Receptor",
                "CB2 Cannabinoid Receptor",
                "CCR4 Receptors",
                "CX3C Chemokine Receptor 1",
                "CXCR4 Receptors",
                "Calcitonin Gene-Related Peptide Receptors",
                "Calcitonin Receptor-Like Protein",
                "Calcitonin Receptors",
                "Cannabinoid Receptors",
                "Corticotropin-Releasing Hormone Receptors",
                "Dopamine D2 Receptors",
                "Dopamine D4 Receptors",
                "Dopamine Receptors",
                "EP1 Subtype Prostaglandin E Receptors",
                "EP2 Subtype Prostaglandin E Receptors",
                "EP4 Subtype Prostaglandin E Receptors",
                "FSH Receptors",
                "Glucagon Receptors",
                "Glucagon-Like Peptide Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Glucagon-Like Peptide-2 Receptor",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "LH Receptors",
                "LHRH Receptors",
                "Lysosphingolipid Receptors",
                "Melanocortin Receptors",
                "Metabotropic Glutamate 5 Receptor",
                "Metabotropic Glutamate Receptors",
                "Opioid Receptors",
                "Parathyroid Hormone Receptors",
                "Rhodopsin",
                "Sphingosine Phosphorylcholine Receptors",
                "Sphingosine-1-Phosphate Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 1 CRF Receptor",
                "Type 1 Melanocortin Receptor",
                "Type 1 Parathyroid Hormone Receptor",
                "Type 2 Angiotensin Receptor",
                "Type 2 Parathyroid Hormone Receptor",
                "Type 4 Melanocortin Receptor",
                "Type II Vasoactive Intestinal Peptide Receptors",
                "Vasopressin Receptors",
                "beta Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "beta-2 Adrenergic Receptors",
                "kappa Opioid Receptors",
                "mu Opioid Receptors"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Rhodopsin (Rho)",
            "Beta-2 adrenergic receptor (ADRB2)",
            "Dopamine D2 receptor (DRD2)",
            "Muscarinic acetylcholine receptor M1 (CHRM1)",
            "Angiotensin II receptor type 1 (AGTR1)",
            "Vasopressin V1a receptor (AVPR1A)",
            "Serotonin 5-HT1A receptor (HTR1A)",
            "Cannabinoid receptor 1 (CNR1)",
            "Chemokine receptor CXCR4",
            "Adenosine A2A receptor (ADORA2A)",
            "Histamine H1 receptor (HRH1)",
            "Glucagon-like peptide-1 receptor (GLP1R)",
            "Parathyroid hormone receptor 1 (PTH1R)",
            "Sphingosine 1-phosphate receptor 1 (S1PR1)",
            "Melanocortin-4 receptor (MC4R)",
            "Prostaglandin E2 receptor EP2 subtype (PTGER2)",
            "Thyrotropin receptor (TSHR)",
            "Oxytocin receptor (OXTR)",
            "Endothelin receptor type A (EDNRA)",
            "Neuropeptide Y receptor Y1 (NPY1R)",
            "Opioid receptor mu 1 (OPRM1)",
            "Relaxin/insulin-like family peptide receptor 1 (RXFP1)",
            "Cholecystokinin receptor type A (CCKAR)",
            "Platelet-activating factor receptor (PTAFR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rhodopsin",
                "beta-2 Adrenergic Receptors",
                "Dopamine D2 Receptors",
                "Muscarinic M1 Receptor",
                "Type 1 Angiotensin Receptor",
                "Vasopressin Receptors",
                "5-HT1A Serotonin Receptor",
                "CB1 Cannabinoid Receptor",
                "CXCR4 Receptors",
                "Adenosine A2A Receptor",
                "Histamine H1 Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Type 1 Parathyroid Hormone Receptor",
                "Sphingosine-1-Phosphate Receptors",
                "Type 4 Melanocortin Receptor",
                "EP2 Subtype Prostaglandin E Receptors",
                "Oxytocin Receptors",
                "Endothelin A Receptor",
                "Neuropeptide Y Receptors",
                "mu Opioid Receptors",
                "Cholecystokinin A Receptor"
            ],
            "mismatches": [
                "Thyrotropin receptor (TSHR)",
                "Relaxin/insulin-like family peptide receptor 1 (RXFP1)",
                "Platelet-activating factor receptor (PTAFR)"
            ],
            "true_referents": [
                "5-HT1 Serotonin Receptors",
                "5-HT1A Serotonin Receptor",
                "5-HT1D Serotonin Receptor",
                "Adenosine A2 Receptors",
                "Adenosine A2A Receptor",
                "Adenosine A2B Receptor",
                "Angiotensin Receptors",
                "CB1 Cannabinoid Receptor",
                "CB2 Cannabinoid Receptor",
                "CCR4 Receptors",
                "CXCR4 Receptors",
                "Cannabinoid Receptors",
                "Chemokine Receptors",
                "Cholecystokinin A Receptor",
                "Cholecystokinin B Receptor",
                "Cholecystokinin Receptors",
                "Dopamine D2 Receptors",
                "Dopamine D4 Receptors",
                "Dopamine Receptors",
                "EP1 Subtype Prostaglandin E Receptors",
                "EP2 Subtype Prostaglandin E Receptors",
                "EP3 Subtype Prostaglandin E Receptors",
                "Endothelin A Receptor",
                "Endothelin B Receptor",
                "Endothelin Receptors",
                "FSH Receptors",
                "Glucagon-Like Peptide Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Glucagon-Like Peptide-2 Receptor",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "LH Receptors",
                "LHRH Receptors",
                "Lysosphingolipid Receptors",
                "Melanocortin Receptors",
                "Muscarinic M1 Receptor",
                "Muscarinic M4 Receptor",
                "Muscarinic Receptors",
                "Neuropeptide Y Receptors",
                "Opioid Receptors",
                "Oxytocin Receptors",
                "PAR-1 Receptor",
                "PAR-2 Receptor",
                "Parathyroid Hormone Receptors",
                "Purinergic P2Y1 Receptors",
                "Purinergic P2Y2 Receptors",
                "Rhodopsin",
                "Sphingosine Phosphorylcholine Receptors",
                "Sphingosine-1-Phosphate Receptors",
                "Thromboxane Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 1 CRF Receptor",
                "Type 1 Melanocortin Receptor",
                "Type 1 Parathyroid Hormone Receptor",
                "Type 2 Angiotensin Receptor",
                "Type 2 Parathyroid Hormone Receptor",
                "Type 4 Melanocortin Receptor",
                "Type I Vasoactive Intestinal Polypeptide Receptors",
                "Vasoactive Intestinal Peptide Receptors",
                "Vasopressin Receptors",
                "beta Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "beta-2 Adrenergic Receptors",
                "mu Opioid Receptors"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Rhodopsin (OPN1SW)",
            "\u03b22-adrenergic receptor (ADRB2)",
            "Muscarinic acetylcholine receptor M1 (CHRM1)",
            "Dopamine receptor D2 (DRD2)",
            "Serotonin receptor 1A (HTR1A)",
            "Chemokine receptor CXCR4 (CXCR4)",
            "Endothelin receptor type A (EDNRA)",
            "Histamine H1 receptor (HRH1)",
            "Melanocortin receptor 4 (MC4R)",
            "Parathyroid hormone receptor 1 (PTH1R)",
            "Protease-activated receptor 1 (F2R)",
            "Sphingosine 1-phosphate receptor 1 (S1PR1)",
            "Thromboxane A2 receptor (TBXA2R)",
            "Vasopressin V2 receptor (AVPR2)",
            "Angiotensin II receptor type 1 (AGTR1)",
            "Cannabinoid receptor 1 (CNR1)",
            "Glucagon receptor (GCGR)",
            "Oxytocin receptor (OXTR)",
            "Prostaglandin E2 receptor EP4 subtype (PTGER4)",
            "Thyrotropin-releasing hormone receptor (TRHR)",
            "Urotensin II receptor (UTS2R)",
            "Vasoactive intestinal polypeptide receptor 1 (VIPR1)",
            "Gonadotropin-releasing hormone receptor (GNRHR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rhodopsin",
                "beta-2 Adrenergic Receptors",
                "Muscarinic M1 Receptor",
                "Dopamine D2 Receptors",
                "5-HT1A Serotonin Receptor",
                "CXCR4 Receptors",
                "Endothelin A Receptor",
                "Histamine H1 Receptors",
                "Type 4 Melanocortin Receptor",
                "Type 1 Parathyroid Hormone Receptor",
                "PAR-1 Receptor",
                "Sphingosine-1-Phosphate Receptors",
                "Prostaglandin H2 Thromboxane A2 Receptors",
                "Vasopressin Receptors",
                "Type 1 Angiotensin Receptor",
                "CB1 Cannabinoid Receptor",
                "Glucagon Receptors",
                "Oxytocin Receptors",
                "EP4 Subtype Prostaglandin E Receptors",
                "Vasoactive Intestinal Polypeptide Receptors",
                "LHRH Receptors"
            ],
            "mismatches": [
                "Thyrotropin-releasing hormone receptor (TRHR)",
                "Urotensin II receptor (UTS2R)"
            ],
            "true_referents": [
                "5-HT1 Serotonin Receptors",
                "5-HT1A Serotonin Receptor",
                "5-HT1D Serotonin Receptor",
                "Angiotensin Receptors",
                "CB1 Cannabinoid Receptor",
                "CB2 Cannabinoid Receptor",
                "CCR4 Receptors",
                "CXCR4 Receptors",
                "Cannabinoid Receptors",
                "Chemokine Receptors",
                "Dopamine D2 Receptors",
                "Dopamine D4 Receptors",
                "Dopamine Receptors",
                "EP1 Subtype Prostaglandin E Receptors",
                "EP2 Subtype Prostaglandin E Receptors",
                "EP4 Subtype Prostaglandin E Receptors",
                "Endothelin A Receptor",
                "Endothelin B Receptor",
                "Endothelin Receptors",
                "FSH Receptors",
                "Glucagon Receptors",
                "Glucagon-Like Peptide Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "LH Receptors",
                "LHRH Receptors",
                "Lysosphingolipid Receptors",
                "Melanocortin Receptors",
                "Muscarinic M1 Receptor",
                "Muscarinic M4 Receptor",
                "Muscarinic Receptors",
                "Oxytocin Receptors",
                "PAR-1 Receptor",
                "PAR-2 Receptor",
                "Parathyroid Hormone Receptors",
                "Prostaglandin H2 Thromboxane A2 Receptors",
                "Purinergic P2X2 Receptors",
                "Rhodopsin",
                "Somatostatin Receptors",
                "Sphingosine Phosphorylcholine Receptors",
                "Sphingosine-1-Phosphate Receptors",
                "Thromboxane Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 1 Melanocortin Receptor",
                "Type 1 Parathyroid Hormone Receptor",
                "Type 2 Angiotensin Receptor",
                "Type 2 Parathyroid Hormone Receptor",
                "Type 4 Melanocortin Receptor",
                "Type I Vasoactive Intestinal Polypeptide Receptors",
                "Type II Vasoactive Intestinal Peptide Receptors",
                "Vasoactive Intestinal Peptide Receptors",
                "Vasopressin Receptors",
                "beta Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "beta-2 Adrenergic Receptors"
            ],
            "TP": 21,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Rhodopsin (RHO)",
            "Adrenergic Receptor Beta 2 (ADRB2)",
            "Muscarinic Acetylcholine Receptor M1 (CHRM1)",
            "Serotonin Receptor 1A (HTR1A)",
            "Dopamine Receptor D1 (DRD1)",
            "Histamine Receptor H1 (HRH1)",
            "Angiotensin II Receptor Type 1 (AGTR1)",
            "Cannabinoid Receptor 1 (CNR1)",
            "Luteinizing Hormone Receptor (LHCGR)",
            "Follicle-Stimulating Hormone Receptor (FSHR)",
            "Thyroid-Stimulating Hormone Receptor (TSHR)",
            "Prostaglandin E2 Receptor EP1 (PTGER1)",
            "Leukotriene B4 Receptor (LTB4R)",
            "Chemokine Receptor Type 4 (CXCR4)",
            "Lysophosphatidic Acid Receptor 1 (LPAR1)",
            "Sphingosine 1-Phosphate Receptor 1 (S1PR1)",
            "Protease-Activated Receptor 1 (F2R)",
            "Melatonin Receptor Type 1A (MTNR1A)",
            "Neuropeptide Y Receptor Type 1 (NPY1R)",
            "Opioid Receptor Mu 1 (OPRM1)",
            "Glucagon Receptor (GCGR)",
            "Adenosine A2A Receptor (ADORA2A)",
            "Metabotropic Glutamate Receptor 1 (GRM1)",
            "Frizzled Class Receptor 4 (FZD4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rhodopsin",
                "beta-2 Adrenergic Receptors",
                "Muscarinic M1 Receptor",
                "5-HT1A Serotonin Receptor",
                "Dopamine D1 Receptors",
                "Histamine H1 Receptors",
                "Type 1 Angiotensin Receptor",
                "CB1 Cannabinoid Receptor",
                "LH Receptors",
                "FSH Receptors",
                "EP1 Subtype Prostaglandin E Receptors",
                "Leukotriene B4 Receptors",
                "CXCR4 Receptors",
                "Lysophosphatidic Acid Receptors",
                "Sphingosine-1-Phosphate Receptors",
                "PAR-1 Receptor",
                "MT1 Melatonin Receptor",
                "Neuropeptide Y Receptors",
                "mu Opioid Receptors",
                "Glucagon Receptors",
                "Adenosine A2A Receptor",
                "Metabotropic Glutamate Receptors",
                "Frizzled Receptors"
            ],
            "mismatches": [
                "Thyroid-Stimulating Hormone Receptor (TSHR)"
            ],
            "true_referents": [
                "5-HT1 Serotonin Receptors",
                "5-HT1A Serotonin Receptor",
                "5-HT1D Serotonin Receptor",
                "Adenosine A2 Receptors",
                "Adenosine A2A Receptor",
                "Adenosine A2B Receptor",
                "Angiotensin Receptors",
                "CB1 Cannabinoid Receptor",
                "CB2 Cannabinoid Receptor",
                "CCR4 Receptors",
                "CX3C Chemokine Receptor 1",
                "CXCR4 Receptors",
                "Cannabinoid Receptors",
                "Dopamine D1 Receptors",
                "Dopamine D4 Receptors",
                "Dopamine Receptors",
                "EP1 Subtype Prostaglandin E Receptors",
                "EP2 Subtype Prostaglandin E Receptors",
                "Eicosanoid Receptors",
                "FSH Receptors",
                "Frizzled Receptors",
                "Glucagon Receptors",
                "Glucagon-Like Peptide Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "LH Receptors",
                "LHRH Receptors",
                "Leukotriene B4 Receptors",
                "Leukotriene Receptors",
                "Lysophosphatidic Acid Receptors",
                "Lysophospholipid Receptors",
                "Lysosphingolipid Receptors",
                "MT1 Melatonin Receptor",
                "MT2 Melatonin Receptor",
                "Melatonin Receptors",
                "Metabotropic Glutamate 5 Receptor",
                "Metabotropic Glutamate Receptors",
                "Muscarinic M1 Receptor",
                "Muscarinic M4 Receptor",
                "Muscarinic Receptors",
                "Neuropeptide Y Receptors",
                "Opioid Receptors",
                "PAR-1 Receptor",
                "PAR-2 Receptor",
                "Prostaglandin E Receptors",
                "Purinergic P2Y1 Receptors",
                "Purinergic P2Y2 Receptors",
                "Rhodopsin",
                "Smoothened Receptor",
                "Sphingosine Phosphorylcholine Receptors",
                "Sphingosine-1-Phosphate Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 1 Parathyroid Hormone Receptor",
                "Type 2 Angiotensin Receptor",
                "Type 2 Parathyroid Hormone Receptor",
                "alpha-2 Adrenergic Receptors",
                "beta Adrenergic Receptors",
                "beta-2 Adrenergic Receptors",
                "mu Opioid Receptors"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Adenosine receptor (A1R)",
            "Adrenergic receptor (\u03b22AR)",
            "Angiotensin receptor (AT1R)",
            "Bombesin receptor (BRS-3)",
            "Calcitonin receptor (CTR)",
            "Cholecystokinin receptor (CCK1R)",
            "Dopamine receptor (D1R)",
            "Endothelin receptor (ETAR)",
            "Estrogen receptor (ER\u03b1)",
            "Fibroblast growth factor receptor (FGFR1)",
            "Formyl peptide receptor (FPR1)",
            "Galanin receptor (GALR1)",
            "Glucagon receptor (GCGR)",
            "Histamine receptor (H1R)",
            "Leukotriene receptor (BLT1)",
            "Melatonin receptor (MT1R)",
            "Neurokinin receptor (NK1R)",
            "Norepinephrine receptor (\u03b12AR)",
            "Oxytocin receptor (OXTR)",
            "Parathyroid hormone receptor (PTH1R)",
            "Prolactin receptor (PRLR)",
            "Prostaglandin receptor (PGD2R)",
            "Somatostatin receptor (SSTR2)",
            "Thyrotropin receptor (TSHR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adenosine A1 Receptor",
                "Adrenergic Receptors",
                "Type 1 Angiotensin Receptor",
                "Bombesin Receptors",
                "Calcitonin Receptors",
                "Cholecystokinin A Receptor",
                "Dopamine D1 Receptors",
                "Endothelin A Receptor",
                "Formyl Peptide Receptors",
                "Type 1 Galanin Receptor",
                "Glucagon Receptors",
                "Histamine H1 Receptors",
                "Leukotriene B4 Receptors",
                "MT1 Melatonin Receptor",
                "Neurokinin-1 Receptors",
                "Oxytocin Receptors",
                "Type 1 Parathyroid Hormone Receptor",
                "Prostaglandin Receptors",
                "Somatostatin Receptors"
            ],
            "mismatches": [
                "Estrogen receptor (ER\u03b1)",
                "Fibroblast growth factor receptor (FGFR1)",
                "Norepinephrine receptor (\u03b12AR)",
                "Prolactin receptor (PRLR)",
                "Thyrotropin receptor (TSHR)"
            ],
            "true_referents": [
                "5-HT1D Serotonin Receptor",
                "5-HT2 Serotonin Receptors",
                "Adenosine A1 Receptor",
                "Adenosine A2A Receptor",
                "Adenosine A3 Receptor",
                "Adrenergic Receptors",
                "Angiotensin Receptors",
                "Bombesin Receptors",
                "Calcitonin Gene-Related Peptide Receptors",
                "Calcitonin Receptor-Like Protein",
                "Calcitonin Receptors",
                "Cholecystokinin A Receptor",
                "Cholecystokinin B Receptor",
                "Cholecystokinin Receptors",
                "Dopamine D1 Receptors",
                "Dopamine Receptors",
                "Eicosanoid Receptors",
                "Endothelin A Receptor",
                "Endothelin B Receptor",
                "Endothelin Receptors",
                "FSH Receptors",
                "Formyl Peptide Receptors",
                "Galanin Receptors",
                "Glucagon Receptors",
                "Glucagon-Like Peptide Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Glucagon-Like Peptide-2 Receptor",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "LH Receptors",
                "LHRH Receptors",
                "Leukotriene B4 Receptors",
                "Leukotriene Receptors",
                "MT1 Melatonin Receptor",
                "MT2 Melatonin Receptor",
                "Melatonin Receptors",
                "Neurokinin-1 Receptors",
                "Neurokinin-2 Receptors",
                "Neurokinin-3 Receptors",
                "Oxytocin Receptors",
                "PAR-1 Receptor",
                "Parathyroid Hormone Receptors",
                "Prostaglandin E Receptors",
                "Prostaglandin Receptors",
                "Smoothened Receptor",
                "Somatostatin Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 1 Galanin Receptor",
                "Type 1 Parathyroid Hormone Receptor",
                "Type 2 Angiotensin Receptor",
                "Type 2 Parathyroid Hormone Receptor",
                "Type 3 Galanin Receptor",
                "Vasopressin Receptors",
                "alpha Adrenergic Receptors",
                "alpha-2 Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "beta-2 Adrenergic Receptors"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": [
            "Adrenergic receptor alpha 1 (ADRA1A)",
            "Adrenergic receptor alpha 2 (ADRA2A)",
            "Adrenergic receptor beta 1 (ADRB1)",
            "Adrenergic receptor beta 2 (ADRB2)",
            "Angiotensin II receptor type 1 (AGTR1)",
            "Angiotensin II receptor type 2 (AGTR2)",
            "B2 bradykinin receptor (BDKRB2)",
            "Calcitonin receptor (CALCR)",
            "Chemokine receptor 4 (CXCR4)",
            "Chemokine receptor 5 (CXCR5)",
            "Dopamine receptor D1 (DRD1)",
            "Dopamine receptor D2 (DRD2)",
            "GABA B receptor 1 (GABBR1)",
            "GABA B receptor 2 (GABBR2)",
            "Glucagon receptor (GCGR)",
            "Glutamate receptor 1 (GRM1)",
            "Glutamate receptor 2 (GRM2)",
            "Glutamate receptor 3 (GRM3)",
            "Glutamate receptor 4 (GRM4)",
            "Histamine receptor H1 (HRH1)",
            "Histamine receptor H2 (HRH2)",
            "Melanocortin 1 receptor (MC1R)",
            "Melanocortin 4 receptor (MC4R)",
            "Muscarinic acetylcholine receptor M1 (CHRM1)",
            "Muscarinic acetylcholine receptor M2 (CHRM2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "alpha-1 Adrenergic Receptors",
                "alpha-2 Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "beta-2 Adrenergic Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 2 Angiotensin Receptor",
                "Bradykinin B2 Receptor",
                "Calcitonin Receptors",
                "CXCR4 Receptors",
                "CXCR5 Receptors",
                "Dopamine D1 Receptors",
                "Dopamine D2 Receptors",
                "GABA-B Receptors",
                "Glucagon Receptors",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Type 1 Melanocortin Receptor",
                "Type 4 Melanocortin Receptor",
                "Muscarinic M1 Receptor"
            ],
            "mismatches": [
                "GABA B receptor 1 (GABBR1)",
                "GABA B receptor 2 (GABBR2)",
                "Glutamate receptor 1 (GRM1)",
                "Glutamate receptor 2 (GRM2)",
                "Glutamate receptor 3 (GRM3)",
                "Glutamate receptor 4 (GRM4)",
                "Muscarinic acetylcholine receptor M2 (CHRM2)"
            ],
            "true_referents": [
                "5-HT1B Serotonin Receptor",
                "5-HT1D Serotonin Receptor",
                "5-HT2 Serotonin Receptors",
                "5-HT2B Serotonin Receptor",
                "5-HT4 Serotonin Receptors",
                "Adrenergic Receptors",
                "Angiotensin Receptors",
                "Bradykinin B1 Receptor",
                "Bradykinin B2 Receptor",
                "Bradykinin Receptors",
                "CB1 Cannabinoid Receptor",
                "CB2 Cannabinoid Receptor",
                "CCR4 Receptors",
                "CCR5 Receptors",
                "CX3C Chemokine Receptor 1",
                "CXCR4 Receptors",
                "CXCR5 Receptors",
                "Calcitonin Gene-Related Peptide Receptors",
                "Calcitonin Receptor-Like Protein",
                "Calcitonin Receptors",
                "Dopamine D1 Receptors",
                "Dopamine D2 Receptors",
                "Dopamine D4 Receptors",
                "Dopamine Receptors",
                "GABA-B Receptors",
                "Glucagon Receptors",
                "Glucagon-Like Peptide Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Glucagon-Like Peptide-2 Receptor",
                "Histamine H1 Receptors",
                "Histamine H2 Receptors",
                "Histamine H4 Receptors",
                "Melanocortin Receptors",
                "Metabotropic Glutamate 5 Receptor",
                "Metabotropic Glutamate Receptors",
                "Muscarinic M1 Receptor",
                "Muscarinic M4 Receptor",
                "Muscarinic Receptors",
                "Neurokinin-2 Receptors",
                "Neurokinin-3 Receptors",
                "Type 1 Angiotensin Receptor",
                "Type 1 Melanocortin Receptor",
                "Type 2 Angiotensin Receptor",
                "Type 3 Galanin Receptor",
                "Type 3 Melanocortin Receptor",
                "Type 4 Melanocortin Receptor",
                "alpha Adrenergic Receptors",
                "alpha-1 Adrenergic Receptors",
                "alpha-2 Adrenergic Receptors",
                "beta Adrenergic Receptors",
                "beta-1 Adrenergic Receptors",
                "beta-2 Adrenergic Receptors"
            ],
            "TP": 19,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "g-protein coupled receptor",
        "domain": "biology",
        "response": "error when calling model 'amazon.titan-text-express-v1': empty response",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]