[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Annexin A1 (ANXA1)",
            "Annexin A2 (ANXA2)",
            "Annexin A5 (ANXA5)",
            "Annexin A6 (ANXA6)",
            "Annexin A7 (ANXA7)",
            "Annexin A11 (ANXA11)",
            "Bacteriorhodopsin (BR)",
            "Beta-amyloid precursor protein (APP)",
            "Claudin-1 (CLDN1)",
            "Connexin 43 (GJA1)",
            "Dysferlin (DYSF)",
            "Epidermal growth factor receptor (EGFR)",
            "Inward rectifier potassium channel (Kir)",
            "Lipid phosphate phosphatase 3 (LPP3)",
            "Major histocompatibility complex class I (MHC I)",
            "Niemann-Pick C1 (NPC1)",
            "Pannexin 1 (PANX1)",
            "Peroxisomal membrane protein 70 (PEX70)",
            "Peroxisomal membrane protein 11 (PEX11)",
            "Peroxisomal membrane protein 14 (PEX14)",
            "Peroxisomal membrane protein 34 (PEX34)",
            "Peroxisomal membrane protein 36 (PEX36)",
            "Peroxisomal membrane protein 46 (PEX46)",
            "Sodium-hydrogen exchanger (NHE)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Bacteriorhodopsin (BR)",
                "Claudin-1 (CLDN1)",
                "Connexin 43 (GJA1)",
                "Dysferlin (DYSF)",
                "Niemann-Pick C1 (NPC1)"
            ],
            "mismatches": [
                "Annexin A1 (ANXA1)",
                "Annexin A2 (ANXA2)",
                "Annexin A5 (ANXA5)",
                "Annexin A6 (ANXA6)",
                "Annexin A7 (ANXA7)",
                "Annexin A11 (ANXA11)",
                "Beta-amyloid precursor protein (APP)",
                "Epidermal growth factor receptor (EGFR)",
                "Inward rectifier potassium channel (Kir)",
                "Lipid phosphate phosphatase 3 (LPP3)",
                "Major histocompatibility complex class I (MHC I)",
                "Pannexin 1 (PANX1)",
                "Peroxisomal membrane protein 70 (PEX70)",
                "Peroxisomal membrane protein 11 (PEX11)",
                "Peroxisomal membrane protein 14 (PEX14)",
                "Peroxisomal membrane protein 34 (PEX34)",
                "Peroxisomal membrane protein 36 (PEX36)",
                "Peroxisomal membrane protein 46 (PEX46)",
                "Sodium-hydrogen exchanger (NHE)"
            ],
            "true_referents": [
                "Amyloid beta-Protein Precursor",
                "Anoctamin-1",
                "Aquaporin 6",
                "Bacteriorhodopsins",
                "Caveolin 3",
                "Class III Phosphatidylinositol 3-Kinases",
                "Claudin-1",
                "Claudin-3",
                "Claudin-5",
                "Connexin 26",
                "Connexin 43",
                "Connexins",
                "Dysbindin",
                "Dysferlin",
                "Ephrin-A5",
                "ErbB-2 Receptor",
                "ErbB-4 Receptor",
                "Fatty Acid Transport Proteins",
                "G Protein-Coupled Inwardly-Rectifying Potassium Channels",
                "HLA-A1 Antigen",
                "HLA-A11 Antigen",
                "Halorhodopsins",
                "Histocompatibility Antigens Class I",
                "Histocompatibility Antigens Class II",
                "Integrin alpha1",
                "Integrin alpha2",
                "Integrin alpha5",
                "Integrin alpha6",
                "Inwardly Rectifying Potassium Channels",
                "Lysosomal-Associated Membrane Protein 3",
                "Member 11 Subfamily B ATP Binding Cassette Transporter",
                "Membrane Cofactor Protein",
                "Niemann-Pick C1 Protein",
                "Peroxisomal Biogenesis Factor 2",
                "Presenilin-1",
                "Presenilin-2",
                "Rhodopsin",
                "SLC31 Proteins",
                "Sodium-Hydrogen Exchanger 1",
                "Voltage-Dependent Anion Channel 2",
                "alpha7 Nicotinic Acetylcholine Receptor"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Adenylate cyclase (AC)",
            "Aquaporin (AQP)",
            "Bacteriorhodopsin",
            "Calmodulin",
            "Calsequestrin",
            "Clathrin",
            "Connexin",
            "Cytochrome c oxidase (Complex IV)",
            "Ferredoxin-NADP+ reductase",
            "Glycerol-3-phosphate dehydrogenase",
            "Glucose transporter (GLUT)",
            "Glycophorin",
            "Hemoglobin (intracellular in erythrocytes)",
            "Heterotrimeric G protein",
            "Integrin",
            "Insulin receptor",
            "Ion channel (various types, e.g., voltage-gated potassium channels)",
            "Lactose permease",
            "Lipid-anchored protein",
            "Na+/K+-ATPase",
            "Nicotinic acetylcholine receptor",
            "NMDA receptor",
            "Phospholamban",
            "Protein kinase C (PKC)",
            "Ryanodine receptor"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Bacteriorhodopsin",
                "Clathrin",
                "Connexin",
                "Insulin receptor",
                "Na+/K+-ATPase",
                "Nicotinic acetylcholine receptor",
                "NMDA receptor"
            ],
            "mismatches": [
                "Adenylate cyclase (AC)",
                "Aquaporin (AQP)",
                "Calmodulin",
                "Calsequestrin",
                "Cytochrome c oxidase (Complex IV)",
                "Ferredoxin-NADP+ reductase",
                "Glycerol-3-phosphate dehydrogenase",
                "Glucose transporter (GLUT)",
                "Glycophorin",
                "Hemoglobin (intracellular in erythrocytes)",
                "Heterotrimeric G protein",
                "Integrin",
                "Ion channel (various types, e.g., voltage-gated potassium channels)",
                "Lactose permease",
                "Lipid-anchored protein",
                "Phospholamban",
                "Protein kinase C (PKC)",
                "Ryanodine receptor"
            ],
            "true_referents": [
                "Amino Acid Transport System L",
                "Aquaporin 1",
                "Aquaporins",
                "Bacteriorhodopsins",
                "Calcium Channels",
                "Calnexin",
                "Chloride-Bicarbonate Antiporters",
                "Class III Phosphatidylinositol 3-Kinases",
                "Clathrin",
                "Clathrin Heavy Chains",
                "Clathrin Light Chains",
                "Connexin 30",
                "Connexin 43",
                "Connexins",
                "Cyclic AMP Receptors",
                "Electron Transport Complex I",
                "Electron Transport Complex IV",
                "Erythrocyte Anion Exchange Protein 1",
                "G-Protein-Coupled Receptors",
                "Gi-Go GTP-Binding Protein alpha Subunits",
                "Glucose Transporter Type 1",
                "Glucose Transporter Type 3",
                "Glucose Transporter Type 5",
                "Halorhodopsins",
                "Heterotrimeric GTP-Binding Proteins",
                "Hyperpolarization-Activated Cyclic Nucleotide-Gated Channels",
                "IGF Type 1 Receptor",
                "Insulin Receptor",
                "Integrin alpha1",
                "Integrin beta1",
                "Integrins",
                "Ion Channels",
                "LDL-Receptor Related Protein-Associated Protein",
                "Lipid-Linked Proteins",
                "Lysosomal-Associated Membrane Protein 1",
                "Membrane Glycoproteins",
                "N-Methyl-D-Aspartate Receptors",
                "Nicotinic Receptors",
                "P-Type Calcium Channels",
                "Phospholipase A2 Receptors",
                "Plastoquinol-Plastocyanin Reductase",
                "Potassium Channels",
                "Rhodopsin",
                "Sarcoglycans",
                "Sarcoplasmic Reticulum Calcium-Transporting ATPases",
                "Sodium-Potassium-Exchanging ATPase",
                "Succinate Dehydrogenase",
                "trkC Receptor"
            ],
            "TP": 7,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Aquaporin (AQP)",
            "Cytochrome P450",
            "Glycophorin",
            "Band 3 protein",
            "Glucagon-like peptide-1 receptor (GLP-1R)",
            "G-protein-coupled receptor (GPCR)",
            "Ion channel (e.g., voltage-gated sodium channel)",
            "Insulin receptor",
            "Integrin",
            "Epidermal growth factor receptor (EGFR)",
            "Transferrin receptor",
            "Low-density lipoprotein receptor (LDLR)",
            "Fibroblast growth factor receptor (FGFR)",
            "Platelet-derived growth factor receptor (PDGFR)",
            "Vascular endothelial growth factor receptor (VEGFR)",
            "Nerve growth factor receptor (NGFR)",
            "Transforming growth factor beta receptor (TGFBR)",
            "Erythropoietin receptor (EPOR)",
            "Protein kinase C (PKC)",
            "Adenylyl cyclase",
            "Rhodopsin",
            "Opsin",
            "Chloride channel",
            "Potassium channel"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucagon-like peptide-1 receptor (GLP-1R)",
                "G-protein-coupled receptor (GPCR)",
                "Insulin receptor",
                "Integrin",
                "Transferrin receptor",
                "Rhodopsin",
                "Chloride channel",
                "Potassium channel",
                "Erythropoietin receptor (EPOR)"
            ],
            "mismatches": [
                "Aquaporin (AQP)",
                "Cytochrome P450",
                "Glycophorin",
                "Band 3 protein",
                "Ion channel (e.g., voltage-gated sodium channel)",
                "Epidermal growth factor receptor (EGFR)",
                "Low-density lipoprotein receptor (LDLR)",
                "Fibroblast growth factor receptor (FGFR)",
                "Platelet-derived growth factor receptor (PDGFR)",
                "Vascular endothelial growth factor receptor (VEGFR)",
                "Nerve growth factor receptor (NGFR)",
                "Transforming growth factor beta receptor (TGFBR)",
                "Protein kinase C (PKC)",
                "Adenylyl cyclase",
                "Opsin"
            ],
            "true_referents": [
                "Aquaporin 1",
                "Aquaporins",
                "Bacterial Transferrin Receptor Complex",
                "CLC-2 Chloride Channels",
                "Channelrhodopsins",
                "Chloride Channels",
                "Class III Phosphatidylinositol 3-Kinases",
                "Clathrin",
                "Cyclic AMP Receptors",
                "Cyclic Nucleotide-Gated Cation Channels",
                "Dual Oxidases",
                "Edar Receptor",
                "ErbB-2 Receptor",
                "ErbB-4 Receptor",
                "Erythropoietin Receptors",
                "G-Protein-Coupled Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Glucagon-Like Peptide-2 Receptor",
                "Halorhodopsins",
                "IGF Type 1 Receptor",
                "Insulin Receptor",
                "Integrin alpha1",
                "Integrin beta1",
                "Integrins",
                "Ion Channels",
                "LDL Receptors",
                "LDL-Receptor Related Proteins",
                "Low Density Lipoprotein Receptor-Related Protein-1",
                "Member 3 Subfamily B ATP Binding Cassette Transporter",
                "Membrane Glycoproteins",
                "NADPH Oxidase 1",
                "NADPH Oxidases",
                "Nerve Growth Factor Receptor",
                "Nerve Growth Factor Receptors",
                "Neuropeptide Receptors",
                "Platelet-Derived Growth Factor Receptors",
                "Platelet-Derived Growth Factor alpha Receptor",
                "Potassium Channels",
                "Rhodopsin",
                "Sarcoglycans",
                "Sodium Channels",
                "Transferrin Receptors",
                "Transferrin-Binding Protein B",
                "Transforming Growth Factor-beta Type I Receptor",
                "Transforming Growth Factor-beta Type II Receptor",
                "Type 1 Fibroblast Growth Factor Receptor",
                "Type 5 Fibroblast Growth Factor Receptor",
                "Vascular Endothelial Growth Factor Receptor-1",
                "Vascular Endothelial Growth Factor Receptor-2",
                "beta-Arrestin 1",
                "trkA Receptor",
                "trkC Receptor"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Bacteriorhodopsin (BR)",
            "Aquaporin-4 (AQP4)",
            "Sodium-Potassium ATPase (Na+/K+ ATPase)",
            "Glucose Transporter 1 (GLUT1)",
            "Ryanodine Receptor (RyR)",
            "Inositol Trisphosphate Receptor (IP3R)",
            "G-Protein Coupled Receptor (GPCR)",
            "Epidermal Growth Factor Receptor (EGFR)",
            "Integrin \u03b15\u03b21",
            "CD4 (CD4)",
            "Major Histocompatibility Complex Class I (MHC-I)",
            "Major Histocompatibility Complex Class II (MHC-II)",
            "Programmed cell death protein 1 (PD-1)",
            "Cytotoxic T-lymphocyte-associated protein 4 (CTLA-4)",
            "Voltage-Dependent Anion Channel 1 (VDAC1)",
            "Mitochondrial Phosphate Carrier (MPC)",
            "SERCA (SERCA)",
            "Plasma Membrane Calcium ATPase (PMCA)",
            "Fas Receptor (Fas)",
            "Transferrin Receptor (TfR)",
            "Low-Density Lipoprotein Receptor (LDLR)",
            "Amyloid Precursor Protein (APP)",
            "Dystrophin (DMD)",
            "Connexin 43 (Cx43)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aquaporin-4 (AQP4)",
                "Bacteriorhodopsin (BR)",
                "CD4 (CD4)",
                "Cytotoxic T-lymphocyte-associated protein 4 (CTLA-4)",
                "Glucose Transporter 1 (GLUT1)",
                "G-Protein Coupled Receptor (GPCR)",
                "Inositol Trisphosphate Receptor (IP3R)",
                "Integrin \u03b15\u03b21",
                "Low-Density Lipoprotein Receptor (LDLR)",
                "Programmed cell death protein 1 (PD-1)",
                "Ryanodine Receptor (RyR)",
                "Voltage-Dependent Anion Channel 1 (VDAC1)",
                "Fas Receptor (Fas)",
                "Transferrin Receptor (TfR)",
                "Amyloid Precursor Protein (APP)",
                "Dystrophin (DMD)",
                "Connexin 43 (Cx43)"
            ],
            "mismatches": [
                "Sodium-Potassium ATPase (Na+/K+ ATPase)",
                "Epidermal Growth Factor Receptor (EGFR)",
                "Major Histocompatibility Complex Class I (MHC-I)",
                "Major Histocompatibility Complex Class II (MHC-II)",
                "Mitochondrial Phosphate Carrier (MPC)",
                "SERCA (SERCA)",
                "Plasma Membrane Calcium ATPase (PMCA)"
            ],
            "true_referents": [
                "5-HT1A Serotonin Receptor",
                "Amyloid beta-Protein Precursor",
                "Aquaporin 1",
                "Aquaporin 4",
                "Bacterial Transferrin Receptor Complex",
                "Bacteriorhodopsins",
                "CD4 Antigens",
                "CD4 Immunoadhesins",
                "CTLA-4 Antigen",
                "Calcium-Transporting ATPases",
                "Class III Phosphatidylinositol 3-Kinases",
                "Connexin 26",
                "Connexin 43",
                "Connexins",
                "Dystroglycans",
                "Dystrophin",
                "Dystrophin-Associated Proteins",
                "ErbB-2 Receptor",
                "ErbB-4 Receptor",
                "Fas Ligand Protein",
                "G-Protein-Coupled Receptors",
                "Glucose Transporter Type 1",
                "HLA-A1 Antigen",
                "HLA-A2 Antigen",
                "HLA-B7 Antigen",
                "Halorhodopsins",
                "Histocompatibility Antigens Class I",
                "Histocompatibility Antigens Class II",
                "Inositol 1,4,5-Trisphosphate Receptors",
                "Integrin alpha5beta1",
                "LDL Receptors",
                "LDL-Receptor Related Proteins",
                "Low Density Lipoprotein Receptor-Related Protein-1",
                "Mitochondrial Membrane Transport Proteins",
                "Neuropeptide Receptors",
                "Plasma Membrane Calcium-Transporting ATPases",
                "Presenilin-1",
                "Presenilin-2",
                "Programmed Cell Death 1 Ligand 2 Protein",
                "Programmed Cell Death 1 Receptor",
                "Proton-Phosphate Symporters",
                "R-Type Calcium Channels",
                "Rhodopsin",
                "Ryanodine Receptor Calcium Release Channel",
                "Sodium-Glucose Transporter 1",
                "Sodium-Potassium-Exchanging ATPase",
                "Transferrin Receptors",
                "Transferrin-Binding Protein B",
                "Voltage-Dependent Anion Channel 1",
                "beta-Arrestin 1",
                "fas Receptor"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Aquaporin (AQP)",
            "ATP synthase (Complex V)",
            "Cytochrome c oxidase (Complex IV)",
            "Glucose transporter 1 (GLUT1)",
            "Sodium-potassium pump (Na+/K+ ATPase)",
            "Calcium pump (Ca2+ ATPase)",
            "Voltage-gated sodium channel (Nav)",
            "Voltage-gated potassium channel (Kv)",
            "Voltage-gated calcium channel (Cav)",
            "Rhodopsin",
            "G-protein coupled receptor (GPCR)",
            "Epidermal growth factor receptor (EGFR)",
            "Insulin receptor",
            "Transferrin receptor",
            "Nicotinic acetylcholine receptor (nAChR)",
            "Serotonin receptor",
            "Dopamine receptor",
            "Histamine receptor",
            "Beta-adrenergic receptor",
            "Integrin",
            "Cadherin",
            "Connexin",
            "Claudin",
            "Occludin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aquaporin 1",
                "Glucose Transporter Type 1",
                "Sodium-Potassium-Exchanging ATPase",
                "Calcium-Transporting ATPases",
                "Voltage-Gated Potassium Channels",
                "Rhodopsin",
                "G-Protein-Coupled Receptors",
                "Insulin Receptor",
                "Transferrin Receptors",
                "Nicotinic Receptors",
                "Serotonin Receptors",
                "Dopamine Receptors",
                "Histamine Receptors",
                "Integrins",
                "Cadherins",
                "Connexins",
                "Claudins",
                "Occludin"
            ],
            "mismatches": [
                "ATP synthase (Complex V)",
                "Cytochrome c oxidase (Complex IV)",
                "Voltage-gated sodium channel (Nav)",
                "Voltage-gated calcium channel (Cav)",
                "Epidermal growth factor receptor (EGFR)",
                "Beta-adrenergic receptor"
            ],
            "true_referents": [
                "Aquaporin 1",
                "Aquaporins",
                "Bacterial Transferrin Receptor Complex",
                "Cadherin Related Proteins",
                "Cadherins",
                "Calcium Channels",
                "Calcium-Transporting ATPases",
                "Channelrhodopsins",
                "Claudin-1",
                "Claudin-5",
                "Claudins",
                "Connexin 30",
                "Connexin 43",
                "Connexins",
                "Dopamine Receptors",
                "Electron Transport Complex I",
                "Electron Transport Complex IV",
                "ErbB-2 Receptor",
                "ErbB-4 Receptor",
                "G-Protein-Coupled Receptors",
                "Glucose Transporter Type 1",
                "Halorhodopsins",
                "Histamine H2 Receptors",
                "Histamine Receptors",
                "IGF Type 1 Receptor",
                "Insulin Receptor",
                "Integrin alpha1",
                "Integrin beta1",
                "Integrins",
                "Kv1.1 Potassium Channel",
                "NAV1.1 Voltage-Gated Sodium Channel",
                "NAV1.2 Voltage-Gated Sodium Channel",
                "Neuropeptide Receptors",
                "Nicotinic Receptors",
                "Occludin",
                "Plasma Membrane Calcium-Transporting ATPases",
                "Rhodopsin",
                "Serotonin Receptors",
                "Sodium-Glucose Transporter 1",
                "Sodium-Potassium-Exchanging ATPase",
                "Transferrin Receptors",
                "Transferrin-Binding Protein B",
                "Voltage-Gated Potassium Channels",
                "beta-1 Adrenergic Receptors",
                "beta-Arrestin 1"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Sodium-Potassium Pump (Na+/K+ ATPase)",
            "Lipid Bilayer Protein (LBP)",
            "Ion Channel Protein (ICP)",
            "Integrin (ITG)",
            "G-Protein Coupled Receptor (GPCR)",
            "Aquaporin (AQP)",
            "Caveolin (CAV)",
            "Clathrin (CLT)",
            "Transferrin Receptor (TfR)",
            "Glucose Transporter (GLUT)",
            "Nicotinic Acetylcholine Receptor (nAChR)",
            "Voltage-Gated Sodium Channel (Nav)",
            "Lipid Raft Protein (LRP)",
            "Epidermal Growth Factor Receptor (EGFR)",
            "Tetraspanin (TSPAN)",
            "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
            "Dipeptidyl Peptidase IV (DPPIV)",
            "P-glycoprotein (P-gp)",
            "CD4 Protein (CD4)",
            "Sodium-Glucose Transporter (SGLT)",
            "Insulin Receptor (INSR)",
            "Neurotransmitter Transporter (NTT)",
            "Vesicular Transport Protein (VTP)",
            "Permease (PERM)",
            "Translocase of the Outer Membrane (TOM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "G-Protein Coupled Receptor (GPCR)",
                "Aquaporin (AQP)",
                "Caveolin (CAV)",
                "Clathrin (CLT)",
                "Transferrin Receptor (TfR)",
                "Glucose Transporter (GLUT)",
                "Nicotinic Acetylcholine Receptor (nAChR)",
                "Voltage-Gated Sodium Channel (Nav)",
                "Tetraspanin (TSPAN)",
                "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
                "CD4 Protein (CD4)",
                "Sodium-Glucose Transporter (SGLT)",
                "Insulin Receptor (INSR)",
                "Neurotransmitter Transporter (NTT)",
                "Vesicular Transport Protein (VTP)"
            ],
            "mismatches": [
                "Sodium-Potassium Pump (Na+/K+ ATPase)",
                "Lipid Bilayer Protein (LBP)",
                "Ion Channel Protein (ICP)",
                "Lipid Raft Protein (LRP)",
                "Epidermal Growth Factor Receptor (EGFR)",
                "Dipeptidyl Peptidase IV (DPPIV)",
                "P-glycoprotein (P-gp)",
                "Permease (PERM)",
                "Translocase of the Outer Membrane (TOM)"
            ],
            "true_referents": [
                "ATP Binding Cassette Transporter 1",
                "Aquaporin 1",
                "Aquaporins",
                "Bacterial Transferrin Receptor Complex",
                "CD4 Antigens",
                "CD4 Immunoadhesins",
                "Caveolin 1",
                "Caveolin 2",
                "Caveolins",
                "Clathrin",
                "Clathrin Heavy Chains",
                "Clathrin Light Chains",
                "Cystic Fibrosis Transmembrane Conductance Regulator",
                "ErbB-2 Receptor",
                "ErbB-4 Receptor",
                "G-Protein-Coupled Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "Glucagon-Like Peptide-2 Receptor",
                "Glucose Transporter Type 1",
                "Glucose Transporter Type 5",
                "IGF Type 1 Receptor",
                "Insulin Receptor",
                "Integrin beta1",
                "Integrin beta3",
                "Integrins",
                "Ion Channels",
                "LDL-Receptor Related Protein-Associated Protein",
                "Lipid-Linked Proteins",
                "Low Density Lipoprotein Receptor-Related Protein-1",
                "Low Density Lipoprotein Receptor-Related Protein-5",
                "Member 1 Subfamily G ATP Binding Cassette Transporter",
                "Myelin and Lymphocyte-Associated Proteolipid Proteins",
                "NAV1.1 Voltage-Gated Sodium Channel",
                "NAV1.2 Voltage-Gated Sodium Channel",
                "Neuropeptide Receptors",
                "Neurotransmitter Transport Proteins",
                "Nicotinic Receptors",
                "Organic Cation Transport Proteins",
                "Phospholipid Transfer Proteins",
                "Plasma Membrane Neurotransmitter Transport Proteins",
                "Potassium Channels",
                "Sodium-Glucose Transporter 1",
                "Sodium-Independent Organic Anion Transporters",
                "Sodium-Potassium-Exchanging ATPase",
                "Tetraspanin 24",
                "Tetraspanin 25",
                "Tetraspanins",
                "Transferrin Receptors",
                "Transferrin-Binding Protein B",
                "Vesicular Neurotransmitter Transport Proteins",
                "Vesicular Transport Adaptor Proteins",
                "Vesicular Transport Proteins",
                "beta-Arrestin 1"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Insulin Receptor (IR)",
            "Epidermal Growth Factor Receptor (EGFR)",
            "G Protein-Coupled Receptors (GPCRs)",
            "Glucose Transporter Type 4 (GLUT4)",
            "Voltage-Gated Sodium Channels (Nav)",
            "Voltage-Gated Potassium Channels (Kv)",
            "Voltage-Gated Calcium Channels (Cav)",
            "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
            "Vesicular Monoamine Transporter 2 (VMAT2)",
            "N-methyl-D-aspartate Receptor (NMDAR)",
            "Alpha-amino-3-hydroxy-5-methyl-4-isoxazolepropionic Acid Receptor (AMPAR)",
            "Adenosine Triphosphate Synthase (ATP Synthase)",
            "Translocator Protein (TSPO)",
            "Nicotinic Acetylcholine Receptor (nAChR)",
            "Muscarinic Acetylcholine Receptor (mAChR)",
            "Gamma-aminobutyric Acid Receptor (GABA Receptor)",
            "Serotonin Receptor (5-HT Receptor)",
            "Dopamine Receptor (D Receptor)",
            "Adrenergic Receptor (AR)",
            "Opioid Receptor (OR)",
            "Endothelin Receptor (ETR)",
            "Angiotensin II Receptor (ATR)",
            "Prostaglandin E2 Receptor (EP)",
            "Leukotriene B4 Receptor (BLT)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin Receptor",
                "Glucose Transporter Type 4",
                "Voltage-Gated Sodium Channels",
                "Voltage-Gated Potassium Channels",
                "Cystic Fibrosis Transmembrane Conductance Regulator",
                "N-Methyl-D-Aspartate Receptors",
                "AMPA Receptors",
                "Nicotinic Receptors",
                "Muscarinic Receptors",
                "GABA-A Receptors",
                "Dopamine Receptors",
                "Adrenergic Receptors",
                "Opioid Receptors",
                "Endothelin Receptors",
                "Angiotensin Receptors",
                "Prostaglandin E Receptors",
                "Leukotriene B4 Receptors"
            ],
            "mismatches": [
                "Epidermal Growth Factor Receptor (EGFR)",
                "G Protein-Coupled Receptors (GPCRs)",
                "Voltage-Gated Calcium Channels (Cav)",
                "Vesicular Monoamine Transporter 2 (VMAT2)",
                "Adenosine Triphosphate Synthase (ATP Synthase)",
                "Translocator Protein (TSPO)",
                "Serotonin Receptor (5-HT Receptor)"
            ],
            "true_referents": [
                "5-HT1D Serotonin Receptor",
                "AMPA Receptors",
                "Adenine Nucleotide Translocator 1",
                "Adrenergic Receptors",
                "Angiotensin Receptors",
                "Calcium Channels",
                "Cystic Fibrosis Transmembrane Conductance Regulator",
                "Dopamine Receptors",
                "EP1 Subtype Prostaglandin E Receptors",
                "EP2 Subtype Prostaglandin E Receptors",
                "Eicosanoid Receptors",
                "Endothelin A Receptor",
                "Endothelin Receptors",
                "ErbB-2 Receptor",
                "ErbB-4 Receptor",
                "G-Protein-Coupled Receptors",
                "GABA-A Receptors",
                "Glucose Transporter Type 1",
                "Glucose Transporter Type 4",
                "IGF Type 1 Receptor",
                "Insulin Receptor",
                "Kv1.1 Potassium Channel",
                "Leukotriene B4 Receptors",
                "Leukotriene Receptors",
                "Mitochondrial Proton-Translocating ATPases",
                "Muscarinic M4 Receptor",
                "Muscarinic Receptors",
                "N-Methyl-D-Aspartate Receptors",
                "NAV1.1 Voltage-Gated Sodium Channel",
                "Neuropeptide Receptors",
                "Nicotinic Receptors",
                "Opioid Receptors",
                "P-Type Calcium Channels",
                "Prostaglandin E Receptors",
                "Proton Pumps",
                "Type 2 Angiotensin Receptor",
                "Vesicular Glutamate Transport Protein 2",
                "Vesicular Monoamine Transport Proteins",
                "Voltage-Gated Potassium Channels",
                "Voltage-Gated Sodium Channels"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "G protein-coupled receptor (GPCR)",
            "ATP synthase",
            "Na+/K+ ATPase",
            "Sodium channel",
            "Potassium channel",
            "Calcium channel",
            "Aquaporin",
            "NADH dehydrogenase",
            "Cytochrome c oxidase",
            "Adenylate cyclase",
            "Phospholipase C",
            "Glycophorin",
            "Integrin",
            "Cadherin",
            "Toll-like receptor",
            "Insulin receptor",
            "Epidermal growth factor receptor (EGFR)",
            "Glucose transporter",
            "Sodium-glucose cotransporter",
            "Chloride channel",
            "Protein kinase C",
            "Protein kinase A",
            "Adenosine triphosphatase (ATPase)",
            "Proton pump"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "G protein-coupled receptor (GPCR)",
                "Na+/K+ ATPase",
                "Sodium channel",
                "Potassium channel",
                "Calcium channel",
                "Aquaporin",
                "Integrin",
                "Cadherin",
                "Toll-like receptor",
                "Insulin receptor",
                "Glucose transporter",
                "Sodium-glucose cotransporter",
                "Chloride channel",
                "Proton pump"
            ],
            "mismatches": [
                "ATP synthase",
                "NADH dehydrogenase",
                "Cytochrome c oxidase",
                "Adenylate cyclase",
                "Phospholipase C",
                "Glycophorin",
                "Epidermal growth factor receptor (EGFR)",
                "Protein kinase C",
                "Protein kinase A",
                "Adenosine triphosphatase (ATPase)"
            ],
            "true_referents": [
                "Aquaporin 1",
                "Aquaporins",
                "CLC-2 Chloride Channels",
                "Cadherin Related Proteins",
                "Cadherins",
                "Calcium Channels",
                "Chloride Channels",
                "Class III Phosphatidylinositol 3-Kinases",
                "Clathrin",
                "Claudin-1",
                "Cyclic AMP Receptors",
                "Cyclophilin C",
                "Dual Oxidases",
                "ErbB-2 Receptor",
                "ErbB-4 Receptor",
                "G-Protein-Coupled Receptors",
                "Glucose Transporter Type 1",
                "Glucose Transporter Type 5",
                "H(+)-K(+)-Exchanging ATPase",
                "Hyperpolarization-Activated Cyclic Nucleotide-Gated Channels",
                "IGF Type 1 Receptor",
                "Insulin Receptor",
                "Integrin alpha1",
                "Integrin beta1",
                "Integrins",
                "Ion Channels",
                "Ion Pumps",
                "Membrane Glycoproteins",
                "Mitochondrial Proton-Translocating ATPases",
                "NADPH Oxidase 1",
                "Neuropeptide Receptors",
                "P-Type Calcium Channels",
                "P-type ATPases",
                "Phospholipase A2 Receptors",
                "Phospholipid Transfer Proteins",
                "Potassium Channels",
                "Proton Pumps",
                "Sarcoglycans",
                "Sodium Channels",
                "Sodium-Glucose Transporter 1",
                "Sodium-Potassium-Exchanging ATPase",
                "Succinate Cytochrome c Oxidoreductase",
                "Succinate Dehydrogenase",
                "Toll-Like Receptor 1",
                "Toll-Like Receptor 3",
                "Toll-Like Receptors",
                "beta-Arrestin 1",
                "trkA Receptor",
                "trkC Receptor"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Aquaporin 1 (AQP1)",
            "Epidermal Growth Factor Receptor (EGFR)",
            "Sodium-Potassium Pump (Na+/K+ ATPase)",
            "Rhodopsin",
            "Insulin Receptor (IR)",
            "Integrin \u03b1V\u03b23",
            "Clathrin",
            "Caveolin-1 (CAV1)",
            "SNARE Protein",
            "Flotillin-1",
            "Transferrin Receptor (TfR)",
            "Low-Density Lipoprotein Receptor (LDLR)",
            "Connexin 43 (Cx43)",
            "Phospholipase C (PLC)",
            "Dynamin",
            "Rab5",
            "Tetraspanin-4 (TSPAN4)",
            "\u03b2-Catenin",
            "Cytochrome c Oxidase",
            "ATP Synthase",
            "Ras Protein (H-Ras)",
            "Bcl-2",
            "Phospholemman",
            "P4-ATPase (Flippase)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aquaporin 1",
                "Rhodopsin",
                "Insulin Receptor",
                "Integrin alphaVbeta3",
                "Clathrin",
                "Caveolin 1",
                "SNARE Proteins",
                "Transferrin Receptors",
                "Connexin 43",
                "Dynamins"
            ],
            "mismatches": [
                "Epidermal Growth Factor Receptor (EGFR)",
                "Sodium-Potassium Pump (Na+/K+ ATPase)",
                "Flotillin-1",
                "Phospholipase C (PLC)",
                "Rab5",
                "Tetraspanin-4 (TSPAN4)",
                "\u03b2-Catenin",
                "Cytochrome c Oxidase",
                "ATP Synthase",
                "Ras Protein (H-Ras)",
                "Bcl-2",
                "Phospholemman",
                "P4-ATPase (Flippase)"
            ],
            "true_referents": [
                "Aquaporin 1",
                "Aquaporins",
                "Bacterial Transferrin Receptor Complex",
                "Bcl-2-Like Protein 11",
                "Caveolin 1",
                "Caveolin 2",
                "Caveolin 3",
                "Cellular Apoptosis Susceptibility Protein",
                "Channelrhodopsins",
                "Chloride Channels",
                "Clathrin",
                "Clathrin Heavy Chains",
                "Clathrin Light Chains",
                "Claudin-1",
                "Connexin 26",
                "Connexin 43",
                "Connexins",
                "Dual Oxidases",
                "Dynamin I",
                "Dynamin II",
                "Dynamins",
                "Ephrin-A5",
                "ErbB-2 Receptor",
                "ErbB-4 Receptor",
                "Halorhodopsins",
                "IGF Type 1 Receptor",
                "Insulin Receptor",
                "Integrin alphaVbeta3",
                "Integrin beta3",
                "LDL Receptors",
                "LDL-Receptor Related Proteins",
                "Low Density Lipoprotein Receptor-Related Protein-1",
                "Mitochondrial Proton-Translocating ATPases",
                "NADPH Oxidase 1",
                "NADPH Oxidase 2",
                "Neuropilin-1",
                "P-type ATPases",
                "Phospholipase A2 Receptors",
                "Phospholipid Transfer Proteins",
                "Proto-Oncogene Mas",
                "Proto-Oncogene Proteins c-kit",
                "Proton Pumps",
                "R-SNARE Proteins",
                "Rabphilin-3A",
                "Rhodopsin",
                "SNARE Proteins",
                "Sodium-Potassium-Exchanging ATPase",
                "Succinate Cytochrome c Oxidoreductase",
                "Tetraspanin 24",
                "Tetraspanin 25",
                "Tetraspanins",
                "Thrombospondin 1",
                "Transferrin Receptors",
                "Transferrin-Binding Protein B",
                "Transforming Growth Factor-beta Type I Receptor",
                "Vacuolar Proton-Translocating ATPases",
                "Wnt Receptors"
            ],
            "TP": 10,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Sodium-potassium pump (Na+/K+-ATPase)",
            "Glucose transporter 4 (GLUT4)",
            "Insulin receptor",
            "Epidermal growth factor receptor (EGFR)",
            "Voltage-gated sodium channel",
            "G protein-coupled receptor (GPCR)",
            "Aquaporin",
            "ATP-binding cassette transporter (ABC transporter)",
            "Sarcoplasmic/endoplasmic reticulum calcium ATPase (SERCA)",
            "Proton pump (H+-ATPase)",
            "Cystic fibrosis transmembrane conductance regulator (CFTR)",
            "Inositol 1,4,5-trisphosphate receptor (IP3R)",
            "Ryanodine receptor (RyR)",
            "Connexin",
            "Integrin",
            "Transferrin receptor",
            "Acetylcholine receptor",
            "GABA receptor",
            "Glycine receptor",
            "Toll-like receptor (TLR)",
            "Major histocompatibility complex (MHC)",
            "Cytochrome c oxidase",
            "Bacteriorhodopsin",
            "Photosystem II"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium-potassium pump (Na+/K+-ATPase)",
                "Glucose transporter 4 (GLUT4)",
                "Insulin receptor",
                "Voltage-gated sodium channel",
                "G protein-coupled receptor (GPCR)",
                "Aquaporin",
                "ATP-binding cassette transporter (ABC transporter)",
                "Sarcoplasmic/endoplasmic reticulum calcium ATPase (SERCA)",
                "Proton pump (H+-ATPase)",
                "Cystic fibrosis transmembrane conductance regulator (CFTR)",
                "Inositol 1,4,5-trisphosphate receptor (IP3R)",
                "Ryanodine receptor (RyR)",
                "Connexin",
                "Integrin",
                "Transferrin receptor",
                "Glycine receptor",
                "Toll-like receptor (TLR)",
                "Bacteriorhodopsin",
                "Photosystem II"
            ],
            "mismatches": [
                "Epidermal growth factor receptor (EGFR)",
                "Acetylcholine receptor",
                "GABA receptor",
                "Major histocompatibility complex (MHC)",
                "Cytochrome c oxidase"
            ],
            "true_referents": [
                "ATP Binding Cassette Transporter 1",
                "Aquaporin 1",
                "Aquaporins",
                "Bacterial Transferrin Receptor Complex",
                "Bacteriorhodopsins",
                "Calcium-Transporting ATPases",
                "Cholinergic Receptors",
                "Class III Phosphatidylinositol 3-Kinases",
                "Connexin 30",
                "Connexin 43",
                "Connexins",
                "Cystic Fibrosis Transmembrane Conductance Regulator",
                "Dual Oxidases",
                "Electron Transport Complex II",
                "ErbB-2 Receptor",
                "ErbB-4 Receptor",
                "G-Protein-Coupled Receptors",
                "GABA Receptors",
                "GABA-A Receptors",
                "Glucose Transporter Type 1",
                "Glucose Transporter Type 4",
                "Glycine Receptors",
                "H(+)-K(+)-Exchanging ATPase",
                "HLA-B7 Antigen",
                "Halorhodopsins",
                "Histocompatibility Antigens Class I",
                "Histocompatibility Antigens Class II",
                "IGF Type 1 Receptor",
                "Inositol 1,4,5-Trisphosphate Receptors",
                "Insulin Receptor",
                "Integrin alpha1",
                "Integrin beta1",
                "Integrins",
                "Member 1 Subfamily B ATP Binding Cassette Transporter",
                "NADPH Oxidase 1",
                "NAV1.1 Voltage-Gated Sodium Channel",
                "Neuropeptide Receptors",
                "Nicotinic Receptors",
                "Photosystem II Protein Complex",
                "Proton Pumps",
                "R-Type Calcium Channels",
                "Rhodopsin",
                "Ryanodine Receptor Calcium Release Channel",
                "Sarcoplasmic Reticulum Calcium-Transporting ATPases",
                "Sodium-Potassium-Exchanging ATPase",
                "Succinate Cytochrome c Oxidoreductase",
                "Toll-Like Receptor 1",
                "Toll-Like Receptor 3",
                "Toll-Like Receptors",
                "Transferrin Receptors",
                "Transferrin-Binding Protein B",
                "Voltage-Gated Sodium Channels",
                "beta-Arrestin 1"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Receptor tyrosine kinases (RTKs)",
            "G protein-coupled receptors (GPCRs)",
            "Ion channels",
            "Integrins",
            "Cadherins",
            "Selectins",
            "Occludins",
            "Connexins",
            "Aquaporins",
            "Niemann-Pick C1 (NPC1)",
            "Scavenger receptor class B type 1 (SR-B1)",
            "ATP-binding cassette (ABC) transporters",
            "Solute carrier (SLC) transporters",
            "Transient receptor potential (TRP) channels",
            "Voltage-gated calcium channels (VGCCs)",
            "Voltage-gated sodium channels (VGSCs)",
            "Voltage-gated potassium channels (VGKCs)",
            "Chloride intracellular channels (CLICs)",
            "Synaptotagmins",
            "Synaptophysins",
            "Vesicle-associated membrane proteins (VAMPs)",
            "Syntaxins",
            "Synaptosome-associated protein (SNAP) receptors (SNAREs)",
            "Mannose-6-phosphate receptors (MPRs)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "G protein-coupled receptors (GPCRs)",
                "Ion channels",
                "Integrins",
                "Cadherins",
                "Selectins",
                "Connexins",
                "Aquaporins",
                "ATP-binding cassette (ABC) transporters",
                "Solute carrier (SLC) transporters",
                "Transient receptor potential (TRP) channels",
                "Voltage-gated sodium channels (VGSCs)",
                "Voltage-gated potassium channels (VGKCs)",
                "Synaptotagmins",
                "Synaptophysins",
                "Vesicle-associated membrane proteins (VAMPs)",
                "Syntaxins",
                "SNAREs"
            ],
            "mismatches": [
                "Receptor tyrosine kinases (RTKs)",
                "Occludins",
                "Niemann-Pick C1 (NPC1)",
                "Scavenger receptor class B type 1 (SR-B1)",
                "Voltage-gated calcium channels (VGCCs)",
                "Chloride intracellular channels (CLICs)",
                "Mannose-6-phosphate receptors (MPRs)"
            ],
            "true_referents": [
                "ATP Binding Cassette Transporter 1",
                "ATP-Binding Cassette Transporters",
                "Aquaporin 1",
                "Aquaporins",
                "CLC-2 Chloride Channels",
                "Cadherin Related Proteins",
                "Cadherins",
                "Calcium Channels",
                "Chloride Channels",
                "Class A Scavenger Receptors",
                "Class B Scavenger Receptors",
                "Claudins",
                "Connexin 26",
                "Connexin 43",
                "Connexins",
                "Desmosomal Cadherins",
                "E-Selectin",
                "G-Protein-Coupled Receptors",
                "Growth Factor Receptors",
                "Integrin alpha1",
                "Integrin beta1",
                "Integrins",
                "Ion Channels",
                "L-Selectin",
                "Lipopolysaccharide Receptors",
                "Mannose Receptor",
                "NAV1.1 Voltage-Gated Sodium Channel",
                "Neuropeptide Receptors",
                "Niemann-Pick C1 Protein",
                "Occludin",
                "Potassium Channels",
                "R-SNARE Proteins",
                "Receptor Protein-Tyrosine Kinases",
                "Receptor Tyrosine Kinase-like Orphan Receptors",
                "SNARE Proteins",
                "Selectins",
                "Solute Carrier Family 12",
                "Solute Carrier Proteins",
                "Synaptogyrins",
                "Synaptophysin",
                "Synaptotagmin I",
                "Synaptotagmin II",
                "Synaptotagmins",
                "Syntaxin 1",
                "Syntaxin 16",
                "TRPA1 Cation Channel",
                "TRPC6 Cation Channel",
                "Transient Receptor Potential Channels",
                "Vesicle-Associated Membrane Protein 1",
                "Vesicle-Associated Membrane Protein 3",
                "Voltage-Gated Potassium Channels",
                "Voltage-Gated Sodium Channels"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Aquaporin (AQP)",
            "Integrin",
            "Cadherin",
            "Selectin",
            "Immunoglobulin",
            "Receptor tyrosine kinase",
            "G protein-coupled receptor (GPCR)",
            "Ion channel",
            "Transporter protein",
            "Connexin",
            "Flotillin",
            "Caveolin",
            "Clathrin",
            "Coatomer",
            "Syntaxin",
            "SNARE protein",
            "Rab protein",
            "Kinesin",
            "Dynein",
            "Myosin",
            "Actin",
            "Spectrin",
            "Ankyrin",
            "Band 3 protein"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aquaporin",
                "Integrin",
                "Cadherin",
                "Selectin",
                "Receptor tyrosine kinase",
                "G protein-coupled receptor (GPCR)",
                "Ion channel",
                "Connexin",
                "Caveolin",
                "Clathrin",
                "Coatomer",
                "Syntaxin",
                "SNARE protein",
                "Spectrin",
                "Ankyrin"
            ],
            "mismatches": [
                "Immunoglobulin",
                "Transporter protein",
                "Flotillin",
                "Rab protein",
                "Kinesin",
                "Dynein",
                "Myosin",
                "Actin",
                "Band 3 protein"
            ],
            "true_referents": [
                "Anion Transport Proteins",
                "Ankyrins",
                "Anoctamin-1",
                "Aquaporin 1",
                "Aquaporins",
                "Cadherin Related Proteins",
                "Cadherins",
                "Caveolin 1",
                "Caveolin 3",
                "Caveolins",
                "Clathrin",
                "Clathrin Heavy Chains",
                "Clathrin Light Chains",
                "Claudin-1",
                "Coat Protein Complex I",
                "Coatomer Protein",
                "Colistin",
                "Connexin 30",
                "Connexin 43",
                "Connexins",
                "Dystroglycans",
                "Dystrophin",
                "E-Selectin",
                "Fibronectins",
                "G-Protein-Coupled Receptors",
                "Growth Factor Receptors",
                "IgG Receptors",
                "Immunologic Receptors",
                "Integrin alpha1",
                "Integrin beta1",
                "Integrins",
                "Ion Channels",
                "L-Selectin",
                "Laminin",
                "Member 3 Subfamily B ATP Binding Cassette Transporter",
                "Membrane Transport Proteins",
                "Mesothelin",
                "Neuropeptide Receptors",
                "Neuropilin-1",
                "Neuropilin-2",
                "Occludin",
                "Potassium Channels",
                "R-SNARE Proteins",
                "Rabphilin-3A",
                "Receptor Protein-Tyrosine Kinases",
                "Receptor Tyrosine Kinase-like Orphan Receptors",
                "SNARE Proteins",
                "Selectins",
                "Solute Carrier Proteins",
                "Spectrin",
                "Surrogate Immunoglobulin Light Chains",
                "Syntaxin 1",
                "Syntaxin 16",
                "Tetraspanins",
                "beta-Arrestin 1",
                "ran GTP-Binding Protein"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Sodium-Potassium ATPase (Na+/K+ ATPase)",
            "Calcium ATPase (Ca2+ ATPase)",
            "Proton ATPase (H+ ATPase)",
            "Mitochondrial ATPase",
            "Chloroplast ATPase",
            "Vacuolar ATPase (V-ATPase)",
            "Sarcoplasmic Reticulum Calcium ATPase (SERCA)",
            "Plasma Membrane Calcium ATPase (PMCA)",
            "Gastric Proton Pump",
            "Rhodopsin",
            "Photosynthetic Reaction Center",
            "Cytochrome Oxidase",
            "Nicotinic Acetylcholine Receptor",
            "GABA Receptor",
            "Glutamate Receptor",
            "Dopamine Receptor",
            "Opioid Receptor",
            "Insulin Receptor",
            "Epidermal Growth Factor Receptor (EGFR)",
            "Transferrin Receptor",
            "Toll-Like Receptor",
            "G Protein-Coupled Receptor (GPCR)",
            "Integrin",
            "Cadherin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rhodopsin",
                "Photosynthetic Reaction Center Complex Proteins",
                "Nicotinic Receptors",
                "GABA Receptors",
                "Glutamate Receptors",
                "Dopamine Receptors",
                "Opioid Receptors",
                "Insulin Receptor",
                "Transferrin Receptors",
                "Toll-Like Receptors",
                "G-Protein-Coupled Receptors",
                "Integrins",
                "Cadherins"
            ],
            "mismatches": [
                "Sodium-Potassium ATPase (Na+/K+ ATPase)",
                "Calcium ATPase (Ca2+ ATPase)",
                "Proton ATPase (H+ ATPase)",
                "Mitochondrial ATPase",
                "Chloroplast ATPase",
                "Vacuolar ATPase (V-ATPase)",
                "Sarcoplasmic Reticulum Calcium ATPase (SERCA)",
                "Plasma Membrane Calcium ATPase (PMCA)",
                "Gastric Proton Pump",
                "Cytochrome Oxidase",
                "Epidermal Growth Factor Receptor (EGFR)"
            ],
            "true_referents": [
                "Bacterial Transferrin Receptor Complex",
                "Cadherin Related Proteins",
                "Cadherins",
                "Calcium-Transporting ATPases",
                "Channelrhodopsins",
                "Chloroplast Proton-Translocating ATPases",
                "Claudin-1",
                "Dopamine Receptors",
                "Dual Oxidases",
                "Electron Transport Complex I",
                "ErbB-2 Receptor",
                "ErbB-4 Receptor",
                "G-Protein-Coupled Receptors",
                "GABA Receptors",
                "GABA-A Receptors",
                "Glutamate Receptors",
                "H(+)-K(+)-Exchanging ATPase",
                "Halorhodopsins",
                "IGF Type 1 Receptor",
                "Insulin Receptor",
                "Integrin alpha1",
                "Integrin beta1",
                "Integrins",
                "Mitochondrial Proton-Translocating ATPases",
                "N-Methyl-D-Aspartate Receptors",
                "Neuropeptide Receptors",
                "Nicotinic Receptors",
                "Opioid Receptors",
                "P-type ATPases",
                "Photosynthetic Reaction Center Complex Proteins",
                "Photosystem II Protein Complex",
                "Plasma Membrane Calcium-Transporting ATPases",
                "Plastoquinol-Plastocyanin Reductase",
                "Proton Pumps",
                "Proton-Phosphate Symporters",
                "Rhodopsin",
                "Sarcoplasmic Reticulum Calcium-Transporting ATPases",
                "Sodium-Potassium-Exchanging ATPase",
                "Succinate Cytochrome c Oxidoreductase",
                "Toll-Like Receptor 1",
                "Toll-Like Receptor 3",
                "Toll-Like Receptors",
                "Transferrin Receptors",
                "Transferrin-Binding Protein B",
                "Vacuolar Proton-Translocating ATPases",
                "beta-Arrestin 1"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Bacteriorhodopsin (BR)",
            "Opsin",
            "Rhodopsin",
            "Proteorhodopsin",
            "Sensory rhodopsin",
            "Arrestin",
            "Visual arrestin",
            "Retinal-binding protein",
            "Rhodopsin kinase",
            "Phosphodiesterase 6",
            "Transducin",
            "G-protein",
            "Phospholipase C",
            "G-protein coupled receptor",
            "7-transmembrane receptor",
            "G-protein coupled receptor kinase",
            "Adenylyl cyclase",
            "Phosphatidylinositol-specific phospholipase C",
            "Phosphatidylinositol 4,5-bisphosphate",
            "Phosphatidylinositol 3,4,5-trisphosphate",
            "Phospholipase D",
            "Phosphatidylinositol 3-phosphate",
            "Phosphatidylinositol 4-phosphate",
            "Phosphatidylinositol 5-phosphate",
            "Phosphatidylinositol 3,5-bisphosphate",
            "Phosphatidylinositol 4,5-bisphosphate 3-kinase"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rhodopsin",
                "Arrestin",
                "Transducin"
            ],
            "mismatches": [
                "Bacteriorhodopsin (BR)",
                "Opsin",
                "Proteorhodopsin",
                "Sensory rhodopsin",
                "Visual arrestin",
                "Retinal-binding protein",
                "Rhodopsin kinase",
                "Phosphodiesterase 6",
                "G-protein",
                "Phospholipase C",
                "G-protein coupled receptor",
                "7-transmembrane receptor",
                "G-protein coupled receptor kinase",
                "Adenylyl cyclase",
                "Phosphatidylinositol-specific phospholipase C",
                "Phosphatidylinositol 4,5-bisphosphate",
                "Phosphatidylinositol 3,4,5-trisphosphate",
                "Phospholipase D",
                "Phosphatidylinositol 3-phosphate",
                "Phosphatidylinositol 4-phosphate",
                "Phosphatidylinositol 5-phosphate",
                "Phosphatidylinositol 3,5-bisphosphate",
                "Phosphatidylinositol 4,5-bisphosphate 3-kinase"
            ],
            "true_referents": [
                "5-HT1D Serotonin Receptor",
                "Arrestin",
                "Arrestins",
                "Bacteriorhodopsins",
                "Channelrhodopsins",
                "Chlorophyll Binding Proteins",
                "Class III Phosphatidylinositol 3-Kinases",
                "Cyclic AMP Receptors",
                "Cyclic Nucleotide-Gated Cation Channels",
                "Cyclophilin C",
                "G Protein-Coupled Inwardly-Rectifying Potassium Channels",
                "G-Protein-Coupled Receptors",
                "Halorhodopsins",
                "Inositol 1,4,5-Trisphosphate Receptors",
                "Ion Channels",
                "Lysophosphatidic Acid Receptors",
                "Neuropeptide Receptors",
                "Phospholipase A2 Receptors",
                "Phospholipid Transfer Proteins",
                "Rhodopsin",
                "Sphingosine-1-Phosphate Receptors",
                "Transducin",
                "alpha7 Nicotinic Acetylcholine Receptor",
                "beta-Arrestin 1",
                "beta-Arrestins",
                "trkA Receptor"
            ],
            "TP": 3,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "membrane protein",
        "domain": "biology",
        "response": [
            "Adenosine receptor A2a (A2aR)",
            "Aquaporin 1 (AQP1)",
            "Band 3 anion transport protein (SLC4A1)",
            "Beta-1 adrenergic receptor (ADRB1)",
            "Calcitonin receptor (CALCR)",
            "Caveolin 1 (CAV1)",
            "CD4 glycoprotein (CD4)",
            "CD44 antigen (CD44)",
            "Cystic fibrosis transmembrane conductance regulator (CFTR)",
            "Dopamine receptor D1 (DRD1)",
            "Epidermal growth factor receptor (EGFR)",
            "Fibroblast growth factor receptor 1 (FGFR1)",
            "G protein-coupled receptor 120 (GPR120)",
            "Glycophorin A (GYPA)",
            "Insulin receptor (INSR)",
            "Insulin-like growth factor 1 receptor (IGF1R)",
            "Integrin alpha-5 beta-1 (ITGA5/ITGB1)",
            "Low-density lipoprotein receptor (LDLR)",
            "Muscarinic acetylcholine receptor M1 (CHRM1)",
            "N-methyl-D-aspartate receptor (GRIN1)",
            "Platelet-derived growth factor receptor beta (PDGFRB)",
            "Rhodopsin (RHO)",
            "Serotonin receptor 1A (HTR1A)",
            "Sodium-potassium-chloride cotransporter 1 (SLC12A2)",
            "T-cell surface glycoprotein CD3 epsilon chain (CD3E)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adenosine receptor A2a (A2aR)",
                "Aquaporin 1 (AQP1)",
                "Beta-1 adrenergic receptor (ADRB1)",
                "Calcitonin receptor (CALCR)",
                "Caveolin 1 (CAV1)",
                "Cystic fibrosis transmembrane conductance regulator (CFTR)",
                "Dopamine receptor D1 (DRD1)",
                "Insulin receptor (INSR)",
                "Insulin-like growth factor 1 receptor (IGF1R)",
                "Integrin alpha-5 beta-1 (ITGA5/ITGB1)",
                "Low-density lipoprotein receptor (LDLR)",
                "Muscarinic acetylcholine receptor M1 (CHRM1)",
                "N-methyl-D-aspartate receptor (GRIN1)",
                "Platelet-derived growth factor receptor beta (PDGFRB)",
                "Rhodopsin (RHO)",
                "Serotonin receptor 1A (HTR1A)"
            ],
            "mismatches": [
                "Band 3 anion transport protein (SLC4A1)",
                "CD4 glycoprotein (CD4)",
                "CD44 antigen (CD44)",
                "Epidermal growth factor receptor (EGFR)",
                "Fibroblast growth factor receptor 1 (FGFR1)",
                "G protein-coupled receptor 120 (GPR120)",
                "Glycophorin A (GYPA)",
                "Sodium-potassium-chloride cotransporter 1 (SLC12A2)",
                "T-cell surface glycoprotein CD3 epsilon chain (CD3E)"
            ],
            "true_referents": [
                "5-HT1A Serotonin Receptor",
                "Adenosine A2 Receptors",
                "Adenosine A2A Receptor",
                "Aquaporin 1",
                "Aquaporins",
                "CD24 Antigen",
                "CD4 Antigens",
                "CD4 Immunoadhesins",
                "Calcitonin Receptor-Like Protein",
                "Calcitonin Receptors",
                "Caveolin 1",
                "Caveolin 2",
                "Caveolin 3",
                "Channelrhodopsins",
                "Cystic Fibrosis Transmembrane Conductance Regulator",
                "Dopamine D1 Receptors",
                "ErbB-2 Receptor",
                "ErbB-4 Receptor",
                "G-Protein-Coupled Receptors",
                "Glucagon-Like Peptide-1 Receptor",
                "HLA-B44 Antigen",
                "IGF Type 1 Receptor",
                "IGF Type 2 Receptor",
                "Insulin Receptor",
                "Integrin alpha5",
                "Integrin alpha5beta1",
                "K Cl- Cotransporters",
                "LDL Receptors",
                "LDL-Receptor Related Proteins",
                "Low Density Lipoprotein Receptor-Related Protein-1",
                "Membrane Glycoproteins",
                "Muscarinic M1 Receptor",
                "Muscarinic M4 Receptor",
                "N-Methyl-D-Aspartate Receptors",
                "Platelet-Derived Growth Factor Receptors",
                "Platelet-Derived Growth Factor beta Receptor",
                "Rhodopsin",
                "SLC4A Proteins",
                "Sarcoglycans",
                "Sodium-Potassium-Chloride Symporters",
                "Type 1 Fibroblast Growth Factor Receptor",
                "Type 5 Fibroblast Growth Factor Receptor",
                "beta-1 Adrenergic Receptors",
                "beta-Arrestin 1"
            ],
            "TP": 16,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "membrane protein",
        "domain": "biology",
        "response": "{\n    \"Referent\": \"Keratin\",\n    \"Canonical name\": \"Keratin\"\n},\n{\n    \"Referent\": \"Myelin\",\n    \"Canonical name\": \"Myelin\"\n}",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]