[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "IRE1 (ERN1)",
            "PERK (EIF2AK3)",
            "ATF6",
            "BiP (HSPA5)",
            "DDIT3 (CHOP)",
            "ERdj5 (DNAJB9)",
            "ERp72 (PDIA6)",
            "GRP170 (HSPA5)",
            "HYOU1 (ERN2)",
            "IRE1 (ERN1) Activated Form",
            "PERK (EIF2AK3) Activated Form",
            "ATF6 Activated Form",
            "Bip (HSPA5) Bound to IRE1",
            "DDIT3 (CHOP) Transcription Factor",
            "ERdj5 (DNAJB9) Chaperone",
            "ERp72 (PDIA6) Chaperone",
            "GRP170 (HSPA5) Chaperone",
            "HYOU1 (ERN2) Stress Granule",
            "IRE1 (ERN1) Endonuclease Active Form",
            "PERK (EIF2AK3) Kinase Active Form",
            "ATF6 Nucleus Translocated Form",
            "BiP (HSPA5) Free Form",
            "DDIT3 (CHOP) Phosphorylated Form"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "IRE1 (ERN1)",
                "PERK (EIF2AK3)",
                "ATF6",
                "BiP (HSPA5)",
                "DDIT3 (CHOP)",
                "ERdj5 (DNAJB9)",
                "ERp72 (PDIA6)",
                "GRP170 (HSPA5)",
                "HYOU1 (ERN2)",
                "IRE1 (ERN1) Activated Form",
                "PERK (EIF2AK3) Activated Form",
                "ATF6 Activated Form",
                "Bip (HSPA5) Bound to IRE1",
                "DDIT3 (CHOP) Transcription Factor",
                "ERdj5 (DNAJB9) Chaperone",
                "ERp72 (PDIA6) Chaperone",
                "GRP170 (HSPA5) Chaperone",
                "HYOU1 (ERN2) Stress Granule",
                "IRE1 (ERN1) Endonuclease Active Form",
                "PERK (EIF2AK3) Kinase Active Form",
                "ATF6 Nucleus Translocated Form",
                "BiP (HSPA5) Free Form",
                "DDIT3 (CHOP) Phosphorylated Form"
            ],
            "mismatches": [],
            "true_referents": [
                "ATF6",
                "ATF6 Activated Form",
                "ATF6 Nucleus Translocated Form",
                "BiP (HSPA5)",
                "BiP (HSPA5) Free Form",
                "Bip (HSPA5) Bound to IRE1",
                "DDIT3 (CHOP)",
                "DDIT3 (CHOP) Phosphorylated Form",
                "DDIT3 (CHOP) Transcription Factor",
                "ERdj5 (DNAJB9)",
                "ERdj5 (DNAJB9) Chaperone",
                "ERp72 (PDIA6)",
                "ERp72 (PDIA6) Chaperone",
                "GRP170 (HSPA5)",
                "GRP170 (HSPA5) Chaperone",
                "HYOU1 (ERN2)",
                "HYOU1 (ERN2) Stress Granule",
                "IRE1 (ERN1)",
                "IRE1 (ERN1) Activated Form",
                "IRE1 (ERN1) Endonuclease Active Form",
                "PERK (EIF2AK3)",
                "PERK (EIF2AK3) Activated Form",
                "PERK (EIF2AK3) Kinase Active Form"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Inositol-Requiring Enzyme 1 (IRE1)",
            "Protein Kinase RNA-like Endoplasmic Reticulum Kinase (PERK)",
            "Activating Transcription Factor 6 (ATF6)",
            "BiP/GRP78 (Binding Immunoglobulin Protein / Glucose-Regulated Protein 78)",
            "Heme Regulated Inhibitor (HRI)",
            "DNA Damage Activated RNA Polymerase (DDA-RNAP)",
            "Eukaryotic Translation Initiation Factor 2 alpha (eIF2\u03b1)",
            "X-box Binding Protein 1 (XBP1)",
            "C/EBP Homologous Protein (CHOP)",
            "Spliced XBP1 (sXBP1)",
            "Unspliced XBP1 (uXBP1)",
            "ER Stress Sensor 1 (ERS1)",
            "ER Stress Sensor 2 (ERS2)",
            "Endoplasmic Reticulum Stress-Activated Protein Kinase (ERK)",
            "C-Jun N-terminal Kinase (JNK)",
            "p38 Mitogen-Activated Protein Kinase (p38 MAPK)",
            "IRE1\u03b1 (Inositol-Requiring Enzyme 1 alpha)",
            "IRE1\u03b2 (Inositol-Requiring Enzyme 1 beta)",
            "ATF4 (Activating Transcription Factor 4)",
            "GADD34 (Growth Arrest and DNA Damage-inducible protein 34)",
            "DNAJC3 (DnaJ Heat Shock Protein Family (Hsp40) Member C3)",
            "ERdj5 (ER DnaJ Homolog 5)",
            "EDEM1 (ER Degradation Enhancing Alpha-Mannosidase-like Protein 1)",
            "Herp (Homocysteine Inducible ER Protein)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Inositol-Requiring Enzyme 1 (IRE1)",
                "Protein Kinase RNA-like Endoplasmic Reticulum Kinase (PERK)",
                "Activating Transcription Factor 6 (ATF6)",
                "BiP/GRP78 (Binding Immunoglobulin Protein / Glucose-Regulated Protein 78)",
                "Heme Regulated Inhibitor (HRI)",
                "DNA Damage Activated RNA Polymerase (DDA-RNAP)",
                "Eukaryotic Translation Initiation Factor 2 alpha (eIF2\u03b1)",
                "X-box Binding Protein 1 (XBP1)",
                "C/EBP Homologous Protein (CHOP)",
                "Spliced XBP1 (sXBP1)",
                "Unspliced XBP1 (uXBP1)",
                "ER Stress Sensor 1 (ERS1)",
                "ER Stress Sensor 2 (ERS2)",
                "Endoplasmic Reticulum Stress-Activated Protein Kinase (ERK)",
                "C-Jun N-terminal Kinase (JNK)",
                "p38 Mitogen-Activated Protein Kinase (p38 MAPK)",
                "IRE1\u03b1 (Inositol-Requiring Enzyme 1 alpha)",
                "IRE1\u03b2 (Inositol-Requiring Enzyme 1 beta)",
                "ATF4 (Activating Transcription Factor 4)",
                "GADD34 (Growth Arrest and DNA Damage-inducible protein 34)",
                "DNAJC3 (DnaJ Heat Shock Protein Family (Hsp40) Member C3)",
                "ERdj5 (ER DnaJ Homolog 5)",
                "EDEM1 (ER Degradation Enhancing Alpha-Mannosidase-like Protein 1)",
                "Herp (Homocysteine Inducible ER Protein)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATF4 (Activating Transcription Factor 4)",
                "Activating Transcription Factor 6 (ATF6)",
                "BiP/GRP78 (Binding Immunoglobulin Protein / Glucose-Regulated Protein 78)",
                "C-Jun N-terminal Kinase (JNK)",
                "C/EBP Homologous Protein (CHOP)",
                "DNA Damage Activated RNA Polymerase (DDA-RNAP)",
                "DNAJC3 (DnaJ Heat Shock Protein Family (Hsp40) Member C3)",
                "EDEM1 (ER Degradation Enhancing Alpha-Mannosidase-like Protein 1)",
                "ER Stress Sensor 1 (ERS1)",
                "ER Stress Sensor 2 (ERS2)",
                "ERdj5 (ER DnaJ Homolog 5)",
                "Endoplasmic Reticulum Stress-Activated Protein Kinase (ERK)",
                "Eukaryotic Translation Initiation Factor 2 alpha (eIF2\u03b1)",
                "GADD34 (Growth Arrest and DNA Damage-inducible protein 34)",
                "Heme Regulated Inhibitor (HRI)",
                "Herp (Homocysteine Inducible ER Protein)",
                "IRE1\u03b1 (Inositol-Requiring Enzyme 1 alpha)",
                "IRE1\u03b2 (Inositol-Requiring Enzyme 1 beta)",
                "Inositol-Requiring Enzyme 1 (IRE1)",
                "Protein Kinase RNA-like Endoplasmic Reticulum Kinase (PERK)",
                "Spliced XBP1 (sXBP1)",
                "Unspliced XBP1 (uXBP1)",
                "X-box Binding Protein 1 (XBP1)",
                "p38 Mitogen-Activated Protein Kinase (p38 MAPK)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Binding immunoglobulin protein (BiP)",
            "Glucose-regulated protein 78 (GRP78)",
            "Heat shock protein 70 (HSP70)",
            "Heat shock protein 90 (HSP90)",
            "Calnexin",
            "Calreticulin",
            "Protein disulfide isomerase (PDI)",
            "Endoplasmic reticulum resident protein 57 (ERp57)",
            "Heat shock protein 47 (HSP47)",
            "Heat shock protein 60 (HSP60)",
            "Heat shock protein 110 (HSP110)",
            "Heat shock protein 27 (HSP27)",
            "Heat shock protein 70-1A (HSPA1A)",
            "Heat shock protein 70-1B (HSPA1B)",
            "Heat shock protein 70-2 (HSPA2)",
            "Heat shock protein 70-5 (HSPA5)",
            "Heat shock protein 70-8 (HSPA8)",
            "Heat shock protein 70-10 (HSPA10)",
            "Heat shock protein 70-12A (HSPA12A)",
            "Heat shock protein 70-12B (HSPA12B)",
            "Heat shock protein 70-14 (HSPA14)",
            "Heat shock protein 70-1L (HSPA1L)",
            "Heat shock protein 70-105 (HSPA105)",
            "Heat shock protein 70-11 (HSPA11)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Binding immunoglobulin protein (BiP)",
                "Glucose-regulated protein 78 (GRP78)",
                "Heat shock protein 70 (HSP70)",
                "Heat shock protein 90 (HSP90)",
                "Calnexin",
                "Calreticulin",
                "Protein disulfide isomerase (PDI)",
                "Endoplasmic reticulum resident protein 57 (ERp57)",
                "Heat shock protein 47 (HSP47)",
                "Heat shock protein 60 (HSP60)",
                "Heat shock protein 110 (HSP110)",
                "Heat shock protein 27 (HSP27)",
                "Heat shock protein 70-1A (HSPA1A)",
                "Heat shock protein 70-1B (HSPA1B)",
                "Heat shock protein 70-2 (HSPA2)",
                "Heat shock protein 70-5 (HSPA5)",
                "Heat shock protein 70-8 (HSPA8)",
                "Heat shock protein 70-10 (HSPA10)",
                "Heat shock protein 70-12A (HSPA12A)",
                "Heat shock protein 70-12B (HSPA12B)",
                "Heat shock protein 70-14 (HSPA14)",
                "Heat shock protein 70-1L (HSPA1L)",
                "Heat shock protein 70-105 (HSPA105)",
                "Heat shock protein 70-11 (HSPA11)"
            ],
            "mismatches": [],
            "true_referents": [
                "Binding immunoglobulin protein (BiP)",
                "Calnexin",
                "Calreticulin",
                "Endoplasmic reticulum resident protein 57 (ERp57)",
                "Glucose-regulated protein 78 (GRP78)",
                "Heat shock protein 110 (HSP110)",
                "Heat shock protein 27 (HSP27)",
                "Heat shock protein 47 (HSP47)",
                "Heat shock protein 60 (HSP60)",
                "Heat shock protein 70 (HSP70)",
                "Heat shock protein 70-10 (HSPA10)",
                "Heat shock protein 70-105 (HSPA105)",
                "Heat shock protein 70-11 (HSPA11)",
                "Heat shock protein 70-12A (HSPA12A)",
                "Heat shock protein 70-12B (HSPA12B)",
                "Heat shock protein 70-14 (HSPA14)",
                "Heat shock protein 70-1A (HSPA1A)",
                "Heat shock protein 70-1B (HSPA1B)",
                "Heat shock protein 70-1L (HSPA1L)",
                "Heat shock protein 70-2 (HSPA2)",
                "Heat shock protein 70-5 (HSPA5)",
                "Heat shock protein 70-8 (HSPA8)",
                "Heat shock protein 90 (HSP90)",
                "Protein disulfide isomerase (PDI)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "BiP/GRP78 (BiP)",
            "IRE1\u03b1 (IRE1)",
            "PERK (PERK)",
            "ATF6 (ATF6)",
            "XBP1s (XBP1)",
            "CHOP/GADD153 (CHOP)",
            "DDIT3 (DDIT3)",
            "HSP90 (HSP90)",
            "HSP70 (HSP70)",
            "HSP50 (BiP-like, HSP50)",
            "Protein disulfide isomerase (PDI)",
            "Calnexin (CNX)",
            "Calreticulin (CRT)",
            "ERp57 (ERp57)",
            "ORMDL3 (ORMDL3)",
            "Sigma-1 receptor (Sig-1R)",
            "G3BP1 (G3BP1)",
            "eIF2\u03b1 (eIF2\u03b1)",
            "SREBP2 (SREBP2)",
            "Max (MAX)",
            "Trib3 (Trib3)",
            "GRP170 (GRP170)",
            "Protein kinase RNA-like ER kinase (PKR-like ER kinase)",
            "Inositol-requiring enzyme 1 (IRE1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BiP/GRP78 (BiP)",
                "IRE1\u03b1 (IRE1)",
                "PERK (PERK)",
                "ATF6 (ATF6)",
                "XBP1s (XBP1)",
                "CHOP/GADD153 (CHOP)",
                "DDIT3 (DDIT3)",
                "HSP90 (HSP90)",
                "HSP70 (HSP70)",
                "HSP50 (BiP-like, HSP50)",
                "Protein disulfide isomerase (PDI)",
                "Calnexin (CNX)",
                "Calreticulin (CRT)",
                "ERp57 (ERp57)",
                "ORMDL3 (ORMDL3)",
                "Sigma-1 receptor (Sig-1R)",
                "G3BP1 (G3BP1)",
                "eIF2\u03b1 (eIF2\u03b1)",
                "SREBP2 (SREBP2)",
                "Max (MAX)",
                "Trib3 (Trib3)",
                "GRP170 (GRP170)",
                "Protein kinase RNA-like ER kinase (PKR-like ER kinase)",
                "Inositol-requiring enzyme 1 (IRE1)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATF6 (ATF6)",
                "BiP/GRP78 (BiP)",
                "CHOP/GADD153 (CHOP)",
                "Calnexin (CNX)",
                "Calreticulin (CRT)",
                "DDIT3 (DDIT3)",
                "ERp57 (ERp57)",
                "G3BP1 (G3BP1)",
                "GRP170 (GRP170)",
                "HSP50 (BiP-like, HSP50)",
                "HSP70 (HSP70)",
                "HSP90 (HSP90)",
                "IRE1\u03b1 (IRE1)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Max (MAX)",
                "ORMDL3 (ORMDL3)",
                "PERK (PERK)",
                "Protein disulfide isomerase (PDI)",
                "Protein kinase RNA-like ER kinase (PKR-like ER kinase)",
                "SREBP2 (SREBP2)",
                "Sigma-1 receptor (Sig-1R)",
                "Trib3 (Trib3)",
                "XBP1s (XBP1)",
                "eIF2\u03b1 (eIF2\u03b1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Binding immunoglobulin protein (BiP)",
            "Glucose-regulated protein 78 (GRP78)",
            "Heat shock protein family A member 5 (HSPA5)",
            "Activating transcription factor 6 (ATF6)",
            "Inositol-requiring enzyme 1 (IRE1)",
            "Protein kinase RNA-like ER kinase (PERK)",
            "C/EBP homologous protein (CHOP)",
            "X-box binding protein 1 (XBP1)",
            "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
            "Calreticulin",
            "Calnexin",
            "Derlin-1",
            "Derlin-2",
            "Derlin-3",
            "ER degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
            "ER degradation-enhancing alpha-mannosidase-like protein 2 (EDEM2)",
            "ER degradation-enhancing alpha-mannosidase-like protein 3 (EDEM3)",
            "Sec61 translocon",
            "Protein disulfide isomerase (PDI)",
            "ER-localized DnaJ homolog (ERdj5)",
            "Unfolded protein response regulator (UPR regulator)",
            "Signal peptide peptidase (SPP)",
            "Oligosaccharyltransferase (OST)",
            "ER stress-induced caspase-4"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Binding immunoglobulin protein (BiP)",
                "Glucose-regulated protein 78 (GRP78)",
                "Heat shock protein family A member 5 (HSPA5)",
                "Activating transcription factor 6 (ATF6)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Protein kinase RNA-like ER kinase (PERK)",
                "C/EBP homologous protein (CHOP)",
                "X-box binding protein 1 (XBP1)",
                "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
                "Calreticulin",
                "Calnexin",
                "Derlin-1",
                "Derlin-2",
                "Derlin-3",
                "ER degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "ER degradation-enhancing alpha-mannosidase-like protein 2 (EDEM2)",
                "ER degradation-enhancing alpha-mannosidase-like protein 3 (EDEM3)",
                "Sec61 translocon",
                "Protein disulfide isomerase (PDI)",
                "ER-localized DnaJ homolog (ERdj5)",
                "Unfolded protein response regulator (UPR regulator)",
                "Signal peptide peptidase (SPP)",
                "Oligosaccharyltransferase (OST)",
                "ER stress-induced caspase-4"
            ],
            "mismatches": [],
            "true_referents": [
                "Activating transcription factor 6 (ATF6)",
                "Binding immunoglobulin protein (BiP)",
                "C/EBP homologous protein (CHOP)",
                "Calnexin",
                "Calreticulin",
                "Derlin-1",
                "Derlin-2",
                "Derlin-3",
                "ER degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "ER degradation-enhancing alpha-mannosidase-like protein 2 (EDEM2)",
                "ER degradation-enhancing alpha-mannosidase-like protein 3 (EDEM3)",
                "ER stress-induced caspase-4",
                "ER-localized DnaJ homolog (ERdj5)",
                "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
                "Glucose-regulated protein 78 (GRP78)",
                "Heat shock protein family A member 5 (HSPA5)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Oligosaccharyltransferase (OST)",
                "Protein disulfide isomerase (PDI)",
                "Protein kinase RNA-like ER kinase (PERK)",
                "Sec61 translocon",
                "Signal peptide peptidase (SPP)",
                "Unfolded protein response regulator (UPR regulator)",
                "X-box binding protein 1 (XBP1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "BiP (Binding Immunoglobulin Protein)",
            "GRP78 (Glucose-Regulated Protein 78)",
            "HSPA5 (Heat Shock Protein Family A Member 5)",
            "HSP70 (Heat Shock Protein 70)",
            "XBP1 (X-Box Binding Protein 1)",
            "ATF6 (Activating Transcription Factor 6)",
            "IRE1 (Inositol-Requiring Enzyme 1)",
            "CHOP (C/EBP Homologous Protein)",
            "PERK (PKR-like Endoplasmic Reticulum Kinase)",
            "GADD153 (Growth Arrest and DNA Damage-inducible Protein 153)",
            "BIP (B-cell receptor-associated protein)",
            "PDI (Protein Disulfide Isomerase)",
            "EDEM1 (ER Degradation Enhancer, Mannosidase Alpha-like 1)",
            "SEL1L (SEL1L Endoplasmic Reticulum Protein)",
            "OSM (Oncostatin M)",
            "SDF-1 (Stromal Derived Factor 1)",
            "TAX1BP1 (Tax1-binding protein 1)",
            "FAM134B (Family With Sequence Similarity 134 Member B)",
            "HSP90 (Heat Shock Protein 90)",
            "HYOU1 (Hypoxia Up-Regulated 1)",
            "TRIB3 (Tribbles Homolog 3)",
            "CNP (C-type Natriuretic Peptide)",
            "C/EBP\u03b2 (CCAAT/enhancer-binding protein beta)",
            "SREBP1 (Sterol Regulatory Element-Binding Protein 1)",
            "HMGCR (3-Hydroxy-3-Methylglutaryl-CoA Reductase)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BiP (Binding Immunoglobulin Protein)",
                "GRP78 (Glucose-Regulated Protein 78)",
                "HSPA5 (Heat Shock Protein Family A Member 5)",
                "HSP70 (Heat Shock Protein 70)",
                "XBP1 (X-Box Binding Protein 1)",
                "ATF6 (Activating Transcription Factor 6)",
                "IRE1 (Inositol-Requiring Enzyme 1)",
                "CHOP (C/EBP Homologous Protein)",
                "PERK (PKR-like Endoplasmic Reticulum Kinase)",
                "GADD153 (Growth Arrest and DNA Damage-inducible Protein 153)",
                "BIP (B-cell receptor-associated protein)",
                "PDI (Protein Disulfide Isomerase)",
                "EDEM1 (ER Degradation Enhancer, Mannosidase Alpha-like 1)",
                "SEL1L (SEL1L Endoplasmic Reticulum Protein)",
                "OSM (Oncostatin M)",
                "SDF-1 (Stromal Derived Factor 1)",
                "TAX1BP1 (Tax1-binding protein 1)",
                "FAM134B (Family With Sequence Similarity 134 Member B)",
                "HSP90 (Heat Shock Protein 90)",
                "HYOU1 (Hypoxia Up-Regulated 1)",
                "TRIB3 (Tribbles Homolog 3)",
                "CNP (C-type Natriuretic Peptide)",
                "C/EBP\u03b2 (CCAAT/enhancer-binding protein beta)",
                "SREBP1 (Sterol Regulatory Element-Binding Protein 1)"
            ],
            "mismatches": [
                "HMGCR (3-Hydroxy-3-Methylglutaryl-CoA Reductase)"
            ],
            "true_referents": [
                "ATF6 (Activating Transcription Factor 6)",
                "BIP (B-cell receptor-associated protein)",
                "BiP (Binding Immunoglobulin Protein)",
                "C/EBP\u03b2 (CCAAT/enhancer-binding protein beta)",
                "CHOP (C/EBP Homologous Protein)",
                "CNP (C-type Natriuretic Peptide)",
                "EDEM1 (ER Degradation Enhancer, Mannosidase Alpha-like 1)",
                "FAM134B (Family With Sequence Similarity 134 Member B)",
                "GADD153 (Growth Arrest and DNA Damage-inducible Protein 153)",
                "GRP78 (Glucose-Regulated Protein 78)",
                "HSP70 (Heat Shock Protein 70)",
                "HSP90 (Heat Shock Protein 90)",
                "HSPA5 (Heat Shock Protein Family A Member 5)",
                "HYOU1 (Hypoxia Up-Regulated 1)",
                "IRE1 (Inositol-Requiring Enzyme 1)",
                "OSM (Oncostatin M)",
                "PDI (Protein Disulfide Isomerase)",
                "PERK (PKR-like Endoplasmic Reticulum Kinase)",
                "SDF-1 (Stromal Derived Factor 1)",
                "SEL1L (SEL1L Endoplasmic Reticulum Protein)",
                "SREBP1 (Sterol Regulatory Element-Binding Protein 1)",
                "TAX1BP1 (Tax1-binding protein 1)",
                "TRIB3 (Tribbles Homolog 3)",
                "XBP1 (X-Box Binding Protein 1)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Binding immunoglobulin protein (BiP)",
            "Protein kinase R (PKR)-like endoplasmic reticulum kinase (PERK)",
            "Inositol-requiring enzyme 1 (IRE1)",
            "Activating transcription factor 6 (ATF6)",
            "ER degradation-enhancing alpha-mannosidase-like protein (EDEM)",
            "Endoplasmic Reticulum Oxidoreductin 1 (ERO1)",
            "Calnexin (CANX)",
            "Calreticulin (CALR)",
            "C/EBP Homologous Protein (CHOP)",
            "X-box binding protein 1 (XBP1)",
            "Endoplasmic reticulum protein 29 (ERp29)",
            "Endoplasmic reticulum protein 44 (ERp44)",
            "Endoplasmic reticulum protein 46 (ERp46)",
            "Endoplasmic reticulum protein 57 (ERp57)",
            "Endoplasmic reticulum protein 72 (ERp72)",
            "Oxygen-regulated protein (ORP150)",
            "Stress-70 protein, mitochondrial (GRP75)",
            "Endoplasmic reticulum resident protein 29 (ERP29)",
            "Endoplasmic reticulum resident protein 44 (ERP44)",
            "Endoplasmic reticulum resident protein 57 (ERP57)",
            "Endoplasmic reticulum resident protein 72 (ERP72)",
            "Unfolded protein response signal activator IRE1 (IRE1alpha)",
            "Unfolded Protein Response Activator ATF6 (ATF6alpha)",
            "Unfolded protein response activator PERK (PERK)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Binding immunoglobulin protein (BiP)",
                "Protein kinase R (PKR)-like endoplasmic reticulum kinase (PERK)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Activating transcription factor 6 (ATF6)",
                "ER degradation-enhancing alpha-mannosidase-like protein (EDEM)",
                "Endoplasmic Reticulum Oxidoreductin 1 (ERO1)",
                "Calnexin (CANX)",
                "Calreticulin (CALR)",
                "C/EBP Homologous Protein (CHOP)",
                "X-box binding protein 1 (XBP1)",
                "Endoplasmic reticulum protein 29 (ERp29)",
                "Endoplasmic reticulum protein 44 (ERp44)",
                "Endoplasmic reticulum protein 57 (ERp57)",
                "Endoplasmic reticulum protein 72 (ERp72)",
                "Oxygen-regulated protein (ORP150)",
                "Stress-70 protein, mitochondrial (GRP75)",
                "Endoplasmic reticulum resident protein 29 (ERP29)",
                "Endoplasmic reticulum resident protein 44 (ERP44)",
                "Endoplasmic reticulum resident protein 57 (ERP57)",
                "Endoplasmic reticulum resident protein 72 (ERP72)",
                "Unfolded Protein Response Activator ATF6 (ATF6alpha)",
                "Unfolded protein response activator PERK (PERK)"
            ],
            "mismatches": [
                "Endoplasmic reticulum protein 46 (ERp46)",
                "Unfolded protein response signal activator IRE1 (IRE1alpha)"
            ],
            "true_referents": [
                "Activating transcription factor 6 (ATF6)",
                "Binding immunoglobulin protein (BiP)",
                "C/EBP Homologous Protein (CHOP)",
                "Calnexin (CANX)",
                "Calreticulin (CALR)",
                "ER degradation-enhancing alpha-mannosidase-like protein (EDEM)",
                "Endoplasmic Reticulum Oxidoreductin 1 (ERO1)",
                "Endoplasmic reticulum protein 29 (ERp29)",
                "Endoplasmic reticulum protein 44 (ERp44)",
                "Endoplasmic reticulum protein 46 (ERp46)",
                "Endoplasmic reticulum protein 57 (ERp57)",
                "Endoplasmic reticulum protein 72 (ERp72)",
                "Endoplasmic reticulum resident protein 29 (ERP29)",
                "Endoplasmic reticulum resident protein 44 (ERP44)",
                "Endoplasmic reticulum resident protein 57 (ERP57)",
                "Endoplasmic reticulum resident protein 72 (ERP72)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Oxygen-regulated protein (ORP150)",
                "Protein kinase R (PKR)-like endoplasmic reticulum kinase (PERK)",
                "Stress-70 protein, mitochondrial (GRP75)",
                "Unfolded Protein Response Activator ATF6 (ATF6alpha)",
                "Unfolded protein response activator PERK (PERK)",
                "Unfolded protein response signal activator IRE1 (IRE1alpha)",
                "X-box binding protein 1 (XBP1)"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "BiP (Binding immunoglobulin protein)",
            "IRE1 (Inositol-requiring enzyme 1)",
            "PERK (Protein kinase R-like endoplasmic reticulum kinase)",
            "ATF6 (Activating transcription factor 6)",
            "XBP1 (X-box binding protein 1)",
            "GRP78 (Glucose-regulated protein 78)",
            "Hsp70 (Heat shock protein 70)",
            "Hsp90 (Heat shock protein 90)",
            "CHOP (C/EBP homologous protein)",
            "Calnexin",
            "Calreticulin",
            "EDEM (ER degradation-enhancing alpha-mannosidase-like protein)",
            "ERdj5 (Endoplasmic reticulum DnaJ homolog 5)",
            "PDI (Protein disulfide isomerase)",
            "ERO1 (Endoplasmic reticulum oxidoreductin 1)",
            "Derlin-1",
            "Derlin-2",
            "Derlin-3",
            "SEL1L (Suppressor/enhancer of lin-12-like)",
            "HRD1 (HMG-CoA reductase degradation 1 homolog)",
            "OS-9 (Osteosarcoma amplified 9)",
            "EDEM1 (ER degradation-enhancing alpha-mannosidase-like protein 1)",
            "EDEM2 (ER degradation-enhancing alpha-mannosidase-like protein 2)",
            "EDEM3 (ER degradation-enhancing alpha-mannosidase-like protein 3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BiP (Binding immunoglobulin protein)",
                "IRE1 (Inositol-requiring enzyme 1)",
                "PERK (Protein kinase R-like endoplasmic reticulum kinase)",
                "ATF6 (Activating transcription factor 6)",
                "XBP1 (X-box binding protein 1)",
                "GRP78 (Glucose-regulated protein 78)",
                "Hsp70 (Heat shock protein 70)",
                "Hsp90 (Heat shock protein 90)",
                "CHOP (C/EBP homologous protein)",
                "Calnexin",
                "Calreticulin",
                "EDEM (ER degradation-enhancing alpha-mannosidase-like protein)",
                "ERdj5 (Endoplasmic reticulum DnaJ homolog 5)",
                "PDI (Protein disulfide isomerase)",
                "ERO1 (Endoplasmic reticulum oxidoreductin 1)",
                "Derlin-1",
                "Derlin-2",
                "Derlin-3",
                "SEL1L (Suppressor/enhancer of lin-12-like)",
                "HRD1 (HMG-CoA reductase degradation 1 homolog)",
                "OS-9 (Osteosarcoma amplified 9)",
                "EDEM1 (ER degradation-enhancing alpha-mannosidase-like protein 1)",
                "EDEM2 (ER degradation-enhancing alpha-mannosidase-like protein 2)",
                "EDEM3 (ER degradation-enhancing alpha-mannosidase-like protein 3)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATF6 (Activating transcription factor 6)",
                "BiP (Binding immunoglobulin protein)",
                "CHOP (C/EBP homologous protein)",
                "Calnexin",
                "Calreticulin",
                "Derlin-1",
                "Derlin-2",
                "Derlin-3",
                "EDEM (ER degradation-enhancing alpha-mannosidase-like protein)",
                "EDEM1 (ER degradation-enhancing alpha-mannosidase-like protein 1)",
                "EDEM2 (ER degradation-enhancing alpha-mannosidase-like protein 2)",
                "EDEM3 (ER degradation-enhancing alpha-mannosidase-like protein 3)",
                "ERO1 (Endoplasmic reticulum oxidoreductin 1)",
                "ERdj5 (Endoplasmic reticulum DnaJ homolog 5)",
                "GRP78 (Glucose-regulated protein 78)",
                "HRD1 (HMG-CoA reductase degradation 1 homolog)",
                "Hsp70 (Heat shock protein 70)",
                "Hsp90 (Heat shock protein 90)",
                "IRE1 (Inositol-requiring enzyme 1)",
                "OS-9 (Osteosarcoma amplified 9)",
                "PDI (Protein disulfide isomerase)",
                "PERK (Protein kinase R-like endoplasmic reticulum kinase)",
                "SEL1L (Suppressor/enhancer of lin-12-like)",
                "XBP1 (X-box binding protein 1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "BiP (GRP78)",
            "ATF6",
            "IRE1",
            "PERK",
            "eIF2\u03b1",
            "XBP1",
            "CHOP",
            "ATF4",
            "GRP94",
            "ERN1",
            "EIF2AK3",
            "HSPA5",
            "DDIT3",
            "DNAJB9",
            "CLGN",
            "HERPUD1",
            "ATF3",
            "JUN",
            "MCL1",
            "BIRC3",
            "EDEM1",
            "SEL1L",
            "OS9",
            "PDIA4"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BiP (GRP78)",
                "ATF6",
                "IRE1",
                "PERK",
                "eIF2\u03b1",
                "XBP1",
                "CHOP",
                "ATF4",
                "GRP94",
                "ERN1",
                "EIF2AK3",
                "HSPA5",
                "DDIT3",
                "DNAJB9",
                "CLGN",
                "HERPUD1",
                "ATF3",
                "JUN",
                "MCL1",
                "BIRC3",
                "EDEM1",
                "SEL1L",
                "OS9",
                "PDIA4"
            ],
            "mismatches": [],
            "true_referents": [
                "ATF3",
                "ATF4",
                "ATF6",
                "BIRC3",
                "BiP (GRP78)",
                "CHOP",
                "CLGN",
                "DDIT3",
                "DNAJB9",
                "EDEM1",
                "EIF2AK3",
                "ERN1",
                "GRP94",
                "HERPUD1",
                "HSPA5",
                "IRE1",
                "JUN",
                "MCL1",
                "OS9",
                "PDIA4",
                "PERK",
                "SEL1L",
                "XBP1",
                "eIF2\u03b1"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Inositol-requiring enzyme 1 (IRE1)",
            "Activating transcription factor 6 (ATF6)",
            "Protein kinase RNA-like endoplasmic reticulum kinase (PERK)",
            "X-box binding protein 1 (XBP1)",
            "Glucose-regulated protein 78 (GRP78/BiP)",
            "Glucose-regulated protein 94 (GRP94)",
            "Endoplasmic reticulum oxidoreductase 1 (ERO1)",
            "Protein disulfide isomerase (PDI)",
            "Calnexin",
            "Calreticulin",
            "ER degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
            "Homocysteine-induced ER protein (HERP)",
            "Stromal cell-derived factor 2-like protein 1 (SDF2L1)",
            "Endoplasmic reticulum lectin 1 (ERLEC1)",
            "Endoplasmic reticulum resident protein 29 (ERp29)",
            "Endoplasmic reticulum resident protein 44 (ERp44)",
            "Endoplasmic reticulum resident protein 57 (ERp57)",
            "Endoplasmic reticulum resident protein 72 (ERp72)",
            "Heat shock protein 47 (HSP47)",
            "Hypoxia up-regulated 1 (HYOU1)",
            "Protein sel-1 homolog 1 (SEL1L)",
            "Synoviolin (SYVN1)",
            "Transducin-like enhancer protein 3 (TLE3)",
            "UDP-glucose:glycoprotein glucosyltransferase 1 (UGGT1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Inositol-requiring enzyme 1 (IRE1)",
                "Activating transcription factor 6 (ATF6)",
                "Protein kinase RNA-like endoplasmic reticulum kinase (PERK)",
                "X-box binding protein 1 (XBP1)",
                "Glucose-regulated protein 78 (GRP78/BiP)",
                "Glucose-regulated protein 94 (GRP94)",
                "Endoplasmic reticulum oxidoreductase 1 (ERO1)",
                "Protein disulfide isomerase (PDI)",
                "Calnexin",
                "Calreticulin",
                "ER degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "Homocysteine-induced ER protein (HERP)",
                "Stromal cell-derived factor 2-like protein 1 (SDF2L1)",
                "Endoplasmic reticulum lectin 1 (ERLEC1)",
                "Endoplasmic reticulum resident protein 29 (ERp29)",
                "Endoplasmic reticulum resident protein 44 (ERp44)",
                "Endoplasmic reticulum resident protein 57 (ERp57)",
                "Endoplasmic reticulum resident protein 72 (ERp72)",
                "Heat shock protein 47 (HSP47)",
                "Hypoxia up-regulated 1 (HYOU1)",
                "Protein sel-1 homolog 1 (SEL1L)",
                "Synoviolin (SYVN1)",
                "Transducin-like enhancer protein 3 (TLE3)",
                "UDP-glucose:glycoprotein glucosyltransferase 1 (UGGT1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activating transcription factor 6 (ATF6)",
                "Calnexin",
                "Calreticulin",
                "ER degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "Endoplasmic reticulum lectin 1 (ERLEC1)",
                "Endoplasmic reticulum oxidoreductase 1 (ERO1)",
                "Endoplasmic reticulum resident protein 29 (ERp29)",
                "Endoplasmic reticulum resident protein 44 (ERp44)",
                "Endoplasmic reticulum resident protein 57 (ERp57)",
                "Endoplasmic reticulum resident protein 72 (ERp72)",
                "Glucose-regulated protein 78 (GRP78/BiP)",
                "Glucose-regulated protein 94 (GRP94)",
                "Heat shock protein 47 (HSP47)",
                "Homocysteine-induced ER protein (HERP)",
                "Hypoxia up-regulated 1 (HYOU1)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Protein disulfide isomerase (PDI)",
                "Protein kinase RNA-like endoplasmic reticulum kinase (PERK)",
                "Protein sel-1 homolog 1 (SEL1L)",
                "Stromal cell-derived factor 2-like protein 1 (SDF2L1)",
                "Synoviolin (SYVN1)",
                "Transducin-like enhancer protein 3 (TLE3)",
                "UDP-glucose:glycoprotein glucosyltransferase 1 (UGGT1)",
                "X-box binding protein 1 (XBP1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Activating transcription factor 6 (ATF6)",
            "Activating transcription factor 4 (ATF4)",
            "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
            "Inositol-requiring enzyme 1 (IRE1)",
            "Glucose-regulated protein 78 (GRP78)",
            "Glucose-regulated protein 94 (GRP94)",
            "Calreticulin (CALR)",
            "Endoplasmic reticulum resident protein 44 (ERp44)",
            "Protein disulfide isomerase (PDI)",
            "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
            "DnaJ homolog subfamily B member 11 (DNAJB11)",
            "Endoplasmic reticulum lectin 1 (ERLEC1)",
            "ER degradation enhancing alpha-mannosidase-like protein 1 (EDEM1)",
            "Homocysteine-responsive endoplasmic reticulum-resident ubiquitin-like domain member 1 protein (HERPUD1)",
            "Endoplasmic reticulum resident protein 29 (ERP29)",
            "Endoplasmic reticulum aminopeptidase 1 (ERAP1)",
            "Endoplasmic reticulum aminopeptidase 2 (ERAP2)",
            "ER membrane protein complex subunit 1 (EMC1)",
            "ER membrane protein complex subunit 2 (EMC2)",
            "ER membrane protein complex subunit 3 (EMC3)",
            "ER membrane protein complex subunit 4 (EMC4)",
            "ER membrane protein complex subunit 5 (EMC5)",
            "ER membrane protein complex subunit 6 (EMC6)",
            "ER membrane protein complex subunit 7 (EMC7)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Activating transcription factor 6 (ATF6)",
                "Activating transcription factor 4 (ATF4)",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Glucose-regulated protein 78 (GRP78)",
                "Glucose-regulated protein 94 (GRP94)",
                "Calreticulin (CALR)",
                "Endoplasmic reticulum resident protein 44 (ERp44)",
                "Protein disulfide isomerase (PDI)",
                "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
                "DnaJ homolog subfamily B member 11 (DNAJB11)",
                "Endoplasmic reticulum lectin 1 (ERLEC1)",
                "ER degradation enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "Homocysteine-responsive endoplasmic reticulum-resident ubiquitin-like domain member 1 protein (HERPUD1)",
                "Endoplasmic reticulum resident protein 29 (ERP29)",
                "Endoplasmic reticulum aminopeptidase 1 (ERAP1)",
                "Endoplasmic reticulum aminopeptidase 2 (ERAP2)",
                "ER membrane protein complex subunit 1 (EMC1)",
                "ER membrane protein complex subunit 2 (EMC2)",
                "ER membrane protein complex subunit 3 (EMC3)",
                "ER membrane protein complex subunit 4 (EMC4)",
                "ER membrane protein complex subunit 5 (EMC5)",
                "ER membrane protein complex subunit 6 (EMC6)",
                "ER membrane protein complex subunit 7 (EMC7)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activating transcription factor 4 (ATF4)",
                "Activating transcription factor 6 (ATF6)",
                "Calreticulin (CALR)",
                "DnaJ homolog subfamily B member 11 (DNAJB11)",
                "ER degradation enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "ER membrane protein complex subunit 1 (EMC1)",
                "ER membrane protein complex subunit 2 (EMC2)",
                "ER membrane protein complex subunit 3 (EMC3)",
                "ER membrane protein complex subunit 4 (EMC4)",
                "ER membrane protein complex subunit 5 (EMC5)",
                "ER membrane protein complex subunit 6 (EMC6)",
                "ER membrane protein complex subunit 7 (EMC7)",
                "Endoplasmic reticulum aminopeptidase 1 (ERAP1)",
                "Endoplasmic reticulum aminopeptidase 2 (ERAP2)",
                "Endoplasmic reticulum lectin 1 (ERLEC1)",
                "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
                "Endoplasmic reticulum resident protein 29 (ERP29)",
                "Endoplasmic reticulum resident protein 44 (ERp44)",
                "Glucose-regulated protein 78 (GRP78)",
                "Glucose-regulated protein 94 (GRP94)",
                "Homocysteine-responsive endoplasmic reticulum-resident ubiquitin-like domain member 1 protein (HERPUD1)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Protein disulfide isomerase (PDI)",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Immunoglobulin heavy chain-binding protein (BiP)",
            "Glucose-regulated protein 78 (GRP78)",
            "Heat shock 70 kDa protein 5 (HSPA5)",
            "Endoplasmic reticulum chaperone SIL1",
            "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
            "Inositol-requiring enzyme 1 (IRE1)",
            "Activating transcription factor 6 (ATF6)",
            "X-box binding protein 1 (XBP1)",
            "C/EBP homologous protein (CHOP)",
            "Calnexin",
            "Calreticulin",
            "Protein disulfide isomerase (PDI)",
            "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
            "Endoplasmic reticulum mannosidase I",
            "DNAJ homolog subfamily B member 9 (DNAJB9)",
            "Endoplasmic reticulum lectin 1 (ERLEC1)",
            "Osteosarcoma amplified 9 (OS9)",
            "Endoplasmic reticulum degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
            "Endoplasmic reticulum degradation-enhancing alpha-mannosidase-like protein 2 (EDEM2)",
            "Endoplasmic reticulum degradation-enhancing alpha-mannosidase-like protein 3 (EDEM3)",
            "Synoviolin 1 (SYVN1)",
            "Endoplasmic reticulum-associated degradation protein 1 (ERAP1)",
            "Valosin-containing protein (VCP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Immunoglobulin heavy chain-binding protein (BiP)",
                "Glucose-regulated protein 78 (GRP78)",
                "Heat shock 70 kDa protein 5 (HSPA5)",
                "Endoplasmic reticulum chaperone SIL1",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Activating transcription factor 6 (ATF6)",
                "X-box binding protein 1 (XBP1)",
                "C/EBP homologous protein (CHOP)",
                "Calnexin",
                "Calreticulin",
                "Protein disulfide isomerase (PDI)",
                "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
                "Endoplasmic reticulum mannosidase I",
                "DNAJ homolog subfamily B member 9 (DNAJB9)",
                "Endoplasmic reticulum lectin 1 (ERLEC1)",
                "Osteosarcoma amplified 9 (OS9)",
                "Endoplasmic reticulum degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "Endoplasmic reticulum degradation-enhancing alpha-mannosidase-like protein 2 (EDEM2)",
                "Endoplasmic reticulum degradation-enhancing alpha-mannosidase-like protein 3 (EDEM3)",
                "Synoviolin 1 (SYVN1)",
                "Endoplasmic reticulum-associated degradation protein 1 (ERAP1)",
                "Valosin-containing protein (VCP)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activating transcription factor 6 (ATF6)",
                "C/EBP homologous protein (CHOP)",
                "Calnexin",
                "Calreticulin",
                "DNAJ homolog subfamily B member 9 (DNAJB9)",
                "Endoplasmic reticulum chaperone SIL1",
                "Endoplasmic reticulum degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "Endoplasmic reticulum degradation-enhancing alpha-mannosidase-like protein 2 (EDEM2)",
                "Endoplasmic reticulum degradation-enhancing alpha-mannosidase-like protein 3 (EDEM3)",
                "Endoplasmic reticulum lectin 1 (ERLEC1)",
                "Endoplasmic reticulum mannosidase I",
                "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
                "Endoplasmic reticulum-associated degradation protein 1 (ERAP1)",
                "Glucose-regulated protein 78 (GRP78)",
                "Heat shock 70 kDa protein 5 (HSPA5)",
                "Immunoglobulin heavy chain-binding protein (BiP)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Osteosarcoma amplified 9 (OS9)",
                "Protein disulfide isomerase (PDI)",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
                "Synoviolin 1 (SYVN1)",
                "Valosin-containing protein (VCP)",
                "X-box binding protein 1 (XBP1)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Binding immunoglobulin protein (BiP)",
            "Glucose-regulated protein 78 (GRP78)",
            "Heat shock 70 kDa protein 5 (HSPA5)",
            "PRKR-like endoplasmic reticulum kinase (PERK)",
            "Inositol-requiring enzyme 1 (IRE1)",
            "Activating transcription factor 6 (ATF6)",
            "Protein disulfide isomerase (PDI)",
            "Endoplasmic reticulum oxidoreductin-1 (Ero1)",
            "Calreticulin (CALR)",
            "Calnexin (CANX)",
            "Protein kinase R (PKR)",
            "Eukaryotic translation initiation factor 2 subunit 1 (EIF2S1)",
            "X-box binding protein 1 (XBP1)",
            "Activating transcription factor 4 (ATF4)",
            "CCAAT/enhancer-binding protein homologous protein (CHOP)",
            "Endoplasmic reticulum-associated degradation (ERAD) pathway",
            "Unfolded protein response (UPR)",
            "Endoplasmic reticulum stress (ER stress)",
            "Misfolded protein aggregation",
            "Endoplasmic reticulum-Golgi intermediate compartment (ERGIC)",
            "Sarco/endoplasmic reticulum Ca2+-ATPase (SERCA)",
            "Phosphoinositide 3-kinase (PI3K)",
            "Mammalian target of rapamycin (mTOR)",
            "Autophagy"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Binding immunoglobulin protein (BiP)",
                "Glucose-regulated protein 78 (GRP78)",
                "Heat shock 70 kDa protein 5 (HSPA5)",
                "PRKR-like endoplasmic reticulum kinase (PERK)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Activating transcription factor 6 (ATF6)",
                "Protein disulfide isomerase (PDI)",
                "Endoplasmic reticulum oxidoreductin-1 (Ero1)",
                "Calreticulin (CALR)",
                "Calnexin (CANX)",
                "Protein kinase R (PKR)",
                "Eukaryotic translation initiation factor 2 subunit 1 (EIF2S1)",
                "X-box binding protein 1 (XBP1)",
                "Activating transcription factor 4 (ATF4)",
                "CCAAT/enhancer-binding protein homologous protein (CHOP)",
                "Endoplasmic reticulum-associated degradation (ERAD) pathway",
                "Unfolded protein response (UPR)",
                "Endoplasmic reticulum stress (ER stress)",
                "Misfolded protein aggregation",
                "Endoplasmic reticulum-Golgi intermediate compartment (ERGIC)",
                "Sarco/endoplasmic reticulum Ca2+-ATPase (SERCA)",
                "Phosphoinositide 3-kinase (PI3K)",
                "Mammalian target of rapamycin (mTOR)",
                "Autophagy"
            ],
            "mismatches": [],
            "true_referents": [
                "Activating transcription factor 4 (ATF4)",
                "Activating transcription factor 6 (ATF6)",
                "Autophagy",
                "Binding immunoglobulin protein (BiP)",
                "CCAAT/enhancer-binding protein homologous protein (CHOP)",
                "Calnexin (CANX)",
                "Calreticulin (CALR)",
                "Endoplasmic reticulum oxidoreductin-1 (Ero1)",
                "Endoplasmic reticulum stress (ER stress)",
                "Endoplasmic reticulum-Golgi intermediate compartment (ERGIC)",
                "Endoplasmic reticulum-associated degradation (ERAD) pathway",
                "Eukaryotic translation initiation factor 2 subunit 1 (EIF2S1)",
                "Glucose-regulated protein 78 (GRP78)",
                "Heat shock 70 kDa protein 5 (HSPA5)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Mammalian target of rapamycin (mTOR)",
                "Misfolded protein aggregation",
                "PRKR-like endoplasmic reticulum kinase (PERK)",
                "Phosphoinositide 3-kinase (PI3K)",
                "Protein disulfide isomerase (PDI)",
                "Protein kinase R (PKR)",
                "Sarco/endoplasmic reticulum Ca2+-ATPase (SERCA)",
                "Unfolded protein response (UPR)",
                "X-box binding protein 1 (XBP1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "ATF6 (Activating Transcription Factor 6) (ATF6)",
            "Bach1 (BTB and CNC homology 1)",
            "CHOP (C/EBP homologous protein)",
            "CREB (Cyclic AMP-Responsive Element Binding) protein",
            "EDEM (ER degradation enhancing alpha-mannosidase-like protein)",
            "ERp29 (Endoplasmic Reticulum protein 29)",
            "Grp78 (Glucose-regulated protein 78)",
            "HAC1 (Homologous to ATF6 and CREB3)",
            "IRE1 (Inositol Requiring Enzyme 1)",
            "PERK (PKR-like Endoplasmic Reticulum Kinase)",
            "PRDX1 (Peroxiredoxin 1)",
            "RIDD (Regulated IRE1-Dependent Decay)",
            "SEC61 (Sec61 translocon subunit alpha)",
            "SEC63 (Sec63 protein)",
            "SEC71 (Sec71 protein)",
            "SEL1L (Sel1-like protein)",
            "TRAF2 (Tumor Necrosis Factor Receptor-Associated Factor 2)",
            "TRAF3 (Tumor Necrosis Factor Receptor-Associated Factor 3)",
            "TRAF6 (Tumor Necrosis Factor Receptor-Associated Factor 6)",
            "UBR1 (Ubiquitin-protein ligase L1)",
            "UBR2 (Ubiquitin-protein ligase L2)",
            "XBP1 (X-box binding protein 1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATF6 (Activating Transcription Factor 6) (ATF6)",
                "Bach1 (BTB and CNC homology 1)",
                "CHOP (C/EBP homologous protein)",
                "CREB (Cyclic AMP-Responsive Element Binding) protein",
                "EDEM (ER degradation enhancing alpha-mannosidase-like protein)",
                "ERp29 (Endoplasmic Reticulum protein 29)",
                "Grp78 (Glucose-regulated protein 78)",
                "HAC1 (Homologous to ATF6 and CREB3)",
                "IRE1 (Inositol Requiring Enzyme 1)",
                "PERK (PKR-like Endoplasmic Reticulum Kinase)",
                "PRDX1 (Peroxiredoxin 1)",
                "RIDD (Regulated IRE1-Dependent Decay)",
                "SEC61 (Sec61 translocon subunit alpha)",
                "SEC63 (Sec63 protein)",
                "SEC71 (Sec71 protein)",
                "SEL1L (Sel1-like protein)",
                "TRAF2 (Tumor Necrosis Factor Receptor-Associated Factor 2)",
                "TRAF3 (Tumor Necrosis Factor Receptor-Associated Factor 3)",
                "TRAF6 (Tumor Necrosis Factor Receptor-Associated Factor 6)",
                "UBR1 (Ubiquitin-protein ligase L1)",
                "UBR2 (Ubiquitin-protein ligase L2)",
                "XBP1 (X-box binding protein 1)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATF6 (Activating Transcription Factor 6) (ATF6)",
                "Bach1 (BTB and CNC homology 1)",
                "CHOP (C/EBP homologous protein)",
                "CREB (Cyclic AMP-Responsive Element Binding) protein",
                "EDEM (ER degradation enhancing alpha-mannosidase-like protein)",
                "ERp29 (Endoplasmic Reticulum protein 29)",
                "Grp78 (Glucose-regulated protein 78)",
                "HAC1 (Homologous to ATF6 and CREB3)",
                "IRE1 (Inositol Requiring Enzyme 1)",
                "PERK (PKR-like Endoplasmic Reticulum Kinase)",
                "PRDX1 (Peroxiredoxin 1)",
                "RIDD (Regulated IRE1-Dependent Decay)",
                "SEC61 (Sec61 translocon subunit alpha)",
                "SEC63 (Sec63 protein)",
                "SEC71 (Sec71 protein)",
                "SEL1L (Sel1-like protein)",
                "TRAF2 (Tumor Necrosis Factor Receptor-Associated Factor 2)",
                "TRAF3 (Tumor Necrosis Factor Receptor-Associated Factor 3)",
                "TRAF6 (Tumor Necrosis Factor Receptor-Associated Factor 6)",
                "UBR1 (Ubiquitin-protein ligase L1)",
                "UBR2 (Ubiquitin-protein ligase L2)",
                "XBP1 (X-box binding protein 1)"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Activating transcription factor 6 (ATF6) (ATF6)",
            "X-box binding protein 1 (XBP1)",
            "Inositol-requiring enzyme 1 alpha (IRE1-alpha)",
            "PKR-like ER kinase (PERK)",
            "Activating transcription factor 4 (ATF4)",
            "CCAAT/enhancer-binding protein (C/EBP) homologous protein (CHOP)",
            "DNA-damage-inducible transcript 3 (DDIT3)",
            "Glucose-regulated protein 78 (GRP78)",
            "Glucose-regulated protein 94 (GRP94)",
            "Endoplasmic reticulum-resident protein 29 (ERP29)",
            "Endoplasmic reticulum-resident protein 44 (ERP44)",
            "Endoplasmic reticulum-resident protein 46 (ERP46)",
            "Protein disulfide isomerase family A, member 2 (PDI-P2)",
            "Protein disulfide isomerase family A, member 4 (PDI-P4)",
            "Protein disulfide isomerase family A, member 6 (PDI-P6)",
            "Endoplasmic reticulum protein 18 (ERp18)",
            "Endoplasmic reticulum protein 27 (ERp27)",
            "Endoplasmic reticulum protein 30 (ERp30)",
            "Endoplasmic reticulum protein 44 (ERp44)",
            "Endoplasmic reticulum protein 46 (ERp46)",
            "Endoplasmic reticulum protein 72 (ERp72)",
            "Osteonidogen (OSN)",
            "Osteonidogen 2 (OSN2)",
            "ER stress-associated protein 1 (ERSP1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Activating transcription factor 6 (ATF6) (ATF6)",
                "X-box binding protein 1 (XBP1)",
                "Inositol-requiring enzyme 1 alpha (IRE1-alpha)",
                "PKR-like ER kinase (PERK)",
                "Activating transcription factor 4 (ATF4)",
                "CCAAT/enhancer-binding protein (C/EBP) homologous protein (CHOP)",
                "DNA-damage-inducible transcript 3 (DDIT3)",
                "Glucose-regulated protein 78 (GRP78)",
                "Glucose-regulated protein 94 (GRP94)",
                "Endoplasmic reticulum-resident protein 29 (ERP29)",
                "Endoplasmic reticulum-resident protein 44 (ERP44)",
                "Endoplasmic reticulum-resident protein 46 (ERP46)",
                "Protein disulfide isomerase family A, member 2 (PDI-P2)",
                "Protein disulfide isomerase family A, member 4 (PDI-P4)",
                "Protein disulfide isomerase family A, member 6 (PDI-P6)",
                "Endoplasmic reticulum protein 18 (ERp18)",
                "Endoplasmic reticulum protein 27 (ERp27)",
                "Endoplasmic reticulum protein 30 (ERp30)",
                "Endoplasmic reticulum protein 44 (ERp44)",
                "Endoplasmic reticulum protein 46 (ERp46)",
                "Endoplasmic reticulum protein 72 (ERp72)",
                "Osteonidogen (OSN)",
                "Osteonidogen 2 (OSN2)",
                "ER stress-associated protein 1 (ERSP1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activating transcription factor 4 (ATF4)",
                "Activating transcription factor 6 (ATF6) (ATF6)",
                "CCAAT/enhancer-binding protein (C/EBP) homologous protein (CHOP)",
                "DNA-damage-inducible transcript 3 (DDIT3)",
                "ER stress-associated protein 1 (ERSP1)",
                "Endoplasmic reticulum protein 18 (ERp18)",
                "Endoplasmic reticulum protein 27 (ERp27)",
                "Endoplasmic reticulum protein 30 (ERp30)",
                "Endoplasmic reticulum protein 44 (ERp44)",
                "Endoplasmic reticulum protein 46 (ERp46)",
                "Endoplasmic reticulum protein 72 (ERp72)",
                "Endoplasmic reticulum-resident protein 29 (ERP29)",
                "Endoplasmic reticulum-resident protein 44 (ERP44)",
                "Endoplasmic reticulum-resident protein 46 (ERP46)",
                "Glucose-regulated protein 78 (GRP78)",
                "Glucose-regulated protein 94 (GRP94)",
                "Inositol-requiring enzyme 1 alpha (IRE1-alpha)",
                "Osteonidogen (OSN)",
                "Osteonidogen 2 (OSN2)",
                "PKR-like ER kinase (PERK)",
                "Protein disulfide isomerase family A, member 2 (PDI-P2)",
                "Protein disulfide isomerase family A, member 4 (PDI-P4)",
                "Protein disulfide isomerase family A, member 6 (PDI-P6)",
                "X-box binding protein 1 (XBP1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            {
                "Referent": "BiP (70kDa glucose-regulated protein)",
                "Canonical name": "70kDa glucose-regulated protein"
            },
            {
                "Referent": "GRP78 (78kDa glucose-regulated protein)",
                "Canonical name": "78kDa glucose-regulated protein"
            },
            {
                "Referent": "GRP94 (94kDa glucose-regulated protein)",
                "Canonical name": "94kDa glucose-regulated protein"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BiP (70kDa glucose-regulated protein)",
                "GRP78 (78kDa glucose-regulated protein)",
                "GRP94 (94kDa glucose-regulated protein)"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"BiP (70kDa glucose-regulated protein)\", \"Canonical name\": \"70kDa glucose-regulated protein\"}",
                "{\"Referent\": \"GRP78 (78kDa glucose-regulated protein)\", \"Canonical name\": \"78kDa glucose-regulated protein\"}",
                "{\"Referent\": \"GRP94 (94kDa glucose-regulated protein)\", \"Canonical name\": \"94kDa glucose-regulated protein\"}"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 0
        }
    }
]