[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "IRE1 (ERN1)",
            "XBP1",
            "ATF6",
            "PERK (EIF2AK3)",
            "DDIT3 (CHOP)",
            "HERPUD1",
            "DNAJB11",
            "DNAJC3",
            "DNAJB9",
            "DNAJC13",
            "EDEM1",
            "EDEM2",
            "EDEM3",
            "P58IPK (HERPUD2)",
            "P8 (HERP)",
            "PDI (PDIA1)",
            "ERDJ4",
            "ERDJ5",
            "ERO1L",
            "HSPA5 (GRP78)",
            "HSPA8 (GRP75)",
            "HSP90B1 (GRP94)",
            "HYOU1 (GRP170)",
            "CALR"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "IRE1 (ERN1)",
                "XBP1",
                "ATF6",
                "PERK (EIF2AK3)",
                "DDIT3 (CHOP)",
                "HERPUD1",
                "DNAJB11",
                "DNAJC3",
                "DNAJB9",
                "DNAJC13",
                "EDEM1",
                "EDEM2",
                "EDEM3",
                "P58IPK (HERPUD2)",
                "P8 (HERP)",
                "PDI (PDIA1)",
                "ERDJ4",
                "ERDJ5",
                "ERO1L",
                "HSPA5 (GRP78)",
                "HSPA8 (GRP75)",
                "HSP90B1 (GRP94)",
                "HYOU1 (GRP170)",
                "CALR"
            ],
            "mismatches": [],
            "true_referents": [
                "ATF6",
                "CALR",
                "DDIT3 (CHOP)",
                "DNAJB11",
                "DNAJB9",
                "DNAJC13",
                "DNAJC3",
                "EDEM1",
                "EDEM2",
                "EDEM3",
                "ERDJ4",
                "ERDJ5",
                "ERO1L",
                "HERPUD1",
                "HSP90B1 (GRP94)",
                "HSPA5 (GRP78)",
                "HSPA8 (GRP75)",
                "HYOU1 (GRP170)",
                "IRE1 (ERN1)",
                "P58IPK (HERPUD2)",
                "P8 (HERP)",
                "PDI (PDIA1)",
                "PERK (EIF2AK3)",
                "XBP1"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Activating Transcription Factor 6 (ATF6)",
            "Inositol-Requiring Enzyme 1 (IRE1)",
            "Protein Kinase RNA-like Endoplasmic Reticulum Kinase (PERK)",
            "Binding Immunoglobulin Protein (BiP)/Glucose-Regulated Protein 78 (GRP78)",
            "X-box Binding Protein 1 (XBP1)",
            "ATF4 (Activating Transcription Factor 4)",
            "CHOP (C/EBP Homologous Protein)",
            "EDEM1 (ER Degradation Enhancing \u03b1-Mannosidase-like Protein 1)",
            "Herp (Homocysteine Inducible ER Protein)",
            "GADD34 (Growth Arrest and DNA Damage-inducible protein 34)",
            "EDEM2 (ER Degradation Enhancing \u03b1-Mannosidase-like Protein 2)",
            "EDEM3 (ER Degradation Enhancing \u03b1-Mannosidase-like Protein 3)",
            "ERp57 (ER Protein 57)",
            "Calnexin",
            "Calreticulin",
            "PDI (Protein Disulfide Isomerase)",
            "ERdj3 (ER DnaJ Homolog 3)",
            "ERdj4 (ER DnaJ Homolog 4)",
            "ERdj5 (ER DnaJ Homolog 5)",
            "ERdj6 (ER DnaJ Homolog 6)",
            "ERp72 (ER Protein 72)",
            "GADD34-Binding Protein 1 (GADD34BP1)",
            "TRAF2 (TNF Receptor Associated Factor 2)",
            "ASK1 (Apoptosis Signal-regulating Kinase 1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Activating Transcription Factor 6 (ATF6)",
                "Inositol-Requiring Enzyme 1 (IRE1)",
                "Protein Kinase RNA-like Endoplasmic Reticulum Kinase (PERK)",
                "Binding Immunoglobulin Protein (BiP)/Glucose-Regulated Protein 78 (GRP78)",
                "X-box Binding Protein 1 (XBP1)",
                "ATF4 (Activating Transcription Factor 4)",
                "CHOP (C/EBP Homologous Protein)",
                "EDEM1 (ER Degradation Enhancing \u03b1-Mannosidase-like Protein 1)",
                "Herp (Homocysteine Inducible ER Protein)",
                "GADD34 (Growth Arrest and DNA Damage-inducible protein 34)",
                "EDEM2 (ER Degradation Enhancing \u03b1-Mannosidase-like Protein 2)",
                "EDEM3 (ER Degradation Enhancing \u03b1-Mannosidase-like Protein 3)",
                "ERp57 (ER Protein 57)",
                "Calnexin",
                "Calreticulin",
                "PDI (Protein Disulfide Isomerase)",
                "ERdj3 (ER DnaJ Homolog 3)",
                "ERdj4 (ER DnaJ Homolog 4)",
                "ERdj5 (ER DnaJ Homolog 5)",
                "ERdj6 (ER DnaJ Homolog 6)",
                "ERp72 (ER Protein 72)",
                "GADD34-Binding Protein 1 (GADD34BP1)",
                "TRAF2 (TNF Receptor Associated Factor 2)",
                "ASK1 (Apoptosis Signal-regulating Kinase 1)"
            ],
            "mismatches": [],
            "true_referents": [
                "ASK1 (Apoptosis Signal-regulating Kinase 1)",
                "ATF4 (Activating Transcription Factor 4)",
                "Activating Transcription Factor 6 (ATF6)",
                "Binding Immunoglobulin Protein (BiP)/Glucose-Regulated Protein 78 (GRP78)",
                "CHOP (C/EBP Homologous Protein)",
                "Calnexin",
                "Calreticulin",
                "EDEM1 (ER Degradation Enhancing \u03b1-Mannosidase-like Protein 1)",
                "EDEM2 (ER Degradation Enhancing \u03b1-Mannosidase-like Protein 2)",
                "EDEM3 (ER Degradation Enhancing \u03b1-Mannosidase-like Protein 3)",
                "ERdj3 (ER DnaJ Homolog 3)",
                "ERdj4 (ER DnaJ Homolog 4)",
                "ERdj5 (ER DnaJ Homolog 5)",
                "ERdj6 (ER DnaJ Homolog 6)",
                "ERp57 (ER Protein 57)",
                "ERp72 (ER Protein 72)",
                "GADD34 (Growth Arrest and DNA Damage-inducible protein 34)",
                "GADD34-Binding Protein 1 (GADD34BP1)",
                "Herp (Homocysteine Inducible ER Protein)",
                "Inositol-Requiring Enzyme 1 (IRE1)",
                "PDI (Protein Disulfide Isomerase)",
                "Protein Kinase RNA-like Endoplasmic Reticulum Kinase (PERK)",
                "TRAF2 (TNF Receptor Associated Factor 2)",
                "X-box Binding Protein 1 (XBP1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "ATF6 (Activating transcription factor 6)",
            "IRE1 (Inositol-requiring enzyme 1)",
            "PERK (Protein kinase R-like endoplasmic reticulum kinase)",
            "GRP78/BiP (Glucose-regulated protein 78 kDa/Binding immunoglobulin Protein)",
            "XBP1 (X-box binding protein 1)",
            "ATF4 (Activating transcription factor 4)",
            "CHOP (C/EBP homologous protein)",
            "ATF3 (Activating transcription factor 3)",
            "EDEM1 (ER Degradation Enhancing Alpha-Mannosidase Like Protein 1)",
            "PDI (Protein disulfide isomerase)",
            "ERp57 (Endoplasmic reticulum protein 57)",
            "Calnexin",
            "Calreticulin",
            "ERp72 (Endoplasmic reticulum protein 72)",
            "HSP40 (Heat shock protein 40)",
            "HSP90 (Heat shock protein 90)",
            "GRP94 (Glucose-regulated protein 94)",
            "EIF2AK3 (Eukaryotic translation initiation factor 2 alpha kinase 3)",
            "EIF2S1 (Eukaryotic translation initiation factor 2 subunit 1)",
            "EIF2A (Eukaryotic translation initiation factor 2A)",
            "ERN1 (Endoplasmic reticulum to nucleus signaling 1)",
            "EDEM2 (ER Degradation Enhancing Alpha-Mannosidase Like Protein 2)",
            "EDEM3 (ER Degradation Enhancing Alpha-Mannosidase Like Protein 3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATF6 (Activating transcription factor 6)",
                "IRE1 (Inositol-requiring enzyme 1)",
                "PERK (Protein kinase R-like endoplasmic reticulum kinase)",
                "GRP78/BiP (Glucose-regulated protein 78 kDa/Binding immunoglobulin Protein)",
                "XBP1 (X-box binding protein 1)",
                "ATF4 (Activating transcription factor 4)",
                "CHOP (C/EBP homologous protein)",
                "ATF3 (Activating transcription factor 3)",
                "EDEM1 (ER Degradation Enhancing Alpha-Mannosidase Like Protein 1)",
                "PDI (Protein disulfide isomerase)",
                "ERp57 (Endoplasmic reticulum protein 57)",
                "Calnexin",
                "Calreticulin",
                "ERp72 (Endoplasmic reticulum protein 72)",
                "HSP40 (Heat shock protein 40)",
                "HSP90 (Heat shock protein 90)",
                "GRP94 (Glucose-regulated protein 94)",
                "EIF2AK3 (Eukaryotic translation initiation factor 2 alpha kinase 3)",
                "EIF2S1 (Eukaryotic translation initiation factor 2 subunit 1)",
                "EIF2A (Eukaryotic translation initiation factor 2A)",
                "ERN1 (Endoplasmic reticulum to nucleus signaling 1)",
                "EDEM2 (ER Degradation Enhancing Alpha-Mannosidase Like Protein 2)",
                "EDEM3 (ER Degradation Enhancing Alpha-Mannosidase Like Protein 3)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATF3 (Activating transcription factor 3)",
                "ATF4 (Activating transcription factor 4)",
                "ATF6 (Activating transcription factor 6)",
                "CHOP (C/EBP homologous protein)",
                "Calnexin",
                "Calreticulin",
                "EDEM1 (ER Degradation Enhancing Alpha-Mannosidase Like Protein 1)",
                "EDEM2 (ER Degradation Enhancing Alpha-Mannosidase Like Protein 2)",
                "EDEM3 (ER Degradation Enhancing Alpha-Mannosidase Like Protein 3)",
                "EIF2A (Eukaryotic translation initiation factor 2A)",
                "EIF2AK3 (Eukaryotic translation initiation factor 2 alpha kinase 3)",
                "EIF2S1 (Eukaryotic translation initiation factor 2 subunit 1)",
                "ERN1 (Endoplasmic reticulum to nucleus signaling 1)",
                "ERp57 (Endoplasmic reticulum protein 57)",
                "ERp72 (Endoplasmic reticulum protein 72)",
                "GRP78/BiP (Glucose-regulated protein 78 kDa/Binding immunoglobulin Protein)",
                "GRP94 (Glucose-regulated protein 94)",
                "HSP40 (Heat shock protein 40)",
                "HSP90 (Heat shock protein 90)",
                "IRE1 (Inositol-requiring enzyme 1)",
                "PDI (Protein disulfide isomerase)",
                "PERK (Protein kinase R-like endoplasmic reticulum kinase)",
                "XBP1 (X-box binding protein 1)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "IRE1\u03b1 (ERFE)",
            "IRE1\u03b2 (ERFE2)",
            "XBP1 (XBP1s/u)",
            "BiP/GRP78 (HSPA5)",
            "PERK (EIF2AK3)",
            "ATF4 (CREB2)",
            "CHOP (DDIT3)",
            "GADD34 (PPP1R15A)",
            "eIF2\u03b1 (EIF2S1)",
            "JNK1 (MAPK8)",
            "JNK2 (MAPK9)",
            "IRE1 endonuclease domain",
            "XBP1 mRNA splicing product",
            "Protein kinase RNA-like endoplasmic reticulum kinase",
            "Activating transcription factor 4",
            "C/EBP Homologous Protein",
            "Growth Arrest and DNA Damage-inducible protein 34",
            "Endoplasmic reticulum stress sensor 1",
            "Inositol-requiring enzyme 1",
            "Splice variant of XBP1",
            "Phosphorylated eIF2\u03b1",
            "MAP kinase cascade activation",
            "ER chaperone protein",
            "Transcription factor DDIT3"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "IRE1\u03b1 (ERFE)",
                "IRE1\u03b2 (ERFE2)",
                "XBP1 (XBP1s/u)",
                "BiP/GRP78 (HSPA5)",
                "PERK (EIF2AK3)",
                "ATF4 (CREB2)",
                "CHOP (DDIT3)",
                "GADD34 (PPP1R15A)",
                "eIF2\u03b1 (EIF2S1)",
                "JNK1 (MAPK8)",
                "JNK2 (MAPK9)",
                "IRE1 endonuclease domain",
                "XBP1 mRNA splicing product",
                "Protein kinase RNA-like endoplasmic reticulum kinase",
                "Activating transcription factor 4",
                "C/EBP Homologous Protein",
                "Growth Arrest and DNA Damage-inducible protein 34",
                "Endoplasmic reticulum stress sensor 1",
                "Inositol-requiring enzyme 1",
                "Splice variant of XBP1",
                "Phosphorylated eIF2\u03b1",
                "MAP kinase cascade activation",
                "ER chaperone protein",
                "Transcription factor DDIT3"
            ],
            "mismatches": [],
            "true_referents": [
                "ATF4 (CREB2)",
                "Activating transcription factor 4",
                "BiP/GRP78 (HSPA5)",
                "C/EBP Homologous Protein",
                "CHOP (DDIT3)",
                "ER chaperone protein",
                "Endoplasmic reticulum stress sensor 1",
                "GADD34 (PPP1R15A)",
                "Growth Arrest and DNA Damage-inducible protein 34",
                "IRE1 endonuclease domain",
                "IRE1\u03b1 (ERFE)",
                "IRE1\u03b2 (ERFE2)",
                "Inositol-requiring enzyme 1",
                "JNK1 (MAPK8)",
                "JNK2 (MAPK9)",
                "MAP kinase cascade activation",
                "PERK (EIF2AK3)",
                "Phosphorylated eIF2\u03b1",
                "Protein kinase RNA-like endoplasmic reticulum kinase",
                "Splice variant of XBP1",
                "Transcription factor DDIT3",
                "XBP1 (XBP1s/u)",
                "XBP1 mRNA splicing product",
                "eIF2\u03b1 (EIF2S1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Inositol-requiring enzyme 1 (IRE1)",
            "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
            "Activating transcription factor 6 (ATF6)",
            "X-box binding protein 1 (XBP1)",
            "C/EBP homologous protein (CHOP)",
            "Glucose-regulated protein 78 (GRP78/BiP)",
            "Glucose-regulated protein 94 (GRP94)",
            "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
            "Disulfide isomerase (PDI)",
            "Calreticulin",
            "Calnexin",
            "Heat shock protein 90 (HSP90)",
            "Heat shock protein 70 (HSP70)",
            "DNA damage-inducible transcript 3 protein (DDIT3)",
            "Heme-regulated inhibitor kinase (HRI)",
            "Heme oxygenase 1 (HO-1)",
            "Serine/threonine-protein phosphatase 1 regulatory subunit 15A (PPP1R15A/GADD34)",
            "Eukaryotic translation initiation factor 2-alpha kinase 3 (EIF2AK3)",
            "Activating transcription factor 4 (ATF4)",
            "B-cell lymphoma 2-associated X protein (BAX)",
            "B-cell lymphoma 2 (BCL-2)",
            "Protein disulfide-isomerase A3 (PDIA3)",
            "Endoplasmic reticulum resident protein 44 (ERp44)",
            "Endoplasmic reticulum protein 57 (ERp57)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Inositol-requiring enzyme 1 (IRE1)",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
                "Activating transcription factor 6 (ATF6)",
                "X-box binding protein 1 (XBP1)",
                "C/EBP homologous protein (CHOP)",
                "Glucose-regulated protein 78 (GRP78/BiP)",
                "Glucose-regulated protein 94 (GRP94)",
                "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
                "Disulfide isomerase (PDI)",
                "Calreticulin",
                "Calnexin",
                "Heat shock protein 90 (HSP90)",
                "Heat shock protein 70 (HSP70)",
                "DNA damage-inducible transcript 3 protein (DDIT3)",
                "Heme-regulated inhibitor kinase (HRI)",
                "Heme oxygenase 1 (HO-1)",
                "Serine/threonine-protein phosphatase 1 regulatory subunit 15A (PPP1R15A/GADD34)",
                "Eukaryotic translation initiation factor 2-alpha kinase 3 (EIF2AK3)",
                "Activating transcription factor 4 (ATF4)",
                "B-cell lymphoma 2-associated X protein (BAX)",
                "B-cell lymphoma 2 (BCL-2)",
                "Protein disulfide-isomerase A3 (PDIA3)",
                "Endoplasmic reticulum resident protein 44 (ERp44)",
                "Endoplasmic reticulum protein 57 (ERp57)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activating transcription factor 4 (ATF4)",
                "Activating transcription factor 6 (ATF6)",
                "B-cell lymphoma 2 (BCL-2)",
                "B-cell lymphoma 2-associated X protein (BAX)",
                "C/EBP homologous protein (CHOP)",
                "Calnexin",
                "Calreticulin",
                "DNA damage-inducible transcript 3 protein (DDIT3)",
                "Disulfide isomerase (PDI)",
                "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
                "Endoplasmic reticulum protein 57 (ERp57)",
                "Endoplasmic reticulum resident protein 44 (ERp44)",
                "Eukaryotic translation initiation factor 2-alpha kinase 3 (EIF2AK3)",
                "Glucose-regulated protein 78 (GRP78/BiP)",
                "Glucose-regulated protein 94 (GRP94)",
                "Heat shock protein 70 (HSP70)",
                "Heat shock protein 90 (HSP90)",
                "Heme oxygenase 1 (HO-1)",
                "Heme-regulated inhibitor kinase (HRI)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Protein disulfide-isomerase A3 (PDIA3)",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
                "Serine/threonine-protein phosphatase 1 regulatory subunit 15A (PPP1R15A/GADD34)",
                "X-box binding protein 1 (XBP1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Glucose-regulated protein 78 (GRP78)",
            "Activating transcription factor 6 (ATF6)",
            "Inositol-requiring enzyme 1 (IRE1)",
            "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
            "C/EBP homologous protein (CHOP)",
            "X-box binding protein 1 (XBP1)",
            "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
            "Calreticulin (CALR)",
            "BiP (Binding immunoglobulin protein)",
            "Sec63 protein (SEC63)",
            "Protein disulfide isomerase (PDI)",
            "Eukaryotic translation initiation factor 2 alpha (eIF2\u03b1)",
            "Spliced X-box binding protein 1 (sXBP1)",
            "C/EBP alpha (CEBPA)",
            "C/EBP beta (CEBPB)",
            "Farnesyltransferase (FTase)",
            "Heat shock protein 70 (HSP70)",
            "Nuclear factor kappa-light-chain-enhancer of activated B cells (NF-\u03baB)",
            "Protein kinase AMP-activated non-catalytic subunit gamma 3 (PRKAG3)",
            "Nuclear factor erythroid 2-related factor 2 (Nrf2)",
            "Forkhead box O1 (FOXO1)",
            "Mitogen-activated protein kinase (MAPK)",
            "Caspase-12 (CASP12)",
            "Endoplasmic reticulum stress-induced apoptosis protein (ERAP)",
            "GADD153 protein (GADD153)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-regulated protein 78 (GRP78)",
                "Activating transcription factor 6 (ATF6)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
                "C/EBP homologous protein (CHOP)",
                "X-box binding protein 1 (XBP1)",
                "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
                "Calreticulin (CALR)",
                "BiP (Binding immunoglobulin protein)",
                "Sec63 protein (SEC63)",
                "Protein disulfide isomerase (PDI)",
                "Eukaryotic translation initiation factor 2 alpha (eIF2\u03b1)",
                "Spliced X-box binding protein 1 (sXBP1)",
                "C/EBP alpha (CEBPA)",
                "C/EBP beta (CEBPB)",
                "Farnesyltransferase (FTase)",
                "Heat shock protein 70 (HSP70)",
                "Nuclear factor kappa-light-chain-enhancer of activated B cells (NF-\u03baB)",
                "Protein kinase AMP-activated non-catalytic subunit gamma 3 (PRKAG3)",
                "Nuclear factor erythroid 2-related factor 2 (Nrf2)",
                "Forkhead box O1 (FOXO1)",
                "Mitogen-activated protein kinase (MAPK)",
                "Caspase-12 (CASP12)",
                "Endoplasmic reticulum stress-induced apoptosis protein (ERAP)"
            ],
            "mismatches": [
                "GADD153 protein (GADD153)"
            ],
            "true_referents": [
                "Activating transcription factor 6 (ATF6)",
                "BiP (Binding immunoglobulin protein)",
                "C/EBP alpha (CEBPA)",
                "C/EBP beta (CEBPB)",
                "C/EBP homologous protein (CHOP)",
                "Calreticulin (CALR)",
                "Caspase-12 (CASP12)",
                "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
                "Endoplasmic reticulum stress-induced apoptosis protein (ERAP)",
                "Eukaryotic translation initiation factor 2 alpha (eIF2\u03b1)",
                "Farnesyltransferase (FTase)",
                "Forkhead box O1 (FOXO1)",
                "Glucose-regulated protein 78 (GRP78)",
                "Heat shock protein 70 (HSP70)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Mitogen-activated protein kinase (MAPK)",
                "Nuclear factor erythroid 2-related factor 2 (Nrf2)",
                "Nuclear factor kappa-light-chain-enhancer of activated B cells (NF-\u03baB)",
                "Protein disulfide isomerase (PDI)",
                "Protein kinase AMP-activated non-catalytic subunit gamma 3 (PRKAG3)",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
                "Sec63 protein (SEC63)",
                "Spliced X-box binding protein 1 (sXBP1)",
                "X-box binding protein 1 (XBP1)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Activating transcription factor 6 (ATF6)",
            "Inositol-requiring enzyme 1 alpha (IRE1\u03b1)",
            "Protein kinase RNA-like endoplasmic reticulum kinase (PERK)",
            "X-box binding protein 1 (XBP1)",
            "Growth arrest and DNA damage-inducible protein (GADD34)",
            "C/EBP homologous protein (CHOP)",
            "ATF4 (Activating Transcription Factor 4)",
            "BIP (Binding immunoglobulin protein)",
            "EDEM1 (ER degradation-enhancing alpha-mannosidase-like protein 1)",
            "Herpud1 (Homocysteine-inducible, endoplasmic reticulum stress-inducible, ubiquitin-like domain member 1)",
            "P58IPK (Protein kinase inhibitor P58)",
            "ATF3 (Activating transcription factor 3)",
            "ATF5 (Activating transcription factor 5)",
            "HSPA5 (Heat shock 70kDa protein 5)",
            "HSP90B1 (Heat shock protein 90kDa beta member 1)",
            "DNAJB9 (DnaJ homolog subfamily B member 9)",
            "SEC61B (Sec61 beta subunit)",
            "SEC63 (Sec63 homolog, protein translocation regulator)",
            "SEL1L (Sel-1 suppressor of lin-12-like)",
            "UBXD8 (Ubiquitin regulatory X domain-containing protein 8)",
            "PDI (Protein disulfide isomerase)",
            "ERdj3 (Endoplasmic reticulum DnaJ homolog 3)",
            "ERdj4 (Endoplasmic reticulum DnaJ homolog 4)",
            "ERdj5 (Endoplasmic reticulum DnaJ homolog 5)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Activating transcription factor 6 (ATF6)",
                "Inositol-requiring enzyme 1 alpha (IRE1\u03b1)",
                "Protein kinase RNA-like endoplasmic reticulum kinase (PERK)",
                "X-box binding protein 1 (XBP1)",
                "Growth arrest and DNA damage-inducible protein (GADD34)",
                "C/EBP homologous protein (CHOP)",
                "ATF4 (Activating Transcription Factor 4)",
                "BIP (Binding immunoglobulin protein)",
                "EDEM1 (ER degradation-enhancing alpha-mannosidase-like protein 1)",
                "Herpud1 (Homocysteine-inducible, endoplasmic reticulum stress-inducible, ubiquitin-like domain member 1)",
                "P58IPK (Protein kinase inhibitor P58)",
                "ATF3 (Activating transcription factor 3)",
                "ATF5 (Activating transcription factor 5)",
                "HSPA5 (Heat shock 70kDa protein 5)",
                "HSP90B1 (Heat shock protein 90kDa beta member 1)",
                "DNAJB9 (DnaJ homolog subfamily B member 9)",
                "SEC61B (Sec61 beta subunit)",
                "SEC63 (Sec63 homolog, protein translocation regulator)",
                "SEL1L (Sel-1 suppressor of lin-12-like)",
                "UBXD8 (Ubiquitin regulatory X domain-containing protein 8)",
                "PDI (Protein disulfide isomerase)",
                "ERdj3 (Endoplasmic reticulum DnaJ homolog 3)",
                "ERdj4 (Endoplasmic reticulum DnaJ homolog 4)",
                "ERdj5 (Endoplasmic reticulum DnaJ homolog 5)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATF3 (Activating transcription factor 3)",
                "ATF4 (Activating Transcription Factor 4)",
                "ATF5 (Activating transcription factor 5)",
                "Activating transcription factor 6 (ATF6)",
                "BIP (Binding immunoglobulin protein)",
                "C/EBP homologous protein (CHOP)",
                "DNAJB9 (DnaJ homolog subfamily B member 9)",
                "EDEM1 (ER degradation-enhancing alpha-mannosidase-like protein 1)",
                "ERdj3 (Endoplasmic reticulum DnaJ homolog 3)",
                "ERdj4 (Endoplasmic reticulum DnaJ homolog 4)",
                "ERdj5 (Endoplasmic reticulum DnaJ homolog 5)",
                "Growth arrest and DNA damage-inducible protein (GADD34)",
                "HSP90B1 (Heat shock protein 90kDa beta member 1)",
                "HSPA5 (Heat shock 70kDa protein 5)",
                "Herpud1 (Homocysteine-inducible, endoplasmic reticulum stress-inducible, ubiquitin-like domain member 1)",
                "Inositol-requiring enzyme 1 alpha (IRE1\u03b1)",
                "P58IPK (Protein kinase inhibitor P58)",
                "PDI (Protein disulfide isomerase)",
                "Protein kinase RNA-like endoplasmic reticulum kinase (PERK)",
                "SEC61B (Sec61 beta subunit)",
                "SEC63 (Sec63 homolog, protein translocation regulator)",
                "SEL1L (Sel-1 suppressor of lin-12-like)",
                "UBXD8 (Ubiquitin regulatory X domain-containing protein 8)",
                "X-box binding protein 1 (XBP1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "ATF4 (activating transcription factor 4)",
            "ATF6 (activating transcription factor 6)",
            "XBP1 (X-box binding protein 1)",
            "IRE1 (inositol-requiring enzyme 1)",
            "PERK (protein kinase R-like endoplasmic reticulum kinase)",
            "CHOP (C/EBP homologous protein)",
            "BIP (binding immunoglobulin protein)",
            "GRP78 (glucose-regulated protein 78)",
            "HSP90 (heat shock protein 90)",
            "CALR (calreticulin)",
            "CRT (calreticulin)",
            "ERdj4 (endoplasmic reticulum DNA J domain-containing protein 4)",
            "XBP1s (spliced X-box binding protein 1)",
            "XBP1u (unspliced X-box binding protein 1)",
            "GADD34 (growth arrest and DNA damage-inducible protein 34)",
            "HERP (homocysteine-induced endoplasmic reticulum protein)",
            "P58IPK (protein kinase inhibitor of 58 kDa)",
            "ATF3 (activating transcription factor 3)",
            "DDIT3 (DNA damage-inducible transcript 3)",
            "GADD153 (growth arrest and DNA damage-inducible protein 153)",
            "ERN1 (endoplasmic reticulum to nucleus signaling 1)",
            "ERN2 (endoplasmic reticulum to nucleus signaling 2)",
            "HSPA5 (heat shock protein family A member 5)",
            "EIF2AK3 (eukaryotic translation initiation factor 2 alpha kinase 3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATF4 (activating transcription factor 4)",
                "ATF6 (activating transcription factor 6)",
                "XBP1 (X-box binding protein 1)",
                "IRE1 (inositol-requiring enzyme 1)",
                "PERK (protein kinase R-like endoplasmic reticulum kinase)",
                "CHOP (C/EBP homologous protein)",
                "BIP (binding immunoglobulin protein)",
                "GRP78 (glucose-regulated protein 78)",
                "HSP90 (heat shock protein 90)",
                "CALR (calreticulin)",
                "CRT (calreticulin)",
                "ERdj4 (endoplasmic reticulum DNA J domain-containing protein 4)",
                "XBP1s (spliced X-box binding protein 1)",
                "XBP1u (unspliced X-box binding protein 1)",
                "GADD34 (growth arrest and DNA damage-inducible protein 34)",
                "HERP (homocysteine-induced endoplasmic reticulum protein)",
                "P58IPK (protein kinase inhibitor of 58 kDa)",
                "ATF3 (activating transcription factor 3)",
                "DDIT3 (DNA damage-inducible transcript 3)",
                "GADD153 (growth arrest and DNA damage-inducible protein 153)",
                "ERN1 (endoplasmic reticulum to nucleus signaling 1)",
                "ERN2 (endoplasmic reticulum to nucleus signaling 2)",
                "HSPA5 (heat shock protein family A member 5)",
                "EIF2AK3 (eukaryotic translation initiation factor 2 alpha kinase 3)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATF3 (activating transcription factor 3)",
                "ATF4 (activating transcription factor 4)",
                "ATF6 (activating transcription factor 6)",
                "BIP (binding immunoglobulin protein)",
                "CALR (calreticulin)",
                "CHOP (C/EBP homologous protein)",
                "CRT (calreticulin)",
                "DDIT3 (DNA damage-inducible transcript 3)",
                "EIF2AK3 (eukaryotic translation initiation factor 2 alpha kinase 3)",
                "ERN1 (endoplasmic reticulum to nucleus signaling 1)",
                "ERN2 (endoplasmic reticulum to nucleus signaling 2)",
                "ERdj4 (endoplasmic reticulum DNA J domain-containing protein 4)",
                "GADD153 (growth arrest and DNA damage-inducible protein 153)",
                "GADD34 (growth arrest and DNA damage-inducible protein 34)",
                "GRP78 (glucose-regulated protein 78)",
                "HERP (homocysteine-induced endoplasmic reticulum protein)",
                "HSP90 (heat shock protein 90)",
                "HSPA5 (heat shock protein family A member 5)",
                "IRE1 (inositol-requiring enzyme 1)",
                "P58IPK (protein kinase inhibitor of 58 kDa)",
                "PERK (protein kinase R-like endoplasmic reticulum kinase)",
                "XBP1 (X-box binding protein 1)",
                "XBP1s (spliced X-box binding protein 1)",
                "XBP1u (unspliced X-box binding protein 1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Binding Immunoglobulin Protein (BiP)",
            "Activating Transcription Factor 6 (ATF6)",
            "Inositol-Requiring Enzyme 1 (IRE1)",
            "Protein Kinase R-like ER Kinase (PERK)",
            "X-box Binding Protein 1 (XBP1)",
            "C/EBP Homologous Protein (CHOP)",
            "Eukaryotic Initiation Factor 2 Subunit Alpha (eIF2\u03b1)",
            "Activating Transcription Factor 4 (ATF4)",
            "Growth Arrest and DNA Damage-inducible Protein 34 (GADD34)",
            "Endoplasmic Reticulum Degradation Enhancing Alpha-Mannosidase-like Protein 1 (EDEM1)",
            "Suppressor/Enhancer Lin-12 Like (SEL1L)",
            "Homocysteine Inducible Endoplasmic Reticulum Stress-Responsive Protein (HERP)",
            "Immunophilin-containing P58 Protein (P58^IPK)",
            "Endoplasmic Reticulum DnaJ Domain-containing Protein 4 (ERdj4)",
            "Protein Disulfide Isomerase (PDI)",
            "Glucose-Regulated Protein 94 (GRP94)",
            "Nuclear Factor (Erythroid-derived 2)-like 2 (Nrf2)",
            "TNF Receptor Associated Factor 2 (TRAF2)",
            "Apoptosis Signal-Regulating Kinase 1 (ASK1)",
            "Old Astrocyte Specifically Induced Substance (OASIS)",
            "Calreticulin",
            "Glucose-Regulated Protein 170 (GRP170)",
            "Caspase-12",
            "X-box Binding Protein 2 (XBP2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Binding Immunoglobulin Protein (BiP)",
                "Activating Transcription Factor 6 (ATF6)",
                "Inositol-Requiring Enzyme 1 (IRE1)",
                "Protein Kinase R-like ER Kinase (PERK)",
                "X-box Binding Protein 1 (XBP1)",
                "C/EBP Homologous Protein (CHOP)",
                "Eukaryotic Initiation Factor 2 Subunit Alpha (eIF2\u03b1)",
                "Activating Transcription Factor 4 (ATF4)",
                "Growth Arrest and DNA Damage-inducible Protein 34 (GADD34)",
                "Endoplasmic Reticulum Degradation Enhancing Alpha-Mannosidase-like Protein 1 (EDEM1)",
                "Suppressor/Enhancer Lin-12 Like (SEL1L)",
                "Homocysteine Inducible Endoplasmic Reticulum Stress-Responsive Protein (HERP)",
                "Immunophilin-containing P58 Protein (P58^IPK)",
                "Endoplasmic Reticulum DnaJ Domain-containing Protein 4 (ERdj4)",
                "Protein Disulfide Isomerase (PDI)",
                "Glucose-Regulated Protein 94 (GRP94)",
                "Nuclear Factor (Erythroid-derived 2)-like 2 (Nrf2)",
                "TNF Receptor Associated Factor 2 (TRAF2)",
                "Apoptosis Signal-Regulating Kinase 1 (ASK1)",
                "Old Astrocyte Specifically Induced Substance (OASIS)",
                "Calreticulin",
                "Glucose-Regulated Protein 170 (GRP170)",
                "Caspase-12",
                "X-box Binding Protein 2 (XBP2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activating Transcription Factor 4 (ATF4)",
                "Activating Transcription Factor 6 (ATF6)",
                "Apoptosis Signal-Regulating Kinase 1 (ASK1)",
                "Binding Immunoglobulin Protein (BiP)",
                "C/EBP Homologous Protein (CHOP)",
                "Calreticulin",
                "Caspase-12",
                "Endoplasmic Reticulum Degradation Enhancing Alpha-Mannosidase-like Protein 1 (EDEM1)",
                "Endoplasmic Reticulum DnaJ Domain-containing Protein 4 (ERdj4)",
                "Eukaryotic Initiation Factor 2 Subunit Alpha (eIF2\u03b1)",
                "Glucose-Regulated Protein 170 (GRP170)",
                "Glucose-Regulated Protein 94 (GRP94)",
                "Growth Arrest and DNA Damage-inducible Protein 34 (GADD34)",
                "Homocysteine Inducible Endoplasmic Reticulum Stress-Responsive Protein (HERP)",
                "Immunophilin-containing P58 Protein (P58^IPK)",
                "Inositol-Requiring Enzyme 1 (IRE1)",
                "Nuclear Factor (Erythroid-derived 2)-like 2 (Nrf2)",
                "Old Astrocyte Specifically Induced Substance (OASIS)",
                "Protein Disulfide Isomerase (PDI)",
                "Protein Kinase R-like ER Kinase (PERK)",
                "Suppressor/Enhancer Lin-12 Like (SEL1L)",
                "TNF Receptor Associated Factor 2 (TRAF2)",
                "X-box Binding Protein 1 (XBP1)",
                "X-box Binding Protein 2 (XBP2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Inositol-requiring enzyme 1 (IRE1)",
            "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
            "Activating transcription factor 6 (ATF6)",
            "X-box binding protein 1 (XBP1)",
            "Binding immunoglobulin protein (BiP/GRP78)",
            "C/EBP homologous protein (CHOP)",
            "Eukaryotic initiation factor 2 alpha (eIF2\u03b1)",
            "Activating transcription factor 4 (ATF4)",
            "Growth arrest and DNA damage-inducible protein (GADD34)",
            "ER degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
            "Protein disulfide isomerase (PDI)",
            "78 kDa glucose-regulated protein (GRP78)",
            "94 kDa glucose-regulated protein (GRP94)",
            "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
            "Homocysteine-induced endoplasmic reticulum protein (HERP)",
            "Synoviolin (HRD1)",
            "Nuclear factor erythroid 2-related factor 2 (NRF2)",
            "Tribbles homolog 3 (TRB3)",
            "ER-localized DnaJ 4 (ERdj4)",
            "Protein kinase inhibitor of 58 kDa (P58IPK)",
            "Wolframin (WFS1)",
            "Derlin-1",
            "ER lipid raft-associated 1 (ERLIN1)",
            "ER lipid raft-associated 2 (ERLIN2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Inositol-requiring enzyme 1 (IRE1)",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
                "Activating transcription factor 6 (ATF6)",
                "X-box binding protein 1 (XBP1)",
                "Binding immunoglobulin protein (BiP/GRP78)",
                "C/EBP homologous protein (CHOP)",
                "Eukaryotic initiation factor 2 alpha (eIF2\u03b1)",
                "Activating transcription factor 4 (ATF4)",
                "Growth arrest and DNA damage-inducible protein (GADD34)",
                "ER degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "Protein disulfide isomerase (PDI)",
                "78 kDa glucose-regulated protein (GRP78)",
                "94 kDa glucose-regulated protein (GRP94)",
                "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
                "Homocysteine-induced endoplasmic reticulum protein (HERP)",
                "Synoviolin (HRD1)",
                "Nuclear factor erythroid 2-related factor 2 (NRF2)",
                "Tribbles homolog 3 (TRB3)",
                "ER-localized DnaJ 4 (ERdj4)",
                "Protein kinase inhibitor of 58 kDa (P58IPK)",
                "Wolframin (WFS1)",
                "Derlin-1",
                "ER lipid raft-associated 1 (ERLIN1)",
                "ER lipid raft-associated 2 (ERLIN2)"
            ],
            "mismatches": [],
            "true_referents": [
                "78 kDa glucose-regulated protein (GRP78)",
                "94 kDa glucose-regulated protein (GRP94)",
                "Activating transcription factor 4 (ATF4)",
                "Activating transcription factor 6 (ATF6)",
                "Binding immunoglobulin protein (BiP/GRP78)",
                "C/EBP homologous protein (CHOP)",
                "Derlin-1",
                "ER degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "ER lipid raft-associated 1 (ERLIN1)",
                "ER lipid raft-associated 2 (ERLIN2)",
                "ER-localized DnaJ 4 (ERdj4)",
                "Endoplasmic reticulum oxidoreductin 1 (ERO1)",
                "Eukaryotic initiation factor 2 alpha (eIF2\u03b1)",
                "Growth arrest and DNA damage-inducible protein (GADD34)",
                "Homocysteine-induced endoplasmic reticulum protein (HERP)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Nuclear factor erythroid 2-related factor 2 (NRF2)",
                "Protein disulfide isomerase (PDI)",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
                "Protein kinase inhibitor of 58 kDa (P58IPK)",
                "Synoviolin (HRD1)",
                "Tribbles homolog 3 (TRB3)",
                "Wolframin (WFS1)",
                "X-box binding protein 1 (XBP1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Activating transcription factor 6 (ATF6)",
            "Activating transcription factor 4 (ATF4)",
            "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
            "Eukaryotic translation initiation factor 2-alpha kinase 3 (EIF2AK3)",
            "Inositol-requiring enzyme 1 (IRE1)",
            "Endoplasmic reticulum to nucleus signaling 1 (ERN1)",
            "X-box binding protein 1 (XBP1)",
            "DNA damage-inducible transcript 3 (DDIT3)",
            "C/EBP homologous protein (CHOP)",
            "ER degradation enhancing alpha-mannosidase-like protein 1 (EDEM1)",
            "ER lectin 1 (ERLEC1)",
            "Homocysteine-responsive endoplasmic reticulum-resident ubiquitin-like domain member 1 protein (HERPUD1)",
            "Heat shock protein family A (Hsp70) member 5 (HSPA5)",
            "78 kDa glucose-regulated protein (GRP78)",
            "Protein disulfide isomerase family A member 4 (PDIA4)",
            "ER protein 72 (ERP72)",
            "DnaJ heat shock protein family (Hsp40) member B9 (DNAJB9)",
            "ER DnaJ homolog 4 (ERdj4)",
            "Asparagine synthetase (glutamine-hydrolyzing) (ASNS)",
            "Growth arrest and DNA damage-inducible protein (GADD34)",
            "Protein phosphatase 1 regulatory subunit 15A (PPP1R15A)",
            "Sestrin 2 (SESN2)",
            "Cyclic AMP-dependent transcription factor ATF-5 (ATF5)",
            "Old astrocyte specifically induced substance (OASIS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Activating transcription factor 6 (ATF6)",
                "Activating transcription factor 4 (ATF4)",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
                "Eukaryotic translation initiation factor 2-alpha kinase 3 (EIF2AK3)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Endoplasmic reticulum to nucleus signaling 1 (ERN1)",
                "X-box binding protein 1 (XBP1)",
                "DNA damage-inducible transcript 3 (DDIT3)",
                "C/EBP homologous protein (CHOP)",
                "ER degradation enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "ER lectin 1 (ERLEC1)",
                "Homocysteine-responsive endoplasmic reticulum-resident ubiquitin-like domain member 1 protein (HERPUD1)",
                "Heat shock protein family A (Hsp70) member 5 (HSPA5)",
                "78 kDa glucose-regulated protein (GRP78)",
                "Protein disulfide isomerase family A member 4 (PDIA4)",
                "ER protein 72 (ERP72)",
                "DnaJ heat shock protein family (Hsp40) member B9 (DNAJB9)",
                "ER DnaJ homolog 4 (ERdj4)",
                "Asparagine synthetase (glutamine-hydrolyzing) (ASNS)",
                "Growth arrest and DNA damage-inducible protein (GADD34)",
                "Protein phosphatase 1 regulatory subunit 15A (PPP1R15A)",
                "Sestrin 2 (SESN2)",
                "Cyclic AMP-dependent transcription factor ATF-5 (ATF5)",
                "Old astrocyte specifically induced substance (OASIS)"
            ],
            "mismatches": [],
            "true_referents": [
                "78 kDa glucose-regulated protein (GRP78)",
                "Activating transcription factor 4 (ATF4)",
                "Activating transcription factor 6 (ATF6)",
                "Asparagine synthetase (glutamine-hydrolyzing) (ASNS)",
                "C/EBP homologous protein (CHOP)",
                "Cyclic AMP-dependent transcription factor ATF-5 (ATF5)",
                "DNA damage-inducible transcript 3 (DDIT3)",
                "DnaJ heat shock protein family (Hsp40) member B9 (DNAJB9)",
                "ER DnaJ homolog 4 (ERdj4)",
                "ER degradation enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "ER lectin 1 (ERLEC1)",
                "ER protein 72 (ERP72)",
                "Endoplasmic reticulum to nucleus signaling 1 (ERN1)",
                "Eukaryotic translation initiation factor 2-alpha kinase 3 (EIF2AK3)",
                "Growth arrest and DNA damage-inducible protein (GADD34)",
                "Heat shock protein family A (Hsp70) member 5 (HSPA5)",
                "Homocysteine-responsive endoplasmic reticulum-resident ubiquitin-like domain member 1 protein (HERPUD1)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Old astrocyte specifically induced substance (OASIS)",
                "Protein disulfide isomerase family A member 4 (PDIA4)",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
                "Protein phosphatase 1 regulatory subunit 15A (PPP1R15A)",
                "Sestrin 2 (SESN2)",
                "X-box binding protein 1 (XBP1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Inositol-requiring enzyme 1 (IRE1)",
            "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
            "Activating transcription factor 6 (ATF6)",
            "X-box binding protein 1 (XBP1)",
            "Glucose-regulated protein 78 (GRP78)",
            "Glucose-regulated protein 94 (GRP94)",
            "Endoplasmic reticulum oxidoreductase 1 alpha (ERO1\u03b1)",
            "Protein disulfide isomerase (PDI)",
            "Calreticulin (CALR)",
            "Calnexin (CANX)",
            "Activating transcription factor 4 (ATF4)",
            "C/EBP homologous protein (CHOP)",
            "Spliced X-box binding protein 1 (XBP1s)",
            "Unspliced X-box binding protein 1 (XBP1u)",
            "Eukaryotic translation initiation factor 2 alpha (eIF2\u03b1)",
            "Endoplasmic reticulum-associated degradation (ERAD)",
            "Synoviolin (SYVN1)",
            "Endoplasmic reticulum mannosidase I (ERManI)",
            "Endoplasmic reticulum degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
            "Homocysteine-induced endoplasmic reticulum protein (HERP)",
            "Endoplasmic reticulum stress-associated RNA (ER-SAR)",
            "Endoplasmic reticulum stress sensor/transducer (ERSE)",
            "Endoplasmic reticulum stress response element (ERSE)",
            "Endoplasmic reticulum stress response element-binding protein (ERSEP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Inositol-requiring enzyme 1 (IRE1)",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
                "Activating transcription factor 6 (ATF6)",
                "X-box binding protein 1 (XBP1)",
                "Glucose-regulated protein 78 (GRP78)",
                "Glucose-regulated protein 94 (GRP94)",
                "Endoplasmic reticulum oxidoreductase 1 alpha (ERO1\u03b1)",
                "Protein disulfide isomerase (PDI)",
                "Calreticulin (CALR)",
                "Calnexin (CANX)",
                "Activating transcription factor 4 (ATF4)",
                "C/EBP homologous protein (CHOP)",
                "Spliced X-box binding protein 1 (XBP1s)",
                "Unspliced X-box binding protein 1 (XBP1u)",
                "Eukaryotic translation initiation factor 2 alpha (eIF2\u03b1)",
                "Endoplasmic reticulum-associated degradation (ERAD)",
                "Synoviolin (SYVN1)",
                "Endoplasmic reticulum mannosidase I (ERManI)",
                "Endoplasmic reticulum degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "Homocysteine-induced endoplasmic reticulum protein (HERP)"
            ],
            "mismatches": [
                "Endoplasmic reticulum stress-associated RNA (ER-SAR)",
                "Endoplasmic reticulum stress sensor/transducer (ERSE)",
                "Endoplasmic reticulum stress response element (ERSE)",
                "Endoplasmic reticulum stress response element-binding protein (ERSEP)"
            ],
            "true_referents": [
                "Activating transcription factor 4 (ATF4)",
                "Activating transcription factor 6 (ATF6)",
                "C/EBP homologous protein (CHOP)",
                "Calnexin (CANX)",
                "Calreticulin (CALR)",
                "Endoplasmic reticulum degradation-enhancing alpha-mannosidase-like protein 1 (EDEM1)",
                "Endoplasmic reticulum mannosidase I (ERManI)",
                "Endoplasmic reticulum oxidoreductase 1 alpha (ERO1\u03b1)",
                "Endoplasmic reticulum stress response element (ERSE)",
                "Endoplasmic reticulum stress response element-binding protein (ERSEP)",
                "Endoplasmic reticulum stress sensor/transducer (ERSE)",
                "Endoplasmic reticulum stress-associated RNA (ER-SAR)",
                "Endoplasmic reticulum-associated degradation (ERAD)",
                "Eukaryotic translation initiation factor 2 alpha (eIF2\u03b1)",
                "Glucose-regulated protein 78 (GRP78)",
                "Glucose-regulated protein 94 (GRP94)",
                "Homocysteine-induced endoplasmic reticulum protein (HERP)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Protein disulfide isomerase (PDI)",
                "Protein kinase R-like endoplasmic reticulum kinase (PERK)",
                "Spliced X-box binding protein 1 (XBP1s)",
                "Synoviolin (SYVN1)",
                "Unspliced X-box binding protein 1 (XBP1u)",
                "X-box binding protein 1 (XBP1)"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Activating Transcription Factor 6 (ATF6)",
            "Endoplasmic Reticulum to Nucleus Signaling 1 (ERN1)",
            "Endoplasmic Reticulum Stress Sensor 1 (ERSS1)",
            "Eukaryotic Translation Initiation Factor 2 Alpha Kinase 3 (EIF2AK3)",
            "Glucose Regulated Protein 78 (GRP78)",
            "Heat Shock Protein Family A (Hsp70) Member 5 (HSPA5)",
            "Inositol-Requiring Enzyme 1 (IRE1)",
            "Mitogen-Activated Protein Kinase 8 (MAPK8)",
            "Protein Kinase R-Like Endoplasmic Reticulum Kinase (PERK)",
            "Spliced X-Box Binding Protein 1 (XBP1s)",
            "Activating Transcription Factor 4 (ATF4)",
            "Calreticulin (CALR)",
            "Calnexin (CANX)",
            "Endoplasmic Reticulum Oxidoreductin 1 (ERO1)",
            "Endoplasmic Reticulum Stress Response Element (ERSE)",
            "Endoplasmic Reticulum to Nucleus Signaling 2 (ERN2)",
            "Endoplasmic Reticulum Stress Sensor 2 (ERSS2)",
            "Eukaryotic Translation Initiation Factor 2 Alpha Kinase 4 (EIF2AK4)",
            "Heat Shock Protein Family A (Hsp70) Member 13 (HSPA13)",
            "Inositol-Requiring Enzyme 2 (IRE2)",
            "Mitogen-Activated Protein Kinase 9 (MAPK9)",
            "Protein Disulfide Isomerase Family A Member 3 (PDIA3)",
            "Protein Disulfide Isomerase Family A Member 4 (PDIA4)",
            "X-Box Binding Protein 1 (XBP1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Activating Transcription Factor 6 (ATF6)",
                "Endoplasmic Reticulum to Nucleus Signaling 1 (ERN1)",
                "Endoplasmic Reticulum Stress Sensor 1 (ERSS1)",
                "Eukaryotic Translation Initiation Factor 2 Alpha Kinase 3 (EIF2AK3)",
                "Glucose Regulated Protein 78 (GRP78)",
                "Heat Shock Protein Family A (Hsp70) Member 5 (HSPA5)",
                "Inositol-Requiring Enzyme 1 (IRE1)",
                "Mitogen-Activated Protein Kinase 8 (MAPK8)",
                "Protein Kinase R-Like Endoplasmic Reticulum Kinase (PERK)",
                "Spliced X-Box Binding Protein 1 (XBP1s)",
                "Activating Transcription Factor 4 (ATF4)",
                "Calreticulin (CALR)",
                "Calnexin (CANX)",
                "Endoplasmic Reticulum Oxidoreductin 1 (ERO1)",
                "Endoplasmic Reticulum Stress Response Element (ERSE)",
                "Endoplasmic Reticulum to Nucleus Signaling 2 (ERN2)",
                "Endoplasmic Reticulum Stress Sensor 2 (ERSS2)",
                "Eukaryotic Translation Initiation Factor 2 Alpha Kinase 4 (EIF2AK4)",
                "Heat Shock Protein Family A (Hsp70) Member 13 (HSPA13)",
                "Inositol-Requiring Enzyme 2 (IRE2)",
                "Mitogen-Activated Protein Kinase 9 (MAPK9)",
                "Protein Disulfide Isomerase Family A Member 3 (PDIA3)",
                "Protein Disulfide Isomerase Family A Member 4 (PDIA4)",
                "X-Box Binding Protein 1 (XBP1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activating Transcription Factor 4 (ATF4)",
                "Activating Transcription Factor 6 (ATF6)",
                "Calnexin (CANX)",
                "Calreticulin (CALR)",
                "Endoplasmic Reticulum Oxidoreductin 1 (ERO1)",
                "Endoplasmic Reticulum Stress Response Element (ERSE)",
                "Endoplasmic Reticulum Stress Sensor 1 (ERSS1)",
                "Endoplasmic Reticulum Stress Sensor 2 (ERSS2)",
                "Endoplasmic Reticulum to Nucleus Signaling 1 (ERN1)",
                "Endoplasmic Reticulum to Nucleus Signaling 2 (ERN2)",
                "Eukaryotic Translation Initiation Factor 2 Alpha Kinase 3 (EIF2AK3)",
                "Eukaryotic Translation Initiation Factor 2 Alpha Kinase 4 (EIF2AK4)",
                "Glucose Regulated Protein 78 (GRP78)",
                "Heat Shock Protein Family A (Hsp70) Member 13 (HSPA13)",
                "Heat Shock Protein Family A (Hsp70) Member 5 (HSPA5)",
                "Inositol-Requiring Enzyme 1 (IRE1)",
                "Inositol-Requiring Enzyme 2 (IRE2)",
                "Mitogen-Activated Protein Kinase 8 (MAPK8)",
                "Mitogen-Activated Protein Kinase 9 (MAPK9)",
                "Protein Disulfide Isomerase Family A Member 3 (PDIA3)",
                "Protein Disulfide Isomerase Family A Member 4 (PDIA4)",
                "Protein Kinase R-Like Endoplasmic Reticulum Kinase (PERK)",
                "Spliced X-Box Binding Protein 1 (XBP1s)",
                "X-Box Binding Protein 1 (XBP1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "ATF4 (Activating Transcription Factor 4)",
            "ATF6 (Activating Transcription Factor 6)",
            "BiP (Binding Immunoglobulin Protein)",
            "CHOP (C/EBP Homologous Protein)",
            "DDIT3 (DNA-Damage-Inducible Transcript 3)",
            "ERdj4 (Endoplasmic Reticulum DnaJ Homolog 4)",
            "ERp29 (Endoplasmic Reticulum Protein 29)",
            "GRP78 (Glucose-Regulated Protein 78)",
            "HSPA5 (Heat Shock Protein Family A Member 5)",
            "IRE1 (Inositol-Requiring Enzyme 1)",
            "PERK (PKR-Like Endoplasmic Reticulum Kinase)",
            "PKR (Protein Kinase R)",
            "PPP1R15A (Protein Phosphatase 1 Regulatory Subunit 15A)",
            "PPP1R15B (Protein Phosphatase 1 Regulatory Subunit 15B)",
            "SEC62 (Sec62 Vesicle Trafficking Protein)",
            "SEC63 (Sec63 Vesicle Trafficking Protein)",
            "SEL1L (Sel1-Like Protein)",
            "SPOTs (Superoxide Dismutase and Peroxiredoxin-like Protein)",
            "TRAP1 (Tumor Rejection Antigen 1)",
            "TRAP2 (Tumor Rejection Antigen 2)",
            "UGP2 (UDP-Glucose Pyrophosphorylase 2)",
            "XBP1 (X-Box Binding Protein 1)",
            "XBP1s (Spliced X-Box Binding Protein 1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATF4 (Activating Transcription Factor 4)",
                "ATF6 (Activating Transcription Factor 6)",
                "BiP (Binding Immunoglobulin Protein)",
                "CHOP (C/EBP Homologous Protein)",
                "DDIT3 (DNA-Damage-Inducible Transcript 3)",
                "ERdj4 (Endoplasmic Reticulum DnaJ Homolog 4)",
                "ERp29 (Endoplasmic Reticulum Protein 29)",
                "GRP78 (Glucose-Regulated Protein 78)",
                "HSPA5 (Heat Shock Protein Family A Member 5)",
                "IRE1 (Inositol-Requiring Enzyme 1)",
                "PERK (PKR-Like Endoplasmic Reticulum Kinase)",
                "PKR (Protein Kinase R)",
                "PPP1R15A (Protein Phosphatase 1 Regulatory Subunit 15A)",
                "PPP1R15B (Protein Phosphatase 1 Regulatory Subunit 15B)",
                "SEC62 (Sec62 Vesicle Trafficking Protein)",
                "SEC63 (Sec63 Vesicle Trafficking Protein)",
                "SEL1L (Sel1-Like Protein)",
                "SPOTs (Superoxide Dismutase and Peroxiredoxin-like Protein)",
                "TRAP1 (Tumor Rejection Antigen 1)",
                "TRAP2 (Tumor Rejection Antigen 2)",
                "UGP2 (UDP-Glucose Pyrophosphorylase 2)",
                "XBP1 (X-Box Binding Protein 1)",
                "XBP1s (Spliced X-Box Binding Protein 1)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATF4 (Activating Transcription Factor 4)",
                "ATF6 (Activating Transcription Factor 6)",
                "BiP (Binding Immunoglobulin Protein)",
                "CHOP (C/EBP Homologous Protein)",
                "DDIT3 (DNA-Damage-Inducible Transcript 3)",
                "ERdj4 (Endoplasmic Reticulum DnaJ Homolog 4)",
                "ERp29 (Endoplasmic Reticulum Protein 29)",
                "GRP78 (Glucose-Regulated Protein 78)",
                "HSPA5 (Heat Shock Protein Family A Member 5)",
                "IRE1 (Inositol-Requiring Enzyme 1)",
                "PERK (PKR-Like Endoplasmic Reticulum Kinase)",
                "PKR (Protein Kinase R)",
                "PPP1R15A (Protein Phosphatase 1 Regulatory Subunit 15A)",
                "PPP1R15B (Protein Phosphatase 1 Regulatory Subunit 15B)",
                "SEC62 (Sec62 Vesicle Trafficking Protein)",
                "SEC63 (Sec63 Vesicle Trafficking Protein)",
                "SEL1L (Sel1-Like Protein)",
                "SPOTs (Superoxide Dismutase and Peroxiredoxin-like Protein)",
                "TRAP1 (Tumor Rejection Antigen 1)",
                "TRAP2 (Tumor Rejection Antigen 2)",
                "UGP2 (UDP-Glucose Pyrophosphorylase 2)",
                "XBP1 (X-Box Binding Protein 1)",
                "XBP1s (Spliced X-Box Binding Protein 1)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            "Activating transcription factor 6 (ATF6)",
            "Alpha-subunit of eukaryotic translation initiation factor 2 (eIF2\u03b1)",
            "Binding immunoglobulin protein (BiP)",
            "CCAAT/enhancer-binding protein (C/EBP) homologous protein (CHOP)",
            "Deoxyribonucleic acid (DNA) damage-inducible protein 3 (GADD153)",
            "Endoplasmic reticulum-resident protein 44 (ERP44)",
            "Endoplasmic reticulum-resident protein 46 (ERP46)",
            "Endoplasmic reticulum-resident protein 72 (ERP72)",
            "Glucose-regulated protein 78 (GRP78)",
            "Glucose-regulated protein 94 (GRP94)",
            "Human immunoglobulin heavy chain-binding protein (BiP)",
            "Inositol-requiring enzyme 1 (IRE1)",
            "Inositol-requiring enzyme 1 alpha (IRE1\u03b1)",
            "PKR-like ER kinase (PERK)",
            "Protein kinase RNA-activated (PKR)",
            "Protein phosphatase 2A (PP2A)",
            "Spliced X-box binding protein 1 (sXBP1)",
            "Unfolded protein response element-binding protein 1 (UPREBP1)",
            "X-box binding protein 1 (XBP1)",
            "X-box binding protein 1s (XBP1s)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Activating transcription factor 6 (ATF6)",
                "Alpha-subunit of eukaryotic translation initiation factor 2 (eIF2\u03b1)",
                "Binding immunoglobulin protein (BiP)",
                "CCAAT/enhancer-binding protein (C/EBP) homologous protein (CHOP)",
                "Deoxyribonucleic acid (DNA) damage-inducible protein 3 (GADD153)",
                "Endoplasmic reticulum-resident protein 44 (ERP44)",
                "Endoplasmic reticulum-resident protein 46 (ERP46)",
                "Endoplasmic reticulum-resident protein 72 (ERP72)",
                "Glucose-regulated protein 78 (GRP78)",
                "Glucose-regulated protein 94 (GRP94)",
                "Human immunoglobulin heavy chain-binding protein (BiP)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Inositol-requiring enzyme 1 alpha (IRE1\u03b1)",
                "PKR-like ER kinase (PERK)",
                "Protein kinase RNA-activated (PKR)",
                "Protein phosphatase 2A (PP2A)",
                "Spliced X-box binding protein 1 (sXBP1)",
                "Unfolded protein response element-binding protein 1 (UPREBP1)",
                "X-box binding protein 1 (XBP1)",
                "X-box binding protein 1s (XBP1s)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activating transcription factor 6 (ATF6)",
                "Alpha-subunit of eukaryotic translation initiation factor 2 (eIF2\u03b1)",
                "Binding immunoglobulin protein (BiP)",
                "CCAAT/enhancer-binding protein (C/EBP) homologous protein (CHOP)",
                "Deoxyribonucleic acid (DNA) damage-inducible protein 3 (GADD153)",
                "Endoplasmic reticulum-resident protein 44 (ERP44)",
                "Endoplasmic reticulum-resident protein 46 (ERP46)",
                "Endoplasmic reticulum-resident protein 72 (ERP72)",
                "Glucose-regulated protein 78 (GRP78)",
                "Glucose-regulated protein 94 (GRP94)",
                "Human immunoglobulin heavy chain-binding protein (BiP)",
                "Inositol-requiring enzyme 1 (IRE1)",
                "Inositol-requiring enzyme 1 alpha (IRE1\u03b1)",
                "PKR-like ER kinase (PERK)",
                "Protein kinase RNA-activated (PKR)",
                "Protein phosphatase 2A (PP2A)",
                "Spliced X-box binding protein 1 (sXBP1)",
                "Unfolded protein response element-binding protein 1 (UPREBP1)",
                "X-box binding protein 1 (XBP1)",
                "X-box binding protein 1s (XBP1s)"
            ],
            "TP": 20,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "unfolded protein response protein",
        "domain": "biology",
        "response": [
            {
                "Referent": "ATF4",
                "Canonical name": "(ATF4)"
            },
            {
                "Referent": "ATF6",
                "Canonical name": "(ATF6)"
            },
            {
                "Referent": "CHOP",
                "Canonical name": "(CHOP)"
            },
            {
                "Referent": "DDIT3",
                "Canonical name": "(DDIT3)"
            },
            {
                "Referent": "EIF2AK3",
                "Canonical name": "(EIF2AK3)"
            },
            {
                "Referent": "GADD34",
                "Canonical name": "(GADD34)"
            },
            {
                "Referent": "HSPA5",
                "Canonical name": "(HSPA5)"
            },
            {
                "Referent": "HSF1",
                "Canonical name": "(HSF1)"
            },
            {
                "Referent": "HSF2",
                "Canonical name": "(HSF2)"
            },
            {
                "Referent": "HSF4",
                "Canonical name": "(HSF4)"
            },
            {
                "Referent": "HSF5",
                "Canonical name": "(HSF5)"
            },
            {
                "Referent": "IRE1",
                "Canonical name": "(IRE1)"
            },
            {
                "Referent": "PERK",
                "Canonical name": "(PERK)"
            },
            {
                "Referent": "SESN2",
                "Canonical name": "(SESN2)"
            },
            {
                "Referent": "XBP1",
                "Canonical name": "(XBP1)"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATF4",
                "ATF6",
                "CHOP",
                "DDIT3",
                "EIF2AK3",
                "GADD34",
                "HSPA5",
                "HSF1",
                "HSF2",
                "HSF4",
                "HSF5",
                "IRE1",
                "PERK",
                "SESN2",
                "XBP1"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"ATF4\", \"Canonical name\": \"(ATF4)\"}",
                "{\"Referent\": \"ATF6\", \"Canonical name\": \"(ATF6)\"}",
                "{\"Referent\": \"CHOP\", \"Canonical name\": \"(CHOP)\"}",
                "{\"Referent\": \"DDIT3\", \"Canonical name\": \"(DDIT3)\"}",
                "{\"Referent\": \"EIF2AK3\", \"Canonical name\": \"(EIF2AK3)\"}",
                "{\"Referent\": \"GADD34\", \"Canonical name\": \"(GADD34)\"}",
                "{\"Referent\": \"HSF1\", \"Canonical name\": \"(HSF1)\"}",
                "{\"Referent\": \"HSF2\", \"Canonical name\": \"(HSF2)\"}",
                "{\"Referent\": \"HSF4\", \"Canonical name\": \"(HSF4)\"}",
                "{\"Referent\": \"HSF5\", \"Canonical name\": \"(HSF5)\"}",
                "{\"Referent\": \"HSPA5\", \"Canonical name\": \"(HSPA5)\"}",
                "{\"Referent\": \"IRE1\", \"Canonical name\": \"(IRE1)\"}",
                "{\"Referent\": \"PERK\", \"Canonical name\": \"(PERK)\"}",
                "{\"Referent\": \"SESN2\", \"Canonical name\": \"(SESN2)\"}",
                "{\"Referent\": \"XBP1\", \"Canonical name\": \"(XBP1)\"}"
            ],
            "TP": 15,
            "FP": 0,
            "FN": 0
        }
    }
]