[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Catalase (CAT)",
            "Superoxide Dismutase 1 (SOD1)",
            "Superoxide Dismutase 2 (SOD2)",
            "Superoxide Dismutase 3 (SOD3)",
            "Glutathione Peroxidase 1 (GPX1)",
            "Glutathione Peroxidase 4 (GPX4)",
            "Glutathione Reductase (GSR)",
            "Thioredoxin 1 (TXN)",
            "Thioredoxin Reductase 1 (TXNRD1)",
            "Heme Oxygenase 1 (HMOX1)",
            "NAD(P)H Dehydrogenase Quinone 1 (NQO1)",
            "Alpha-1-Antitrypsin (A1AT)",
            "Alpha-1-Microglobulin (A1M)",
            "Paraoxonase 1 (PON1)",
            "Cystatin C (CST3)",
            "Metallothionein 1 (MT1)",
            "Metallothionein 2 (MT2)",
            "Selenoprotein P (SEPP1)",
            "Selenoprotein W (SEPW1)",
            "Peroxiredoxin 1 (PRDX1)",
            "Peroxiredoxin 2 (PRDX2)",
            "Peroxiredoxin 3 (PRDX3)",
            "Peroxiredoxin 6 (PRDX6)",
            "Urate Oxidase (UOX)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Superoxide Dismutase 1 (SOD1)",
                "Superoxide Dismutase 2 (SOD2)",
                "Superoxide Dismutase 3 (SOD3)",
                "Glutathione Peroxidase 1 (GPX1)",
                "Glutathione Peroxidase 4 (GPX4)",
                "Glutathione Reductase (GSR)",
                "Thioredoxin Reductase 1 (TXNRD1)",
                "NAD(P)H Dehydrogenase Quinone 1 (NQO1)",
                "Peroxiredoxin 1 (PRDX1)",
                "Peroxiredoxin 2 (PRDX2)",
                "Peroxiredoxin 3 (PRDX3)",
                "Peroxiredoxin 6 (PRDX6)"
            ],
            "mismatches": [
                "Thioredoxin 1 (TXN)",
                "Heme Oxygenase 1 (HMOX1)",
                "Alpha-1-Antitrypsin (A1AT)",
                "Alpha-1-Microglobulin (A1M)",
                "Paraoxonase 1 (PON1)",
                "Cystatin C (CST3)",
                "Metallothionein 1 (MT1)",
                "Metallothionein 2 (MT2)",
                "Selenoprotein P (SEPP1)",
                "Selenoprotein W (SEPW1)",
                "Urate Oxidase (UOX)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "alpha 1 microglobulin/bikunin precursor (Ambp)",
                "catalase (Cat)",
                "glutathione S-transferase alpha 5 (Gsta5)",
                "glutathione S-transferase pi 3 (Gstp3)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "hemoglobin X, alpha-like embryonic chain in Hba complex (Hba-x)",
                "hemoglobin alpha, adult chain 1 (Hba-a1)",
                "microsomal glutathione S-transferase 1 (Mgst1)",
                "microsomal glutathione S-transferase 2 (Mgst2)",
                "microsomal glutathione S-transferase 3 (Mgst3)",
                "myeloperoxidase (Mpo)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "peroxiredoxin 6 (Prdx6)",
                "peroxiredoxin 6B (Prdx6b)",
                "peroxiredoxin like 2A (Prxl2a)",
                "selenoprotein F (Selenof)",
                "selenoprotein S (Selenos)",
                "selenoprotein T (Selenot)",
                "selenoprotein W (Selenow)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide Dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione Peroxidase (GPx)",
            "Glutathione Reductase (GR)",
            "Peroxiredoxin (Prx)",
            "Thioredoxin (Trx)",
            "Glutaredoxin (Grx)",
            "Glutathione S-Transferase (GST)",
            "NAD(P)H Quinone Oxidoreductase 1 (NQO1)",
            "Heme Oxygenase-1 (HO-1)",
            "Cytochrome P450 Reductase (CPR)",
            "Manganese Superoxide Dismutase (MnSOD)",
            "Cu/Zn Superoxide Dismutase (Cu/ZnSOD)",
            "Extracellular Superoxide Dismutase (EC-SOD)",
            "Protein Thioredoxin (Trx1)",
            "Thioredoxin Reductase (TrxR)",
            "Glutathione (GSH)",
            "Vitamin C (Ascorbate)",
            "Vitamin E (Tocopherol)",
            "Uric Acid",
            "Alpha-Lipoic Acid",
            "Coenzyme Q10 (Ubiquinone)",
            "Melatonin",
            "Ferredoxin",
            "Ferritin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Glutathione Reductase (GR)",
                "Extracellular Superoxide Dismutase (EC-SOD)"
            ],
            "mismatches": [
                "Superoxide Dismutase (SOD)",
                "Glutathione Peroxidase (GPx)",
                "Peroxiredoxin (Prx)",
                "Thioredoxin (Trx)",
                "Glutaredoxin (Grx)",
                "Glutathione S-Transferase (GST)",
                "NAD(P)H Quinone Oxidoreductase 1 (NQO1)",
                "Heme Oxygenase-1 (HO-1)",
                "Cytochrome P450 Reductase (CPR)",
                "Manganese Superoxide Dismutase (MnSOD)",
                "Cu/Zn Superoxide Dismutase (Cu/ZnSOD)",
                "Protein Thioredoxin (Trx1)",
                "Thioredoxin Reductase (TrxR)",
                "Glutathione (GSH)",
                "Vitamin C (Ascorbate)",
                "Vitamin E (Tocopherol)",
                "Uric Acid",
                "Alpha-Lipoic Acid",
                "Coenzyme Q10 (Ubiquinone)",
                "Melatonin",
                "Ferredoxin",
                "Ferritin"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "arachidonate 5-lipoxygenase activating protein (Alox5ap)",
                "catalase (Cat)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase kappa 1 (Gstk1)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 3,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide Dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione Peroxidase (GPx)",
            "Glutathione Reductase (GR)",
            "Glutathione S-Transferase (GST)",
            "Thioredoxin (TRX)",
            "Thioredoxin Reductase (TXNRD)",
            "Peroxiredoxin (PRDX)",
            "Glutaredoxin (GLRX)",
            "Selenium-dependent Glutathione Peroxidase",
            "Copper-Zinc Superoxide Dismutase (CuZnSOD)",
            "Manganese Superoxide Dismutase (MnSOD)",
            "Extracellular Superoxide Dismutase (ECSOD)",
            "Selenium-independent Glutathione Peroxidase",
            "Nicotinamide Nucleotide Transhydrogenase (NNT)",
            "Ferritin",
            "Hemoxygenase-1 (HO-1)",
            "Nrf2 (Nuclear factor erythroid 2-related factor 2)",
            "Keap1 (Kelch-like ECH-associated protein 1)",
            "SIRT1 (Sirtuin 1)",
            "PGC-1\u03b1 (Proliferator-activated receptor gamma coactivator 1-alpha)",
            "ApoE (Apolipoprotein E)",
            "Paraoxonase 1 (PON1)",
            "NQO1 (NAD(P)H Quinone Dehydrogenase 1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Glutathione Reductase (GR)",
                "ApoE (Apolipoprotein E)",
                "NQO1 (NAD(P)H Quinone Dehydrogenase 1)"
            ],
            "mismatches": [
                "Superoxide Dismutase (SOD)",
                "Glutathione Peroxidase (GPx)",
                "Glutathione S-Transferase (GST)",
                "Thioredoxin (TRX)",
                "Thioredoxin Reductase (TXNRD)",
                "Peroxiredoxin (PRDX)",
                "Glutaredoxin (GLRX)",
                "Selenium-dependent Glutathione Peroxidase",
                "Copper-Zinc Superoxide Dismutase (CuZnSOD)",
                "Manganese Superoxide Dismutase (MnSOD)",
                "Extracellular Superoxide Dismutase (ECSOD)",
                "Selenium-independent Glutathione Peroxidase",
                "Nicotinamide Nucleotide Transhydrogenase (NNT)",
                "Ferritin",
                "Hemoxygenase-1 (HO-1)",
                "Nrf2 (Nuclear factor erythroid 2-related factor 2)",
                "Keap1 (Kelch-like ECH-associated protein 1)",
                "SIRT1 (Sirtuin 1)",
                "PGC-1\u03b1 (Proliferator-activated receptor gamma coactivator 1-alpha)",
                "Paraoxonase 1 (PON1)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "apolipoprotein A-IV (Apoa4)",
                "apolipoprotein E (Apoe)",
                "apolipoprotein M (Apom)",
                "arachidonate 5-lipoxygenase activating protein (Alox5ap)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "glutathione S-transferase kappa 1 (Gstk1)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "lactoperoxidase (Lpo)",
                "myeloperoxidase (Mpo)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "prostaglandin-endoperoxide synthase 1 (Ptgs1)",
                "prostaglandin-endoperoxide synthase 2 (Ptgs2)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide Dismutase 1 (SOD1)",
            "Superoxide Dismutase 2 (SOD2)",
            "Superoxide Dismutase 3 (SOD3)",
            "Catalase (CAT)",
            "Glutathione Peroxidase 1 (GPX1)",
            "Glutathione Peroxidase 2 (GPX2)",
            "Glutathione Peroxidase 3 (GPX3)",
            "Glutathione Peroxidase 4 (GPX4)",
            "Glutathione Reductase (GR)",
            "Thioredoxin Reductase 1 (TXNRD1)",
            "Thioredoxin (TRX)",
            "Peroxiredoxin 1 (PRDX1)",
            "Peroxiredoxin 2 (PRDX2)",
            "Peroxiredoxin 3 (PRDX3)",
            "Peroxiredoxin 4 (PRDX4)",
            "Peroxiredoxin 5 (PRDX5)",
            "Peroxiredoxin 6 (PRDX6)",
            "Heme Oxygenase-1 (HMOX1)",
            "Sulfiredoxin 1 (Srxn1)",
            "Methionine Sulfoxide Reductase A (MsrA)",
            "Methionine Sulfoxide Reductase B (MsrB)",
            "DJ-1 (PARK7)",
            "Nuclear factor erythroid 2-related factor 2 (Nrf2)",
            "Biliverdin Reductase A (BVR-A)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide Dismutase 1 (SOD1)",
                "Superoxide Dismutase 2 (SOD2)",
                "Superoxide Dismutase 3 (SOD3)",
                "Catalase (CAT)",
                "Glutathione Peroxidase 1 (GPX1)",
                "Glutathione Peroxidase 2 (GPX2)",
                "Glutathione Peroxidase 3 (GPX3)",
                "Glutathione Peroxidase 4 (GPX4)",
                "Thioredoxin Reductase 1 (TXNRD1)",
                "Peroxiredoxin 1 (PRDX1)",
                "Peroxiredoxin 2 (PRDX2)",
                "Peroxiredoxin 3 (PRDX3)",
                "Peroxiredoxin 4 (PRDX4)",
                "Peroxiredoxin 5 (PRDX5)",
                "Peroxiredoxin 6 (PRDX6)",
                "Sulfiredoxin 1 (Srxn1)",
                "DJ-1 (PARK7)"
            ],
            "mismatches": [
                "Glutathione Reductase (GR)",
                "Thioredoxin (TRX)",
                "Heme Oxygenase-1 (HMOX1)",
                "Methionine Sulfoxide Reductase A (MsrA)",
                "Methionine Sulfoxide Reductase B (MsrB)",
                "Nuclear factor erythroid 2-related factor 2 (Nrf2)",
                "Biliverdin Reductase A (BVR-A)"
            ],
            "true_referents": [
                "Parkinson disease (autosomal recessive, early onset) 7 (Park7)",
                "catalase (Cat)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 3 (Gpx3)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "nucleoredoxin (Nxn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "peroxiredoxin 6 (Prdx6)",
                "peroxiredoxin 6B (Prdx6b)",
                "peroxiredoxin like 2A (Prxl2a)",
                "sulfiredoxin 1 homolog (S. cerevisiae) (Srxn1)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide Dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione Peroxidase (GPx)",
            "Glutathione Reductase (GR)",
            "Thioredoxin (Trx)",
            "Thioredoxin Reductase (TrxR)",
            "Peroxiredoxin (Prx)",
            "Glutaredoxin (Grx)",
            "NAD(P)H:quinone oxidoreductase 1 (NQO1)",
            "Heme Oxygenase-1 (HO-1)",
            "Ferritin",
            "Ceruloplasmin",
            "Methionine Sulfoxide Reductase (MsrA)",
            "Aldose Reductase (AR)",
            "Paraoxonase (PON1)",
            "Sulfiredoxin (Srx)",
            "Aryl Hydrocarbon Receptor (AhR)",
            "Nuclear Factor Erythroid 2-Related Factor 2 (Nrf2)",
            "Selenoprotein P (SelP)",
            "Copper Chaperone for Superoxide Dismutase (CCS)",
            "Extracellular Superoxide Dismutase (EC-SOD)",
            "Ubiquinol-Cytochrome c Reductase (Complex III)",
            "Cytochrome c Oxidase (Complex IV)",
            "NADH:ubiquinone oxidoreductase (Complex I)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Ceruloplasmin",
                "Sulfiredoxin (Srx)"
            ],
            "mismatches": [
                "Superoxide Dismutase (SOD)",
                "Glutathione Peroxidase (GPx)",
                "Glutathione Reductase (GR)",
                "Thioredoxin (Trx)",
                "Thioredoxin Reductase (TrxR)",
                "Peroxiredoxin (Prx)",
                "Glutaredoxin (Grx)",
                "NAD(P)H:quinone oxidoreductase 1 (NQO1)",
                "Heme Oxygenase-1 (HO-1)",
                "Ferritin",
                "Methionine Sulfoxide Reductase (MsrA)",
                "Aldose Reductase (AR)",
                "Paraoxonase (PON1)",
                "Aryl Hydrocarbon Receptor (AhR)",
                "Nuclear Factor Erythroid 2-Related Factor 2 (Nrf2)",
                "Selenoprotein P (SelP)",
                "Copper Chaperone for Superoxide Dismutase (CCS)",
                "Extracellular Superoxide Dismutase (EC-SOD)",
                "Ubiquinol-Cytochrome c Reductase (Complex III)",
                "Cytochrome c Oxidase (Complex IV)",
                "NADH:ubiquinone oxidoreductase (Complex I)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase kappa 1 (Gstk1)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "myeloperoxidase (Mpo)",
                "myoglobin (Mb)",
                "nucleoredoxin (Nxn)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "selenoprotein F (Selenof)",
                "selenoprotein S (Selenos)",
                "selenoprotein W (Selenow)",
                "sulfiredoxin 1 homolog (S. cerevisiae) (Srxn1)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione peroxidase (GPX)",
            "Glutathione S-transferase (GST)",
            "Thioredoxin (TRX)",
            "Peroxiredoxin (PRDX)",
            "NADPH oxidase (NOX)",
            "Heme oxygenase-1 (HO-1)",
            "Ferritin (FT)",
            "Aldose reductase (AR)",
            "Ubiquitin-conjugating enzyme (UBE2)",
            "Nuclear factor erythroid 2-related factor 2 (Nrf2)",
            "Aconitase (ACO)",
            "Lactate dehydrogenase (LDH)",
            "Dipeptidyl peptidase-4 (DPP-4)",
            "Methionine sulfoxide reductase (MSR)",
            "Selenoprotein P (SELENOP)",
            "Cysteine-rich protein 61 (CYR61)",
            "Heat shock protein 70 (HSP70)",
            "Heat shock protein 27 (HSP27)",
            "Ferroportin (FPN)",
            "Glutathione (GSH)",
            "Vitamin C (Ascorbic acid)",
            "Vitamin E (Tocopherol)",
            "Coenzyme Q10 (Ubiquinone)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)"
            ],
            "mismatches": [
                "Superoxide dismutase (SOD)",
                "Glutathione peroxidase (GPX)",
                "Glutathione S-transferase (GST)",
                "Thioredoxin (TRX)",
                "Peroxiredoxin (PRDX)",
                "NADPH oxidase (NOX)",
                "Heme oxygenase-1 (HO-1)",
                "Ferritin (FT)",
                "Aldose reductase (AR)",
                "Ubiquitin-conjugating enzyme (UBE2)",
                "Nuclear factor erythroid 2-related factor 2 (Nrf2)",
                "Aconitase (ACO)",
                "Lactate dehydrogenase (LDH)",
                "Dipeptidyl peptidase-4 (DPP-4)",
                "Methionine sulfoxide reductase (MSR)",
                "Selenoprotein P (SELENOP)",
                "Cysteine-rich protein 61 (CYR61)",
                "Heat shock protein 70 (HSP70)",
                "Heat shock protein 27 (HSP27)",
                "Ferroportin (FPN)",
                "Glutathione (GSH)",
                "Vitamin C (Ascorbic acid)",
                "Vitamin E (Tocopherol)",
                "Coenzyme Q10 (Ubiquinone)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "apolipoprotein A-IV (Apoa4)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase pi 3 (Gstp3)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione peroxidase 7 (Gpx7)",
                "glutathione reductase (Gsr)",
                "hemoglobin, beta adult t chain (Hbb-bt)",
                "lactoperoxidase (Lpo)",
                "myoglobin (Mb)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "peroxiredoxin 6 (Prdx6)",
                "peroxiredoxin 6B (Prdx6b)",
                "selenoprotein F (Selenof)",
                "selenoprotein S (Selenos)",
                "selenoprotein T (Selenot)",
                "sulfiredoxin 1 homolog (S. cerevisiae) (Srxn1)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)",
                "transformation related protein 53 inducible nuclear protein 1 (Trp53inp1)"
            ],
            "TP": 1,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide Dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione Peroxidase (GPx)",
            "Glutathione Reductase (GR)",
            "Glutathione S-Transferase (GST)",
            "Peroxiredoxin (Prx)",
            "Thioredoxin (Trx)",
            "Thioredoxin Reductase (TrxR)",
            "Glutaredoxin (Grx)",
            "Glutathione-Synthetase (GSS)",
            "Glutamate-Cysteine Ligase (GCL)",
            "Methionine Sulfoxide Reductase (Msr)",
            "Coenzyme Q (CoQ)",
            "Vitamin E (\u03b1-Tocopherol)",
            "Vitamin C (Ascorbic Acid)",
            "Beta-Carotene",
            "Lipoic Acid",
            "Ferritin (FTH1)",
            "Heme Oxygenase-1 (HO-1)",
            "NAD(P)H Quinone Dehydrogenase 1 (NQO1)",
            "Glucose-6-Phosphate Dehydrogenase (G6PD)",
            "6-Phosphogluconate Dehydrogenase (6PGD)",
            "Haptoglobin",
            "Ceruloplasmin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Glutathione Reductase (GR)",
                "Haptoglobin",
                "Ceruloplasmin",
                "NAD(P)H Quinone Dehydrogenase 1 (NQO1)"
            ],
            "mismatches": [
                "Superoxide Dismutase (SOD)",
                "Glutathione Peroxidase (GPx)",
                "Glutathione S-Transferase (GST)",
                "Peroxiredoxin (Prx)",
                "Thioredoxin (Trx)",
                "Thioredoxin Reductase (TrxR)",
                "Glutaredoxin (Grx)",
                "Glutathione-Synthetase (GSS)",
                "Glutamate-Cysteine Ligase (GCL)",
                "Methionine Sulfoxide Reductase (Msr)",
                "Coenzyme Q (CoQ)",
                "Vitamin E (\u03b1-Tocopherol)",
                "Vitamin C (Ascorbic Acid)",
                "Beta-Carotene",
                "Lipoic Acid",
                "Ferritin (FTH1)",
                "Heme Oxygenase-1 (HO-1)",
                "Glucose-6-Phosphate Dehydrogenase (G6PD)",
                "6-Phosphogluconate Dehydrogenase (6PGD)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, alpha 2 (Yc2) (Gsta2)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "haptoglobin (Hp)",
                "hemoglobin Z, beta-like embryonic chain (Hbb-bh1)",
                "myoglobin (Mb)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "peroxiredoxin 6 (Prdx6)",
                "sulfiredoxin 1 homolog (S. cerevisiae) (Srxn1)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione peroxidase (GPx)",
            "Glutathione reductase (GR)",
            "Glutathione S-transferase (GST)",
            "Peroxiredoxin (Prx)",
            "Thioredoxin (Trx)",
            "Heme oxygenase-1 (HO-1)",
            "Ferritin",
            "Metallothionein (MT)",
            "NADPH quinone oxidoreductase 1 (NQO1)",
            "Glutaredoxin (Grx)",
            "Glutathione synthetase (GSS)",
            "Glutathione peroxidase 4 (GPx4)",
            "Glutathione S-transferase omega-1 (GSTO1)",
            "Selenium-binding protein 1 (SELENBP1)",
            "Peroxiredoxin 1 (Prx1)",
            "Thioredoxin reductase 1 (TrxR1)",
            "Superoxide dismutase 2 (SOD2)",
            "Catalase-peroxidase (KatG)",
            "Glutathione peroxidase 1 (GPx1)",
            "Glutathione reductase 1 (GR1)",
            "Glutathione S-transferase alpha (GSTA)",
            "Peroxiredoxin 2 (Prx2)",
            "Thioredoxin 1 (Trx1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Glutathione peroxidase 4 (GPx4)",
                "Glutathione S-transferase omega-1 (GSTO1)",
                "Peroxiredoxin 1 (Prx1)",
                "Thioredoxin reductase 1 (TrxR1)",
                "Superoxide dismutase 2 (SOD2)",
                "Glutathione peroxidase 1 (GPx1)",
                "Peroxiredoxin 2 (Prx2)"
            ],
            "mismatches": [
                "Superoxide dismutase (SOD)",
                "Glutathione peroxidase (GPx)",
                "Glutathione reductase (GR)",
                "Glutathione S-transferase (GST)",
                "Peroxiredoxin (Prx)",
                "Thioredoxin (Trx)",
                "Heme oxygenase-1 (HO-1)",
                "Ferritin",
                "Metallothionein (MT)",
                "NADPH quinone oxidoreductase 1 (NQO1)",
                "Glutaredoxin (Grx)",
                "Glutathione synthetase (GSS)",
                "Selenium-binding protein 1 (SELENBP1)",
                "Catalase-peroxidase (KatG)",
                "Glutathione reductase 1 (GR1)",
                "Glutathione S-transferase alpha (GSTA)",
                "Thioredoxin 1 (Trx1)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase alpha 13 (Gsta13)",
                "glutathione S-transferase alpha 5 (Gsta5)",
                "glutathione S-transferase omega 1 (Gsto1)",
                "glutathione S-transferase omega 2 (Gsto2)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "peroxiredoxin like 2A (Prxl2a)",
                "selenoprotein F (Selenof)",
                "selenoprotein S (Selenos)",
                "selenoprotein T (Selenot)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 8,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide dismutase 1 (SOD1)",
            "Superoxide dismutase 2 (SOD2)",
            "Catalase (CAT)",
            "Glutathione peroxidase 1 (GPX1)",
            "Glutathione peroxidase 4 (GPX4)",
            "Peroxiredoxin 1 (PRDX1)",
            "Peroxiredoxin 2 (PRDX2)",
            "Peroxiredoxin 3 (PRDX3)",
            "Peroxiredoxin 4 (PRDX4)",
            "Peroxiredoxin 5 (PRDX5)",
            "Peroxiredoxin 6 (PRDX6)",
            "Thioredoxin (TXN)",
            "Thioredoxin reductase 1 (TXNRD1)",
            "NAD(P)H quinone dehydrogenase 1 (NQO1)",
            "Glutathione reductase (GSR)",
            "Heme oxygenase 1 (HMOX1)",
            "Heme oxygenase 2 (HMOX2)",
            "Ferritin (FT)",
            "Metallothionein 1A (MT1A)",
            "Metallothionein 2A (MT2A)",
            "Paraoxonase 1 (PON1)",
            "Sulfiredoxin (SRXN1)",
            "Glutaredoxin (GLRX)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide dismutase 1 (SOD1)",
                "Superoxide dismutase 2 (SOD2)",
                "Catalase (CAT)",
                "Glutathione peroxidase 1 (GPX1)",
                "Glutathione peroxidase 4 (GPX4)",
                "Peroxiredoxin 1 (PRDX1)",
                "Peroxiredoxin 2 (PRDX2)",
                "Peroxiredoxin 3 (PRDX3)",
                "Peroxiredoxin 4 (PRDX4)",
                "Peroxiredoxin 5 (PRDX5)",
                "Peroxiredoxin 6 (PRDX6)",
                "Thioredoxin reductase 1 (TXNRD1)",
                "NAD(P)H quinone dehydrogenase 1 (NQO1)",
                "Glutathione reductase (GSR)",
                "Sulfiredoxin (SRXN1)"
            ],
            "mismatches": [
                "Thioredoxin (TXN)",
                "Heme oxygenase 1 (HMOX1)",
                "Heme oxygenase 2 (HMOX2)",
                "Ferritin (FT)",
                "Metallothionein 1A (MT1A)",
                "Metallothionein 2A (MT2A)",
                "Paraoxonase 1 (PON1)",
                "Glutaredoxin (GLRX)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "hemoglobin, beta adult t chain (Hbb-bt)",
                "microsomal glutathione S-transferase 1 (Mgst1)",
                "microsomal glutathione S-transferase 2 (Mgst2)",
                "myeloperoxidase (Mpo)",
                "myoglobin (Mb)",
                "nucleoredoxin (Nxn)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "peroxiredoxin 6 (Prdx6)",
                "peroxiredoxin 6B (Prdx6b)",
                "peroxiredoxin like 2A (Prxl2a)",
                "sulfiredoxin 1 homolog (S. cerevisiae) (Srxn1)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 15,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione peroxidase (GPx)",
            "Thioredoxin (Trx)",
            "Peroxiredoxin (Prx)",
            "Glutathione reductase (GR)",
            "Thioredoxin reductase (TrxR)",
            "Glutathione S-transferase (GST)",
            "Heme oxygenase-1 (HO-1)",
            "NAD(P)H:quinone oxidoreductase 1 (NQO1)",
            "Metallothionein (MT)",
            "Ferritin",
            "Transferrin",
            "Ceruloplasmin",
            "Albumin",
            "Nuclear factor erythroid 2-related factor 2 (Nrf2)",
            "Kelch-like ECH-associated protein 1 (Keap1)",
            "Paraoxonase (PON)",
            "Sulfiredoxin (Srx)",
            "Glutaredoxin (Grx)",
            "Methionine sulfoxide reductase (Msr)",
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "Ascorbate peroxidase (APX)",
            "DJ-1 (PARK7)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Glutathione reductase (GR)",
                "Ceruloplasmin",
                "Sulfiredoxin (Srx)",
                "NAD(P)H:quinone oxidoreductase 1 (NQO1)",
                "DJ-1 (PARK7)"
            ],
            "mismatches": [
                "Superoxide dismutase (SOD)",
                "Glutathione peroxidase (GPx)",
                "Thioredoxin (Trx)",
                "Peroxiredoxin (Prx)",
                "Thioredoxin reductase (TrxR)",
                "Glutathione S-transferase (GST)",
                "Heme oxygenase-1 (HO-1)",
                "Metallothionein (MT)",
                "Ferritin",
                "Transferrin",
                "Albumin",
                "Nuclear factor erythroid 2-related factor 2 (Nrf2)",
                "Kelch-like ECH-associated protein 1 (Keap1)",
                "Paraoxonase (PON)",
                "Glutaredoxin (Grx)",
                "Methionine sulfoxide reductase (Msr)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Ascorbate peroxidase (APX)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "Parkinson disease (autosomal recessive, early onset) 7 (Park7)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase kappa 1 (Gstk1)",
                "glutathione S-transferase pi 3 (Gstp3)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "lactoperoxidase (Lpo)",
                "myeloperoxidase (Mpo)",
                "myoglobin (Mb)",
                "nucleoredoxin (Nxn)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "sulfiredoxin 1 homolog (S. cerevisiae) (Srxn1)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione peroxidase (GPx)",
            "Glutathione reductase (GR)",
            "Glutathione S-transferase (GST)",
            "Thioredoxin (Trx)",
            "Thioredoxin reductase (TrxR)",
            "Peroxiredoxin (Prx)",
            "Heme oxygenase (HO)",
            "NAD(P)H quinone oxidoreductase 1 (NQO1)",
            "Glutaredoxin (Grx)",
            "Metallothionein (MT)",
            "Ferritin",
            "Ceruloplasmin",
            "Albumin",
            "Transferrin",
            "Glutathione synthetase (GSS)",
            "Gamma-glutamylcysteine synthetase (GCS)",
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "6-phosphogluconate dehydrogenase (6PGD)",
            "Glutathione transferase omega (GSTO)",
            "Glutathione transferase zeta (GSTZ)",
            "Glutathione transferase theta (GSTT)",
            "Glutathione transferase mu (GSTM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Ceruloplasmin",
                "Glutathione reductase (GR)"
            ],
            "mismatches": [
                "Superoxide dismutase (SOD)",
                "Glutathione peroxidase (GPx)",
                "Glutathione S-transferase (GST)",
                "Thioredoxin (Trx)",
                "Thioredoxin reductase (TrxR)",
                "Peroxiredoxin (Prx)",
                "Heme oxygenase (HO)",
                "NAD(P)H quinone oxidoreductase 1 (NQO1)",
                "Glutaredoxin (Grx)",
                "Metallothionein (MT)",
                "Ferritin",
                "Albumin",
                "Transferrin",
                "Glutathione synthetase (GSS)",
                "Gamma-glutamylcysteine synthetase (GCS)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "6-phosphogluconate dehydrogenase (6PGD)",
                "Glutathione transferase omega (GSTO)",
                "Glutathione transferase zeta (GSTZ)",
                "Glutathione transferase theta (GSTT)",
                "Glutathione transferase mu (GSTM)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase alpha 5 (Gsta5)",
                "glutathione S-transferase omega 1 (Gsto1)",
                "glutathione S-transferase omega 2 (Gsto2)",
                "glutathione S-transferase pi 3 (Gstp3)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, alpha 2 (Yc2) (Gsta2)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "myoglobin (Mb)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "peroxiredoxin 6 (Prdx6)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione peroxidase (GPX)",
            "Glutathione reductase (GSR)",
            "Thioredoxin reductase (TXNRD)",
            "Peroxiredoxin (PRDX)",
            "Glutaredoxin (GLRX)",
            "Sulfiredoxin (SRXN)",
            "Paraoxonase (PON)",
            "Heme oxygenase (HMOX)",
            "NADPH quinone oxidoreductase 1 (NQO1)",
            "Glutathione S-transferase (GST)",
            "Ferritin (FTH1, FTL)",
            "Metallothionein (MT)",
            "Superoxide reductase (SOR)",
            "Alkyl hydroperoxide reductase (AhpR)",
            "Thiol peroxidase (TPX)",
            "Peroxidase (PRX)",
            "Glutathione synthetase (GSS)",
            "Gamma-glutamylcysteine synthetase (GCLC, GCLM)",
            "Thioredoxin (TXN)",
            "Glutaredoxin (GLRX)",
            "DJ-1/Park7 protein",
            "Sestrin (SESN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Glutathione reductase (GSR)",
                "NADPH quinone oxidoreductase 1 (NQO1)",
                "DJ-1/Park7 protein"
            ],
            "mismatches": [
                "Superoxide dismutase (SOD)",
                "Glutathione peroxidase (GPX)",
                "Thioredoxin reductase (TXNRD)",
                "Peroxiredoxin (PRDX)",
                "Glutaredoxin (GLRX)",
                "Sulfiredoxin (SRXN)",
                "Paraoxonase (PON)",
                "Heme oxygenase (HMOX)",
                "Glutathione S-transferase (GST)",
                "Ferritin (FTH1, FTL)",
                "Metallothionein (MT)",
                "Superoxide reductase (SOR)",
                "Alkyl hydroperoxide reductase (AhpR)",
                "Thiol peroxidase (TPX)",
                "Peroxidase (PRX)",
                "Glutathione synthetase (GSS)",
                "Gamma-glutamylcysteine synthetase (GCLC, GCLM)",
                "Thioredoxin (TXN)",
                "Sestrin (SESN)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "Parkinson disease (autosomal recessive, early onset) 7 (Park7)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, alpha 2 (Yc2) (Gsta2)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione peroxidase 7 (Gpx7)",
                "glutathione reductase (Gsr)",
                "hemoglobin Z, beta-like embryonic chain (Hbb-bh1)",
                "lactoperoxidase (Lpo)",
                "myeloperoxidase (Mpo)",
                "myoglobin (Mb)",
                "nucleoredoxin (Nxn)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "selenoprotein S (Selenos)",
                "selenoprotein T (Selenot)",
                "sestrin 2 (Sesn2)",
                "sulfiredoxin 1 homolog (S. cerevisiae) (Srxn1)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 4,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide Dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione Peroxidase (GPx)",
            "Thioredoxin (TRX)",
            "Peroxiredoxin (PRX)",
            "Glutaredoxin (GRX)",
            "Heme Oxygenase-1 (HO-1)",
            "NAD(P)H Quinone Dehydrogenase 1 (NQO1)",
            "Gamma-Glutamylcysteine Synthetase (GCS)",
            "Glutathione Reductase (GR)",
            "Glucose-6-Phosphate Dehydrogenase (G6PD)",
            "Isocitrate Dehydrogenase (IDH)",
            "Ferritin (FTN)",
            "Metallothionein (MT)",
            "Biliverdin Reductase (BVR)",
            "Glutathione S-Transferase (GST)",
            "Haptoglobin (HP)",
            "Hemopexin (HPX)",
            "Ceruloplasmin (CP)",
            "Transferrin (TF)",
            "Albumin (ALB)",
            "Paraoxonase (PON)",
            "Lipoprotein-Associated Phospholipase A2 (Lp-PLA2)",
            "Glutathione-S-Transferase Omega (GSTO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "NAD(P)H Quinone Dehydrogenase 1 (NQO1)",
                "Glutathione Reductase (GR)",
                "Haptoglobin (HP)",
                "Ceruloplasmin (CP)"
            ],
            "mismatches": [
                "Superoxide Dismutase (SOD)",
                "Glutathione Peroxidase (GPx)",
                "Thioredoxin (TRX)",
                "Peroxiredoxin (PRX)",
                "Glutaredoxin (GRX)",
                "Heme Oxygenase-1 (HO-1)",
                "Gamma-Glutamylcysteine Synthetase (GCS)",
                "Glucose-6-Phosphate Dehydrogenase (G6PD)",
                "Isocitrate Dehydrogenase (IDH)",
                "Ferritin (FTN)",
                "Metallothionein (MT)",
                "Biliverdin Reductase (BVR)",
                "Glutathione S-Transferase (GST)",
                "Hemopexin (HPX)",
                "Transferrin (TF)",
                "Albumin (ALB)",
                "Paraoxonase (PON)",
                "Lipoprotein-Associated Phospholipase A2 (Lp-PLA2)",
                "Glutathione-S-Transferase Omega (GSTO)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "alpha 1 microglobulin/bikunin precursor (Ambp)",
                "arachidonate 5-lipoxygenase activating protein (Alox5ap)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "eosinophil peroxidase (Epx)",
                "glutathione S-transferase omega 1 (Gsto1)",
                "glutathione S-transferase omega 2 (Gsto2)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, alpha 2 (Yc2) (Gsta2)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "haptoglobin (Hp)",
                "hemoglobin, beta adult major chain (Hbb-b1)",
                "hemoglobin, beta adult t chain (Hbb-bt)",
                "lactoperoxidase (Lpo)",
                "myeloperoxidase (Mpo)",
                "myoglobin (Mb)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "peroxiredoxin like 2A (Prxl2a)",
                "prostaglandin-endoperoxide synthase 2 (Ptgs2)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide dismutase (SOD)",
            "Catalase",
            "Glutathione peroxidase (GPx)",
            "Glutathione reductase",
            "Glutathione transferase",
            "Lactoperoxidase",
            "Myeloperoxidase",
            "Thioredoxin reductase",
            "Thioredoxin",
            "Peroxiredoxin",
            "Manganese superoxide dismutase",
            "Copper-zinc superoxide dismutase",
            "Mitochondrial manganese superoxide dismutase",
            "Endothelial nitric oxide synthase",
            "Neuronal nitric oxide synthase",
            "Inducible nitric oxide synthase",
            "Nitric oxide synthase",
            "Heme oxygenase-1",
            "Heme oxygenase-2",
            "Heme oxygenase-3",
            "GSTP1",
            "GSTA1",
            "GSTA2",
            "GSTA3",
            "GSTA4",
            "GSTA5",
            "GSTA6"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase",
                "Glutathione reductase",
                "Lactoperoxidase",
                "Myeloperoxidase",
                "GSTA1",
                "GSTA2",
                "GSTA5"
            ],
            "mismatches": [
                "Superoxide dismutase (SOD)",
                "Glutathione peroxidase (GPx)",
                "Glutathione transferase",
                "Thioredoxin reductase",
                "Thioredoxin",
                "Peroxiredoxin",
                "Manganese superoxide dismutase",
                "Copper-zinc superoxide dismutase",
                "Mitochondrial manganese superoxide dismutase",
                "Endothelial nitric oxide synthase",
                "Neuronal nitric oxide synthase",
                "Inducible nitric oxide synthase",
                "Nitric oxide synthase",
                "Heme oxygenase-1",
                "Heme oxygenase-2",
                "Heme oxygenase-3",
                "GSTP1",
                "GSTA3",
                "GSTA4",
                "GSTA6"
            ],
            "true_referents": [
                "catalase (Cat)",
                "cytoglobin (Cygb)",
                "eosinophil peroxidase (Epx)",
                "glutathione S-transferase alpha 13 (Gsta13)",
                "glutathione S-transferase alpha 5 (Gsta5)",
                "glutathione S-transferase pi 3 (Gstp3)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, alpha 2 (Yc2) (Gsta2)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, pi, pseudogene (Gstp-ps)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 3 (Gpx3)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione reductase (Gsr)",
                "lactoperoxidase (Lpo)",
                "leukotriene C4 synthase (Ltc4s)",
                "myeloperoxidase (Mpo)",
                "nucleoredoxin (Nxn)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "prostaglandin E synthase (Ptges)",
                "prostaglandin-endoperoxide synthase 1 (Ptgs1)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 7,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide Dismutase 1 (SOD1)",
            "Catalase (CAT)",
            "Glutathione Peroxidase 1 (GPX1)",
            "Glutathione Reductase (GSR)",
            "Glutathione S-Transferase Pi 1 (GSTP1)",
            "Thioredoxin 1 (TXN1)",
            "Thioredoxin Reductase 1 (TXNRD1)",
            "Ceruloplasmin (CP)",
            "Heme Oxygenase 1 (HMOX1)",
            "Ferritin Heavy Chain (FTH1)",
            "Ferritin Light Chain (FTL)",
            "Transferrin (TF)",
            "Lactoferrin (LTF)",
            "Albumin (ALB)",
            "Oxidized Low-Density Lipoprotein Receptor 1 (OLR1)",
            "Paraoxonase 1 (PON1)",
            "Vitamin C (Ascorbate)",
            "Vitamin E (Alpha-Tocopherol)",
            "Coenzyme Q10 (Ubiquinone)",
            "Glutathione (GSH)",
            "Cysteine (Cys)",
            "Methionine Sulfoxide Reductase A (MSRA)",
            " Peroxiredoxin 1 (PRDX1)",
            "Selenium-Binding Protein 1 (SBP1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide Dismutase 1 (SOD1)",
                "Catalase (CAT)",
                "Glutathione Peroxidase 1 (GPX1)",
                "Glutathione Reductase (GSR)",
                "Glutathione S-Transferase Pi 1 (GSTP1)",
                "Thioredoxin Reductase 1 (TXNRD1)",
                "Ceruloplasmin (CP)",
                "Peroxiredoxin 1 (PRDX1)"
            ],
            "mismatches": [
                "Thioredoxin 1 (TXN1)",
                "Heme Oxygenase 1 (HMOX1)",
                "Ferritin Heavy Chain (FTH1)",
                "Ferritin Light Chain (FTL)",
                "Transferrin (TF)",
                "Lactoferrin (LTF)",
                "Albumin (ALB)",
                "Oxidized Low-Density Lipoprotein Receptor 1 (OLR1)",
                "Paraoxonase 1 (PON1)",
                "Vitamin C (Ascorbate)",
                "Vitamin E (Alpha-Tocopherol)",
                "Coenzyme Q10 (Ubiquinone)",
                "Glutathione (GSH)",
                "Cysteine (Cys)",
                "Methionine Sulfoxide Reductase A (MSRA)",
                "Selenium-Binding Protein 1 (SBP1)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "alpha 1 microglobulin/bikunin precursor (Ambp)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase pi 3 (Gstp3)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "hemoglobin X, alpha-like embryonic chain in Hba complex (Hba-x)",
                "hemoglobin Z, beta-like embryonic chain (Hbb-bh1)",
                "hemoglobin, beta adult major chain (Hbb-b1)",
                "hemoglobin, beta adult t chain (Hbb-bt)",
                "lactoperoxidase (Lpo)",
                "myeloperoxidase (Mpo)",
                "myoglobin (Mb)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "selenoprotein S (Selenos)",
                "selenoprotein T (Selenot)",
                "selenoprotein W (Selenow)",
                "sulfiredoxin 1 homolog (S. cerevisiae) (Srxn1)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide dismutase",
            "Catalase",
            "Glutathione peroxidase",
            "Thioredoxin",
            "Peroxiredoxin",
            "Peroxiredoxin 6",
            "Peroxiredoxin 5",
            "Peroxiredoxin 3",
            "Peroxiredoxin 2",
            "Peroxiredoxin 1",
            "Peroxiredoxin 4",
            "Thioredoxin reductase",
            "Thioredoxin glutathione reductase",
            "Glutathione peroxidase 4",
            "Glutathione peroxidase 5",
            "Glutathione peroxidase 6",
            "Glutathione peroxidase 7",
            "Glutathione peroxidase 8",
            "Glutathione peroxidase 9",
            "Glutathione peroxidase 10",
            "Glutathione peroxidase 11",
            "Glutathione peroxidase 12",
            "Glutathione peroxidase 13",
            "Glutathione peroxidase 14",
            "Glutathione peroxidase 15",
            "Glutathione peroxidase 16",
            "Glutathione peroxidase 17",
            "Glutathione peroxidase 18",
            "Glutathione peroxidase 19",
            "Glutathione peroxidase 20",
            "Glutathione peroxidase 21",
            "Glutathione peroxidase 22",
            "Glutathione peroxidase 23",
            "Glutathione peroxidase 24"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase",
                "Peroxiredoxin 6",
                "Peroxiredoxin 5",
                "Peroxiredoxin 3",
                "Peroxiredoxin 2",
                "Peroxiredoxin 1",
                "Peroxiredoxin 4",
                "Glutathione peroxidase 4",
                "Glutathione peroxidase 5",
                "Glutathione peroxidase 6",
                "Glutathione peroxidase 7",
                "Glutathione peroxidase 8"
            ],
            "mismatches": [
                "Superoxide dismutase",
                "Glutathione peroxidase",
                "Thioredoxin",
                "Peroxiredoxin",
                "Thioredoxin reductase",
                "Thioredoxin glutathione reductase",
                "Glutathione peroxidase 9",
                "Glutathione peroxidase 10",
                "Glutathione peroxidase 11",
                "Glutathione peroxidase 12",
                "Glutathione peroxidase 13",
                "Glutathione peroxidase 14",
                "Glutathione peroxidase 15",
                "Glutathione peroxidase 16",
                "Glutathione peroxidase 17",
                "Glutathione peroxidase 18",
                "Glutathione peroxidase 19",
                "Glutathione peroxidase 20",
                "Glutathione peroxidase 21",
                "Glutathione peroxidase 22",
                "Glutathione peroxidase 23",
                "Glutathione peroxidase 24"
            ],
            "true_referents": [
                "catalase (Cat)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione peroxidase 7 (Gpx7)",
                "glutathione peroxidase 8 (putative) (Gpx8)",
                "glutathione reductase (Gsr)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "peroxiredoxin 6 (Prdx6)",
                "peroxiredoxin 6B (Prdx6b)",
                "peroxiredoxin like 2A (Prxl2a)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 12,
            "FP": 22,
            "FN": 0
        }
    }
]