[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Catalase (CAT)",
            "Superoxide Dismutase (SOD)",
            "Glutathione Peroxidase (GPX)",
            "Heme Oxygenase-1 (HO-1)",
            "Paraoxonase 1 (PON1)",
            "Thioredoxin Reductase (TXNRD)",
            "Manganese Superoxide Dismutase (MnSOD)",
            "Copper-Zinc Superoxide Dismutase (CuZnSOD)",
            "Glutaredoxin (GRX)",
            "Peroxiredoxin (PRX)",
            "Elastase Inhibitor (AAT)",
            "Alpha-1 Antichymotrypsin (ACT)",
            "Alpha-2 Macroglobulin (A2M)",
            "Haptoglobin (HP)",
            "Transferrin (TF)",
            "Metallothionein (MT)",
            "Alpha-1 Antitrypsin (A1AT)",
            "Cystatin C (CST3)",
            "NAD(P)H Quinone Dehydrogenase 1 (NQO1)",
            "Selenoprotein P (SEPP1)",
            "Selenoprotein W (SEPW1)",
            "Selenium Binding Protein 1 (SELENBP1)",
            "Glutathione S-Transferase (GST)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Haptoglobin (HP)",
                "NAD(P)H Quinone Dehydrogenase 1 (NQO1)"
            ],
            "mismatches": [
                "Superoxide Dismutase (SOD)",
                "Glutathione Peroxidase (GPX)",
                "Heme Oxygenase-1 (HO-1)",
                "Paraoxonase 1 (PON1)",
                "Thioredoxin Reductase (TXNRD)",
                "Manganese Superoxide Dismutase (MnSOD)",
                "Copper-Zinc Superoxide Dismutase (CuZnSOD)",
                "Glutaredoxin (GRX)",
                "Peroxiredoxin (PRX)",
                "Elastase Inhibitor (AAT)",
                "Alpha-1 Antichymotrypsin (ACT)",
                "Alpha-2 Macroglobulin (A2M)",
                "Transferrin (TF)",
                "Metallothionein (MT)",
                "Alpha-1 Antitrypsin (A1AT)",
                "Cystatin C (CST3)",
                "Selenoprotein P (SEPP1)",
                "Selenoprotein W (SEPW1)",
                "Selenium Binding Protein 1 (SELENBP1)",
                "Glutathione S-Transferase (GST)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "alpha 1 microglobulin/bikunin precursor (Ambp)",
                "arachidonate 5-lipoxygenase activating protein (Alox5ap)",
                "catalase (Cat)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase alpha 5 (Gsta5)",
                "glutathione S-transferase pi 3 (Gstp3)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "haptoglobin (Hp)",
                "hemoglobin alpha, adult chain 1 (Hba-a1)",
                "hemoglobin alpha, adult chain 2 (Hba-a2)",
                "hemoglobin, beta adult t chain (Hbb-bt)",
                "microsomal glutathione S-transferase 3 (Mgst3)",
                "myeloperoxidase (Mpo)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "selenoprotein F (Selenof)",
                "selenoprotein S (Selenos)",
                "selenoprotein T (Selenot)",
                "selenoprotein W (Selenow)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 3,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Glutathione peroxidase (GPx)",
            "Superoxide dismutase (SOD)",
            "Catalase (CAT)",
            "Peroxiredoxin (Prx)",
            "Thioredoxin (Trx)",
            "Glutaredoxin (Grx)",
            "MnSOD (Manganese superoxide dismutase)",
            "CuZnSOD (Copper-zinc superoxide dismutase)",
            "EcSOD (Extracellular superoxide dismutase)",
            "Prdx6 (Peroxiredoxin-6)",
            "TrxR1 (Thioredoxin reductase 1)",
            "TrxR2 (Thioredoxin reductase 2)",
            "Grx1 (Glutaredoxin 1)",
            "Prdx1 (Peroxiredoxin 1)",
            "Prdx2 (Peroxiredoxin 2)",
            "Prdx3 (Peroxiredoxin 3)",
            "Prdx4 (Peroxiredoxin 4)",
            "Prdx5 (Peroxiredoxin 5)",
            "GPx1 (Glutathione peroxidase 1)",
            "GPx2 (Glutathione peroxidase 2)",
            "GPx3 (Glutathione peroxidase 3)",
            "GPx4 (Glutathione peroxidase 4)",
            "GPx6 (Glutathione peroxidase 6)",
            "GPx7 (Glutathione peroxidase 7)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Prdx1 (Peroxiredoxin 1)",
                "Prdx2 (Peroxiredoxin 2)",
                "Prdx3 (Peroxiredoxin 3)",
                "Prdx4 (Peroxiredoxin 4)",
                "Prdx5 (Peroxiredoxin 5)",
                "Prdx6 (Peroxiredoxin-6)",
                "TrxR1 (Thioredoxin reductase 1)",
                "TrxR2 (Thioredoxin reductase 2)",
                "GPx1 (Glutathione peroxidase 1)",
                "GPx2 (Glutathione peroxidase 2)",
                "GPx3 (Glutathione peroxidase 3)",
                "GPx4 (Glutathione peroxidase 4)",
                "GPx6 (Glutathione peroxidase 6)",
                "GPx7 (Glutathione peroxidase 7)"
            ],
            "mismatches": [
                "Glutathione peroxidase (GPx)",
                "Superoxide dismutase (SOD)",
                "Peroxiredoxin (Prx)",
                "Thioredoxin (Trx)",
                "Glutaredoxin (Grx)",
                "MnSOD (Manganese superoxide dismutase)",
                "CuZnSOD (Copper-zinc superoxide dismutase)",
                "EcSOD (Extracellular superoxide dismutase)",
                "Grx1 (Glutaredoxin 1)"
            ],
            "true_referents": [
                "catalase (Cat)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 3 (Gpx3)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione peroxidase 7 (Gpx7)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "peroxiredoxin 6 (Prdx6)",
                "peroxiredoxin 6B (Prdx6b)",
                "peroxiredoxin like 2A (Prxl2a)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide Dismutase (SOD)",
            "Catalase",
            "Glutathione Peroxidase",
            "Thioredoxin",
            "Glutathione S-transferase",
            "Peroxiredoxin",
            "Heme Oxygenase-1",
            "Ferritin",
            "Ceruloplasmin",
            "Metallothionein",
            "Paraoxonase 1",
            "Paraoxonase 2",
            "Paraoxonase 3",
            "Prdx5",
            "Prdx6",
            "Nrf2",
            "Prx1",
            "Prx2",
            "Prx3",
            "Prx4",
            "Prx5",
            "Prx6",
            "PrxQ",
            "PrxS"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase",
                "Ceruloplasmin",
                "Prdx5",
                "Prdx6"
            ],
            "mismatches": [
                "Superoxide Dismutase (SOD)",
                "Glutathione Peroxidase",
                "Thioredoxin",
                "Glutathione S-transferase",
                "Peroxiredoxin",
                "Heme Oxygenase-1",
                "Ferritin",
                "Metallothionein",
                "Paraoxonase 1",
                "Paraoxonase 2",
                "Paraoxonase 3",
                "Nrf2",
                "Prx1",
                "Prx2",
                "Prx3",
                "Prx4",
                "PrxQ",
                "PrxS"
            ],
            "true_referents": [
                "apolipoprotein E (Apoe)",
                "arachidonate 5-lipoxygenase activating protein (Alox5ap)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 3 (Gpx3)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "myoglobin (Mb)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "peroxiredoxin 6 (Prdx6)",
                "peroxiredoxin 6B (Prdx6b)",
                "peroxiredoxin like 2A (Prxl2a)",
                "peroxiredoxin like 2B (Prxl2b)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 4,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide Dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione Peroxidase (GPx)",
            "Glutathione Reductase (GR)",
            "Peroxiredoxins (PRDX)",
            "Heme Oxygenase-1 (HO-1)",
            "Thioredoxin Reductase (TrxR)",
            "Thioredoxin (Trx)",
            "Albumin (ALB)",
            "Ceruloplasmin (CP)",
            "Transferrin (TF)",
            "Lactoferrin (LF)",
            "Metallothioneins (MT)",
            "Lipoxygenase (LOX)",
            "Uric Acid (UA)",
            "Serum Amyloid A (SAA)",
            "Haptoglobin (HP)",
            "Apolipoprotein A1 (APOA1)",
            "Paraoxonase 1 (PON1)",
            "Selenoprotein P (SEPP1)",
            "DJ-1 (PARK7)",
            "Nuclear Factor Erythroid 2-Related Factor 2 (Nrf2)",
            "Thioredoxin-interacting protein (TXNIP)",
            "Copper-Zinc Superoxide Dismutase (CuZnSOD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Ceruloplasmin (CP)",
                "Haptoglobin (HP)",
                "DJ-1 (PARK7)"
            ],
            "mismatches": [
                "Superoxide Dismutase (SOD)",
                "Glutathione Peroxidase (GPx)",
                "Glutathione Reductase (GR)",
                "Peroxiredoxins (PRDX)",
                "Heme Oxygenase-1 (HO-1)",
                "Thioredoxin Reductase (TrxR)",
                "Thioredoxin (Trx)",
                "Albumin (ALB)",
                "Transferrin (TF)",
                "Lactoferrin (LF)",
                "Metallothioneins (MT)",
                "Lipoxygenase (LOX)",
                "Uric Acid (UA)",
                "Serum Amyloid A (SAA)",
                "Apolipoprotein A1 (APOA1)",
                "Paraoxonase 1 (PON1)",
                "Selenoprotein P (SEPP1)",
                "Nuclear Factor Erythroid 2-Related Factor 2 (Nrf2)",
                "Thioredoxin-interacting protein (TXNIP)",
                "Copper-Zinc Superoxide Dismutase (CuZnSOD)"
            ],
            "true_referents": [
                "Parkinson disease (autosomal recessive, early onset) 7 (Park7)",
                "S100 calcium binding protein A8 (calgranulin A) (S100a8)",
                "S100 calcium binding protein A9 (calgranulin B) (S100a9)",
                "alpha 1 microglobulin/bikunin precursor (Ambp)",
                "apolipoprotein A-IV (Apoa4)",
                "apolipoprotein E (Apoe)",
                "apolipoprotein M (Apom)",
                "arachidonate 5-lipoxygenase activating protein (Alox5ap)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione reductase (Gsr)",
                "haptoglobin (Hp)",
                "hemoglobin, beta adult major chain (Hbb-b1)",
                "hemoglobin, beta adult t chain (Hbb-bt)",
                "lactoperoxidase (Lpo)",
                "leukotriene C4 synthase (Ltc4s)",
                "myeloperoxidase (Mpo)",
                "myoglobin (Mb)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 5 (Prdx5)",
                "peroxiredoxin 6 (Prdx6)",
                "selenoprotein F (Selenof)",
                "selenoprotein S (Selenos)",
                "selenoprotein T (Selenot)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide Dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione Peroxidase (GPx)",
            "Thioredoxin (Trx)",
            "Peroxiredoxin (Prx)",
            "Glutaredoxin (Grx)",
            "Ceruloplasmin (CP)",
            "Hemoglobin (Hb)",
            "Myoglobin (Mb)",
            "Lactoferrin (Lf)",
            "Transferrin (Tf)",
            "Albumin (Alb)",
            "Ferritin (Ft)",
            "Paraoxonase (PON)",
            "Aldose Reductase (AR)",
            "Methionine Sulfoxide Reductase (Msr)",
            "Coenzyme Q10 (CoQ10)",
            "Haptoglobin (Hp)",
            "Alpha-1-antitrypsin (A1AT)",
            "Selenium-binding protein (SBP)",
            "Uricase (UOX)",
            "Bilirubin (BIL)",
            "Alpha-lipoic acid (ALA)",
            "NAD(P)H:quinone oxidoreductase 1 (NQO1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Ceruloplasmin (CP)",
                "Myoglobin (Mb)",
                "Haptoglobin (Hp)",
                "NAD(P)H:quinone oxidoreductase 1 (NQO1)"
            ],
            "mismatches": [
                "Superoxide Dismutase (SOD)",
                "Glutathione Peroxidase (GPx)",
                "Thioredoxin (Trx)",
                "Peroxiredoxin (Prx)",
                "Glutaredoxin (Grx)",
                "Hemoglobin (Hb)",
                "Lactoferrin (Lf)",
                "Transferrin (Tf)",
                "Albumin (Alb)",
                "Ferritin (Ft)",
                "Paraoxonase (PON)",
                "Aldose Reductase (AR)",
                "Methionine Sulfoxide Reductase (Msr)",
                "Coenzyme Q10 (CoQ10)",
                "Alpha-1-antitrypsin (A1AT)",
                "Selenium-binding protein (SBP)",
                "Uricase (UOX)",
                "Bilirubin (BIL)",
                "Alpha-lipoic acid (ALA)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "alpha 1 microglobulin/bikunin precursor (Ambp)",
                "arachidonate 5-lipoxygenase activating protein (Alox5ap)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase alpha 5 (Gsta5)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "haptoglobin (Hp)",
                "hemoglobin alpha, adult chain 1 (Hba-a1)",
                "hemoglobin beta, bh2 (Hbb-bh2)",
                "hemoglobin, beta adult major chain (Hbb-b1)",
                "hemoglobin, beta adult s chain (Hbb-bs)",
                "hemoglobin, beta adult t chain (Hbb-bt)",
                "lactoperoxidase (Lpo)",
                "myeloperoxidase (Mpo)",
                "myoglobin (Mb)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "selenoprotein S (Selenos)",
                "selenoprotein T (Selenot)",
                "selenoprotein W (Selenow)",
                "sulfiredoxin 1 homolog (S. cerevisiae) (Srxn1)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide dismutase (SOD)",
            "Glutathione peroxidase (GPx)",
            "Catalase (CAT)",
            "Thioredoxin (Trx)",
            "Peroxiredoxin (Prx)",
            "Hemopexin (Hx)",
            "Ceruloplasmin (Cp)",
            "Albumin (Alb)",
            "Ferritin (Ft)",
            "Lactoferrin (Lf)",
            "Alpha-1-antitrypsin (A1AT)",
            "Heat shock protein 70 (Hsp70)",
            "Nrf2 (Nuclear factor erythroid 2-related factor 2)",
            "Apolipoprotein A1 (ApoA1)",
            "Glutathione S-transferase (GST)",
            "Alpha-lipoic acid protein (ALAP)",
            "Bilirubin (indirect, as a protein-bound antioxidant)",
            "Vitamin D binding protein (DBP)",
            "Cystatin C (CysC)",
            "Selenium-binding protein 1 (SBP1)",
            "Fetuin-A (FetA)",
            "Resistin (Retn)",
            "Nuclear factor kappa-light-chain-enhancer of activated B cells (NF-kB)",
            "Myeloperoxidase (MPO)",
            "Interleukin-6 (IL-6)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Ceruloplasmin (Cp)",
                "Myeloperoxidase (MPO)"
            ],
            "mismatches": [
                "Superoxide dismutase (SOD)",
                "Glutathione peroxidase (GPx)",
                "Thioredoxin (Trx)",
                "Peroxiredoxin (Prx)",
                "Hemopexin (Hx)",
                "Albumin (Alb)",
                "Ferritin (Ft)",
                "Lactoferrin (Lf)",
                "Alpha-1-antitrypsin (A1AT)",
                "Heat shock protein 70 (Hsp70)",
                "Nrf2 (Nuclear factor erythroid 2-related factor 2)",
                "Apolipoprotein A1 (ApoA1)",
                "Glutathione S-transferase (GST)",
                "Alpha-lipoic acid protein (ALAP)",
                "Bilirubin (indirect, as a protein-bound antioxidant)",
                "Vitamin D binding protein (DBP)",
                "Cystatin C (CysC)",
                "Selenium-binding protein 1 (SBP1)",
                "Fetuin-A (FetA)",
                "Resistin (Retn)",
                "Nuclear factor kappa-light-chain-enhancer of activated B cells (NF-kB)",
                "Interleukin-6 (IL-6)"
            ],
            "true_referents": [
                "S100 calcium binding protein A8 (calgranulin A) (S100a8)",
                "S100 calcium binding protein A9 (calgranulin B) (S100a9)",
                "alpha 1 microglobulin/bikunin precursor (Ambp)",
                "apolipoprotein A-IV (Apoa4)",
                "apolipoprotein E (Apoe)",
                "apolipoprotein M (Apom)",
                "arachidonate 5-lipoxygenase activating protein (Alox5ap)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "eosinophil peroxidase (Epx)",
                "fatty acid binding protein 1, liver (Fabp1)",
                "glutathione S-transferase alpha 5 (Gsta5)",
                "glutathione S-transferase kappa 1 (Gstk1)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, alpha 2 (Yc2) (Gsta2)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "haptoglobin (Hp)",
                "hemoglobin alpha, adult chain 1 (Hba-a1)",
                "hemoglobin, beta adult major chain (Hbb-b1)",
                "hemoglobin, beta adult minor chain (Hbb-b2)",
                "hemoglobin, beta adult t chain (Hbb-bt)",
                "lactoperoxidase (Lpo)",
                "myeloperoxidase (Mpo)",
                "myoglobin (Mb)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "selenoprotein S (Selenos)",
                "selenoprotein T (Selenot)",
                "selenoprotein W (Selenow)",
                "sestrin 2 (Sesn2)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)",
                "transformation related protein 53 inducible nuclear protein 1 (Trp53inp1)"
            ],
            "TP": 3,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide Dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione Peroxidase (GPx)",
            "Thioredoxin (Trx)",
            "Peroxiredoxin (Prx)",
            "Glutaredoxin (Grx)",
            "Glutathione S-transferase (GST)",
            "Metallothionein (MT)",
            "Ceruloplasmin (CP)",
            "Ferritin (FT)",
            "Transferrin (TF)",
            "Hemopexin (HPX)",
            "Haptoglobin (Hp)",
            "Albumin (Alb)",
            "Alpha-1 antitrypsin (A1AT)",
            "Coenzyme Q10 (CoQ10)",
            "Melanotransferrin (MTf)",
            "Alpha Lipoic Acid (ALA)",
            "Uric Acid (UA)",
            "Vitamin E (Vit E)",
            "Vitamin C (Vit C)",
            "Vitamin A (Vit A)",
            "Betacarotene (BC)",
            "Selenium (Se)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Ceruloplasmin (CP)",
                "Haptoglobin (Hp)"
            ],
            "mismatches": [
                "Superoxide Dismutase (SOD)",
                "Glutathione Peroxidase (GPx)",
                "Thioredoxin (Trx)",
                "Peroxiredoxin (Prx)",
                "Glutaredoxin (Grx)",
                "Glutathione S-transferase (GST)",
                "Metallothionein (MT)",
                "Ferritin (FT)",
                "Transferrin (TF)",
                "Hemopexin (HPX)",
                "Albumin (Alb)",
                "Alpha-1 antitrypsin (A1AT)",
                "Coenzyme Q10 (CoQ10)",
                "Melanotransferrin (MTf)",
                "Alpha Lipoic Acid (ALA)",
                "Uric Acid (UA)",
                "Vitamin E (Vit E)",
                "Vitamin C (Vit C)",
                "Vitamin A (Vit A)",
                "Betacarotene (BC)",
                "Selenium (Se)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "alpha 1 microglobulin/bikunin precursor (Ambp)",
                "arachidonate 5-lipoxygenase activating protein (Alox5ap)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "eosinophil peroxidase (Epx)",
                "glutathione S-transferase alpha 5 (Gsta5)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "haptoglobin (Hp)",
                "hemoglobin alpha, adult chain 1 (Hba-a1)",
                "hemoglobin, beta adult major chain (Hbb-b1)",
                "hemoglobin, beta adult t chain (Hbb-bt)",
                "lactoperoxidase (Lpo)",
                "myeloperoxidase (Mpo)",
                "myoglobin (Mb)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "selenoprotein F (Selenof)",
                "selenoprotein S (Selenos)",
                "selenoprotein T (Selenot)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide dismutase (SOD)",
            "Catalase",
            "Glutathione peroxidase",
            "Glutathione reductase",
            "Peroxiredoxin",
            "Thioredoxin",
            "Ferritin",
            "Transferrin",
            "Hemoglobin",
            "Myoglobin",
            "Cytochrome c",
            "Glutathione-S-transferase (GST)",
            "Glutathione reductase",
            "Glutathione peroxidase",
            "Glutathione synthetase",
            "Glutathione transferase",
            "Superoxide dismutase (SOD)",
            "Catalase",
            "Peroxiredoxin",
            "Thioredoxin",
            "Ferritin",
            "Transferrin",
            "Hemoglobin",
            "Myoglobin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase",
                "Glutathione reductase",
                "Myoglobin"
            ],
            "mismatches": [
                "Superoxide dismutase (SOD)",
                "Glutathione peroxidase",
                "Peroxiredoxin",
                "Thioredoxin",
                "Ferritin",
                "Transferrin",
                "Hemoglobin",
                "Cytochrome c",
                "Glutathione-S-transferase (GST)",
                "Glutathione synthetase",
                "Glutathione transferase"
            ],
            "true_referents": [
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase pi 3 (Gstp3)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione reductase (Gsr)",
                "hemoglobin beta, bh2 (Hbb-bh2)",
                "hemoglobin, beta adult major chain (Hbb-b1)",
                "myoglobin (Mb)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 3,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione peroxidase (GPx)",
            "Glutathione reductase (GR)",
            "Peroxiredoxin (Prx)",
            "Thioredoxin (Trx)",
            "Glutaredoxin (Grx)",
            "Ferritin",
            "Lactoferrin",
            "Albumin",
            "Metallothionein",
            "Paraoxonase (PON)",
            "Transferrin",
            "Heme oxygenase (HO)",
            "Hemoglobin",
            "Myoglobin",
            "Ribonuclease",
            "C-reactive protein (CRP)",
            "Alpha-lactalbumin",
            "Keratin",
            "Selenoprotein P (SEPP1)",
            "Vitamin D-binding protein",
            "Prion protein (PrP)",
            "Haptoglobin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Glutathione reductase (GR)",
                "Hemoglobin",
                "Myoglobin",
                "Haptoglobin"
            ],
            "mismatches": [
                "Superoxide dismutase (SOD)",
                "Glutathione peroxidase (GPx)",
                "Peroxiredoxin (Prx)",
                "Thioredoxin (Trx)",
                "Glutaredoxin (Grx)",
                "Ferritin",
                "Lactoferrin",
                "Albumin",
                "Metallothionein",
                "Paraoxonase (PON)",
                "Transferrin",
                "Heme oxygenase (HO)",
                "Ribonuclease",
                "C-reactive protein (CRP)",
                "Alpha-lactalbumin",
                "Keratin",
                "Selenoprotein P (SEPP1)",
                "Vitamin D-binding protein",
                "Prion protein (PrP)"
            ],
            "true_referents": [
                "S100 calcium binding protein A8 (calgranulin A) (S100a8)",
                "S100 calcium binding protein A9 (calgranulin B) (S100a9)",
                "alpha 1 microglobulin/bikunin precursor (Ambp)",
                "apolipoprotein E (Apoe)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "fatty acid binding protein 1, liver (Fabp1)",
                "glutathione S-transferase pi 3 (Gstp3)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "haptoglobin (Hp)",
                "hemoglobin alpha, adult chain 1 (Hba-a1)",
                "hemoglobin beta, bh2 (Hbb-bh2)",
                "hemoglobin, beta adult major chain (Hbb-b1)",
                "lactoperoxidase (Lpo)",
                "myeloperoxidase (Mpo)",
                "myoglobin (Mb)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "selenoprotein F (Selenof)",
                "selenoprotein S (Selenos)",
                "selenoprotein T (Selenot)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione peroxidase (GPx)",
            "Peroxiredoxin (Prx)",
            "Thioredoxin (Trx)",
            "Glutaredoxin (Grx)",
            "Heme oxygenase-1 (HO-1)",
            "Paraoxonase (PON)",
            "Albumin",
            "Ferritin",
            "Transferrin",
            "Ceruloplasmin",
            "Metallothionein",
            "Alpha-1-microglobulin (A1M)",
            "Bilirubin",
            "Uric acid",
            "Melatonin",
            "Coenzyme Q10 (CoQ10)",
            "Alpha-lipoic acid (ALA)",
            "Glutathione S-transferase (GST)",
            "Sulfiredoxin (Srx)",
            "Sestrin",
            "DJ-1 (PARK7)",
            "Methionine sulfoxide reductase (Msr)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Ceruloplasmin",
                "Alpha-1-microglobulin (A1M)",
                "Sulfiredoxin (Srx)",
                "DJ-1 (PARK7)"
            ],
            "mismatches": [
                "Superoxide dismutase (SOD)",
                "Glutathione peroxidase (GPx)",
                "Peroxiredoxin (Prx)",
                "Thioredoxin (Trx)",
                "Glutaredoxin (Grx)",
                "Heme oxygenase-1 (HO-1)",
                "Paraoxonase (PON)",
                "Albumin",
                "Ferritin",
                "Transferrin",
                "Metallothionein",
                "Bilirubin",
                "Uric acid",
                "Melatonin",
                "Coenzyme Q10 (CoQ10)",
                "Alpha-lipoic acid (ALA)",
                "Glutathione S-transferase (GST)",
                "Sestrin",
                "Methionine sulfoxide reductase (Msr)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "Parkinson disease (autosomal recessive, early onset) 7 (Park7)",
                "alpha 1 microglobulin/bikunin precursor (Ambp)",
                "arachidonate 5-lipoxygenase activating protein (Alox5ap)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "glutathione S-transferase kappa 1 (Gstk1)",
                "glutathione S-transferase pi 3 (Gstp3)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "haptoglobin (Hp)",
                "hemoglobin X, alpha-like embryonic chain in Hba complex (Hba-x)",
                "hemoglobin alpha, adult chain 1 (Hba-a1)",
                "lactoperoxidase (Lpo)",
                "myeloperoxidase (Mpo)",
                "myoglobin (Mb)",
                "nucleoredoxin (Nxn)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "selenoprotein T (Selenot)",
                "selenoprotein W (Selenow)",
                "sestrin 2 (Sesn2)",
                "sulfiredoxin 1 homolog (S. cerevisiae) (Srxn1)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Catalase (CAT)",
            "Superoxide dismutase (SOD)",
            "Glutathione peroxidase (GPx)",
            "Thioredoxin (Trx)",
            "Peroxiredoxin (Prx)",
            "Glutathione S-transferase (GST)",
            "Heme oxygenase (HO)",
            "Ferritin",
            "Metallothionein (MT)",
            "Albumin",
            "Ceruloplasmin",
            "Transferrin",
            "Lactoferrin",
            "Hemopexin",
            "Haptoglobin",
            "Bilirubin",
            "Uric acid",
            "Melatonin",
            "Coenzyme Q10 (CoQ10)",
            "Cytochrome c",
            "Glutaredoxin (Grx)",
            "Protein disulfide isomerase (PDI)",
            "Selenoprotein P (SelP)",
            "Selenoprotein W (SelW)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Ceruloplasmin",
                "Haptoglobin",
                "Selenoprotein W (SelW)"
            ],
            "mismatches": [
                "Superoxide dismutase (SOD)",
                "Glutathione peroxidase (GPx)",
                "Thioredoxin (Trx)",
                "Peroxiredoxin (Prx)",
                "Glutathione S-transferase (GST)",
                "Heme oxygenase (HO)",
                "Ferritin",
                "Metallothionein (MT)",
                "Albumin",
                "Transferrin",
                "Lactoferrin",
                "Hemopexin",
                "Bilirubin",
                "Uric acid",
                "Melatonin",
                "Coenzyme Q10 (CoQ10)",
                "Cytochrome c",
                "Glutaredoxin (Grx)",
                "Protein disulfide isomerase (PDI)",
                "Selenoprotein P (SelP)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "S100 calcium binding protein A9 (calgranulin B) (S100a9)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "eosinophil peroxidase (Epx)",
                "glutathione S-transferase kappa 1 (Gstk1)",
                "glutathione S-transferase pi 3 (Gstp3)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "haptoglobin (Hp)",
                "lactoperoxidase (Lpo)",
                "myoglobin (Mb)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "selenoprotein F (Selenof)",
                "selenoprotein S (Selenos)",
                "selenoprotein W (Selenow)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "superoxide dismutase (SOD)",
            "catalase",
            "glutathione peroxidase",
            "thioredoxin",
            "peroxiredoxin",
            "glutaredoxin",
            "metallothionein",
            "ferritin",
            "ceruloplasmin",
            "albumin",
            "transferrin",
            "haptoglobin",
            "hemopexin",
            "bilirubin",
            "uric acid",
            "vitamin C (ascorbic acid)",
            "vitamin E (tocopherol)",
            "carotenoids",
            "flavonoids",
            "polyphenols",
            "selenium-containing proteins",
            "melatonin",
            "lipoic acid",
            "coenzyme Q10"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "catalase",
                "ceruloplasmin",
                "haptoglobin"
            ],
            "mismatches": [
                "superoxide dismutase (SOD)",
                "glutathione peroxidase",
                "thioredoxin",
                "peroxiredoxin",
                "glutaredoxin",
                "metallothionein",
                "ferritin",
                "albumin",
                "transferrin",
                "hemopexin",
                "bilirubin",
                "uric acid",
                "vitamin C (ascorbic acid)",
                "vitamin E (tocopherol)",
                "carotenoids",
                "flavonoids",
                "polyphenols",
                "selenium-containing proteins",
                "melatonin",
                "lipoic acid",
                "coenzyme Q10"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "eosinophil peroxidase (Epx)",
                "glutathione S-transferase kappa 1 (Gstk1)",
                "glutathione S-transferase pi 3 (Gstp3)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "haptoglobin (Hp)",
                "myoglobin (Mb)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "selenoprotein S (Selenos)",
                "selenoprotein T (Selenot)",
                "selenoprotein W (Selenow)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide Dismutase (SOD)",
            "Catalase (CAT)",
            "Glutathione Peroxidase (GPx)",
            "Thioredoxin (TRX)",
            "Peroxiredoxin (PRX)",
            "Heme Oxygenase-1 (HO-1)",
            "Metallothionein (MT)",
            "Ferritin (FTN)",
            "Glutaredoxin (GRX)",
            "Bilirubin (BLR)",
            "Uric Acid (UA)",
            "Albumin (ALB)",
            "Transferrin (TF)",
            "Ceruloplasmin (CP)",
            "Paraoxonase (PON)",
            "Glutathione S-Transferase (GST)",
            "Haptoglobin (HP)",
            "Hemopexin (HPX)",
            "Vitamin C (Ascorbic Acid)",
            "Vitamin E (Tocopherol)",
            "Carotenoids",
            "Flavonoids",
            "Coenzyme Q10 (CoQ10)",
            "Lipoic Acid (LA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase (CAT)",
                "Ceruloplasmin (CP)",
                "Haptoglobin (HP)"
            ],
            "mismatches": [
                "Superoxide Dismutase (SOD)",
                "Glutathione Peroxidase (GPx)",
                "Thioredoxin (TRX)",
                "Peroxiredoxin (PRX)",
                "Heme Oxygenase-1 (HO-1)",
                "Metallothionein (MT)",
                "Ferritin (FTN)",
                "Glutaredoxin (GRX)",
                "Bilirubin (BLR)",
                "Uric Acid (UA)",
                "Albumin (ALB)",
                "Transferrin (TF)",
                "Paraoxonase (PON)",
                "Glutathione S-Transferase (GST)",
                "Hemopexin (HPX)",
                "Vitamin C (Ascorbic Acid)",
                "Vitamin E (Tocopherol)",
                "Carotenoids",
                "Flavonoids",
                "Coenzyme Q10 (CoQ10)",
                "Lipoic Acid (LA)"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "alpha 1 microglobulin/bikunin precursor (Ambp)",
                "arachidonate 5-lipoxygenase activating protein (Alox5ap)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "eosinophil peroxidase (Epx)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione S-transferase, theta 2 (Gstt2)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 5 (Gpx5)",
                "glutathione peroxidase 6 (Gpx6)",
                "glutathione reductase (Gsr)",
                "haptoglobin (Hp)",
                "hemoglobin, beta adult major chain (Hbb-b1)",
                "hemoglobin, beta adult t chain (Hbb-bt)",
                "lactoperoxidase (Lpo)",
                "myeloperoxidase (Mpo)",
                "myoglobin (Mb)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Glutathione (GSH)",
            "Superoxide Dismutase (SOD)",
            "Catalase",
            "Glutaredoxin",
            "Thioredoxin",
            "Ferritin",
            "Heme Oxygenase-1 (HO-1)",
            "Nrf2",
            "Haemopexin",
            "Oxidoreductase",
            "Peroxiredoxin",
            "Vitamin D-binding protein",
            "Alpha-lipoic acid",
            "Coenzyme Q10",
            "Ubiquinol",
            "Selenium-binding protein",
            "Glutathione peroxidase",
            "Glutathione reductase",
            "Thioredoxin reductase",
            "Cysteine-rich protein",
            "Antioxidant protein 1",
            "Antioxidant protein 2",
            "Antioxidant protein 3",
            "Antioxidant protein 4"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase",
                "Glutathione reductase",
                "Thioredoxin reductase"
            ],
            "mismatches": [
                "Glutathione (GSH)",
                "Superoxide Dismutase (SOD)",
                "Glutaredoxin",
                "Thioredoxin",
                "Ferritin",
                "Heme Oxygenase-1 (HO-1)",
                "Nrf2",
                "Haemopexin",
                "Oxidoreductase",
                "Peroxiredoxin",
                "Vitamin D-binding protein",
                "Alpha-lipoic acid",
                "Coenzyme Q10",
                "Ubiquinol",
                "Selenium-binding protein",
                "Glutathione peroxidase",
                "Cysteine-rich protein",
                "Antioxidant protein 1",
                "Antioxidant protein 2",
                "Antioxidant protein 3",
                "Antioxidant protein 4"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "S100 calcium binding protein A8 (calgranulin A) (S100a8)",
                "S100 calcium binding protein A9 (calgranulin B) (S100a9)",
                "apolipoprotein A-IV (Apoa4)",
                "arachidonate 5-lipoxygenase activating protein (Alox5ap)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "eosinophil peroxidase (Epx)",
                "fatty acid binding protein 1, liver (Fabp1)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 3 (Gpx3)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione reductase (Gsr)",
                "haptoglobin (Hp)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "selenoprotein S (Selenos)",
                "selenoprotein T (Selenot)",
                "selenoprotein W (Selenow)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            "Superoxide Dismutase (SOD)",
            "Catalase",
            "Glutathione Peroxidase (GPx)",
            "Peroxiredoxin (Prx)",
            "Thioredoxin (Trx)",
            "Glutathione Reductase",
            "Ceruloplasmin",
            "Hemopexin",
            "Haptoglobin",
            "Lactoferrin",
            "Transferrin",
            "Ferritin",
            "Albumin",
            "Alpha-1 Antitrypsin",
            "Hemoglobin",
            "Myoglobin",
            "Cytochrome c",
            "Ceruloplasmin",
            "Ferritin",
            "Lactoferrin",
            "Transferrin",
            "Alpha-Lactalbumin",
            "Ovotransferrin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase",
                "Glutathione Reductase",
                "Ceruloplasmin",
                "Haptoglobin",
                "Hemoglobin",
                "Myoglobin"
            ],
            "mismatches": [
                "Superoxide Dismutase (SOD)",
                "Glutathione Peroxidase (GPx)",
                "Peroxiredoxin (Prx)",
                "Thioredoxin (Trx)",
                "Hemopexin",
                "Lactoferrin",
                "Transferrin",
                "Ferritin",
                "Albumin",
                "Alpha-1 Antitrypsin",
                "Cytochrome c",
                "Alpha-Lactalbumin",
                "Ovotransferrin"
            ],
            "true_referents": [
                "S100 calcium binding protein A8 (calgranulin A) (S100a8)",
                "S100 calcium binding protein A9 (calgranulin B) (S100a9)",
                "alpha 1 microglobulin/bikunin precursor (Ambp)",
                "catalase (Cat)",
                "ceruloplasmin (Cp)",
                "cytoglobin (Cygb)",
                "eosinophil peroxidase (Epx)",
                "glutathione S-transferase alpha 5 (Gsta5)",
                "glutathione S-transferase pi 3 (Gstp3)",
                "glutathione S-transferase, alpha 1 (Ya) (Gsta1)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione S-transferase, pi 2 (Gstp2)",
                "glutathione S-transferase, theta 1 (Gstt1)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 2 (Gpx2)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione reductase (Gsr)",
                "haptoglobin (Hp)",
                "hemoglobin alpha, adult chain 1 (Hba-a1)",
                "hemoglobin beta, bh2 (Hbb-bh2)",
                "hemoglobin, beta adult major chain (Hbb-b1)",
                "lactoperoxidase (Lpo)",
                "myoglobin (Mb)",
                "peroxidasin (Pxdn)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 3 (Prdx3)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)",
                "thioredoxin reductase 2 (Txnrd2)",
                "thioredoxin reductase 3 (Txnrd3)"
            ],
            "TP": 6,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "antioxidant system protein",
        "domain": "biology",
        "response": [
            {
                "Referent": "Vitamin E",
                "Canonical Name": "Vitamin E"
            },
            {
                "Referent": "Vitamin C",
                "Canonical Name": "Vitamin C"
            },
            {
                "Referent": "Glutathione",
                "Canonical Name": "Glutathione"
            },
            {
                "Referent": "Coenzyme Q10",
                "Canonical Name": "Coenzyme Q10"
            },
            {
                "Referent": "Superoxide dismutase",
                "Canonical Name": "Superoxide dismutase"
            },
            {
                "Referent": "Catalase",
                "Canonical Name": "Catalase"
            },
            {
                "Referent": "Glutathione peroxidase",
                "Canonical Name": "Glutathione peroxidase"
            },
            {
                "Referent": "Peroxiredoxin",
                "Canonical Name": "Peroxiredoxin"
            },
            {
                "Referent": "Thioredoxin",
                "Canonical Name": "Thioredoxin"
            },
            {
                "Referent": "Peroxiredoxin 6",
                "Canonical Name": "Peroxiredoxin 6"
            },
            {
                "Referent": "Peroxiredoxin 5",
                "Canonical Name": "Peroxiredoxin 5"
            },
            {
                "Referent": "Peroxiredoxin 3",
                "Canonical Name": "Peroxiredoxin 3"
            },
            {
                "Referent": "Peroxiredoxin 2",
                "Canonical Name": "Peroxiredoxin 2"
            },
            {
                "Referent": "Peroxiredoxin 1",
                "Canonical Name": "Peroxiredoxin 1"
            },
            {
                "Referent": "Peroxiredoxin 4",
                "Canonical Name": "Peroxiredoxin 4"
            },
            {
                "Referent": "Peroxiredoxin 8",
                "Canonical Name": "Peroxiredoxin 8"
            },
            {
                "Referent": "Peroxiredoxin 7",
                "Canonical Name": "Peroxiredoxin 7"
            },
            {
                "Referent": "Peroxiredoxin 10",
                "Canonical Name": "Peroxiredoxin 10"
            },
            {
                "Referent": "Peroxiredoxin 9",
                "Canonical Name": "Peroxiredoxin 9"
            },
            {
                "Referent": "Peroxiredoxin 11",
                "Canonical Name": "Peroxiredoxin 11"
            },
            {
                "Referent": "Peroxiredoxin 12",
                "Canonical Name": "Peroxiredoxin 12"
            },
            {
                "Referent": "Peroxiredoxin 13",
                "Canonical Name": "Peroxiredoxin 13"
            },
            {
                "Referent": "Peroxiredoxin 14",
                "Canonical Name": "Peroxiredoxin 14"
            },
            {
                "Referent": "Peroxiredoxin 15",
                "Canonical Name": "Peroxiredoxin 15"
            },
            {
                "Referent": "Peroxiredoxin 16",
                "Canonical Name": "Peroxiredoxin 16"
            },
            {
                "Referent": "Peroxiredoxin 17",
                "Canonical Name": "Peroxiredoxin 17"
            },
            {
                "Referent": "Peroxiredoxin 18",
                "Canonical Name": "Peroxiredoxin 18"
            },
            {
                "Referent": "Peroxiredoxin 19",
                "Canonical Name": "Peroxiredoxin 19"
            },
            {
                "Referent": "Peroxiredoxin 20",
                "Canonical Name": "Peroxiredoxin 20"
            },
            {
                "Referent": "Peroxiredoxin 21",
                "Canonical Name": "Peroxiredoxin 21"
            },
            {
                "Referent": "Peroxiredoxin 22",
                "Canonical Name": "Peroxiredoxin 22"
            },
            {
                "Referent": "Peroxiredoxin 23",
                "Canonical Name": "Peroxiredoxin 23"
            },
            {
                "Referent": "Peroxiredoxin 24",
                "Canonical Name": "Peroxiredoxin 24"
            },
            {
                "Referent": "Peroxiredoxin 25",
                "Canonical Name": "Peroxiredoxin 25"
            },
            {
                "Referent": "Peroxiredoxin 26",
                "Canonical Name": "Peroxiredoxin 26"
            },
            {
                "Referent": "Peroxiredoxin 27",
                "Canonical Name": "Peroxiredoxin 27"
            },
            {
                "Referent": "Peroxiredoxin 28",
                "Canonical Name": "Peroxiredoxin 28"
            },
            {
                "Referent": "Peroxiredoxin 29",
                "Canonical Name": "Peroxiredoxin 29"
            },
            {
                "Referent": "Peroxiredoxin 30",
                "Canonical Name": "Peroxiredoxin 30"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Catalase",
                "Peroxiredoxin 1",
                "Peroxiredoxin 2",
                "Peroxiredoxin 4",
                "Peroxiredoxin 5"
            ],
            "mismatches": [
                "Vitamin E",
                "Vitamin C",
                "Glutathione",
                "Coenzyme Q10",
                "Superoxide dismutase",
                "Glutathione peroxidase",
                "Peroxiredoxin",
                "Thioredoxin",
                "Peroxiredoxin 6",
                "Peroxiredoxin 3",
                "Peroxiredoxin 8",
                "Peroxiredoxin 7",
                "Peroxiredoxin 10",
                "Peroxiredoxin 9",
                "Peroxiredoxin 11",
                "Peroxiredoxin 12",
                "Peroxiredoxin 13",
                "Peroxiredoxin 14",
                "Peroxiredoxin 15",
                "Peroxiredoxin 16",
                "Peroxiredoxin 17",
                "Peroxiredoxin 18",
                "Peroxiredoxin 19",
                "Peroxiredoxin 20",
                "Peroxiredoxin 21",
                "Peroxiredoxin 22",
                "Peroxiredoxin 23",
                "Peroxiredoxin 24",
                "Peroxiredoxin 25",
                "Peroxiredoxin 26",
                "Peroxiredoxin 27",
                "Peroxiredoxin 28",
                "Peroxiredoxin 29",
                "Peroxiredoxin 30"
            ],
            "true_referents": [
                "NAD(P)H dehydrogenase, quinone 1 (Nqo1)",
                "catalase (Cat)",
                "glutathione S-transferase, mu 7 (Gstm7)",
                "glutathione S-transferase, pi 1 (Gstp1)",
                "glutathione peroxidase 1 (Gpx1)",
                "glutathione peroxidase 4 (Gpx4)",
                "glutathione peroxidase 8 (putative) (Gpx8)",
                "glutathione reductase (Gsr)",
                "peroxiredoxin 1 (Prdx1)",
                "peroxiredoxin 2 (Prdx2)",
                "peroxiredoxin 4 (Prdx4)",
                "peroxiredoxin 5 (Prdx5)",
                "superoxide dismutase 1, soluble (Sod1)",
                "superoxide dismutase 2, mitochondrial (Sod2)",
                "superoxide dismutase 3, extracellular (Sod3)",
                "thioredoxin reductase 1 (Txnrd1)"
            ],
            "TP": 5,
            "FP": 34,
            "FN": 0
        }
    }
]