[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "superoxide anion (O2\u2022-)",
            "hydrogen peroxide (H2O2)",
            "hydroperoxyl radical (HOO\u2022)",
            "peroxynitrite anion (ONOO-)",
            "nitroxyl (HNO)",
            "diazene (N2H2)",
            "nitric oxide (NO)",
            "nitroxide radical (RNO\u2022)",
            "peroxymonocarbonate anion (CO3OO-)",
            "peroxodisulfate anion (S2O82-)",
            "peroxymonosulfate anion (HSO5-)",
            "peroxynitrite (ONOOH)",
            "hypochlorite anion (ClO-)",
            "hypobromite anion (BrO-)",
            "hypochlorous acid (HOCl)",
            "hypobromous acid (HOBr)",
            "chlorite anion (ClO2-)",
            "bromite anion (BrO2-)",
            "chlorous acid (HClO2)",
            "bromous acid (HBrO2)",
            "chlorite (ClO2)",
            "bromite (BrO2)",
            "chlorous (ClO2)",
            "bromous (BrO2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "superoxide anion (O2\u2022-)",
                "hydrogen peroxide (H2O2)",
                "hydroperoxyl radical (HOO\u2022)",
                "peroxynitrite anion (ONOO-)",
                "nitroxyl (HNO)",
                "diazene (N2H2)",
                "nitric oxide (NO)",
                "nitroxide radical (RNO\u2022)",
                "peroxymonocarbonate anion (CO3OO-)",
                "peroxodisulfate anion (S2O82-)",
                "peroxymonosulfate anion (HSO5-)",
                "peroxynitrite (ONOOH)",
                "hypochlorite anion (ClO-)",
                "hypobromite anion (BrO-)",
                "hypochlorous acid (HOCl)",
                "hypobromous acid (HOBr)",
                "chlorite anion (ClO2-)",
                "bromite anion (BrO2-)",
                "chlorous acid (HClO2)",
                "bromous acid (HBrO2)",
                "chlorite (ClO2)",
                "bromite (BrO2)",
                "chlorous (ClO2)",
                "bromous (BrO2)"
            ],
            "mismatches": [],
            "true_referents": [
                "bromite (BrO2)",
                "bromite anion (BrO2-)",
                "bromous (BrO2)",
                "bromous acid (HBrO2)",
                "chlorite (ClO2)",
                "chlorite anion (ClO2-)",
                "chlorous (ClO2)",
                "chlorous acid (HClO2)",
                "diazene (N2H2)",
                "hydrogen peroxide (H2O2)",
                "hydroperoxyl radical (HOO\u2022)",
                "hypobromite anion (BrO-)",
                "hypobromous acid (HOBr)",
                "hypochlorite anion (ClO-)",
                "hypochlorous acid (HOCl)",
                "nitric oxide (NO)",
                "nitroxide radical (RNO\u2022)",
                "nitroxyl (HNO)",
                "peroxodisulfate anion (S2O82-)",
                "peroxymonocarbonate anion (CO3OO-)",
                "peroxymonosulfate anion (HSO5-)",
                "peroxynitrite (ONOOH)",
                "peroxynitrite anion (ONOO-)",
                "superoxide anion (O2\u2022-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "Superoxide anion (O2\u2022\u2212)",
            "Hydroxyl radical (\u2022OH)",
            "Peroxyl radical (ROO\u2022)",
            "Alkoxyl radical (RO\u2022)",
            "Nitric oxide (\u2022NO)",
            "Peroxynitrite (ONOO\u2212)",
            "Hydroperoxyl radical (HO2\u2022)",
            "Singlet oxygen (^1O2)",
            "Triplet oxygen (3O2)",
            "Chlorine radical (Cl\u2022)",
            "Hydrogen peroxide (H2O2)",
            "Ozone (O3)",
            "Hydroperoxide ion (HO2\u2212)",
            "Superoxide dismutase (SOD)",
            "Catalase",
            "Glutathione peroxidase",
            "Xanthine oxidase",
            "NADPH oxidase",
            "Cytochrome P450 reductase",
            "Myeloperoxidase",
            "Nitric oxide synthase",
            "Manganese superoxide dismutase (MnSOD)",
            "Copper-zinc superoxide dismutase (CuZnSOD)",
            "Iron superoxide dismutase (FeSOD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide anion (O2\u2022\u2212)",
                "Hydroxyl radical (\u2022OH)",
                "Peroxyl radical (ROO\u2022)",
                "Alkoxyl radical (RO\u2022)",
                "Nitric oxide (\u2022NO)",
                "Peroxynitrite (ONOO\u2212)",
                "Hydroperoxyl radical (HO2\u2022)",
                "Singlet oxygen (^1O2)",
                "Triplet oxygen (3O2)",
                "Chlorine radical (Cl\u2022)",
                "Hydrogen peroxide (H2O2)",
                "Ozone (O3)",
                "Hydroperoxide ion (HO2\u2212)",
                "Superoxide dismutase (SOD)",
                "Catalase",
                "Glutathione peroxidase",
                "Xanthine oxidase",
                "NADPH oxidase",
                "Cytochrome P450 reductase",
                "Myeloperoxidase",
                "Nitric oxide synthase",
                "Manganese superoxide dismutase (MnSOD)",
                "Copper-zinc superoxide dismutase (CuZnSOD)",
                "Iron superoxide dismutase (FeSOD)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alkoxyl radical (RO\u2022)",
                "Catalase",
                "Chlorine radical (Cl\u2022)",
                "Copper-zinc superoxide dismutase (CuZnSOD)",
                "Cytochrome P450 reductase",
                "Glutathione peroxidase",
                "Hydrogen peroxide (H2O2)",
                "Hydroperoxide ion (HO2\u2212)",
                "Hydroperoxyl radical (HO2\u2022)",
                "Hydroxyl radical (\u2022OH)",
                "Iron superoxide dismutase (FeSOD)",
                "Manganese superoxide dismutase (MnSOD)",
                "Myeloperoxidase",
                "NADPH oxidase",
                "Nitric oxide (\u2022NO)",
                "Nitric oxide synthase",
                "Ozone (O3)",
                "Peroxyl radical (ROO\u2022)",
                "Peroxynitrite (ONOO\u2212)",
                "Singlet oxygen (^1O2)",
                "Superoxide anion (O2\u2022\u2212)",
                "Superoxide dismutase (SOD)",
                "Triplet oxygen (3O2)",
                "Xanthine oxidase"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "Superoxide (O2\u2212)",
            "Superoxide anion",
            "Superoxide radical",
            "O2\u2212",
            "Molecular oxygen radical anion",
            "Oxygen radical anion",
            "Singlet superoxide",
            "Triplet superoxide",
            "Superoxide ion",
            "Dioxygen radical anion",
            "O2\u2022\u2212",
            "Oxygen superoxide",
            "Superoxide anion radical",
            "Oxygen radical",
            "Oxygen superoxide anion",
            "Oxygen superoxide ion",
            "Superoxide radical anion",
            "Dioxygen radical anion",
            "O2\u2212\u2022",
            "Oxygen superoxide radical",
            "Oxygen superoxide anion radical",
            "Superoxide ion radical",
            "Oxygen superoxide ion radical",
            "Oxygen superoxide anion radical",
            "O2\u2212\u2022"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O2\u2212)",
                "Superoxide anion",
                "Superoxide radical",
                "O2\u2212",
                "Molecular oxygen radical anion",
                "Oxygen radical anion",
                "Singlet superoxide",
                "Triplet superoxide",
                "Superoxide ion",
                "Dioxygen radical anion",
                "O2\u2022\u2212",
                "Oxygen superoxide",
                "Superoxide anion radical",
                "Oxygen radical",
                "Oxygen superoxide anion",
                "Oxygen superoxide ion",
                "Superoxide radical anion",
                "O2\u2212\u2022",
                "Oxygen superoxide radical",
                "Oxygen superoxide anion radical",
                "Superoxide ion radical",
                "Oxygen superoxide ion radical"
            ],
            "mismatches": [],
            "true_referents": [
                "Dioxygen radical anion",
                "Molecular oxygen radical anion",
                "O2\u2022\u2212",
                "O2\u2212",
                "O2\u2212\u2022",
                "Oxygen radical",
                "Oxygen radical anion",
                "Oxygen superoxide",
                "Oxygen superoxide anion",
                "Oxygen superoxide anion radical",
                "Oxygen superoxide ion",
                "Oxygen superoxide ion radical",
                "Oxygen superoxide radical",
                "Singlet superoxide",
                "Superoxide (O2\u2212)",
                "Superoxide anion",
                "Superoxide anion radical",
                "Superoxide ion",
                "Superoxide ion radical",
                "Superoxide radical",
                "Superoxide radical anion",
                "Triplet superoxide"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "Superoxide radical anion (O\u2082\u207b)",
            "Hydrogen peroxide (H\u2082O\u2082)",
            "Hydroxyl radical (\u2022OH)",
            "Peroxyl radical (ROO\u2022)",
            "Hypochlorous acid (HOCl)",
            "Singlet oxygen (\u00b9O\u2082)",
            "Peroxynitrite (ONOO\u207b)",
            "Nitric oxide radical (\u2022NO)",
            "Nitrous oxide (N\u2082O)",
            "Nitrite ion (NO\u2082\u207b)",
            "Nitrate ion (NO\u2083\u207b)",
            "Ozone (O\u2083)",
            "Peroxisome-derived reactive oxygen species",
            "Myeloperoxidase-generated hypochlorous acid",
            "Phagocyte-derived superoxide",
            "Xanthine oxidase-generated superoxide",
            "Autoxidation of catecholamines-generated semiquinones",
            "Metal-catalyzed Haber-Weiss reaction products",
            "Fenton reaction-generated hydroxyl radical",
            "Radiation-induced water radiolysis products",
            "Ischemia-reperfusion injury-derived superoxide",
            "Mitochondrial electron transport chain leakage-derived superoxide",
            "Lipoxygenase-derived peroxyl radicals",
            "Cyclooxygenase-derived superoxide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide radical anion (O\u2082\u207b)",
                "Hydrogen peroxide (H\u2082O\u2082)",
                "Hydroxyl radical (\u2022OH)",
                "Peroxyl radical (ROO\u2022)",
                "Hypochlorous acid (HOCl)",
                "Singlet oxygen (\u00b9O\u2082)",
                "Peroxynitrite (ONOO\u207b)",
                "Nitric oxide radical (\u2022NO)",
                "Nitrous oxide (N\u2082O)",
                "Nitrite ion (NO\u2082\u207b)",
                "Nitrate ion (NO\u2083\u207b)",
                "Ozone (O\u2083)",
                "Peroxisome-derived reactive oxygen species",
                "Myeloperoxidase-generated hypochlorous acid",
                "Phagocyte-derived superoxide",
                "Xanthine oxidase-generated superoxide",
                "Autoxidation of catecholamines-generated semiquinones",
                "Metal-catalyzed Haber-Weiss reaction products",
                "Fenton reaction-generated hydroxyl radical",
                "Radiation-induced water radiolysis products",
                "Ischemia-reperfusion injury-derived superoxide",
                "Mitochondrial electron transport chain leakage-derived superoxide",
                "Lipoxygenase-derived peroxyl radicals",
                "Cyclooxygenase-derived superoxide"
            ],
            "mismatches": [],
            "true_referents": [
                "Autoxidation of catecholamines-generated semiquinones",
                "Cyclooxygenase-derived superoxide",
                "Fenton reaction-generated hydroxyl radical",
                "Hydrogen peroxide (H\u2082O\u2082)",
                "Hydroxyl radical (\u2022OH)",
                "Hypochlorous acid (HOCl)",
                "Ischemia-reperfusion injury-derived superoxide",
                "Lipoxygenase-derived peroxyl radicals",
                "Metal-catalyzed Haber-Weiss reaction products",
                "Mitochondrial electron transport chain leakage-derived superoxide",
                "Myeloperoxidase-generated hypochlorous acid",
                "Nitrate ion (NO\u2083\u207b)",
                "Nitric oxide radical (\u2022NO)",
                "Nitrite ion (NO\u2082\u207b)",
                "Nitrous oxide (N\u2082O)",
                "Ozone (O\u2083)",
                "Peroxisome-derived reactive oxygen species",
                "Peroxyl radical (ROO\u2022)",
                "Peroxynitrite (ONOO\u207b)",
                "Phagocyte-derived superoxide",
                "Radiation-induced water radiolysis products",
                "Singlet oxygen (\u00b9O\u2082)",
                "Superoxide radical anion (O\u2082\u207b)",
                "Xanthine oxidase-generated superoxide"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "Superoxide anion (O2-)",
            "Hydroperoxyl radical (HO2)",
            "Peroxyl radical (ROO)",
            "Alkoxyl radical (RO)",
            "Semiquinone radical (QH\u2022)",
            "Nitric oxide (NO\u2022)",
            "Nitroxide radical (R2NO\u2022)",
            "Thiyl radical (RS\u2022)",
            "Ascorbate radical (Asc\u2022\u2212)",
            "Phenoxyl radical (PhO\u2022)",
            "Aminyl radical (R2N\u2022)",
            "Carbon-centered radical (R\u2022)",
            "Allyl radical (C3H5\u2022)",
            "Benzyl radical (C6H5CH2\u2022)",
            "Aryl radical (Ar\u2022)",
            "Hydroxyl radical (OH\u2022)",
            "Perhydroxyl radical (HOO\u2022)",
            "Nitrogen dioxide radical (NO2\u2022)",
            "Sulfur dioxide radical (SO2\u2022)",
            "Thiosulfate radical (S2O3\u2022)",
            "Carboxylate radical (COO\u2022)",
            "Acetyl radical (CH3CO\u2022)",
            "Methoxyl radical (CH3O\u2022)",
            "Ethoxyl radical (C2H5O\u2022)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide anion (O2-)",
                "Hydroperoxyl radical (HO2)",
                "Peroxyl radical (ROO)",
                "Alkoxyl radical (RO)",
                "Semiquinone radical (QH\u2022)",
                "Nitric oxide (NO\u2022)",
                "Nitroxide radical (R2NO\u2022)",
                "Thiyl radical (RS\u2022)",
                "Ascorbate radical (Asc\u2022\u2212)",
                "Phenoxyl radical (PhO\u2022)",
                "Aminyl radical (R2N\u2022)",
                "Carbon-centered radical (R\u2022)",
                "Allyl radical (C3H5\u2022)",
                "Benzyl radical (C6H5CH2\u2022)",
                "Aryl radical (Ar\u2022)",
                "Hydroxyl radical (OH\u2022)",
                "Perhydroxyl radical (HOO\u2022)",
                "Nitrogen dioxide radical (NO2\u2022)",
                "Sulfur dioxide radical (SO2\u2022)",
                "Thiosulfate radical (S2O3\u2022)",
                "Carboxylate radical (COO\u2022)",
                "Acetyl radical (CH3CO\u2022)",
                "Methoxyl radical (CH3O\u2022)",
                "Ethoxyl radical (C2H5O\u2022)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl radical (CH3CO\u2022)",
                "Alkoxyl radical (RO)",
                "Allyl radical (C3H5\u2022)",
                "Aminyl radical (R2N\u2022)",
                "Aryl radical (Ar\u2022)",
                "Ascorbate radical (Asc\u2022\u2212)",
                "Benzyl radical (C6H5CH2\u2022)",
                "Carbon-centered radical (R\u2022)",
                "Carboxylate radical (COO\u2022)",
                "Ethoxyl radical (C2H5O\u2022)",
                "Hydroperoxyl radical (HO2)",
                "Hydroxyl radical (OH\u2022)",
                "Methoxyl radical (CH3O\u2022)",
                "Nitric oxide (NO\u2022)",
                "Nitrogen dioxide radical (NO2\u2022)",
                "Nitroxide radical (R2NO\u2022)",
                "Perhydroxyl radical (HOO\u2022)",
                "Peroxyl radical (ROO)",
                "Phenoxyl radical (PhO\u2022)",
                "Semiquinone radical (QH\u2022)",
                "Sulfur dioxide radical (SO2\u2022)",
                "Superoxide anion (O2-)",
                "Thiosulfate radical (S2O3\u2022)",
                "Thiyl radical (RS\u2022)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "Superoxide (O2\u2022\u2212)",
            "Hydrogen Peroxide (H2O2)",
            "Singlet Oxygen (1O2)",
            "Ozone (O3)",
            "Peroxynitrite (ONOO\u2212)",
            "Dioxygenyl Ion (O2+)",
            "Hypochlorous Acid (HOCl)",
            "Aldose Sugar Peroxide (e.g., Glucose Peroxide)",
            "Phenol Radical (C6H5O\u2022)",
            "Lipid Hydroperoxide (e.g., Phospholipid Hydroperoxide)",
            "Benzoyl Peroxide (C14H10O4)",
            "Chlorite Ion (ClO2\u2212)",
            "Nitroxyl (HNO)",
            "Dichlorodifluoromethane (CCl2F2)",
            "Oxygen Radical (O\u2022)",
            "Carbonate Radical (CO3\u2022\u2212)",
            "Thiyl Radical (RSH\u2022)",
            "Sulfite Ion (SO3^2\u2212)",
            "Selenite Ion (SeO3^2\u2212)",
            "Nitrogen Dioxide (NO2)",
            "Acetyl Peroxide (C4H6O2)",
            "Cyanate Ion (OCN\u2212)",
            "Formyl Radical (HCO\u2022)",
            "Methyl Hydroperoxide (CH3OOH)",
            "Peracetic Acid (C2H4O3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O2\u2022\u2212)",
                "Hydrogen Peroxide (H2O2)",
                "Singlet Oxygen (1O2)",
                "Ozone (O3)",
                "Peroxynitrite (ONOO\u2212)",
                "Dioxygenyl Ion (O2+)",
                "Hypochlorous Acid (HOCl)",
                "Aldose Sugar Peroxide (e.g., Glucose Peroxide)",
                "Phenol Radical (C6H5O\u2022)",
                "Lipid Hydroperoxide (e.g., Phospholipid Hydroperoxide)",
                "Benzoyl Peroxide (C14H10O4)",
                "Chlorite Ion (ClO2\u2212)",
                "Nitroxyl (HNO)",
                "Dichlorodifluoromethane (CCl2F2)",
                "Oxygen Radical (O\u2022)",
                "Carbonate Radical (CO3\u2022\u2212)",
                "Thiyl Radical (RSH\u2022)",
                "Sulfite Ion (SO3^2\u2212)",
                "Selenite Ion (SeO3^2\u2212)",
                "Nitrogen Dioxide (NO2)",
                "Acetyl Peroxide (C4H6O2)",
                "Cyanate Ion (OCN\u2212)",
                "Formyl Radical (HCO\u2022)",
                "Methyl Hydroperoxide (CH3OOH)"
            ],
            "mismatches": [
                "Peracetic Acid (C2H4O3)"
            ],
            "true_referents": [
                "Acetyl Peroxide (C4H6O2)",
                "Aldose Sugar Peroxide (e.g., Glucose Peroxide)",
                "Benzoyl Peroxide (C14H10O4)",
                "Carbonate Radical (CO3\u2022\u2212)",
                "Chlorite Ion (ClO2\u2212)",
                "Cyanate Ion (OCN\u2212)",
                "Dichlorodifluoromethane (CCl2F2)",
                "Dioxygenyl Ion (O2+)",
                "Formyl Radical (HCO\u2022)",
                "Hydrogen Peroxide (H2O2)",
                "Hypochlorous Acid (HOCl)",
                "Lipid Hydroperoxide (e.g., Phospholipid Hydroperoxide)",
                "Methyl Hydroperoxide (CH3OOH)",
                "Nitrogen Dioxide (NO2)",
                "Nitroxyl (HNO)",
                "Oxygen Radical (O\u2022)",
                "Ozone (O3)",
                "Peroxynitrite (ONOO\u2212)",
                "Phenol Radical (C6H5O\u2022)",
                "Selenite Ion (SeO3^2\u2212)",
                "Singlet Oxygen (1O2)",
                "Sulfite Ion (SO3^2\u2212)",
                "Superoxide (O2\u2022\u2212)",
                "Thiyl Radical (RSH\u2022)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "Superoxide (O2\u2212)",
            "Hydrogen peroxide (H2O2)",
            "Hydroxyl radical (\u2022OH)",
            "Peroxyl radical (ROO\u2022)",
            "Hydroperoxyl (HO2\u2022)",
            "Organic hydroperoxide (ROOH)",
            "Oxygen radical (O\u2022)",
            "Alkoxyl radical (RO\u2022)",
            "Peroxide anion (O22\u2212)",
            "Hydroperoxyl radical (HO2\u2022)",
            "Superoxide anion radical (O2\u2212\u2022)",
            "Hydroxide ion (OH\u2212)",
            "Hydrogen superoxide (HO2)",
            "Hydroxy radical (HO\u2022)",
            "Oxygen anion (O\u2212)",
            "Hydrogen peroxide anion (HO2\u2212)",
            "Hydrogen superoxide anion (HO2\u2212)",
            "Alkylperoxyl radical (RO2\u2022)",
            "Organic peroxide (R2O2)",
            "Hydrogen peroxide cation (H2O2+)",
            "Hydroperoxyl cation (HO2+)",
            "Superoxide cation (O2\u2212+)",
            "Hydroxyl cation (OH+)",
            "Alkoxyl cation (RO+)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O2\u2212)",
                "Hydrogen peroxide (H2O2)",
                "Hydroxyl radical (\u2022OH)",
                "Peroxyl radical (ROO\u2022)",
                "Hydroperoxyl (HO2\u2022)",
                "Organic hydroperoxide (ROOH)",
                "Oxygen radical (O\u2022)",
                "Alkoxyl radical (RO\u2022)",
                "Peroxide anion (O22\u2212)",
                "Hydroperoxyl radical (HO2\u2022)",
                "Superoxide anion radical (O2\u2212\u2022)",
                "Hydroxide ion (OH\u2212)",
                "Hydrogen superoxide (HO2)",
                "Hydroxy radical (HO\u2022)",
                "Oxygen anion (O\u2212)",
                "Hydrogen peroxide anion (HO2\u2212)",
                "Hydrogen superoxide anion (HO2\u2212)",
                "Alkylperoxyl radical (RO2\u2022)",
                "Organic peroxide (R2O2)",
                "Hydrogen peroxide cation (H2O2+)",
                "Hydroperoxyl cation (HO2+)",
                "Superoxide cation (O2\u2212+)",
                "Hydroxyl cation (OH+)",
                "Alkoxyl cation (RO+)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alkoxyl cation (RO+)",
                "Alkoxyl radical (RO\u2022)",
                "Alkylperoxyl radical (RO2\u2022)",
                "Hydrogen peroxide (H2O2)",
                "Hydrogen peroxide anion (HO2\u2212)",
                "Hydrogen peroxide cation (H2O2+)",
                "Hydrogen superoxide (HO2)",
                "Hydrogen superoxide anion (HO2\u2212)",
                "Hydroperoxyl (HO2\u2022)",
                "Hydroperoxyl cation (HO2+)",
                "Hydroperoxyl radical (HO2\u2022)",
                "Hydroxide ion (OH\u2212)",
                "Hydroxy radical (HO\u2022)",
                "Hydroxyl cation (OH+)",
                "Hydroxyl radical (\u2022OH)",
                "Organic hydroperoxide (ROOH)",
                "Organic peroxide (R2O2)",
                "Oxygen anion (O\u2212)",
                "Oxygen radical (O\u2022)",
                "Peroxide anion (O22\u2212)",
                "Peroxyl radical (ROO\u2022)",
                "Superoxide (O2\u2212)",
                "Superoxide anion radical (O2\u2212\u2022)",
                "Superoxide cation (O2\u2212+)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "Superoxide ion (O2-)",
            "Superoxide radical (O2)",
            "Peroxyl radical (ROO)",
            "Hydroperoxyl radical (HO2)",
            "Nitric oxide (NO)",
            "Nitric oxide radical (NO\u2022)",
            "Peroxynitrite (ONOO-)",
            "Hydrogen peroxide (H2O2)",
            "Hydroxyl radical (\u2022OH)",
            "Hydroxyl anion (OH-)",
            "Carbon monoxide (CO)",
            "Carbon dioxide radical (CO2\u2022)",
            "Carbon dioxide anion (CO2-)",
            "Sulfur dioxide radical (SO2\u2022)",
            "Sulfur dioxide anion (SO2-)",
            "Sulfur trioxide radical (SO3\u2022)",
            "Sulfur trioxide anion (SO3-)",
            "Hydrogen sulfide (H2S)",
            "Hydrogen sulfide radical (HS\u2022)",
            "Hydrogen sulfide anion (HS-)",
            "Hydrogen sulfite ion (HSO3-)",
            "Hydrogen disulfide (H2S2)",
            "Hydrogen disulfide anion (H2S2-)",
            "Hydrogen persulfide (H2S2)",
            "Hydrogen persulfide anion (H2S2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide ion (O2-)",
                "Superoxide radical (O2)",
                "Peroxyl radical (ROO)",
                "Hydroperoxyl radical (HO2)",
                "Nitric oxide (NO)",
                "Nitric oxide radical (NO\u2022)",
                "Peroxynitrite (ONOO-)",
                "Hydrogen peroxide (H2O2)",
                "Hydroxyl radical (\u2022OH)",
                "Hydroxyl anion (OH-)",
                "Carbon monoxide (CO)",
                "Carbon dioxide radical (CO2\u2022)",
                "Carbon dioxide anion (CO2-)",
                "Sulfur dioxide radical (SO2\u2022)",
                "Sulfur dioxide anion (SO2-)",
                "Sulfur trioxide radical (SO3\u2022)",
                "Sulfur trioxide anion (SO3-)",
                "Hydrogen sulfide (H2S)",
                "Hydrogen sulfide radical (HS\u2022)",
                "Hydrogen sulfide anion (HS-)",
                "Hydrogen sulfite ion (HSO3-)",
                "Hydrogen disulfide (H2S2)",
                "Hydrogen disulfide anion (H2S2-)",
                "Hydrogen persulfide (H2S2)"
            ],
            "mismatches": [
                "Hydrogen persulfide anion (H2S2-)"
            ],
            "true_referents": [
                "Carbon dioxide anion (CO2-)",
                "Carbon dioxide radical (CO2\u2022)",
                "Carbon monoxide (CO)",
                "Hydrogen disulfide (H2S2)",
                "Hydrogen disulfide anion (H2S2-)",
                "Hydrogen peroxide (H2O2)",
                "Hydrogen persulfide (H2S2)",
                "Hydrogen sulfide (H2S)",
                "Hydrogen sulfide anion (HS-)",
                "Hydrogen sulfide radical (HS\u2022)",
                "Hydrogen sulfite ion (HSO3-)",
                "Hydroperoxyl radical (HO2)",
                "Hydroxyl anion (OH-)",
                "Hydroxyl radical (\u2022OH)",
                "Nitric oxide (NO)",
                "Nitric oxide radical (NO\u2022)",
                "Peroxyl radical (ROO)",
                "Peroxynitrite (ONOO-)",
                "Sulfur dioxide anion (SO2-)",
                "Sulfur dioxide radical (SO2\u2022)",
                "Sulfur trioxide anion (SO3-)",
                "Sulfur trioxide radical (SO3\u2022)",
                "Superoxide ion (O2-)",
                "Superoxide radical (O2)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "Superoxide anion (O\u2082\u207b)",
            "Hydroperoxyl radical (HO\u2082)",
            "Potassium superoxide (KO\u2082)",
            "Sodium superoxide (NaO\u2082)",
            "Lithium superoxide (LiO\u2082)",
            "Rubidium superoxide (RbO\u2082)",
            "Cesium superoxide (CsO\u2082)",
            "Barium superoxide (BaO\u2082)",
            "Calcium superoxide (CaO\u2082)",
            "Magnesium superoxide (MgO\u2082)",
            "Strontium superoxide (SrO\u2082)",
            "Ammonium superoxide (NH\u2084\u207aO\u2082\u207b)",
            "Tetramethylammonium superoxide (TMAO\u2082)",
            "Triphenylmethyl superoxide",
            "Diethylammonium superoxide",
            "Phenylmethyl superoxide",
            "Trimethylsilyl superoxide",
            "Potassium bis(superoxide) complex",
            "Cesium bis(superoxide) complex",
            "Sodium bis(superoxide) complex",
            "Lithium bis(superoxide) complex",
            "Rubidium bis(superoxide) complex",
            "Methyl superoxide",
            "Ethyl superoxide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide anion (O\u2082\u207b)",
                "Hydroperoxyl radical (HO\u2082)",
                "Potassium superoxide (KO\u2082)",
                "Sodium superoxide (NaO\u2082)",
                "Lithium superoxide (LiO\u2082)",
                "Rubidium superoxide (RbO\u2082)",
                "Cesium superoxide (CsO\u2082)",
                "Barium superoxide (BaO\u2082)",
                "Calcium superoxide (CaO\u2082)",
                "Magnesium superoxide (MgO\u2082)",
                "Strontium superoxide (SrO\u2082)",
                "Ammonium superoxide (NH\u2084\u207aO\u2082\u207b)",
                "Tetramethylammonium superoxide (TMAO\u2082)",
                "Triphenylmethyl superoxide",
                "Diethylammonium superoxide",
                "Phenylmethyl superoxide",
                "Trimethylsilyl superoxide",
                "Potassium bis(superoxide) complex",
                "Cesium bis(superoxide) complex",
                "Sodium bis(superoxide) complex",
                "Lithium bis(superoxide) complex",
                "Rubidium bis(superoxide) complex",
                "Methyl superoxide",
                "Ethyl superoxide"
            ],
            "mismatches": [],
            "true_referents": [
                "Ammonium superoxide (NH\u2084\u207aO\u2082\u207b)",
                "Barium superoxide (BaO\u2082)",
                "Calcium superoxide (CaO\u2082)",
                "Cesium bis(superoxide) complex",
                "Cesium superoxide (CsO\u2082)",
                "Diethylammonium superoxide",
                "Ethyl superoxide",
                "Hydroperoxyl radical (HO\u2082)",
                "Lithium bis(superoxide) complex",
                "Lithium superoxide (LiO\u2082)",
                "Magnesium superoxide (MgO\u2082)",
                "Methyl superoxide",
                "Phenylmethyl superoxide",
                "Potassium bis(superoxide) complex",
                "Potassium superoxide (KO\u2082)",
                "Rubidium bis(superoxide) complex",
                "Rubidium superoxide (RbO\u2082)",
                "Sodium bis(superoxide) complex",
                "Sodium superoxide (NaO\u2082)",
                "Strontium superoxide (SrO\u2082)",
                "Superoxide anion (O\u2082\u207b)",
                "Tetramethylammonium superoxide (TMAO\u2082)",
                "Trimethylsilyl superoxide",
                "Triphenylmethyl superoxide"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "Superoxide anion (O2\u2022\u2212)",
            "Hydroperoxyl radical (HO2\u2022)",
            "Potassium superoxide (KO2)",
            "Sodium superoxide (NaO2)",
            "Calcium superoxide (Ca(O2)2)",
            "Rubidium superoxide (RbO2)",
            "Cesium superoxide (CsO2)",
            "Barium superoxide (BaO2)",
            "Tetrabutylammonium superoxide ((C4H9)4NO2)",
            "Tetramethylammonium superoxide ((CH3)4NO2)",
            "Lithium superoxide (LiO2)",
            "Magnesium superoxide (Mg(O2)2)",
            "Strontium superoxide (Sr(O2)2)",
            "Xenon superoxide (XeO2)",
            "Copper superoxide (CuO2)",
            "Iron superoxide (FeO2)",
            "Manganese superoxide (MnO2)",
            "Nickel superoxide (NiO2)",
            "Cobalt superoxide (CoO2)",
            "Zinc superoxide (ZnO2)",
            "Silver superoxide (AgO2)",
            "Gold superoxide (AuO2)",
            "Platinum superoxide (PtO2)",
            "Palladium superoxide (PdO2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide anion (O2\u2022\u2212)",
                "Hydroperoxyl radical (HO2\u2022)",
                "Potassium superoxide (KO2)",
                "Sodium superoxide (NaO2)",
                "Calcium superoxide (Ca(O2)2)",
                "Rubidium superoxide (RbO2)",
                "Cesium superoxide (CsO2)",
                "Barium superoxide (BaO2)",
                "Tetrabutylammonium superoxide ((C4H9)4NO2)",
                "Tetramethylammonium superoxide ((CH3)4NO2)",
                "Lithium superoxide (LiO2)",
                "Magnesium superoxide (Mg(O2)2)",
                "Strontium superoxide (Sr(O2)2)",
                "Xenon superoxide (XeO2)",
                "Copper superoxide (CuO2)",
                "Iron superoxide (FeO2)",
                "Manganese superoxide (MnO2)",
                "Nickel superoxide (NiO2)",
                "Cobalt superoxide (CoO2)",
                "Zinc superoxide (ZnO2)",
                "Silver superoxide (AgO2)",
                "Gold superoxide (AuO2)",
                "Platinum superoxide (PtO2)",
                "Palladium superoxide (PdO2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Barium superoxide (BaO2)",
                "Calcium superoxide (Ca(O2)2)",
                "Cesium superoxide (CsO2)",
                "Cobalt superoxide (CoO2)",
                "Copper superoxide (CuO2)",
                "Gold superoxide (AuO2)",
                "Hydroperoxyl radical (HO2\u2022)",
                "Iron superoxide (FeO2)",
                "Lithium superoxide (LiO2)",
                "Magnesium superoxide (Mg(O2)2)",
                "Manganese superoxide (MnO2)",
                "Nickel superoxide (NiO2)",
                "Palladium superoxide (PdO2)",
                "Platinum superoxide (PtO2)",
                "Potassium superoxide (KO2)",
                "Rubidium superoxide (RbO2)",
                "Silver superoxide (AgO2)",
                "Sodium superoxide (NaO2)",
                "Strontium superoxide (Sr(O2)2)",
                "Superoxide anion (O2\u2022\u2212)",
                "Tetrabutylammonium superoxide ((C4H9)4NO2)",
                "Tetramethylammonium superoxide ((CH3)4NO2)",
                "Xenon superoxide (XeO2)",
                "Zinc superoxide (ZnO2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "Superoxide anion radical (O2\u2022-)",
            "Hydroperoxyl radical (HO2\u2022)",
            "Hydrogen peroxide (H2O2)",
            "Hydroxyl radical (\u2022OH)",
            "Singlet oxygen (1O2)",
            "Ozone (O3)",
            "Hypochlorite ion (OCl-)",
            "Hypobromite ion (OBr-)",
            "Hypoiodite ion (OI-)",
            "Peroxynitrite (ONOO-)",
            "Peroxynitrous acid (ONOOH)",
            "Nitric oxide (NO)",
            "Nitrogen dioxide (NO2)",
            "Peroxyl radicals (ROO\u2022)",
            "Alkoxyl radicals (RO\u2022)",
            "Hydroperoxides (ROOH)",
            "Organic peroxides (ROOR)",
            "Semiquinone radicals (Q\u2022-)",
            "Peroxomonocarbonate (HCO4-)",
            "Peroxodicarbonate (C2O62-)",
            "Peroxomonosulfate (HSO5-)",
            "Peroxodisulfate (S2O82-)",
            "Peroxomonophosphate (H2PO5-)",
            "Peroxodiphosphate (P2O84-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide anion radical (O2\u2022-)",
                "Hydroperoxyl radical (HO2\u2022)",
                "Hydrogen peroxide (H2O2)",
                "Hydroxyl radical (\u2022OH)",
                "Singlet oxygen (1O2)",
                "Ozone (O3)",
                "Hypochlorite ion (OCl-)",
                "Hypobromite ion (OBr-)",
                "Hypoiodite ion (OI-)",
                "Peroxynitrite (ONOO-)",
                "Peroxynitrous acid (ONOOH)",
                "Nitric oxide (NO)",
                "Nitrogen dioxide (NO2)",
                "Peroxyl radicals (ROO\u2022)",
                "Alkoxyl radicals (RO\u2022)",
                "Hydroperoxides (ROOH)",
                "Organic peroxides (ROOR)",
                "Semiquinone radicals (Q\u2022-)",
                "Peroxomonocarbonate (HCO4-)",
                "Peroxodicarbonate (C2O62-)",
                "Peroxomonosulfate (HSO5-)",
                "Peroxodisulfate (S2O82-)",
                "Peroxomonophosphate (H2PO5-)",
                "Peroxodiphosphate (P2O84-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alkoxyl radicals (RO\u2022)",
                "Hydrogen peroxide (H2O2)",
                "Hydroperoxides (ROOH)",
                "Hydroperoxyl radical (HO2\u2022)",
                "Hydroxyl radical (\u2022OH)",
                "Hypobromite ion (OBr-)",
                "Hypochlorite ion (OCl-)",
                "Hypoiodite ion (OI-)",
                "Nitric oxide (NO)",
                "Nitrogen dioxide (NO2)",
                "Organic peroxides (ROOR)",
                "Ozone (O3)",
                "Peroxodicarbonate (C2O62-)",
                "Peroxodiphosphate (P2O84-)",
                "Peroxodisulfate (S2O82-)",
                "Peroxomonocarbonate (HCO4-)",
                "Peroxomonophosphate (H2PO5-)",
                "Peroxomonosulfate (HSO5-)",
                "Peroxyl radicals (ROO\u2022)",
                "Peroxynitrite (ONOO-)",
                "Peroxynitrous acid (ONOOH)",
                "Semiquinone radicals (Q\u2022-)",
                "Singlet oxygen (1O2)",
                "Superoxide anion radical (O2\u2022-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "Superoxide radical (O2\u2022\u2212)",
            "Hydroperoxyl radical (HO2\u2022)",
            "Perhydroxyl radical (H2O2\u2022\u2212)",
            "Alkoxyl radical (RO\u2022)",
            "Peroxyl radical (ROO\u2022)",
            "Hydroxyl radical (\u2022OH)",
            "Singlet oxygen (1O2)",
            "Ozonide radical ion (O3\u2022\u2212)",
            "Carbonate radical anion (CO3\u2022\u2212)",
            "Nitrogen dioxide radical (\u2022NO2)",
            "Sulfate radical anion (SO4\u2022\u2212)",
            "Trichloromethylperoxyl radical (CCl3OO\u2022)",
            "Phosphate radical (PO4\u20222\u2212)",
            "Hypochlorite radical anion (ClO\u2022\u2212)",
            "Nitrate radical (NO3\u2022)",
            "Chromate radical (CrO4\u2022\u2212)",
            "Dichromate radical anion (Cr2O7\u2022\u2212)",
            "Permanganate radical (MnO4\u2022\u2212)",
            "Azide radical (N3\u2022)",
            "Nitroxyl radical (HNO)",
            "Nitrosyl hydride radical (H2NO\u2022)",
            "Sulfonyl radical (RSO2\u2022)",
            "Thiyl radical (RS\u2022)",
            "Selenoxyl radical (RSe\u2022)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide radical (O2\u2022\u2212)",
                "Hydroperoxyl radical (HO2\u2022)",
                "Perhydroxyl radical (H2O2\u2022\u2212)",
                "Alkoxyl radical (RO\u2022)",
                "Peroxyl radical (ROO\u2022)",
                "Hydroxyl radical (\u2022OH)",
                "Singlet oxygen (1O2)",
                "Ozonide radical ion (O3\u2022\u2212)",
                "Carbonate radical anion (CO3\u2022\u2212)",
                "Nitrogen dioxide radical (\u2022NO2)",
                "Sulfate radical anion (SO4\u2022\u2212)",
                "Trichloromethylperoxyl radical (CCl3OO\u2022)",
                "Phosphate radical (PO4\u20222\u2212)",
                "Hypochlorite radical anion (ClO\u2022\u2212)",
                "Nitrate radical (NO3\u2022)",
                "Chromate radical (CrO4\u2022\u2212)",
                "Dichromate radical anion (Cr2O7\u2022\u2212)",
                "Permanganate radical (MnO4\u2022\u2212)",
                "Azide radical (N3\u2022)",
                "Nitroxyl radical (HNO)",
                "Nitrosyl hydride radical (H2NO\u2022)",
                "Sulfonyl radical (RSO2\u2022)",
                "Thiyl radical (RS\u2022)",
                "Selenoxyl radical (RSe\u2022)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alkoxyl radical (RO\u2022)",
                "Azide radical (N3\u2022)",
                "Carbonate radical anion (CO3\u2022\u2212)",
                "Chromate radical (CrO4\u2022\u2212)",
                "Dichromate radical anion (Cr2O7\u2022\u2212)",
                "Hydroperoxyl radical (HO2\u2022)",
                "Hydroxyl radical (\u2022OH)",
                "Hypochlorite radical anion (ClO\u2022\u2212)",
                "Nitrate radical (NO3\u2022)",
                "Nitrogen dioxide radical (\u2022NO2)",
                "Nitrosyl hydride radical (H2NO\u2022)",
                "Nitroxyl radical (HNO)",
                "Ozonide radical ion (O3\u2022\u2212)",
                "Perhydroxyl radical (H2O2\u2022\u2212)",
                "Permanganate radical (MnO4\u2022\u2212)",
                "Peroxyl radical (ROO\u2022)",
                "Phosphate radical (PO4\u20222\u2212)",
                "Selenoxyl radical (RSe\u2022)",
                "Singlet oxygen (1O2)",
                "Sulfate radical anion (SO4\u2022\u2212)",
                "Sulfonyl radical (RSO2\u2022)",
                "Superoxide radical (O2\u2022\u2212)",
                "Thiyl radical (RS\u2022)",
                "Trichloromethylperoxyl radical (CCl3OO\u2022)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "Superoxide (O2-)",
            "Hydrogen peroxide (H2O2)",
            "Hydroxyl radical (OH\u2022)",
            "Peroxynitrite (ONOO-)",
            "Hypochlorous acid (HOCl)",
            "Ozone (O3)",
            "Singlet oxygen (1O2)",
            "Nitric oxide (NO\u2022)",
            "Nitrogen dioxide (NO2\u2022)",
            "Lipid peroxyl radical (LOO\u2022)",
            "Lipid hydroperoxide (LOOH)",
            "Malondialdehyde (MDA)",
            "4-Hydroxynonenal (4-HNE)",
            "Glutathione peroxidase (GPx)",
            "Superoxide dismutase (SOD)",
            "Catalase (CAT)",
            "Thioredoxin (Trx)",
            "Peroxiredoxin (Prx)",
            "Glutathione (GSH)",
            "Ascorbic acid (Vitamin C)",
            "\u03b1-Tocopherol (Vitamin E)",
            "Carotenoids",
            "Flavonoids",
            "Metallothioneins (MTs)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O2-)",
                "Hydrogen peroxide (H2O2)",
                "Hydroxyl radical (OH\u2022)",
                "Peroxynitrite (ONOO-)",
                "Hypochlorous acid (HOCl)",
                "Ozone (O3)",
                "Singlet oxygen (1O2)",
                "Nitric oxide (NO\u2022)",
                "Nitrogen dioxide (NO2\u2022)",
                "Lipid peroxyl radical (LOO\u2022)",
                "Lipid hydroperoxide (LOOH)",
                "Malondialdehyde (MDA)",
                "4-Hydroxynonenal (4-HNE)",
                "Glutathione peroxidase (GPx)",
                "Superoxide dismutase (SOD)",
                "Catalase (CAT)",
                "Thioredoxin (Trx)",
                "Peroxiredoxin (Prx)",
                "Glutathione (GSH)",
                "Ascorbic acid (Vitamin C)",
                "\u03b1-Tocopherol (Vitamin E)",
                "Carotenoids",
                "Flavonoids",
                "Metallothioneins (MTs)"
            ],
            "mismatches": [],
            "true_referents": [
                "4-Hydroxynonenal (4-HNE)",
                "Ascorbic acid (Vitamin C)",
                "Carotenoids",
                "Catalase (CAT)",
                "Flavonoids",
                "Glutathione (GSH)",
                "Glutathione peroxidase (GPx)",
                "Hydrogen peroxide (H2O2)",
                "Hydroxyl radical (OH\u2022)",
                "Hypochlorous acid (HOCl)",
                "Lipid hydroperoxide (LOOH)",
                "Lipid peroxyl radical (LOO\u2022)",
                "Malondialdehyde (MDA)",
                "Metallothioneins (MTs)",
                "Nitric oxide (NO\u2022)",
                "Nitrogen dioxide (NO2\u2022)",
                "Ozone (O3)",
                "Peroxiredoxin (Prx)",
                "Peroxynitrite (ONOO-)",
                "Singlet oxygen (1O2)",
                "Superoxide (O2-)",
                "Superoxide dismutase (SOD)",
                "Thioredoxin (Trx)",
                "\u03b1-Tocopherol (Vitamin E)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "Superoxide (O2\u2022-)",
            "Hydroxyl radical (\u2022OH)",
            "Peroxide (ROOH)",
            "Dihydroxide (R(OH)2)",
            "Nitric oxide (NO)",
            "Nitrite (NO2-)",
            "Nitrate (NO3-)",
            "Peroxynitrite (ONOO-)",
            "Peroxynitrate (ONOO-)",
            "Dioxidane (H2O2)",
            "Hydrogen peroxide (H2O2)",
            "Oxide radical (O\u2022)",
            "Superoxide dismutase (SOD)",
            "Hydroxyl radical scavenger (HRS)",
            "Peroxide scavenger (PS)",
            "Dihydroxide scavenger (DHS)",
            "Nitric oxide synthase (NOS)",
            "Nitrite reductase (NR)",
            "Nitrate reductase (NR)",
            "Peroxynitrite reductase (PNR)",
            "Peroxynitrate reductase (PNR)",
            "Dioxidane reductase (DR)",
            "Hydrogen peroxide reductase (HPR)",
            "Oxide radical scavenger (ORS)",
            "Superoxide dismutase (SOD)",
            "Hydroxyl radical scavenger (HRS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O2\u2022-)",
                "Hydroxyl radical (\u2022OH)",
                "Peroxide (ROOH)",
                "Dihydroxide (R(OH)2)",
                "Nitric oxide (NO)",
                "Nitrite (NO2-)",
                "Nitrate (NO3-)",
                "Peroxynitrite (ONOO-)",
                "Peroxynitrate (ONOO-)",
                "Dioxidane (H2O2)",
                "Hydrogen peroxide (H2O2)",
                "Oxide radical (O\u2022)",
                "Superoxide dismutase (SOD)",
                "Hydroxyl radical scavenger (HRS)",
                "Peroxide scavenger (PS)",
                "Dihydroxide scavenger (DHS)",
                "Nitric oxide synthase (NOS)",
                "Nitrite reductase (NR)",
                "Nitrate reductase (NR)",
                "Peroxynitrite reductase (PNR)",
                "Peroxynitrate reductase (PNR)",
                "Dioxidane reductase (DR)",
                "Hydrogen peroxide reductase (HPR)",
                "Oxide radical scavenger (ORS)"
            ],
            "mismatches": [],
            "true_referents": [
                "Dihydroxide (R(OH)2)",
                "Dihydroxide scavenger (DHS)",
                "Dioxidane (H2O2)",
                "Dioxidane reductase (DR)",
                "Hydrogen peroxide (H2O2)",
                "Hydrogen peroxide reductase (HPR)",
                "Hydroxyl radical (\u2022OH)",
                "Hydroxyl radical scavenger (HRS)",
                "Nitrate (NO3-)",
                "Nitrate reductase (NR)",
                "Nitric oxide (NO)",
                "Nitric oxide synthase (NOS)",
                "Nitrite (NO2-)",
                "Nitrite reductase (NR)",
                "Oxide radical (O\u2022)",
                "Oxide radical scavenger (ORS)",
                "Peroxide (ROOH)",
                "Peroxide scavenger (PS)",
                "Peroxynitrate (ONOO-)",
                "Peroxynitrate reductase (PNR)",
                "Peroxynitrite (ONOO-)",
                "Peroxynitrite reductase (PNR)",
                "Superoxide (O2\u2022-)",
                "Superoxide dismutase (SOD)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            "superoxide (O2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "superoxide (O2-)"
            ],
            "mismatches": [],
            "true_referents": [
                "superoxide (O2-)"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "reactive oxygen species",
        "domain": "chemistry",
        "response": [
            [
                "Canonical name",
                "Oxygen"
            ],
            [
                "Canonical name",
                "Oxygen radical anion"
            ]
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Oxygen",
                "Oxygen radical anion"
            ],
            "mismatches": [],
            "true_referents": [
                "[\"Canonical name\", \"Oxygen radical anion\"]",
                "[\"Canonical name\", \"Oxygen\"]"
            ],
            "TP": 2,
            "FP": 0,
            "FN": 0
        }
    }
]