[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen peroxide (H2O2)",
            "Superoxide anion (O2\u2022-)",
            "Nitric oxide (NO\u2022)",
            "Hypochlorous acid (HOCl)",
            "Reactive oxygen species (ROS)",
            "Dihydrogen trioxide (H2O3)",
            "Peroxynitrite (ONOO-)",
            "Alkoxy radicals (RO\u2022)",
            "Hydroxyl radicals (HO\u2022)",
            "Peroxynitrous acid (HOONO)",
            "Singlet oxygen (1O2)",
            "Lipid peroxides",
            "Metal-catalyzed oxidation products",
            "Chloramines",
            "Peroxynitrite anion (ONOO-)",
            "Ozone (O3)",
            "Hydrogen peroxide anion (HO2-)",
            "Peroxides (ROOR)",
            "Alkyl hydroperoxides (ROOH)",
            "Peroxy radicals (ROO\u2022)",
            "Chlorine (Cl2)",
            "Hydrogen peroxide dismutase (H2O2)",
            "Chlorine dioxide (ClO2)",
            "Oxygen (O2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H2O2)",
                "Singlet oxygen (1O2)",
                "Ozone (O3)",
                "Peroxides (ROOR)"
            ],
            "mismatches": [
                "Superoxide anion (O2\u2022-)",
                "Nitric oxide (NO\u2022)",
                "Hypochlorous acid (HOCl)",
                "Reactive oxygen species (ROS)",
                "Dihydrogen trioxide (H2O3)",
                "Peroxynitrite (ONOO-)",
                "Alkoxy radicals (RO\u2022)",
                "Hydroxyl radicals (HO\u2022)",
                "Peroxynitrous acid (HOONO)",
                "Lipid peroxides",
                "Metal-catalyzed oxidation products",
                "Chloramines",
                "Peroxynitrite anion (ONOO-)",
                "Hydrogen peroxide anion (HO2-)",
                "Alkyl hydroperoxides (ROOH)",
                "Peroxy radicals (ROO\u2022)",
                "Chlorine (Cl2)",
                "Hydrogen peroxide dismutase (H2O2)",
                "Chlorine dioxide (ClO2)",
                "Oxygen (O2)"
            ],
            "true_referents": [
                "chlorine peroxide",
                "chloroacetaldehyde",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "ergosterol peroxide",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "isonordoperoxide",
                "nitrosoperoxycarbonic acid",
                "ozone",
                "peroxides",
                "singlet dioxygen",
                "sodium chlorite",
                "tert-butyl hydroperoxide",
                "triplet dioxygen"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen Peroxide (H2O2)",
            "Superoxide Anion (O2\u2022\u2212)",
            "Hydroxyl Radical (\u2022OH)",
            "Nitric Oxide (NO)",
            "Chlorine (Cl2)",
            "Ozone (O3)",
            "Nitrogen Dioxide (NO2)",
            "Carbon Tetrachloride (CCl4)",
            "Chlorine Dioxide (ClO2)",
            "Peroxynitrite (ONOO\u2212)",
            "Singlet Oxygen (1O2)",
            "Reactive Oxygen Species (ROS)",
            "Reactive Nitrogen Species (RNS)",
            "Lipid Peroxidation Products (e.g., Malondialdehyde)",
            "Fenton Reaction (Fe2+ + H2O2)",
            "Hypochlorous Acid (HOCl)",
            "Hypobromous Acid (HOBr)",
            "Dichlorine Monoxide (Cl2O)",
            "Hydrogen Superoxide (HOO\u2022)",
            "Hydrogen Chloride (HCl) in the presence of O2",
            "Peroxynitrous Acid (OONOH)",
            "Methane Peroxide (CH3OOH)",
            "Nitrogen Tetroxide (N2O4)",
            "Sulfur Dioxide (SO2) in the presence of O2",
            "Hydrogen Bromide (HBr) in the presence of O2"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen Peroxide (H2O2)",
                "Ozone (O3)",
                "Singlet Oxygen (1O2)",
                "Nitrogen Tetroxide (N2O4)"
            ],
            "mismatches": [
                "Superoxide Anion (O2\u2022\u2212)",
                "Hydroxyl Radical (\u2022OH)",
                "Nitric Oxide (NO)",
                "Chlorine (Cl2)",
                "Nitrogen Dioxide (NO2)",
                "Carbon Tetrachloride (CCl4)",
                "Chlorine Dioxide (ClO2)",
                "Peroxynitrite (ONOO\u2212)",
                "Reactive Oxygen Species (ROS)",
                "Reactive Nitrogen Species (RNS)",
                "Lipid Peroxidation Products (e.g., Malondialdehyde)",
                "Fenton Reaction (Fe2+ + H2O2)",
                "Hypochlorous Acid (HOCl)",
                "Hypobromous Acid (HOBr)",
                "Dichlorine Monoxide (Cl2O)",
                "Hydrogen Superoxide (HOO\u2022)",
                "Hydrogen Chloride (HCl) in the presence of O2",
                "Peroxynitrous Acid (OONOH)",
                "Methane Peroxide (CH3OOH)",
                "Sulfur Dioxide (SO2) in the presence of O2",
                "Hydrogen Bromide (HBr) in the presence of O2"
            ],
            "true_referents": [
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromic acid",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "isonordoperoxide",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peroxides",
                "singlet dioxygen",
                "sodium chlorite",
                "sodium chromate",
                "trichloroacetaldehyde",
                "triplet dioxygen"
            ],
            "TP": 4,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen peroxide (H2O2)",
            "Superoxide (O2\u2212)",
            "Hypochlorous acid (HOCl)",
            "Nitric oxide (NO)",
            "Nitrosyl cation (NO+)",
            "Peroxynitrite (ONOO\u2212)",
            "Ozone (O3)",
            "Singlet oxygen (1O2)",
            "Hydroxyl radical (\u00b7OH)",
            "Chlorine dioxide (ClO2)",
            "Chlorine (Cl2)",
            "Oxygen (O2)",
            "Peroxide anion (O22\u2212)",
            "Hydrogen trioxide (H2O3)",
            "Nitrous oxide (N2O)",
            "Nitric dioxide (NO2)",
            "Dioxygenyl cation (O2+)",
            "Chlorine monoxide (ClO)",
            "Chlorine dioxide anion (ClO2\u2212)",
            "Peroxynitrous acid (ONOOH)",
            "Dichlorine monoxide (Cl2O)",
            "Dinitrogen tetroxide (N2O4)",
            "Dinitrogen trioxide (N2O3)",
            "Oxygen difluoride (OF2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H2O2)",
                "Ozone (O3)",
                "Singlet oxygen (1O2)",
                "Dinitrogen tetroxide (N2O4)"
            ],
            "mismatches": [
                "Superoxide (O2\u2212)",
                "Hypochlorous acid (HOCl)",
                "Nitric oxide (NO)",
                "Nitrosyl cation (NO+)",
                "Peroxynitrite (ONOO\u2212)",
                "Hydroxyl radical (\u00b7OH)",
                "Chlorine dioxide (ClO2)",
                "Chlorine (Cl2)",
                "Oxygen (O2)",
                "Peroxide anion (O22\u2212)",
                "Hydrogen trioxide (H2O3)",
                "Nitrous oxide (N2O)",
                "Nitric dioxide (NO2)",
                "Dioxygenyl cation (O2+)",
                "Chlorine monoxide (ClO)",
                "Chlorine dioxide anion (ClO2\u2212)",
                "Peroxynitrous acid (ONOOH)",
                "Dichlorine monoxide (Cl2O)",
                "Dinitrogen trioxide (N2O3)",
                "Oxygen difluoride (OF2)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium nitrate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromyl dichloride",
                "diethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "isonordoperoxide",
                "nitrosoperoxycarbonic acid",
                "nitryl chloride",
                "ozone",
                "peroxides",
                "singlet dioxygen",
                "sodium chlorite",
                "triplet dioxygen"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen Peroxide (H\u2082O\u2082)",
            "Superoxide Radical (O\u2082\u207b)",
            "Hydroxyl Radical (\u2022OH)",
            "Singlet Oxygen (\u00b9O\u2082)",
            "Peroxynitrite (ONOO\u207b)",
            "Hypochlorous Acid (HOCl)",
            "Nitric Oxide (NO)",
            "Nitrogen Dioxide (NO\u2082)",
            "Ozone (O\u2083)",
            "Peroxynitrite Anion (ONOO\u207b)",
            "Glutathione Disulfide (GSSG)",
            "Advanced Oxidation Protein Products (AOPP)",
            "Reactive Carbonyl Species (RCS)",
            "Myeloperoxidase-derived oxidants",
            "Fenton Reaction generated \u2022OH",
            "Metal Ions (Fe\u00b2\u207a, Cu\u207a)",
            "Semiquinone Radical",
            "Quinone",
            "Lipid Peroxyl Radical (LOO\u2022)",
            "Lipid Hydroperoxide (LOOH)",
            "4-Hydroxynonenal (4-HNE)",
            "Malondialdehyde (MDA)",
            "Prostaglandin Endoperoxides",
            "Activated Oxygen Species (ROS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen Peroxide (H\u2082O\u2082)",
                "Singlet Oxygen (\u00b9O\u2082)",
                "Ozone (O\u2083)",
                "Prostaglandin Endoperoxides"
            ],
            "mismatches": [
                "Superoxide Radical (O\u2082\u207b)",
                "Hydroxyl Radical (\u2022OH)",
                "Peroxynitrite (ONOO\u207b)",
                "Hypochlorous Acid (HOCl)",
                "Nitric Oxide (NO)",
                "Nitrogen Dioxide (NO\u2082)",
                "Peroxynitrite Anion (ONOO\u207b)",
                "Glutathione Disulfide (GSSG)",
                "Advanced Oxidation Protein Products (AOPP)",
                "Reactive Carbonyl Species (RCS)",
                "Myeloperoxidase-derived oxidants",
                "Fenton Reaction generated \u2022OH",
                "Metal Ions (Fe\u00b2\u207a, Cu\u207a)",
                "Semiquinone Radical",
                "Quinone",
                "Lipid Peroxyl Radical (LOO\u2022)",
                "Lipid Hydroperoxide (LOOH)",
                "4-Hydroxynonenal (4-HNE)",
                "Malondialdehyde (MDA)",
                "Activated Oxygen Species (ROS)"
            ],
            "true_referents": [
                "(R)-alpha-campholenaldehyde",
                "(methylsulfanyl)acetaldehyde",
                "5alpha,8alpha-epidioxysterol",
                "9(11)-dehydroaxinysterol",
                "acetaldehyde",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "cumene hydroperoxide",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "hydrogen peroxide",
                "isonordoperoxide",
                "nitrosoperoxycarbonic acid",
                "ozone",
                "peroxides",
                "prostaglandin G2",
                "prostaglandin H3",
                "prostaglandins G",
                "prostaglandins H",
                "singlet dioxygen",
                "tert-butyl hydroperoxide",
                "triplet dioxygen"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxygen (O2)",
            "Ozone (O3)",
            "Hydrogen Peroxide (H2O2)",
            "Nitric Oxide (NO)",
            "Nitrogen Dioxide (NO2)",
            "Chlorine (Cl2)",
            "Bromine (Br2)",
            "Fluorine (F2)",
            "Peroxynitrite (ONOO-)",
            "Singlet Oxygen (1O2)",
            "Superoxide (O2-)",
            "Hypochlorous Acid (HOCl)",
            "Hypobromous Acid (HOBr)",
            "Nitrous Oxide (N2O)",
            "Peracetic Acid (CH3CO3H)",
            "Potassium Permanganate (KMnO4)",
            "Chromium Trioxide (CrO3)",
            "Sodium Hypochlorite (NaClO)",
            "Sodium Perborate (NaBO3)",
            "Osmium Tetroxide (OsO4)",
            "Potassium Dichromate (K2Cr2O7)",
            "Lead(IV) Oxide (PbO2)",
            "Iodine (I2)",
            "Ferrate (FeO4^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ozone (O3)",
                "Hydrogen Peroxide (H2O2)",
                "Singlet Oxygen (1O2)",
                "Peracetic Acid (CH3CO3H)",
                "Osmium Tetroxide (OsO4)",
                "Potassium Dichromate (K2Cr2O7)"
            ],
            "mismatches": [
                "Oxygen (O2)",
                "Nitric Oxide (NO)",
                "Nitrogen Dioxide (NO2)",
                "Chlorine (Cl2)",
                "Bromine (Br2)",
                "Fluorine (F2)",
                "Peroxynitrite (ONOO-)",
                "Superoxide (O2-)",
                "Hypochlorous Acid (HOCl)",
                "Hypobromous Acid (HOBr)",
                "Nitrous Oxide (N2O)",
                "Potassium Permanganate (KMnO4)",
                "Chromium Trioxide (CrO3)",
                "Sodium Hypochlorite (NaClO)",
                "Sodium Perborate (NaBO3)",
                "Lead(IV) Oxide (PbO2)",
                "Iodine (I2)",
                "Ferrate (FeO4^2-)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium nitrate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "isonordoperoxide",
                "lead tetraacetate",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peracetic acid",
                "peroxides",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "singlet dioxygen",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "sodium periodate",
                "triplet dioxygen"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxygen (O2)",
            "Hydrogen peroxide (H2O2)",
            "Superoxide anion (O2-)",
            "Ozone (O3)",
            "Nitric oxide (NO)",
            "Chlorine (Cl2)",
            "Bromine (Br2)",
            "Potassium permanganate (KMnO4)",
            "Ferric ion (Fe3+)",
            "Copper(II) ion (Cu2+)",
            "Selenium dioxide (SeO2)",
            "Manganese dioxide (MnO2)",
            "Nitrogen dioxide (NO2)",
            "Peracetic acid (C2H4O3)",
            "Benzoyl peroxide (C14H10O4)",
            "Iodine (I2)",
            "Hydrochloric acid (HCl)",
            "Trichloroacetic acid (CCl3COOH)",
            "Chromic acid (H2CrO4)",
            "Sodium hypochlorite (NaClO)",
            "Calcium hypochlorite (Ca(OCl)2)",
            "Sodium dichromate (Na2Cr2O7)",
            "Arsenic trioxide (As2O3)",
            "Vanadium pentoxide (V2O5)",
            "Lead(IV) oxide (PbO2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H2O2)",
                "Ozone (O3)",
                "Peracetic acid (C2H4O3)",
                "Chromic acid (H2CrO4)"
            ],
            "mismatches": [
                "Oxygen (O2)",
                "Superoxide anion (O2-)",
                "Nitric oxide (NO)",
                "Chlorine (Cl2)",
                "Bromine (Br2)",
                "Potassium permanganate (KMnO4)",
                "Ferric ion (Fe3+)",
                "Copper(II) ion (Cu2+)",
                "Selenium dioxide (SeO2)",
                "Manganese dioxide (MnO2)",
                "Nitrogen dioxide (NO2)",
                "Benzoyl peroxide (C14H10O4)",
                "Iodine (I2)",
                "Hydrochloric acid (HCl)",
                "Trichloroacetic acid (CCl3COOH)",
                "Sodium hypochlorite (NaClO)",
                "Calcium hypochlorite (Ca(OCl)2)",
                "Sodium dichromate (Na2Cr2O7)",
                "Arsenic trioxide (As2O3)",
                "Vanadium pentoxide (V2O5)",
                "Lead(IV) oxide (PbO2)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium nitrate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "chromyl dichloride",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dioxygen",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peracetic acid",
                "peroxides",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "trichloroacetaldehyde",
                "triplet dioxygen"
            ],
            "TP": 4,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen Peroxide (H2O2)",
            "Ozone (O3)",
            "Sodium Hypochlorite (NaClO)",
            "Potassium Permanganate (KMnO4)",
            "Nitric Acid (HNO3)",
            "Chlorine (Cl2)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Oxygen (O2)",
            "Sulfuric Acid (H2SO4)",
            "Nitrogen Dioxide (NO2)",
            "Chlorine Dioxide (ClO2)",
            "Peroxynitrite (ONOO-)",
            "Superoxide (O2-)",
            "Hydroxyl Radical (\u2022OH)",
            "Sodium Chlorate (NaClO3)",
            "Potassium Dichromate (K2Cr2O7)",
            "Sodium Persulfate (Na2S2O8)",
            "Ammonium Persulfate ((NH4)2S2O8)",
            "Bromine Trifluoride (BrF3)",
            "Chromium Trioxide (CrO3)",
            "Potassium Chlorate (KClO3)",
            "Lead Dioxide (PbO2)",
            "Selenium Dioxide (SeO2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen Peroxide (H2O2)",
                "Ozone (O3)",
                "Potassium Dichromate (K2Cr2O7)",
                "Ammonium Persulfate ((NH4)2S2O8)"
            ],
            "mismatches": [
                "Sodium Hypochlorite (NaClO)",
                "Potassium Permanganate (KMnO4)",
                "Nitric Acid (HNO3)",
                "Chlorine (Cl2)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Oxygen (O2)",
                "Sulfuric Acid (H2SO4)",
                "Nitrogen Dioxide (NO2)",
                "Chlorine Dioxide (ClO2)",
                "Peroxynitrite (ONOO-)",
                "Superoxide (O2-)",
                "Hydroxyl Radical (\u2022OH)",
                "Sodium Chlorate (NaClO3)",
                "Sodium Persulfate (Na2S2O8)",
                "Bromine Trifluoride (BrF3)",
                "Chromium Trioxide (CrO3)",
                "Potassium Chlorate (KClO3)",
                "Lead Dioxide (PbO2)",
                "Selenium Dioxide (SeO2)"
            ],
            "true_referents": [
                "(methylsulfanyl)acetaldehyde oxime",
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromic acid",
                "diethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "isonordoperoxide",
                "lead tetraacetate",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peroxides",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "singlet dioxygen",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "thallium(III) nitrate",
                "triplet dioxygen"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxygen (O2)",
            "Hydrogen peroxide (H2O2)",
            "Ozone (O3)",
            "Nitric oxide (NO)",
            "Hydroxyl radical (OH)",
            "Superoxide anion (O2-)",
            "Chlorine (Cl2)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Fluorine (F2)",
            "Permanganate ion (MnO4-)",
            "Chromate ion (CrO4^2-)",
            "Dichromate ion (Cr2O7^2-)",
            "Hypochlorite ion (ClO-)",
            "Hypobromite ion (BrO-)",
            "Hypoiodite ion (IO-)",
            "Hydrogen peroxide radical (HO2)",
            "Singlet oxygen (^1O2)",
            "Peroxynitrite (ONOO-)",
            "Ferric ion (Fe3+)",
            "Copper ion (Cu2+)",
            "Manganese ion (Mn2+)",
            "Lead ion (Pb2+)",
            "Mercury ion (Hg2+)",
            "Silver ion (Ag+)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide",
                "Ozone",
                "chromate(2-)",
                "singlet dioxygen"
            ],
            "mismatches": [
                "Oxygen (O2)",
                "Nitric oxide (NO)",
                "Hydroxyl radical (OH)",
                "Superoxide anion (O2-)",
                "Chlorine (Cl2)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Fluorine (F2)",
                "Permanganate ion (MnO4-)",
                "Dichromate ion (Cr2O7^2-)",
                "Hypochlorite ion (ClO-)",
                "Hypobromite ion (BrO-)",
                "Hypoiodite ion (IO-)",
                "Hydrogen peroxide radical (HO2)",
                "Peroxynitrite (ONOO-)",
                "Ferric ion (Fe3+)",
                "Copper ion (Cu2+)",
                "Manganese ion (Mn2+)",
                "Lead ion (Pb2+)",
                "Mercury ion (Hg2+)",
                "Silver ion (Ag+)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "chromyl dichloride",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "isonordoperoxide",
                "lead tetraacetate",
                "lithium nitrate",
                "nitrosoperoxycarbonic acid",
                "ozone",
                "peroxides",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "singlet dioxygen",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "triplet dioxygen"
            ],
            "TP": 4,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen peroxide (H\u2082O\u2082)",
            "Superoxide anion (O\u2082\u207b)",
            "Hydroxyl radical (\u2022OH)",
            "Ozone (O\u2083)",
            "Nitric oxide (NO)",
            "Singlet oxygen (\u00b9O\u2082)",
            "Ferric ion (Fe\u00b3\u207a)",
            "Permanganate ion (MnO\u2084\u207b)",
            "Chlorine (Cl\u2082)",
            "Hypochlorous acid (HOCl)",
            "Peroxynitrite (ONOO\u207b)",
            "Dioxygen (O\u2082)",
            "Nitrogen dioxide (NO\u2082)",
            "Chromate ion (CrO\u2084\u00b2\u207b)",
            "Permanganic acid (HMnO\u2084)",
            "Peroxymonosulfate (HSO\u2085\u207b)",
            "Persulfate ion (S\u2082O\u2088\u00b2\u207b)",
            "Iodine (I\u2082)",
            "Nitric acid (HNO\u2083)",
            "Potassium dichromate (K\u2082Cr\u2082O\u2087)",
            "Potassium permanganate (KMnO\u2084)",
            "Sulfur trioxide (SO\u2083)",
            "Chlorine dioxide (ClO\u2082)",
            "Bromine (Br\u2082)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H\u2082O\u2082)",
                "Ozone (O\u2083)",
                "Singlet oxygen (\u00b9O\u2082)",
                "Dioxygen (O\u2082)",
                "Potassium dichromate (K\u2082Cr\u2082O\u2087)"
            ],
            "mismatches": [
                "Superoxide anion (O\u2082\u207b)",
                "Hydroxyl radical (\u2022OH)",
                "Nitric oxide (NO)",
                "Ferric ion (Fe\u00b3\u207a)",
                "Permanganate ion (MnO\u2084\u207b)",
                "Chlorine (Cl\u2082)",
                "Hypochlorous acid (HOCl)",
                "Peroxynitrite (ONOO\u207b)",
                "Nitrogen dioxide (NO\u2082)",
                "Chromate ion (CrO\u2084\u00b2\u207b)",
                "Permanganic acid (HMnO\u2084)",
                "Peroxymonosulfate (HSO\u2085\u207b)",
                "Persulfate ion (S\u2082O\u2088\u00b2\u207b)",
                "Iodine (I\u2082)",
                "Nitric acid (HNO\u2083)",
                "Potassium permanganate (KMnO\u2084)",
                "Sulfur trioxide (SO\u2083)",
                "Chlorine dioxide (ClO\u2082)",
                "Bromine (Br\u2082)"
            ],
            "true_referents": [
                "(methylsulfanyl)acetaldehyde",
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "isonordoperoxide",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peracetic acid",
                "peroxides",
                "peroxybis(sulfanide)",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "singlet dioxygen",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "triplet dioxygen"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen peroxide (H2O2)",
            "Oxygen (O2)",
            "Ozone (O3)",
            "Hypochlorite ion (ClO-)",
            "Superoxide anion (O2\u2022-)",
            "Hydroxyl radical (\u2022OH)",
            "Singlet oxygen (1O2)",
            "Peroxynitrite (ONOO-)",
            "Nitric oxide (NO)",
            "Chlorine gas (Cl2)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Permanganate ion (MnO4-)",
            "Dichromate ion (Cr2O7 2-)",
            "Nitrate ion (NO3-)",
            "Sulfate radical (SO4\u2022-)",
            "Peroxyl radical (ROO\u2022)",
            "Alkoxyl radical (RO\u2022)",
            "Hypobromous acid (HOBr)",
            "Hypochlorous acid (HOCl)",
            "Chlorine dioxide (ClO2)",
            "Peracetic acid (CH3CO3H)",
            "Ferrate ion (FeO4 2-)",
            "tert-Butyl hydroperoxide (t-BuOOH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H2O2)",
                "Ozone (O3)",
                "Singlet oxygen (1O2)",
                "Peracetic acid (CH3CO3H)",
                "tert-Butyl hydroperoxide (t-BuOOH)"
            ],
            "mismatches": [
                "Oxygen (O2)",
                "Hypochlorite ion (ClO-)",
                "Superoxide anion (O2\u2022-)",
                "Hydroxyl radical (\u2022OH)",
                "Peroxynitrite (ONOO-)",
                "Nitric oxide (NO)",
                "Chlorine gas (Cl2)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Permanganate ion (MnO4-)",
                "Dichromate ion (Cr2O7 2-)",
                "Nitrate ion (NO3-)",
                "Sulfate radical (SO4\u2022-)",
                "Peroxyl radical (ROO\u2022)",
                "Alkoxyl radical (RO\u2022)",
                "Hypobromous acid (HOBr)",
                "Hypochlorous acid (HOCl)",
                "Chlorine dioxide (ClO2)",
                "Ferrate ion (FeO4 2-)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "chromyl dichloride",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "isonordoperoxide",
                "lithium nitrate",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peracetic acid",
                "peroxides",
                "potassium dichromate",
                "pyridinium dichromate",
                "singlet dioxygen",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "tert-butyl hydroperoxide",
                "thallium(III) nitrate",
                "triplet dioxygen"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen peroxide (H2O2)",
            "Ozone (O3)",
            "Hypochlorous acid (HClO)",
            "Chlorine (Cl2)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Singlet oxygen (1O2)",
            "Superoxide anion radical (O2\u2022-)",
            "Hydroxyl radical (\u2022OH)",
            "Peroxyl radical (ROO\u2022)",
            "Alkoxyl radical (RO\u2022)",
            "Peroxynitrite (ONOO-)",
            "Nitric oxide (NO)",
            "Nitrogen dioxide (NO2)",
            "Hypobromous acid (HBrO)",
            "Hypoiodous acid (HIO)",
            "Chlorine dioxide (ClO2)",
            "Peroxydisulfate (S2O82-)",
            "Peroxymonosulfate (HSO5-)",
            "Permanganate (MnO4-)",
            "Chromate (CrO42-)",
            "Dichromate (Cr2O72-)",
            "Periodate (IO4-)",
            "Persulfate (S2O82-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H2O2)",
                "Ozone (O3)",
                "Singlet oxygen (1O2)",
                "Chromate (CrO42-)",
                "Dichromate (Cr2O72-)"
            ],
            "mismatches": [
                "Hypochlorous acid (HClO)",
                "Chlorine (Cl2)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Superoxide anion radical (O2\u2022-)",
                "Hydroxyl radical (\u2022OH)",
                "Peroxyl radical (ROO\u2022)",
                "Alkoxyl radical (RO\u2022)",
                "Peroxynitrite (ONOO-)",
                "Nitric oxide (NO)",
                "Nitrogen dioxide (NO2)",
                "Hypobromous acid (HBrO)",
                "Hypoiodous acid (HIO)",
                "Chlorine dioxide (ClO2)",
                "Peroxydisulfate (S2O82-)",
                "Peroxymonosulfate (HSO5-)",
                "Permanganate (MnO4-)",
                "Periodate (IO4-)",
                "Persulfate (S2O82-)"
            ],
            "true_referents": [
                "(methylsulfanyl)acetaldehyde",
                "(methylsulfanyl)acetaldehyde oxime",
                "FINO2",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "isonordoperoxide",
                "nitrosoperoxycarbonic acid",
                "ozone",
                "peroxides",
                "peroxybis(sulfanide)",
                "potassium dichromate",
                "pyridinium dichromate",
                "singlet dioxygen",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "sodium periodate",
                "triplet dioxygen"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen peroxide (H2O2)",
            "Potassium permanganate (KMnO4)",
            "Sodium hypochlorite (NaClO)",
            "Ozone (O3)",
            "Chlorine (Cl2)",
            "Potassium dichromate (K2Cr2O7)",
            "Nitric acid (HNO3)",
            "Chromic acid (H2CrO4)",
            "Ferric chloride (FeCl3)",
            "Potassium bromate (KBrO3)",
            "Sodium perborate (NaBO3\u00b74H2O)",
            "Persulfates (S2O8^2-)",
            "Periodic acid (H5IO6)",
            "Lead dioxide (PbO2)",
            "Potassium ferricyanide (K3[Fe(CN)6])",
            "Potassium iodate (KIO3)",
            "Sodium persulfate (Na2S2O8)",
            "Iodine (I2)",
            "Benzoyl peroxide (C14H10O4)",
            "Potassium chlorate (KClO3)",
            "Calcium hypochlorite (Ca(ClO)2)",
            "Sodium perborate monohydrate (NaBO3\u00b7H2O)",
            "Potassium perchlorate (KClO4)",
            "Ammonium persulfate ((NH4)2S2O8)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H2O2)",
                "Ozone (O3)",
                "Potassium dichromate (K2Cr2O7)",
                "Chromic acid (H2CrO4)",
                "Ammonium persulfate ((NH4)2S2O8)"
            ],
            "mismatches": [
                "Potassium permanganate (KMnO4)",
                "Sodium hypochlorite (NaClO)",
                "Chlorine (Cl2)",
                "Nitric acid (HNO3)",
                "Ferric chloride (FeCl3)",
                "Potassium bromate (KBrO3)",
                "Sodium perborate (NaBO3\u00b74H2O)",
                "Persulfates (S2O8^2-)",
                "Periodic acid (H5IO6)",
                "Lead dioxide (PbO2)",
                "Potassium ferricyanide (K3[Fe(CN)6])",
                "Potassium iodate (KIO3)",
                "Sodium persulfate (Na2S2O8)",
                "Iodine (I2)",
                "Benzoyl peroxide (C14H10O4)",
                "Potassium chlorate (KClO3)",
                "Calcium hypochlorite (Ca(ClO)2)",
                "Sodium perborate monohydrate (NaBO3\u00b7H2O)",
                "Potassium perchlorate (KClO4)"
            ],
            "true_referents": [
                "(methylsulfanyl)acetaldehyde",
                "(methylsulfanyl)acetaldehyde oxime",
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "chromyl dichloride",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dioxygen",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "lead tetraacetate",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peroxybis(sulfanide)",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "sodium periodate"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen peroxide (H2O2)",
            "Superoxide radical (O2\u2022-)",
            "Hydroxyl radical (\u2022OH)",
            "Hypochlorous acid (HOCl)",
            "Peroxynitrite (ONOO-)",
            "Ozone (O3)",
            "Singlet oxygen (1O2)",
            "Nitric oxide (NO\u2022)",
            "Nitrogen dioxide (NO2\u2022)",
            "Lipid peroxyl radical (LOO\u2022)",
            "Alkoxyl radical (RO\u2022)",
            "Peroxyl radical (ROO\u2022)",
            "Chlorine (Cl2)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Potassium permanganate (KMnO4)",
            "Sodium hypochlorite (NaOCl)",
            "Hydrogen sulfide (H2S)",
            "Sulfur dioxide (SO2)",
            "Nitrogen oxides (NOx)",
            "Organic hydroperoxides (ROOH)",
            "Quinones",
            "Flavins",
            "Metal ions (Fe3+, Cu2+, etc.)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H2O2)",
                "Ozone (O3)",
                "Singlet oxygen (1O2)"
            ],
            "mismatches": [
                "Superoxide radical (O2\u2022-)",
                "Hydroxyl radical (\u2022OH)",
                "Hypochlorous acid (HOCl)",
                "Peroxynitrite (ONOO-)",
                "Nitric oxide (NO\u2022)",
                "Nitrogen dioxide (NO2\u2022)",
                "Lipid peroxyl radical (LOO\u2022)",
                "Alkoxyl radical (RO\u2022)",
                "Peroxyl radical (ROO\u2022)",
                "Chlorine (Cl2)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Potassium permanganate (KMnO4)",
                "Sodium hypochlorite (NaOCl)",
                "Hydrogen sulfide (H2S)",
                "Sulfur dioxide (SO2)",
                "Nitrogen oxides (NOx)",
                "Organic hydroperoxides (ROOH)",
                "Quinones",
                "Flavins",
                "Metal ions (Fe3+, Cu2+, etc.)"
            ],
            "true_referents": [
                "(R)-alpha-campholenaldehyde",
                "FINO2",
                "ammonium nitrate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "diethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "isonordoperoxide",
                "nitrosoperoxycarbonic acid",
                "organic peroxide",
                "ozone",
                "peroxides",
                "potassium chromate",
                "potassium dichromate",
                "singlet dioxygen",
                "sodium bromate",
                "sodium chlorite",
                "tert-butyl hydroperoxide",
                "triplet dioxygen"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen peroxide (H2O2)",
            "Ozone (O3)",
            "Chlorine gas (Cl2)",
            "Bromine gas (Br2)",
            "Iodine (I2)",
            "Nitric oxide (NO)",
            "Nitrogen dioxide (NO2)",
            "Nitrogen trioxide (NO3)",
            "Oxalic acid",
            "Ferric chloride (FeCl3)",
            "Manganese dioxide (MnO2)",
            "Potassium permanganate (KMnO4)",
            "Sodium hypochlorite (NaOCl)",
            "Chloramine-T",
            "Oxone",
            "Oxygen (O2)",
            "Oxidizing agents in the Fenton reaction",
            "Oxidizing agents in the Haber-Weiss reaction",
            "Luminol",
            "Lucigenin",
            "Amplex UltraRed",
            "Dihydroxybenzoic acid (DHBA)",
            "2,7-Dichlorofluorescein diacetate (DCFH-DA)",
            "3,3'-Diaminobenzidine (DAB)",
            "Fluorescein",
            "Fluorescein diacetate (FDA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H2O2)",
                "Ozone (O3)",
                "Oxygen (O2)"
            ],
            "mismatches": [
                "Chlorine gas (Cl2)",
                "Bromine gas (Br2)",
                "Iodine (I2)",
                "Nitric oxide (NO)",
                "Nitrogen dioxide (NO2)",
                "Nitrogen trioxide (NO3)",
                "Oxalic acid",
                "Ferric chloride (FeCl3)",
                "Manganese dioxide (MnO2)",
                "Potassium permanganate (KMnO4)",
                "Sodium hypochlorite (NaOCl)",
                "Chloramine-T",
                "Oxone",
                "Oxidizing agents in the Fenton reaction",
                "Oxidizing agents in the Haber-Weiss reaction",
                "Luminol",
                "Lucigenin",
                "Amplex UltraRed",
                "Dihydroxybenzoic acid (DHBA)",
                "2,7-Dichlorofluorescein diacetate (DCFH-DA)",
                "3,3'-Diaminobenzidine (DAB)",
                "Fluorescein",
                "Fluorescein diacetate (FDA)"
            ],
            "true_referents": [
                "(5-hydroxyindol-3-yl)acetaldehyde",
                "(methylsulfanyl)acetaldehyde oxime",
                "1-hydroxy-1,3-dioxobenziodoxole",
                "Dihydroartemisinin (DHA)",
                "FINO2",
                "acetaldehyde",
                "ammonium nitrate",
                "artemotil",
                "astropectenol B",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromic acid",
                "coelenterazine dioxetanone",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxidanedicarbonitrile",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "muqubilone",
                "nitrosoperoxycarbonic acid",
                "ozone",
                "peracetic acid",
                "peroxides",
                "potassium chromate",
                "potassium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "thallium(III) nitrate",
                "triplet dioxygen"
            ],
            "TP": 3,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen peroxide (H2O2)",
            "Oxygen (O2)",
            "Chlorine (Cl2)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Fluorine (F2)",
            "Ozone (O3)",
            "Nitric oxide (NO)",
            "Nitrogen dioxide (NO2)",
            "Chlorine dioxide (ClO2)",
            "Hypochlorous acid (HOCl)",
            "Hypobromous acid (HOBr)",
            "Hypoiodous acid (HOI)",
            "Fenton's reagent (Fe2+/H2O2)",
            "Doxorubicin (DXR)",
            "Bleach (NaOCl)",
            "Potassium permanganate (KMnO4)",
            "Chlorhexidine",
            "Dehydroascorbic acid (DHA)",
            "Menadione (Vit K3)",
            "Platinum (Pt)",
            "Cerium(IV) oxide (CeO2)",
            "Ferric ion (Fe3+)",
            "Copper(II) ion (Cu2+)",
            "Manganese dioxide (MnO2)",
            "Chromate (CrO4^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H2O2)",
                "Ozone (O3)",
                "Chromate (CrO4^2-)"
            ],
            "mismatches": [
                "Oxygen (O2)",
                "Chlorine (Cl2)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Fluorine (F2)",
                "Nitric oxide (NO)",
                "Nitrogen dioxide (NO2)",
                "Chlorine dioxide (ClO2)",
                "Hypochlorous acid (HOCl)",
                "Hypobromous acid (HOBr)",
                "Hypoiodous acid (HOI)",
                "Fenton's reagent (Fe2+/H2O2)",
                "Doxorubicin (DXR)",
                "Bleach (NaOCl)",
                "Potassium permanganate (KMnO4)",
                "Chlorhexidine",
                "Dehydroascorbic acid (DHA)",
                "Menadione (Vit K3)",
                "Platinum (Pt)",
                "Cerium(IV) oxide (CeO2)",
                "Ferric ion (Fe3+)",
                "Copper(II) ion (Cu2+)",
                "Manganese dioxide (MnO2)"
            ],
            "true_referents": [
                "(+)-artemisinin",
                "Dihydroartemisinin (DHA)",
                "FINO2",
                "adxanthromycin A",
                "adxanthromycin B",
                "ammonium nitrate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "lead tetraacetate",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "potassium chromate",
                "potassium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "triplet dioxygen"
            ],
            "TP": 3,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": "[\n        {\n            \"Canonical name\": \"Peroxide\" (H2O2)\n        },\n        {\n            \"Canonical name\": \"Superoxide\" (O2-)\n        },\n        {\n            \"Canonical name\": \"Hypochlorite\" (ClO2-)\n        },\n        {\n            \"Canonical name\": \"Singlet oxygen\" (1O2)\n        },\n        {\n            \"Canonical name\": \"Peroxynitrite\" (ONOO-)\n        },\n        {\n            \"Canonical name\": \"Nitrosonium\" (NO+)\n        },\n        {\n            \"Canonical name\": \"Nitric oxide\" (NO)\n        },\n        {\n            \"Canonical name\": \"Nitrite\" (NO2-)\n        },\n        {\n            \"Canonical name\": \"Hypochlorite\" (ClO2-)\n        },\n        {\n            \"Canonical name\": \"Peroxynitrite\" (ONOO-)\n        },\n        {\n            \"Canonical name\": \"Nitrosonium\" (NO+)\n        },\n        {\n            \"Canonical name\": \"Nitric oxide\" (NO)\n        },\n        {\n            \"Canonical name\": \"Nitrite\" (NO2-)\n        },\n        {\n            \"Canonical name\": \"Peroxide\" (H2O2)\n        },\n        {\n            \"Canonical name\": \"Superoxide\" (O2-)\n        },\n        {\n            \"Canonical name\": \"Hypochlorite\" (ClO2-)\n        },\n        {\n            \"Canonical name\": \"Singlet oxygen\" (1O2)\n        },\n        {\n            \"Canonical name\": \"Peroxynitrite\" (ONOO-)\n        },\n        {\n            \"Canonical name\": \"Nitrosonium\" (NO+)\n        },\n        {\n            \"Canonical name\": \"Nitric oxide\" (NO)\n        },\n        {\n            \"Canonical name\": \"Nitrite\" (NO2-)\n        },\n        {\n            \"Canonical name\": \"Hypochlorite\" (ClO2-)\n        },\n        {\n            \"Canonical name\": \"Peroxynitrite\" (ONOO-)\n        },\n        {\n            \"Canonical name\": \"Nitrosonium\" (NO+)\n        },\n        {\n            \"Canonical name\": \"Nitric oxide\" (NO)\n        },\n        {\n            \"Canonical name\": \"Nitrite\" (NO2-)\n        },\n        {\n            \"Canonical name\": \"Peroxide\" (H2O2)\n        },\n        {\n            \"Canonical name\": \"Superoxide\" (O2-)\n        },\n        {\n            \"Canonical name\": \"Hypochlorite\" (ClO2-)\n        },\n        {\n            \"Canonical name\": \"Singlet oxygen\" (1O2)\n        },\n        {\n            \"Canonical name\": \"Peroxynitrite\" (ONOO-)\n        },\n        {\n            \"Canonical name\": \"Nitrosonium\" (NO+)\n        },\n        {\n            \"Canonical name\": \"Nitric oxide\" (NO)\n        },\n        {\n            \"Canonical name\": \"Nitrite\" (NO2-)\n        },\n        {\n            \"Canonical name\": \"Hypochlorite\" (ClO2-)\n        },\n        {\n            \"Canonical name\": \"Peroxynitrite\" (ONOO-)\n        },\n        {\n            \"Canonical name\": \"Nitrosonium\" (NO+)\n        },\n        {\n            \"Canonical name\": \"Nitric oxide\" (NO)\n        },\n        {\n            \"Canonical name\": \"Nitrite\" (NO2-)\n        },\n        {\n            \"Canonical name\": \"Peroxide\" (H2O2)\n        },\n        {\n            \"Canonical name\": \"Superoxide\" (O2-)\n        },\n        {\n            \"Canonical name\": \"Hypochlorite\" (ClO2-)\n        },\n        {\n            \"Canonical name\": \"Singlet oxygen\" (1O2)\n        },\n        {\n            \"Canonical name\": \"Peroxynitrite\" (ONOO-)\n        },\n        {\n            \"Canonical name\": \"Nitrosonium\" (NO+)\n        },\n        {\n            \"Canonical name\": \"Nitric oxide\" (NO)\n        },\n        {\n            \"Canonical name\": \"Nitrite\" (NO2-)\n        },\n        {\n            \"Canonical name\": \"Hypochlorite\" (ClO2-)\n        },\n        {\n            \"Canonical name\": \"Peroxynitrite\" (ONOO-)\n        },\n        {\n            \"Canonical name\": \"Nitrosonium\" (NO+)\n        },\n        {\n            \"Canonical name\": \"Nitric oxide\" (NO)\n        },\n        {\n            \"Canonical name\": \"Nitrite\" (NO2-)\n        }\n    ]",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]