[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen Peroxide (H2O2)",
            "Chlorine (Cl2)",
            "Oxygen (O2)",
            "Nitric Acid (HNO3)",
            "Sodium Chlorate (NaClO3)",
            "Chromate Ion (CrO4^2-)",
            "Potassium Permanganate (KMnO4)",
            "Sulfur Trioxide (SO3)",
            "Chlorine Dioxide (ClO2)",
            "Sulfuric Acid (H2SO4)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Chloramine (NH2Cl)",
            "Chlorine Monoxide (ClO)",
            "Nitrogen Dioxide (NO2)",
            "Chlorine Trifluoride (ClF3)",
            "Chlorine Pentafluoride (ClF5)",
            "Dichromate Ion (Cr2O7^2-)",
            "Chlorine Dioxide Radical (ClO2^+)",
            "Perchloric Acid (HClO4)",
            "Chlorine Dioxide Ion (ClO2^-)",
            "Chlorine Monoxide Radical (ClO^+)",
            "Chlorine Trioxide (ClO3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen Peroxide (H2O2)",
                "Chromate Ion (CrO4^2-)",
                "Dichromate Ion (Cr2O7^2-)"
            ],
            "mismatches": [
                "Chlorine (Cl2)",
                "Oxygen (O2)",
                "Nitric Acid (HNO3)",
                "Sodium Chlorate (NaClO3)",
                "Potassium Permanganate (KMnO4)",
                "Sulfur Trioxide (SO3)",
                "Chlorine Dioxide (ClO2)",
                "Sulfuric Acid (H2SO4)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Chloramine (NH2Cl)",
                "Chlorine Monoxide (ClO)",
                "Nitrogen Dioxide (NO2)",
                "Chlorine Trifluoride (ClF3)",
                "Chlorine Pentafluoride (ClF5)",
                "Chlorine Dioxide Radical (ClO2^+)",
                "Perchloric Acid (HClO4)",
                "Chlorine Dioxide Ion (ClO2^-)",
                "Chlorine Monoxide Radical (ClO^+)",
                "Chlorine Trioxide (ClO3)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromyl dichloride",
                "diethyl peroxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peracetic acid",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "trichloroacetaldehyde",
                "triplet dioxygen"
            ],
            "TP": 3,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen Peroxide (H2O2)",
            "Chlorine (Cl2)",
            "Oxygen (O2)",
            "Nitric Acid (HNO3)",
            "Potassium Permanganate (KMnO4)",
            "Chromium Trioxide (CrO3)",
            "Ozone (O3)",
            "Sulfuric Acid (H2SO4)",
            "Nitrogen Dioxide (NO2)",
            "Ferric Ion (Fe3+)",
            "Manganate Ion (MnO4-)",
            "Dichromate Ion (Cr2O7^2-)",
            "Sodium Hypochlorite (NaOCl)",
            "Iodine (I2)",
            "Potassium Dichromate (K2Cr2O7)",
            "Hypochlorous Acid (HOCl)",
            "Hydrogen Fluoride (HF)",
            "Sodium Nitrate (NaNO3)",
            "Cerium(IV) Ion (Ce4+)",
            "Potassium Ferricyanide (K3[Fe(CN)6])",
            "Ammonium Nitrate (NH4NO3)",
            "Bromine (Br2)",
            "Iodine Pentafluoride (IF5)",
            "Oxygen Difluoride (OF2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen Peroxide (H2O2)",
                "Ozone (O3)",
                "Potassium Dichromate (K2Cr2O7)",
                "Ammonium Nitrate (NH4NO3)"
            ],
            "mismatches": [
                "Chlorine (Cl2)",
                "Oxygen (O2)",
                "Nitric Acid (HNO3)",
                "Potassium Permanganate (KMnO4)",
                "Chromium Trioxide (CrO3)",
                "Sulfuric Acid (H2SO4)",
                "Nitrogen Dioxide (NO2)",
                "Ferric Ion (Fe3+)",
                "Manganate Ion (MnO4-)",
                "Dichromate Ion (Cr2O7^2-)",
                "Sodium Hypochlorite (NaOCl)",
                "Iodine (I2)",
                "Hypochlorous Acid (HOCl)",
                "Hydrogen Fluoride (HF)",
                "Sodium Nitrate (NaNO3)",
                "Cerium(IV) Ion (Ce4+)",
                "Potassium Ferricyanide (K3[Fe(CN)6])",
                "Bromine (Br2)",
                "Iodine Pentafluoride (IF5)",
                "Oxygen Difluoride (OF2)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "diethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "lithium nitrate",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "thallium(III) nitrate",
                "triplet dioxygen"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxygen (O2)",
            "Hydrogen peroxide (H2O2)",
            "Potassium permanganate (KMnO4)",
            "Chlorine (Cl2)",
            "Nitric acid (HNO3)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Manganese dioxide (MnO2)",
            "Potassium dichromate (K2Cr2O7)",
            "Iron(III) oxide (Fe2O3)",
            "Copper(II) sulfate (CuSO4)",
            "Silver nitrate (AgNO3)",
            "Perchloric acid (HClO4)",
            "Sulfuric acid (H2SO4)",
            "Chlorine dioxide (ClO2)",
            "Hydrogen peroxide (H2O2)",
            "Ozone (O3)",
            "Fluorine (F2)",
            "Chromic acid (H2CrO4)",
            "Manganese heptoxide (Mn2O7)",
            "Nitrous oxide (N2O)",
            "Sodium hypochlorite (NaOCl)",
            "Osmium tetroxide (OsO4)",
            "Sulfur trioxide (SO3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H2O2)",
                "Potassium dichromate (K2Cr2O7)",
                "Ozone (O3)",
                "Chromic acid (H2CrO4)",
                "Osmium tetroxide (OsO4)"
            ],
            "mismatches": [
                "Oxygen (O2)",
                "Potassium permanganate (KMnO4)",
                "Chlorine (Cl2)",
                "Nitric acid (HNO3)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Manganese dioxide (MnO2)",
                "Iron(III) oxide (Fe2O3)",
                "Copper(II) sulfate (CuSO4)",
                "Silver nitrate (AgNO3)",
                "Perchloric acid (HClO4)",
                "Sulfuric acid (H2SO4)",
                "Chlorine dioxide (ClO2)",
                "Fluorine (F2)",
                "Manganese heptoxide (Mn2O7)",
                "Nitrous oxide (N2O)",
                "Sodium hypochlorite (NaOCl)",
                "Sulfur trioxide (SO3)"
            ],
            "true_referents": [
                "9-(2-carboxyethyl)-10-methylanthracene endoperoxide",
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "lithium nitrate",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peracetic acid",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "thallium(III) nitrate",
                "triplet dioxygen"
            ],
            "TP": 5,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxygen (O2)",
            "Fluorine (F2)",
            "Chlorine (Cl2)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Potassium Permanganate (KMnO4)",
            "Potassium Dichromate (K2Cr2O7)",
            "Hydrogen Peroxide (H2O2)",
            "Nitric Acid (HNO3)",
            "Chromic Acid (H2CrO4)",
            "Osmium Tetroxide (OsO4)",
            "Peracetic Acid (CH3CO3H)",
            "m-Chloroperoxybenzoic Acid (mCPBA)",
            "Sodium Hypochlorite (NaClO)",
            "Silver Oxide (Ag2O)",
            "Iron(III) Chloride (FeCl3)",
            "Copper(II) Sulfate (CuSO4)",
            "Cerium(IV) Ammonium Nitrate (CAN)",
            "2,3-Dichloro-5,6-dicyano-1,4-benzoquinone (DDQ)",
            "Pyridinium Chlorochromate (PCC)",
            "Pyridinium Dichromate (PDC)",
            "Dess-Martin Periodinane (DMP)",
            "Manganese Dioxide (MnO2)",
            "Selectfluor (F-TEDA-BF4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Potassium Dichromate (K2Cr2O7)",
                "Hydrogen Peroxide (H2O2)",
                "Chromic Acid (H2CrO4)",
                "Osmium Tetroxide (OsO4)",
                "Peracetic Acid (CH3CO3H)",
                "Pyridinium Chlorochromate (PCC)",
                "Pyridinium Dichromate (PDC)"
            ],
            "mismatches": [
                "Oxygen (O2)",
                "Fluorine (F2)",
                "Chlorine (Cl2)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Potassium Permanganate (KMnO4)",
                "Nitric Acid (HNO3)",
                "m-Chloroperoxybenzoic Acid (mCPBA)",
                "Sodium Hypochlorite (NaClO)",
                "Silver Oxide (Ag2O)",
                "Iron(III) Chloride (FeCl3)",
                "Copper(II) Sulfate (CuSO4)",
                "Cerium(IV) Ammonium Nitrate (CAN)",
                "2,3-Dichloro-5,6-dicyano-1,4-benzoquinone (DDQ)",
                "Dess-Martin Periodinane (DMP)",
                "Manganese Dioxide (MnO2)",
                "Selectfluor (F-TEDA-BF4)"
            ],
            "true_referents": [
                "1-hydroxy-1,3-dioxobenziodoxole",
                "1R,4S,6R-1,4-endoperoxy-bisabola-2,10-diene",
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "chromyl dichloride",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dioxidanedicarbonitrile",
                "dioxygen",
                "fluoroacetaldehyde",
                "formylmethyl",
                "gyromitrin",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peracetic acid",
                "plakortide F free acid",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium chlorochromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "sodium periodate",
                "thallium(III) nitrate",
                "triplet dioxygen"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxygen (O2)",
            "Hydrogen peroxide (H2O2)",
            "Potassium permanganate (KMnO4)",
            "Chlorine (Cl2)",
            "Nitric acid (HNO3)",
            "Sulfuric acid (H2SO4)",
            "Sodium hypochlorite (NaClO)",
            "Fluorine (F2)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Ozone (O3)",
            "Chromium trioxide (CrO3)",
            "Potassium dichromate (K2Cr2O7)",
            "Ferric chloride (FeCl3)",
            "Copper(II) sulfate (CuSO4)",
            "Silver nitrate (AgNO3)",
            "Nitrogen dioxide (NO2)",
            "Peracetic acid (CH3CO3H)",
            "Benzoquinone (C6H4O2)",
            "Lead(IV) acetate (Pb(C2H3O2)4)",
            "Cerium(IV) ammonium nitrate (CAN)",
            "Iron(III) nitrate (Fe(NO3)3)",
            "Manganese dioxide (MnO2)",
            "Sodium percarbonate (Na2CO3\u00b71.5H2O2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H2O2)",
                "Ozone (O3)",
                "Peracetic acid (CH3CO3H)",
                "Potassium dichromate (K2Cr2O7)",
                "Lead(IV) acetate (Pb(C2H3O2)4)"
            ],
            "mismatches": [
                "Oxygen (O2)",
                "Potassium permanganate (KMnO4)",
                "Chlorine (Cl2)",
                "Nitric acid (HNO3)",
                "Sulfuric acid (H2SO4)",
                "Sodium hypochlorite (NaClO)",
                "Fluorine (F2)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Chromium trioxide (CrO3)",
                "Ferric chloride (FeCl3)",
                "Copper(II) sulfate (CuSO4)",
                "Silver nitrate (AgNO3)",
                "Nitrogen dioxide (NO2)",
                "Benzoquinone (C6H4O2)",
                "Cerium(IV) ammonium nitrate (CAN)",
                "Iron(III) nitrate (Fe(NO3)3)",
                "Manganese dioxide (MnO2)",
                "Sodium percarbonate (Na2CO3\u00b71.5H2O2)"
            ],
            "true_referents": [
                "(5-hydroxyindol-3-yl)acetaldehyde",
                "1-hydroxy-1,3-dioxobenziodoxole",
                "1S,4R,6R-1,4-endoperoxy-bisabola-2,10-diene",
                "9-(2-carboxyethyl)-10-methylanthracene endoperoxide",
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "lead tetraacetate",
                "lithium nitrate",
                "nitrosoperoxycarbonic acid",
                "ozone",
                "peracetic acid",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "thallium(III) nitrate",
                "triplet dioxygen"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen Peroxide (H2O2)",
            "Potassium Permanganate (KMnO4)",
            "Chlorine Gas (Cl2)",
            "Nitric Acid (HNO3)",
            "Sodium Hypochlorite (NaOCl)",
            "Bromine (Br2)",
            "Ozone (O3)",
            "Ferric Chloride (FeCl3)",
            "Copper(II) Sulfate (CuSO4)",
            "Sodium Dichromate (Na2Cr2O7)",
            "Silver Nitrate (AgNO3)",
            "Hydrochloric Acid (HCl)",
            "Sodium Perborate (NaBO3)",
            "Calcium Hypochlorite (Ca(OCl)2)",
            "Magnesium Peroxide (MgO2)",
            "Lead(IV) Oxide (PbO2)",
            "Iodine (I2)",
            "Thallium(I) Chloride (TlCl)",
            "Titanium Dioxide (TiO2)",
            "Vanadium Pentoxide (V2O5)",
            "Arsenic Trioxide (As2O3)",
            "Barium Peroxide (BaO2)",
            "Cobalt(III) Chloride (CoCl3)",
            "Zinc Oxide (ZnO)",
            "Manganese Dioxide (MnO2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen Peroxide (H2O2)",
                "Ozone (O3)"
            ],
            "mismatches": [
                "Potassium Permanganate (KMnO4)",
                "Chlorine Gas (Cl2)",
                "Nitric Acid (HNO3)",
                "Sodium Hypochlorite (NaOCl)",
                "Bromine (Br2)",
                "Ferric Chloride (FeCl3)",
                "Copper(II) Sulfate (CuSO4)",
                "Sodium Dichromate (Na2Cr2O7)",
                "Silver Nitrate (AgNO3)",
                "Hydrochloric Acid (HCl)",
                "Sodium Perborate (NaBO3)",
                "Calcium Hypochlorite (Ca(OCl)2)",
                "Magnesium Peroxide (MgO2)",
                "Lead(IV) Oxide (PbO2)",
                "Iodine (I2)",
                "Thallium(I) Chloride (TlCl)",
                "Titanium Dioxide (TiO2)",
                "Vanadium Pentoxide (V2O5)",
                "Arsenic Trioxide (As2O3)",
                "Barium Peroxide (BaO2)",
                "Cobalt(III) Chloride (CoCl3)",
                "Zinc Oxide (ZnO)",
                "Manganese Dioxide (MnO2)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chromate(2-)",
                "chromic acid",
                "chromyl dichloride",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dioxygen",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "lead tetraacetate",
                "lithium nitrate",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "sodium periodate",
                "thallium(III) nitrate"
            ],
            "TP": 2,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxygen (O2)",
            "Chlorine (Cl)",
            "Hydrogen peroxide (H2O2)",
            "Iodine (I2)",
            "Bromine (Br2)",
            "Potassium permanganate (KMnO4)",
            "Hydrochloric acid (HCl)",
            "Sulfuric acid (H2SO4)",
            "Nitric acid (HNO3)",
            "Chromium trioxide (CrO3)",
            "Potassium dichromate (K2Cr2O7)",
            "Sodium hypochlorite (NaClO)",
            "Hydrogen fluoride (HF)",
            "Ozone (O3)",
            "Fluorine (F2)",
            "Lead(IV) oxide (PbO2)",
            "Hexavalent chromium (Cr(VI))",
            "Osmium tetroxide (OsO4)",
            "Perchloric acid (HClO4)",
            "Sodium chlorate (NaClO3)",
            "Sodium bromate (NaBrO3)",
            "Sodium iodate (NaIO3)",
            "Platinum(IV) chloride (PtCl4)",
            "Gold(III) chloride (AuCl3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H2O2)",
                "Potassium dichromate (K2Cr2O7)",
                "Ozone (O3)",
                "Osmium tetroxide (OsO4)",
                "Sodium bromate (NaBrO3)"
            ],
            "mismatches": [
                "Oxygen (O2)",
                "Chlorine (Cl)",
                "Iodine (I2)",
                "Bromine (Br2)",
                "Potassium permanganate (KMnO4)",
                "Hydrochloric acid (HCl)",
                "Sulfuric acid (H2SO4)",
                "Nitric acid (HNO3)",
                "Chromium trioxide (CrO3)",
                "Sodium hypochlorite (NaClO)",
                "Hydrogen fluoride (HF)",
                "Fluorine (F2)",
                "Lead(IV) oxide (PbO2)",
                "Hexavalent chromium (Cr(VI))",
                "Perchloric acid (HClO4)",
                "Sodium chlorate (NaClO3)",
                "Sodium iodate (NaIO3)",
                "Platinum(IV) chloride (PtCl4)",
                "Gold(III) chloride (AuCl3)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "chromyl dichloride",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "lead tetraacetate",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peracetic acid",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "thallium(III) nitrate",
                "triplet dioxygen"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxygen (O2)",
            "Hydrogen peroxide (H2O2)",
            "Potassium permanganate (KMnO4)",
            "Chlorine (Cl2)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Fluorine (F2)",
            "Sodium hypochlorite (NaClO)",
            "Potassium dichromate (K2Cr2O7)",
            "Sulfuric acid (H2SO4)",
            "Nitric acid (HNO3)",
            "Permanganic acid (HMnO4)",
            "Chloric acid (HClO3)",
            "Hydrobromic acid (HBr)",
            "Hydroiodic acid (HI)",
            "Hydrofluoric acid (HF)",
            "Hydrochloric acid (HCl)",
            "Potassium iodide (KI)",
            "Potassium bromide (KBr)",
            "Potassium chloride (KCl)",
            "Sodium iodide (NaI)",
            "Sodium bromide (NaBr)",
            "Sodium chloride (NaCl)",
            "Iron(III) chloride (FeCl3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide",
                "Potassium dichromate"
            ],
            "mismatches": [
                "Oxygen (O2)",
                "Potassium permanganate (KMnO4)",
                "Chlorine (Cl2)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Fluorine (F2)",
                "Sodium hypochlorite (NaClO)",
                "Sulfuric acid (H2SO4)",
                "Nitric acid (HNO3)",
                "Permanganic acid (HMnO4)",
                "Chloric acid (HClO3)",
                "Hydrobromic acid (HBr)",
                "Hydroiodic acid (HI)",
                "Hydrofluoric acid (HF)",
                "Hydrochloric acid (HCl)",
                "Potassium iodide (KI)",
                "Potassium bromide (KBr)",
                "Potassium chloride (KCl)",
                "Sodium iodide (NaI)",
                "Sodium bromide (NaBr)",
                "Sodium chloride (NaCl)",
                "Iron(III) chloride (FeCl3)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromic acid",
                "chromyl dichloride",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "nitrosoperoxycarbonic acid",
                "ozone",
                "peracetic acid",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "thallium(III) nitrate",
                "triplet dioxygen"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxygen (O\u2082)",
            "Hydrogen peroxide (H\u2082O\u2082)",
            "Potassium permanganate (KMnO\u2084)",
            "Chlorine (Cl\u2082)",
            "Nitric acid (HNO\u2083)",
            "Bromine (Br\u2082)",
            "Ozone (O\u2083)",
            "Sodium hypochlorite (NaOCl)",
            "Chromium trioxide (CrO\u2083)",
            "Ferric chloride (FeCl\u2083)",
            "Silver nitrate (AgNO\u2083)",
            "Iodine (I\u2082)",
            "Potassium dichromate (K\u2082Cr\u2082O\u2087)",
            "Hydrogen persulfate (H\u2082S\u2082O\u2088)",
            "Sodium chlorate (NaClO\u2083)",
            "Thionyl chloride (SOCl\u2082)",
            "Peroxomonosulfuric acid (Caro's acid)",
            "Peracetic acid (CH\u2083C(O)OOH)",
            "Dichromic acid (H\u2082Cr\u2082O\u2087)",
            "Potassium ferricyanide (K\u2083[Fe(CN)\u2086])",
            "Peroxydisulfate (S\u2082O\u2088\u00b2\u207b)",
            "Nitrogen dioxide (NO\u2082)",
            "Benzoyl peroxide (C\u2086H\u2085C(O)OOC\u2086H\u2085)",
            "Lead dioxide (PbO\u2082)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H\u2082O\u2082)",
                "Ozone (O\u2083)",
                "Peracetic acid (CH\u2083C(O)OOH)",
                "Potassium dichromate (K\u2082Cr\u2082O\u2087)"
            ],
            "mismatches": [
                "Oxygen (O\u2082)",
                "Potassium permanganate (KMnO\u2084)",
                "Chlorine (Cl\u2082)",
                "Nitric acid (HNO\u2083)",
                "Bromine (Br\u2082)",
                "Sodium hypochlorite (NaOCl)",
                "Chromium trioxide (CrO\u2083)",
                "Ferric chloride (FeCl\u2083)",
                "Silver nitrate (AgNO\u2083)",
                "Iodine (I\u2082)",
                "Hydrogen persulfate (H\u2082S\u2082O\u2088)",
                "Sodium chlorate (NaClO\u2083)",
                "Thionyl chloride (SOCl\u2082)",
                "Peroxomonosulfuric acid (Caro's acid)",
                "Dichromic acid (H\u2082Cr\u2082O\u2087)",
                "Potassium ferricyanide (K\u2083[Fe(CN)\u2086])",
                "Peroxydisulfate (S\u2082O\u2088\u00b2\u207b)",
                "Nitrogen dioxide (NO\u2082)",
                "Benzoyl peroxide (C\u2086H\u2085C(O)OOC\u2086H\u2085)",
                "Lead dioxide (PbO\u2082)"
            ],
            "true_referents": [
                "(methylsulfanyl)acetaldehyde",
                "(methylsulfanyl)acetaldehyde oxime",
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "chromyl dichloride",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "lead tetraacetate",
                "lithium nitrate",
                "nitrosoperoxycarbonic acid",
                "organic peroxide",
                "ozone",
                "peracetic acid",
                "peroxybis(sulfanide)",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "thallium(III) nitrate",
                "triplet dioxygen"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxygen (O\u2082)",
            "Hydrogen peroxide (H\u2082O\u2082)",
            "Chlorine (Cl\u2082)",
            "Potassium permanganate (KMnO\u2084)",
            "Hydrogen ion (H\u207a)",
            "Ferric ion (Fe\u00b3\u207a)",
            "Nitric acid (HNO\u2083)",
            "Ozone (O\u2083)",
            "Bromine (Br\u2082)",
            "Dichromate ion (Cr\u2082O\u2087\u00b2\u207b)",
            "Hypochlorite ion (ClO\u207b)",
            "Sulfuric acid (H\u2082SO\u2084)",
            "Nitrate ion (NO\u2083\u207b)",
            "Chromic acid (H\u2082CrO\u2084)",
            "Chlorate ion (ClO\u2083\u207b)",
            "Iodine (I\u2082)",
            "Perchloric acid (HClO\u2084)",
            "Cerium(IV) ion (Ce\u2074\u207a)",
            "Manganese dioxide (MnO\u2082)",
            "Persulfate ion (S\u2082O\u2088\u00b2\u207b)",
            "Fluorine (F\u2082)",
            "Lead dioxide (PbO\u2082)",
            "Peroxydisulfate ion (S\u2082O\u2088\u00b2\u207b)",
            "Silver ion (Ag\u207a)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide",
                "Ozone",
                "Chromic acid"
            ],
            "mismatches": [
                "Oxygen (O\u2082)",
                "Chlorine (Cl\u2082)",
                "Potassium permanganate (KMnO\u2084)",
                "Hydrogen ion (H\u207a)",
                "Ferric ion (Fe\u00b3\u207a)",
                "Nitric acid (HNO\u2083)",
                "Bromine (Br\u2082)",
                "Dichromate ion (Cr\u2082O\u2087\u00b2\u207b)",
                "Hypochlorite ion (ClO\u207b)",
                "Sulfuric acid (H\u2082SO\u2084)",
                "Nitrate ion (NO\u2083\u207b)",
                "Chlorate ion (ClO\u2083\u207b)",
                "Iodine (I\u2082)",
                "Perchloric acid (HClO\u2084)",
                "Cerium(IV) ion (Ce\u2074\u207a)",
                "Manganese dioxide (MnO\u2082)",
                "Persulfate ion (S\u2082O\u2088\u00b2\u207b)",
                "Fluorine (F\u2082)",
                "Lead dioxide (PbO\u2082)",
                "Peroxydisulfate ion (S\u2082O\u2088\u00b2\u207b)",
                "Silver ion (Ag\u207a)"
            ],
            "true_referents": [
                "(methylsulfanyl)acetaldehyde",
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "diethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "lead tetraacetate",
                "lithium nitrate",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peracetic acid",
                "peroxybis(sulfanide)",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "thallium(III) nitrate",
                "triplet dioxygen"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxygen (O2)",
            "Chlorine (Cl2)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Fluorine (F2)",
            "Hydrogen peroxide (H2O2)",
            "Potassium permanganate (KMnO4)",
            "Sodium hypochlorite (NaClO)",
            "Nitric acid (HNO3)",
            "Sulfuric acid (H2SO4)",
            "Chromic acid (H2CrO4)",
            "Osmium tetroxide (OsO4)",
            "Chlorine dioxide (ClO2)",
            "Bromine pentafluoride (BrF5)",
            "Xenon difluoride (XeF2)",
            "Cerium(IV) ammonium nitrate (CAN)",
            "2,3-Dichloro-5,6-dicyano-1,4-benzoquinone (DDQ)",
            "Pyridinium chlorochromate (PCC)",
            "Dess-Martin periodinane (DMP)",
            "Tetrabutylammonium periodate (TBAP)",
            "Chloramine-T",
            "N-Bromosuccinimide (NBS)",
            "Selectfluor",
            "Benzoquinone (BQ)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen peroxide (H2O2)",
                "Chromic acid (H2CrO4)",
                "Osmium tetroxide (OsO4)",
                "Pyridinium chlorochromate (PCC)"
            ],
            "mismatches": [
                "Oxygen (O2)",
                "Chlorine (Cl2)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Fluorine (F2)",
                "Potassium permanganate (KMnO4)",
                "Sodium hypochlorite (NaClO)",
                "Nitric acid (HNO3)",
                "Sulfuric acid (H2SO4)",
                "Chlorine dioxide (ClO2)",
                "Bromine pentafluoride (BrF5)",
                "Xenon difluoride (XeF2)",
                "Cerium(IV) ammonium nitrate (CAN)",
                "2,3-Dichloro-5,6-dicyano-1,4-benzoquinone (DDQ)",
                "Dess-Martin periodinane (DMP)",
                "Tetrabutylammonium periodate (TBAP)",
                "Chloramine-T",
                "N-Bromosuccinimide (NBS)",
                "Selectfluor",
                "Benzoquinone (BQ)"
            ],
            "true_referents": [
                "1-hydroxy-1,3-dioxobenziodoxole",
                "3H-1,2-benzodioxole",
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "chromyl dichloride",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dioxidanedicarbonitrile",
                "dioxygen",
                "fluoroacetaldehyde",
                "gyromitrin",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "lead tetraacetate",
                "muqubilone",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peroxybis(sulfanide)",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium chlorochromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "sodium periodate",
                "thallium(III) nitrate",
                "triplet dioxygen"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxygen (O\u2082)",
            "Chlorine (Cl\u2082)",
            "Bromine (Br\u2082)",
            "Iodine (I\u2082)",
            "Fluorine (F\u2082)",
            "Potassium Permanganate (KMnO\u2084)",
            "Potassium Dichromate (K\u2082Cr\u2082O\u2087)",
            "Sodium Dichromate (Na\u2082Cr\u2082O\u2087)",
            "Hydrogen Peroxide (H\u2082O\u2082)",
            "Ozone (O\u2083)",
            "Nitric Acid (HNO\u2083)",
            "Sulfuric Acid (H\u2082SO\u2084)",
            "Chromic Acid (H\u2082CrO\u2084)",
            "Perchloric Acid (HClO\u2084)",
            "Potassium Nitrate (KNO\u2083)",
            "Ammonium Nitrate (NH\u2084NO\u2083)",
            "Potassium Chlorate (KClO\u2083)",
            "Potassium Bromate (KBrO\u2083)",
            "Potassium Iodate (KIO\u2083)",
            "Copper(II) Sulfate (CuSO\u2084)",
            "Iron(III) Chloride (FeCl\u2083)",
            "Manganese(IV) Oxide (MnO\u2082)",
            "Lead(IV) Oxide (PbO\u2082)",
            "Cerium(IV) Sulfate (Ce(SO\u2084)\u2082)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Potassium Dichromate",
                "Hydrogen Peroxide",
                "Ozone",
                "Chromic Acid",
                "Ammonium Nitrate"
            ],
            "mismatches": [
                "Oxygen (O\u2082)",
                "Chlorine (Cl\u2082)",
                "Bromine (Br\u2082)",
                "Iodine (I\u2082)",
                "Fluorine (F\u2082)",
                "Potassium Permanganate (KMnO\u2084)",
                "Sodium Dichromate (Na\u2082Cr\u2082O\u2087)",
                "Nitric Acid (HNO\u2083)",
                "Sulfuric Acid (H\u2082SO\u2084)",
                "Perchloric Acid (HClO\u2084)",
                "Potassium Nitrate (KNO\u2083)",
                "Potassium Chlorate (KClO\u2083)",
                "Potassium Bromate (KBrO\u2083)",
                "Potassium Iodate (KIO\u2083)",
                "Copper(II) Sulfate (CuSO\u2084)",
                "Iron(III) Chloride (FeCl\u2083)",
                "Manganese(IV) Oxide (MnO\u2082)",
                "Lead(IV) Oxide (PbO\u2082)",
                "Cerium(IV) Sulfate (Ce(SO\u2084)\u2082)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "chromyl dichloride",
                "diethyl peroxide",
                "dinitrogen tetraoxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "lead tetraacetate",
                "lithium nitrate",
                "nitrosoperoxycarbonic acid",
                "osmium tetroxide",
                "ozone",
                "peracetic acid",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "thallium(III) nitrate",
                "triplet dioxygen"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Hydrogen Peroxide (H2O2)",
            "Potassium Permanganate (KMnO4)",
            "Sodium Hypochlorite (NaOCl)",
            "Chlorine (Cl2)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Nitric Acid (HNO3)",
            "Sulfuric Acid (H2SO4)",
            "Chromic Acid (H2CrO4)",
            "Perchloric Acid (HClO4)",
            "Peracetic Acid (CH3CO3H)",
            "Benzoyl Peroxide (C6H5COO)2",
            "Cumene Hydroperoxide (C6H5C(CH3)2OOH)",
            "Tert-Butyl Hydroperoxide ((CH3)3COOH)",
            "Lead(IV) Acetate (Pb(OAc)4)",
            "Cerium(IV) Sulfate (Ce(SO4)2)",
            "Ferric Chloride (FeCl3)",
            "Copper(II) Chloride (CuCl2)",
            "Silver Nitrate (AgNO3)",
            "Potassium Dichromate (K2Cr2O7)",
            "Sodium Perborate (NaBO3)",
            "Calcium Hypochlorite (Ca(OCl)2)",
            "Lithium Peroxide (Li2O2)",
            "Hydrogen Iodide (HI)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen Peroxide (H2O2)",
                "Chromic Acid (H2CrO4)",
                "Peracetic Acid (CH3CO3H)",
                "Cumene Hydroperoxide (C6H5C(CH3)2OOH)",
                "Tert-Butyl Hydroperoxide ((CH3)3COOH)",
                "Potassium Dichromate (K2Cr2O7)"
            ],
            "mismatches": [
                "Potassium Permanganate (KMnO4)",
                "Sodium Hypochlorite (NaOCl)",
                "Chlorine (Cl2)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Nitric Acid (HNO3)",
                "Sulfuric Acid (H2SO4)",
                "Perchloric Acid (HClO4)",
                "Benzoyl Peroxide (C6H5COO)2",
                "Lead(IV) Acetate (Pb(OAc)4)",
                "Cerium(IV) Sulfate (Ce(SO4)2)",
                "Ferric Chloride (FeCl3)",
                "Copper(II) Chloride (CuCl2)",
                "Silver Nitrate (AgNO3)",
                "Sodium Perborate (NaBO3)",
                "Calcium Hypochlorite (Ca(OCl)2)",
                "Lithium Peroxide (Li2O2)",
                "Hydrogen Iodide (HI)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "chromyl dichloride",
                "cumene hydroperoxide",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dioxygen",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "lead tetraacetate",
                "lithium nitrate",
                "nitrosoperoxycarbonic acid",
                "ozone",
                "peracetic acid",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "sodium periodate",
                "tert-butyl hydroperoxide",
                "thallium(III) nitrate"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxidizing agent (Oxidizing agent)",
            "Chlorine gas (Cl2)",
            "Nitric acid (HNO3)",
            "Ozone (O3)",
            "Potassium permanganate (KMnO4)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Chromium trioxide (CrO3)",
            "Manganese dioxide (MnO2)",
            "Oxygen (O2)",
            "Ferric chloride (FeCl3)",
            "Potassium dichromate (K2Cr2O7)",
            "Chlorine dioxide (ClO2)",
            "Benzoyl peroxide (BzO2)",
            "Hydrogen peroxide (H2O2)",
            "Ferrous sulfate (FeSO4)",
            "Cerium(IV) oxide (CeO2)",
            "Silver oxide (Ag2O)",
            "Manganese(IV) oxide (MnO4)",
            "Chromium(VI) oxide (CrO3)",
            "Bromine water (Br2/H2O)",
            "Iodine monochloride (ICl)",
            "Chlorine trifluoride (ClF3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ozone",
                "Potassium dichromate",
                "Hydrogen peroxide"
            ],
            "mismatches": [
                "Oxidizing agent (Oxidizing agent)",
                "Chlorine gas (Cl2)",
                "Nitric acid (HNO3)",
                "Potassium permanganate (KMnO4)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Chromium trioxide (CrO3)",
                "Manganese dioxide (MnO2)",
                "Oxygen (O2)",
                "Ferric chloride (FeCl3)",
                "Chlorine dioxide (ClO2)",
                "Benzoyl peroxide (BzO2)",
                "Ferrous sulfate (FeSO4)",
                "Cerium(IV) oxide (CeO2)",
                "Silver oxide (Ag2O)",
                "Manganese(IV) oxide (MnO4)",
                "Chromium(VI) oxide (CrO3)",
                "Bromine water (Br2/H2O)",
                "Iodine monochloride (ICl)",
                "Chlorine trifluoride (ClF3)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "chromyl dichloride",
                "diethyl peroxide",
                "dimethyl peroxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "nitrosoperoxycarbonic acid",
                "organic peroxide",
                "osmium tetroxide",
                "ozone",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "trichloroacetaldehyde",
                "triplet dioxygen"
            ],
            "TP": 3,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            "Oxidizing agent (OA)",
            "Chlorine (Cl2)",
            "Oxygen (O2)",
            "Bromine (Br2)",
            "Iodine (I2)",
            "Fluorine (F2)",
            "Chlorine dioxide (ClO2)",
            "Ozone (O3)",
            "Hydrogen peroxide (H2O2)",
            "Manganese dioxide (MnO2)",
            "Potassium permanganate (KMnO4)",
            "Sodium dichromate (Na2Cr2O7)",
            "Chromic acid (H2CrO4)",
            "Chromium trioxide (CrO3)",
            "Ferric chloride (FeCl3)",
            "Cerium(IV) sulfate (Ce(SO4)2)",
            "Lead dioxide (PbO2)",
            "Silver oxide (Ag2O)",
            "Barium peroxide (BaO2)",
            "Strontium peroxide (SrO2)",
            "Copper(II) oxide (CuO)",
            "Nickel oxide (NiO)",
            "Manganese(III) acetate (Mn(CH3COO)3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ozone",
                "Hydrogen peroxide",
                "Chromic acid"
            ],
            "mismatches": [
                "Oxidizing agent (OA)",
                "Chlorine (Cl2)",
                "Oxygen (O2)",
                "Bromine (Br2)",
                "Iodine (I2)",
                "Fluorine (F2)",
                "Chlorine dioxide (ClO2)",
                "Manganese dioxide (MnO2)",
                "Potassium permanganate (KMnO4)",
                "Sodium dichromate (Na2Cr2O7)",
                "Chromium trioxide (CrO3)",
                "Ferric chloride (FeCl3)",
                "Cerium(IV) sulfate (Ce(SO4)2)",
                "Lead dioxide (PbO2)",
                "Silver oxide (Ag2O)",
                "Barium peroxide (BaO2)",
                "Strontium peroxide (SrO2)",
                "Copper(II) oxide (CuO)",
                "Nickel oxide (NiO)",
                "Manganese(III) acetate (Mn(CH3COO)3)"
            ],
            "true_referents": [
                "FINO2",
                "ammonium nitrate",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "diethyl peroxide",
                "dioxygen",
                "fluoroacetaldehyde",
                "formylmethyl",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "inorganic peroxide",
                "lead tetraacetate",
                "osmium tetroxide",
                "ozone",
                "peracetic acid",
                "peroxides",
                "potassium chromate",
                "potassium dichromate",
                "pyridinium dichromate",
                "sodium bromate",
                "sodium chlorite",
                "sodium chromate",
                "triplet dioxygen"
            ],
            "TP": 3,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "oxidant",
        "domain": "chemistry",
        "response": [
            [
                "Canonical name",
                "H2O2"
            ],
            [
                "Canonical name",
                "KMnO4"
            ],
            [
                "Canonical name",
                "O2"
            ],
            [
                "Canonical name",
                "NaClO2"
            ],
            [
                "Canonical name",
                "Fe2+"
            ],
            [
                "Canonical name",
                "Cu2+"
            ],
            [
                "Canonical name",
                "Cl2"
            ],
            [
                "Canonical name",
                "ClO2"
            ],
            [
                "Canonical name",
                "H2SO4"
            ],
            [
                "Canonical name",
                "H2O"
            ],
            [
                "Canonical name",
                "NaOH"
            ],
            [
                "Canonical name",
                "HCl"
            ],
            [
                "Canonical name",
                "HNO3"
            ],
            [
                "Canonical name",
                "H2"
            ],
            [
                "Canonical name",
                "F2"
            ],
            [
                "Canonical name",
                "O3"
            ],
            [
                "Canonical name",
                "Br2"
            ],
            [
                "Canonical name",
                "I2"
            ]
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "H2O2",
                "O2",
                "NaClO2",
                "O3"
            ],
            "mismatches": [
                "KMnO4",
                "Fe2+",
                "Cu2+",
                "Cl2",
                "ClO2",
                "H2SO4",
                "H2O",
                "NaOH",
                "HCl",
                "HNO3",
                "H2",
                "F2",
                "Br2",
                "I2"
            ],
            "true_referents": [
                "(methylsulfanyl)acetaldehyde",
                "FINO2",
                "LSM-5859",
                "acetaldehyde (E)-hydrazone",
                "ammonium persulfate",
                "chlorine peroxide",
                "chloroacetaldehyde",
                "chromate(2-)",
                "chromic acid",
                "chromyl dichloride",
                "dioxygen",
                "fluoroacetaldehyde",
                "formylmethyl",
                "hydrogen peroxide",
                "hypothiocyanous acid",
                "ozone",
                "potassium chromate",
                "potassium dichromate",
                "prostaglandin H2",
                "sodium chlorite",
                "triplet dioxygen"
            ],
            "TP": 4,
            "FP": 14,
            "FN": 0
        }
    }
]