[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "superoxide anion (O2\u2022-)",
            "hydroxyl radical (\u2022OH)",
            "nitric oxide (NO\u2022)",
            "peroxynitrite anion (ONOO\u2022-)",
            "hypochlorous acid anion (HOCl\u2022-)",
            "singlet oxygen anion (1\u0394gO2\u2022-)",
            "methyl radical (\u2022CH3)",
            "ferryl ion (Fe4+=O\u2022-)",
            "chloramine anion (NH2Cl\u2022-)",
            "peroxyl radical (ROO\u2022-)",
            "alkoxyl radical (RO\u2022-)",
            "carbon-centered radical (\u2022CH2-)",
            "nitroxide anion (RNO\u2022-)",
            "hydroperoxyl radical (HO2\u2022-)",
            "thiyl radical (RS\u2022-)",
            "benzyl radical (\u2022C6H5CH2-)",
            "alkenyl radical (\u2022CH=CH2-)",
            "alkynyl radical (\u2022C\u2261CH-)",
            "phenoxyl radical (C6H5O\u2022-)",
            "semiquinone anion (ArO\u2022-)",
            "fatty acid radical (RCH=CHCOO\u2022-)",
            "carbonyl radical (RCO\u2022-)",
            "alkyl nitrite anion (RONO\u2022-)",
            "thiocarbonyl radical (RCS\u2022-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "superoxide anion (O2\u2022-)",
                "hydroxyl radical (\u2022OH)",
                "nitric oxide (NO\u2022)",
                "peroxynitrite anion (ONOO\u2022-)",
                "hypochlorous acid anion (HOCl\u2022-)",
                "singlet oxygen anion (1\u0394gO2\u2022-)",
                "methyl radical (\u2022CH3)",
                "ferryl ion (Fe4+=O\u2022-)",
                "chloramine anion (NH2Cl\u2022-)",
                "peroxyl radical (ROO\u2022-)",
                "alkoxyl radical (RO\u2022-)",
                "carbon-centered radical (\u2022CH2-)",
                "nitroxide anion (RNO\u2022-)",
                "hydroperoxyl radical (HO2\u2022-)",
                "thiyl radical (RS\u2022-)",
                "benzyl radical (\u2022C6H5CH2-)",
                "alkenyl radical (\u2022CH=CH2-)",
                "alkynyl radical (\u2022C\u2261CH-)",
                "phenoxyl radical (C6H5O\u2022-)",
                "semiquinone anion (ArO\u2022-)",
                "fatty acid radical (RCH=CHCOO\u2022-)",
                "carbonyl radical (RCO\u2022-)",
                "alkyl nitrite anion (RONO\u2022-)",
                "thiocarbonyl radical (RCS\u2022-)"
            ],
            "mismatches": [],
            "true_referents": [
                "alkenyl radical (\u2022CH=CH2-)",
                "alkoxyl radical (RO\u2022-)",
                "alkyl nitrite anion (RONO\u2022-)",
                "alkynyl radical (\u2022C\u2261CH-)",
                "benzyl radical (\u2022C6H5CH2-)",
                "carbon-centered radical (\u2022CH2-)",
                "carbonyl radical (RCO\u2022-)",
                "chloramine anion (NH2Cl\u2022-)",
                "fatty acid radical (RCH=CHCOO\u2022-)",
                "ferryl ion (Fe4+=O\u2022-)",
                "hydroperoxyl radical (HO2\u2022-)",
                "hydroxyl radical (\u2022OH)",
                "hypochlorous acid anion (HOCl\u2022-)",
                "methyl radical (\u2022CH3)",
                "nitric oxide (NO\u2022)",
                "nitroxide anion (RNO\u2022-)",
                "peroxyl radical (ROO\u2022-)",
                "peroxynitrite anion (ONOO\u2022-)",
                "phenoxyl radical (C6H5O\u2022-)",
                "semiquinone anion (ArO\u2022-)",
                "singlet oxygen anion (1\u0394gO2\u2022-)",
                "superoxide anion (O2\u2022-)",
                "thiocarbonyl radical (RCS\u2022-)",
                "thiyl radical (RS\u2022-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide anion (O2\u2022\u2212)",
            "Hydroxyl radical (\u2022OH)",
            "Peroxyl radical anion (ROO\u2022\u2212)",
            "Alkoxyl radical anion (RO\u2022\u2212)",
            "Nitrite radical anion (NO2\u2022\u2212)",
            "Nitrate radical anion (NO3\u2022\u2212)",
            "Azide radical anion (N3\u2022\u2212)",
            "Cyanide radical anion (CN\u2022\u2212)",
            "Thiolate anion (RS\u2022\u2212)",
            "Phenolate anion (PhO\u2022\u2212)",
            "Carboxylate radical anion (RCOO\u2022\u2212)",
            "Acetate radical anion (CH3COO\u2022\u2212)",
            "Formate radical anion (HCOO\u2022\u2212)",
            "Thiocyanate radical anion (SCN\u2022\u2212)",
            "Bromide radical anion (Br\u2022\u2212)",
            "Iodide radical anion (I\u2022\u2212)",
            "Chloride radical anion (Cl\u2022\u2212)",
            "Fluoride radical anion (F\u2022\u2212)",
            "Methyl radical anion (CH3\u2022\u2212)",
            "Ethyl radical anion (C2H5\u2022\u2212)",
            "Propyl radical anion (C3H7\u2022\u2212)",
            "Butyl radical anion (C4H9\u2022\u2212)",
            "Phenyl radical anion (Ph\u2022\u2212)",
            "Vinyl radical anion (CH2=CH\u2022\u2212)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide anion (O2\u2022\u2212)",
                "Hydroxyl radical (\u2022OH)",
                "Peroxyl radical anion (ROO\u2022\u2212)",
                "Alkoxyl radical anion (RO\u2022\u2212)",
                "Nitrite radical anion (NO2\u2022\u2212)",
                "Nitrate radical anion (NO3\u2022\u2212)",
                "Azide radical anion (N3\u2022\u2212)",
                "Cyanide radical anion (CN\u2022\u2212)",
                "Thiolate anion (RS\u2022\u2212)",
                "Phenolate anion (PhO\u2022\u2212)",
                "Carboxylate radical anion (RCOO\u2022\u2212)",
                "Acetate radical anion (CH3COO\u2022\u2212)",
                "Formate radical anion (HCOO\u2022\u2212)",
                "Thiocyanate radical anion (SCN\u2022\u2212)",
                "Bromide radical anion (Br\u2022\u2212)",
                "Iodide radical anion (I\u2022\u2212)",
                "Chloride radical anion (Cl\u2022\u2212)",
                "Fluoride radical anion (F\u2022\u2212)",
                "Methyl radical anion (CH3\u2022\u2212)",
                "Ethyl radical anion (C2H5\u2022\u2212)",
                "Propyl radical anion (C3H7\u2022\u2212)",
                "Butyl radical anion (C4H9\u2022\u2212)",
                "Phenyl radical anion (Ph\u2022\u2212)",
                "Vinyl radical anion (CH2=CH\u2022\u2212)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate radical anion (CH3COO\u2022\u2212)",
                "Alkoxyl radical anion (RO\u2022\u2212)",
                "Azide radical anion (N3\u2022\u2212)",
                "Bromide radical anion (Br\u2022\u2212)",
                "Butyl radical anion (C4H9\u2022\u2212)",
                "Carboxylate radical anion (RCOO\u2022\u2212)",
                "Chloride radical anion (Cl\u2022\u2212)",
                "Cyanide radical anion (CN\u2022\u2212)",
                "Ethyl radical anion (C2H5\u2022\u2212)",
                "Fluoride radical anion (F\u2022\u2212)",
                "Formate radical anion (HCOO\u2022\u2212)",
                "Hydroxyl radical (\u2022OH)",
                "Iodide radical anion (I\u2022\u2212)",
                "Methyl radical anion (CH3\u2022\u2212)",
                "Nitrate radical anion (NO3\u2022\u2212)",
                "Nitrite radical anion (NO2\u2022\u2212)",
                "Peroxyl radical anion (ROO\u2022\u2212)",
                "Phenolate anion (PhO\u2022\u2212)",
                "Phenyl radical anion (Ph\u2022\u2212)",
                "Propyl radical anion (C3H7\u2022\u2212)",
                "Superoxide anion (O2\u2022\u2212)",
                "Thiocyanate radical anion (SCN\u2022\u2212)",
                "Thiolate anion (RS\u2022\u2212)",
                "Vinyl radical anion (CH2=CH\u2022\u2212)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide anion (O2\u2212)",
            "Hydroxyl radical (\u00b7OH)",
            "Nitric oxide (NO)",
            "Nitric oxide anion (NO\u2212)",
            "Hydroperoxyl radical (HOO\u00b7)",
            "Peroxyl radical (ROO\u00b7)",
            "Alkoxy radical (RO\u00b7)",
            "Carbon-centered radical (R\u00b7)",
            "Sulfur-centered radical (RS\u00b7)",
            "Oxygen-centered radical (RO\u00b7)",
            "Thiyl radical (RS\u00b7)",
            "Carbonate radical (CO3\u2212\u00b7)",
            "Sulfate radical (SO4\u2212\u00b7)",
            "Peroxynitrite anion (ONOO\u2212)",
            "Thiyl radical anion (RS\u2212)",
            "Azide radical (N3\u00b7)",
            "Thiocyanate radical (SCN\u00b7)",
            "Cyanide radical (CN\u00b7)",
            "Nitrite radical (NO2\u00b7)",
            "Nitrate radical (NO3\u00b7)",
            "Cyanate radical (OCN\u00b7)",
            "Chlorine dioxide radical (ClO2\u00b7)",
            "Bromine dioxide radical (BrO2\u00b7)",
            "Iodine dioxide radical (IO2\u00b7)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide anion (O2\u2212)",
                "Hydroxyl radical (\u00b7OH)",
                "Nitric oxide (NO)",
                "Nitric oxide anion (NO\u2212)",
                "Hydroperoxyl radical (HOO\u00b7)",
                "Peroxyl radical (ROO\u00b7)",
                "Alkoxy radical (RO\u00b7)",
                "Carbon-centered radical (R\u00b7)",
                "Sulfur-centered radical (RS\u00b7)",
                "Oxygen-centered radical (RO\u00b7)",
                "Thiyl radical (RS\u00b7)",
                "Carbonate radical (CO3\u2212\u00b7)",
                "Sulfate radical (SO4\u2212\u00b7)",
                "Peroxynitrite anion (ONOO\u2212)",
                "Thiyl radical anion (RS\u2212)",
                "Azide radical (N3\u00b7)",
                "Thiocyanate radical (SCN\u00b7)",
                "Cyanide radical (CN\u00b7)",
                "Nitrite radical (NO2\u00b7)",
                "Nitrate radical (NO3\u00b7)",
                "Cyanate radical (OCN\u00b7)",
                "Chlorine dioxide radical (ClO2\u00b7)",
                "Bromine dioxide radical (BrO2\u00b7)",
                "Iodine dioxide radical (IO2\u00b7)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alkoxy radical (RO\u00b7)",
                "Azide radical (N3\u00b7)",
                "Bromine dioxide radical (BrO2\u00b7)",
                "Carbon-centered radical (R\u00b7)",
                "Carbonate radical (CO3\u2212\u00b7)",
                "Chlorine dioxide radical (ClO2\u00b7)",
                "Cyanate radical (OCN\u00b7)",
                "Cyanide radical (CN\u00b7)",
                "Hydroperoxyl radical (HOO\u00b7)",
                "Hydroxyl radical (\u00b7OH)",
                "Iodine dioxide radical (IO2\u00b7)",
                "Nitrate radical (NO3\u00b7)",
                "Nitric oxide (NO)",
                "Nitric oxide anion (NO\u2212)",
                "Nitrite radical (NO2\u00b7)",
                "Oxygen-centered radical (RO\u00b7)",
                "Peroxyl radical (ROO\u00b7)",
                "Peroxynitrite anion (ONOO\u2212)",
                "Sulfate radical (SO4\u2212\u00b7)",
                "Sulfur-centered radical (RS\u00b7)",
                "Superoxide anion (O2\u2212)",
                "Thiocyanate radical (SCN\u00b7)",
                "Thiyl radical (RS\u00b7)",
                "Thiyl radical anion (RS\u2212)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide radical anion (O\u2082\u207b\u2022)",
            "Hydroxyl radical (\u2022OH)",
            "Glutathione radical anion (GS\u207b\u2022)",
            "Semiquinone radical anion (Q\u207b\u2022)",
            "Nitric oxide radical (NO\u2022)",
            "Peroxyl radical (ROO\u2022)",
            "Alkoxyl radical (RO\u2022)",
            "Carbonate radical anion (CO\u2083\u207b\u2022)",
            "Nitrite radical anion (NO\u2082\u207b\u2022)",
            "Cyanide radical anion (CN\u207b\u2022)",
            "Thiyl radical (RS\u2022)",
            "Phenoxyl radical (ArO\u2022)",
            "Methyl radical (CH\u2083\u2022)",
            "Ethyl radical (C\u2082H\u2085\u2022)",
            "Propyl radical (C\u2083H\u2087\u2022)",
            "Formyl radical (HCO\u2022)",
            "Acetyl radical (CH\u2083CO\u2022)",
            "Vinyl radical (CH\u2082=CH\u2022)",
            "Allyl radical (CH\u2082=CH-CH\u2082\u2022)",
            "Hydride ion (H\u207b)",
            "Fluoride ion (F\u207b)",
            "Chloride ion (Cl\u207b)",
            "Bromide ion (Br\u207b)",
            "Iodide ion (I\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide radical anion (O\u2082\u207b\u2022)",
                "Hydroxyl radical (\u2022OH)",
                "Glutathione radical anion (GS\u207b\u2022)",
                "Semiquinone radical anion (Q\u207b\u2022)",
                "Nitric oxide radical (NO\u2022)",
                "Peroxyl radical (ROO\u2022)",
                "Alkoxyl radical (RO\u2022)",
                "Carbonate radical anion (CO\u2083\u207b\u2022)",
                "Nitrite radical anion (NO\u2082\u207b\u2022)",
                "Cyanide radical anion (CN\u207b\u2022)",
                "Thiyl radical (RS\u2022)",
                "Phenoxyl radical (ArO\u2022)",
                "Methyl radical (CH\u2083\u2022)",
                "Ethyl radical (C\u2082H\u2085\u2022)",
                "Propyl radical (C\u2083H\u2087\u2022)",
                "Formyl radical (HCO\u2022)",
                "Acetyl radical (CH\u2083CO\u2022)",
                "Vinyl radical (CH\u2082=CH\u2022)",
                "Allyl radical (CH\u2082=CH-CH\u2082\u2022)",
                "Hydride ion (H\u207b)",
                "Fluoride ion (F\u207b)",
                "Chloride ion (Cl\u207b)",
                "Bromide ion (Br\u207b)",
                "Iodide ion (I\u207b)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl radical (CH\u2083CO\u2022)",
                "Alkoxyl radical (RO\u2022)",
                "Allyl radical (CH\u2082=CH-CH\u2082\u2022)",
                "Bromide ion (Br\u207b)",
                "Carbonate radical anion (CO\u2083\u207b\u2022)",
                "Chloride ion (Cl\u207b)",
                "Cyanide radical anion (CN\u207b\u2022)",
                "Ethyl radical (C\u2082H\u2085\u2022)",
                "Fluoride ion (F\u207b)",
                "Formyl radical (HCO\u2022)",
                "Glutathione radical anion (GS\u207b\u2022)",
                "Hydride ion (H\u207b)",
                "Hydroxyl radical (\u2022OH)",
                "Iodide ion (I\u207b)",
                "Methyl radical (CH\u2083\u2022)",
                "Nitric oxide radical (NO\u2022)",
                "Nitrite radical anion (NO\u2082\u207b\u2022)",
                "Peroxyl radical (ROO\u2022)",
                "Phenoxyl radical (ArO\u2022)",
                "Propyl radical (C\u2083H\u2087\u2022)",
                "Semiquinone radical anion (Q\u207b\u2022)",
                "Superoxide radical anion (O\u2082\u207b\u2022)",
                "Thiyl radical (RS\u2022)",
                "Vinyl radical (CH\u2082=CH\u2022)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide (O2-)",
            "Nitric oxide anion (NO-)",
            "Hydroxyl radical anion (OH-)",
            "Chlorine dioxide anion (ClO2-)",
            "Peroxide anion (O2^2-)",
            "Thiyl radical anion (RS-)",
            "Phenolate radical anion (C6H5O-)",
            "Nitrogen dioxide anion (NO2-)",
            "Carbonate radical anion (CO3-)",
            "Hydrogen peroxide radical anion (HO2-)",
            "Acetate radical anion (CH3COO-)",
            "Sulfate radical anion (SO4-)",
            "Nitrate radical anion (NO3-)",
            "Peroxymonosulfate radical anion (HSO5-)",
            "Azide radical anion (N3-)",
            "Iodate radical anion (IO3-)",
            "Bromate radical anion (BrO3-)",
            "Chlorate radical anion (ClO3-)",
            "Formate radical anion (HCOO-)",
            "Cyanide radical anion (CN-)",
            "Bisulfite radical anion (HSO3-)",
            "Thiocyanate radical anion (SCN-)",
            "Hypochlorite radical anion (OCl-)",
            "Perchlorate radical anion (ClO4-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O2-)",
                "Nitric oxide anion (NO-)",
                "Hydroxyl radical anion (OH-)",
                "Chlorine dioxide anion (ClO2-)",
                "Peroxide anion (O2^2-)",
                "Thiyl radical anion (RS-)",
                "Phenolate radical anion (C6H5O-)",
                "Nitrogen dioxide anion (NO2-)",
                "Carbonate radical anion (CO3-)",
                "Hydrogen peroxide radical anion (HO2-)",
                "Acetate radical anion (CH3COO-)",
                "Sulfate radical anion (SO4-)",
                "Nitrate radical anion (NO3-)",
                "Peroxymonosulfate radical anion (HSO5-)",
                "Azide radical anion (N3-)",
                "Iodate radical anion (IO3-)",
                "Bromate radical anion (BrO3-)",
                "Chlorate radical anion (ClO3-)",
                "Formate radical anion (HCOO-)",
                "Cyanide radical anion (CN-)",
                "Bisulfite radical anion (HSO3-)",
                "Thiocyanate radical anion (SCN-)",
                "Hypochlorite radical anion (OCl-)",
                "Perchlorate radical anion (ClO4-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate radical anion (CH3COO-)",
                "Azide radical anion (N3-)",
                "Bisulfite radical anion (HSO3-)",
                "Bromate radical anion (BrO3-)",
                "Carbonate radical anion (CO3-)",
                "Chlorate radical anion (ClO3-)",
                "Chlorine dioxide anion (ClO2-)",
                "Cyanide radical anion (CN-)",
                "Formate radical anion (HCOO-)",
                "Hydrogen peroxide radical anion (HO2-)",
                "Hydroxyl radical anion (OH-)",
                "Hypochlorite radical anion (OCl-)",
                "Iodate radical anion (IO3-)",
                "Nitrate radical anion (NO3-)",
                "Nitric oxide anion (NO-)",
                "Nitrogen dioxide anion (NO2-)",
                "Perchlorate radical anion (ClO4-)",
                "Peroxide anion (O2^2-)",
                "Peroxymonosulfate radical anion (HSO5-)",
                "Phenolate radical anion (C6H5O-)",
                "Sulfate radical anion (SO4-)",
                "Superoxide (O2-)",
                "Thiocyanate radical anion (SCN-)",
                "Thiyl radical anion (RS-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide (O2-)",
            "Hydroxyl radical (\u2022OH)",
            "Alkyl radical (R\u2022)",
            "Nitric oxide (NO)",
            "Peroxyl radical (ROO\u2022)",
            "Aldehyde radical (RCHO\u2022)",
            "Phenoxyl radical (C6H5O\u2022)",
            "Carboxyl radical (RCOO\u2022)",
            "Thiyl radical (RS\u2022)",
            "Chloride ion (Cl-)",
            "Bromide ion (Br-)",
            "Iodide ion (I-)",
            "Sulfide radical (RS\u2022)",
            "Carbonate radical (CO3\u2022-)",
            "Nitrite radical (NO2\u2022-)",
            "Acetate radical (CH3COO\u2022)",
            "Methyl radical (CH3\u2022)",
            "Ethyl radical (C2H5\u2022)",
            "Vinyl radical (C2H3\u2022)",
            "Cyclopropyl radical (C3H5\u2022)",
            "Triphenylmethyl radical (C19H15\u2022)",
            "Dichloromethyl radical (CCl2H\u2022)",
            "Selenoate radical (RSe\u2022)",
            "Phosphoranyl radical (R3P\u2022)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O2-)",
                "Hydroxyl radical (\u2022OH)",
                "Alkyl radical (R\u2022)",
                "Nitric oxide (NO)",
                "Peroxyl radical (ROO\u2022)",
                "Aldehyde radical (RCHO\u2022)",
                "Phenoxyl radical (C6H5O\u2022)",
                "Carboxyl radical (RCOO\u2022)",
                "Thiyl radical (RS\u2022)",
                "Chloride ion (Cl-)",
                "Bromide ion (Br-)",
                "Iodide ion (I-)",
                "Sulfide radical (RS\u2022)",
                "Carbonate radical (CO3\u2022-)",
                "Nitrite radical (NO2\u2022-)",
                "Acetate radical (CH3COO\u2022)",
                "Methyl radical (CH3\u2022)",
                "Ethyl radical (C2H5\u2022)",
                "Vinyl radical (C2H3\u2022)",
                "Cyclopropyl radical (C3H5\u2022)",
                "Triphenylmethyl radical (C19H15\u2022)",
                "Dichloromethyl radical (CCl2H\u2022)",
                "Selenoate radical (RSe\u2022)",
                "Phosphoranyl radical (R3P\u2022)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate radical (CH3COO\u2022)",
                "Aldehyde radical (RCHO\u2022)",
                "Alkyl radical (R\u2022)",
                "Bromide ion (Br-)",
                "Carbonate radical (CO3\u2022-)",
                "Carboxyl radical (RCOO\u2022)",
                "Chloride ion (Cl-)",
                "Cyclopropyl radical (C3H5\u2022)",
                "Dichloromethyl radical (CCl2H\u2022)",
                "Ethyl radical (C2H5\u2022)",
                "Hydroxyl radical (\u2022OH)",
                "Iodide ion (I-)",
                "Methyl radical (CH3\u2022)",
                "Nitric oxide (NO)",
                "Nitrite radical (NO2\u2022-)",
                "Peroxyl radical (ROO\u2022)",
                "Phenoxyl radical (C6H5O\u2022)",
                "Phosphoranyl radical (R3P\u2022)",
                "Selenoate radical (RSe\u2022)",
                "Sulfide radical (RS\u2022)",
                "Superoxide (O2-)",
                "Thiyl radical (RS\u2022)",
                "Triphenylmethyl radical (C19H15\u2022)",
                "Vinyl radical (C2H3\u2022)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide ion (O2-)",
            "Hydroxyl radical (OH-)",
            "Hydroperoxyl (HO2-)",
            "Alkoxide ion (RO-)",
            "Carboxylate ion (RCOO-)",
            "Phenoxide ion (C6H5O-)",
            "Hydrosulfide ion (HS-)",
            "Thiocyanate ion (SCN-)",
            "Nitrate radical (NO3-)",
            "Perchlorate radical (ClO4-)",
            "Nitrite radical (NO2-)",
            "Sulfite radical (SO3-)",
            "Phosphate radical (PO4-)",
            "Carbonate radical (CO3-)",
            "Bicarbonate radical (HCO3-)",
            "Hydrogen peroxide radical (HOO-)",
            "Sulfate radical (SO4-)",
            "Thiosulfate radical (S2O3-)",
            "Hydrogen sulfite radical (HSO3-)",
            "Hydrogen sulfate radical (HSO4-)",
            "Dihydrogen phosphate radical (H2PO4-)",
            "Hydrogen phosphate radical (HPO4-)",
            "Dihydrogen phosphite radical (H2PO3-)",
            "Hydrogen phosphite radical (HPO3-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide ion (O2-)",
                "Hydroxyl radical (OH-)",
                "Hydroperoxyl (HO2-)",
                "Alkoxide ion (RO-)",
                "Carboxylate ion (RCOO-)",
                "Phenoxide ion (C6H5O-)",
                "Hydrosulfide ion (HS-)",
                "Thiocyanate ion (SCN-)",
                "Nitrate radical (NO3-)",
                "Perchlorate radical (ClO4-)",
                "Nitrite radical (NO2-)",
                "Sulfite radical (SO3-)",
                "Phosphate radical (PO4-)",
                "Carbonate radical (CO3-)",
                "Bicarbonate radical (HCO3-)",
                "Hydrogen peroxide radical (HOO-)",
                "Sulfate radical (SO4-)",
                "Thiosulfate radical (S2O3-)",
                "Hydrogen sulfite radical (HSO3-)",
                "Hydrogen sulfate radical (HSO4-)",
                "Dihydrogen phosphate radical (H2PO4-)",
                "Hydrogen phosphate radical (HPO4-)",
                "Dihydrogen phosphite radical (H2PO3-)",
                "Hydrogen phosphite radical (HPO3-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alkoxide ion (RO-)",
                "Bicarbonate radical (HCO3-)",
                "Carbonate radical (CO3-)",
                "Carboxylate ion (RCOO-)",
                "Dihydrogen phosphate radical (H2PO4-)",
                "Dihydrogen phosphite radical (H2PO3-)",
                "Hydrogen peroxide radical (HOO-)",
                "Hydrogen phosphate radical (HPO4-)",
                "Hydrogen phosphite radical (HPO3-)",
                "Hydrogen sulfate radical (HSO4-)",
                "Hydrogen sulfite radical (HSO3-)",
                "Hydroperoxyl (HO2-)",
                "Hydrosulfide ion (HS-)",
                "Hydroxyl radical (OH-)",
                "Nitrate radical (NO3-)",
                "Nitrite radical (NO2-)",
                "Perchlorate radical (ClO4-)",
                "Phenoxide ion (C6H5O-)",
                "Phosphate radical (PO4-)",
                "Sulfate radical (SO4-)",
                "Sulfite radical (SO3-)",
                "Superoxide ion (O2-)",
                "Thiocyanate ion (SCN-)",
                "Thiosulfate radical (S2O3-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Nitric oxide (NO)",
            "Superoxide anion (O2-)",
            "Hydroxyl radical (OH)",
            "Peroxynitrite (ONOO-)",
            "Hydrogen peroxide (H2O2)",
            "Ozone (O3)",
            "Sulfur trioxide (SO3)",
            "Sulfuric acid (H2SO4)",
            "Phosphoric acid (H3PO4)",
            "Carbonate ion (CO3^2-)",
            "Sulfate ion (SO4^2-)",
            "Nitrate ion (NO3-)",
            "Phosphate ion (PO4^3-)",
            "Chlorate ion (ClO3-)",
            "Bromate ion (BrO3-)",
            "Iodate ion (IO3-)",
            "Perchlorate ion (ClO4-)",
            "Chromate ion (CrO4^2-)",
            "Dichromate ion (Cr2O7^2-)",
            "Permanganate ion (MnO4-)",
            "Sulfite ion (SO3^2-)",
            "Hyposulfite ion (S2O3^2-)",
            "Thiosulfate ion (S2O3^2-)",
            "Bisulfite ion (HSO3-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nitric oxide (NO)",
                "Superoxide anion (O2-)",
                "Hydroxyl radical (OH)",
                "Peroxynitrite (ONOO-)",
                "Hydrogen peroxide (H2O2)",
                "Ozone (O3)",
                "Sulfur trioxide (SO3)",
                "Sulfuric acid (H2SO4)",
                "Phosphoric acid (H3PO4)",
                "Carbonate ion (CO3^2-)",
                "Sulfate ion (SO4^2-)",
                "Nitrate ion (NO3-)",
                "Phosphate ion (PO4^3-)",
                "Chlorate ion (ClO3-)",
                "Bromate ion (BrO3-)",
                "Iodate ion (IO3-)",
                "Perchlorate ion (ClO4-)",
                "Chromate ion (CrO4^2-)",
                "Dichromate ion (Cr2O7^2-)",
                "Permanganate ion (MnO4-)",
                "Sulfite ion (SO3^2-)",
                "Thiosulfate ion (S2O3^2-)",
                "Bisulfite ion (HSO3-)"
            ],
            "mismatches": [
                "Hyposulfite ion (S2O3^2-)"
            ],
            "true_referents": [
                "Bisulfite ion (HSO3-)",
                "Bromate ion (BrO3-)",
                "Carbonate ion (CO3^2-)",
                "Chlorate ion (ClO3-)",
                "Chromate ion (CrO4^2-)",
                "Dichromate ion (Cr2O7^2-)",
                "Hydrogen peroxide (H2O2)",
                "Hydroxyl radical (OH)",
                "Hyposulfite ion (S2O3^2-)",
                "Iodate ion (IO3-)",
                "Nitrate ion (NO3-)",
                "Nitric oxide (NO)",
                "Ozone (O3)",
                "Perchlorate ion (ClO4-)",
                "Permanganate ion (MnO4-)",
                "Peroxynitrite (ONOO-)",
                "Phosphate ion (PO4^3-)",
                "Phosphoric acid (H3PO4)",
                "Sulfate ion (SO4^2-)",
                "Sulfite ion (SO3^2-)",
                "Sulfur trioxide (SO3)",
                "Sulfuric acid (H2SO4)",
                "Superoxide anion (O2-)",
                "Thiosulfate ion (S2O3^2-)"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide (O\u2082\u207b)",
            "Hydroxyl radical anion (HO\u2022\u207b)",
            "Nitric oxide radical anion (NO\u207b\u2022)",
            "Azide radical anion (N\u2083\u207b\u2022)",
            "Sulfite radical anion (SO\u2083\u207b\u2022)",
            "Ascorbate radical anion (AscH\u207b\u2022)",
            "Phenoxyl radical anion (PhO\u207b\u2022)",
            "TEMPO radical anion (2,2,6,6-Tetramethylpiperidine 1-oxyl radical)",
            "Benzoate radical anion (C\u2086H\u2085COO\u207b\u2022)",
            "Pyridine radical anion (C\u2085H\u2085N\u207b\u2022)",
            "Thiophenolate radical anion (C\u2084H\u2084S\u207b\u2022)",
            "DPPH radical anion (2,2-diphenyl-1-picrylhydrazyl radical anion)",
            "Naphthoxyl radical anion (C\u2081\u2080H\u2087O\u207b\u2022)",
            "Pyrrole radical anion (C\u2084H\u2085N\u207b\u2022)",
            "Peroxyl radical anion (ROO\u207b\u2022)",
            "Diphenyl radical anion (C\u2081\u2080H\u2088\u207b\u2022)",
            "Glutathione radical anion (GSH\u207b\u2022)",
            "Quinone radical anion (C\u2086H\u2084O\u2082\u207b\u2022)",
            "EPR-detectable solvated electron radical anion",
            "Lithium anthracene radical anion (Li\u207a\u00b7C\u2081\u2084H\u2081\u2080\u207b\u2022)",
            "Anthraquinone radical anion (C\u2081\u2084H\u2088O\u2082\u207b\u2022)",
            "Triphenylmethyl radical anion (Ph\u2083C\u207b\u2022)",
            "Indole radical anion (C\u2088H\u2087N\u207b\u2022)",
            "Carbazole radical anion (C\u2081\u2082H\u2087N\u207b\u2022)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O\u2082\u207b)",
                "Hydroxyl radical anion (HO\u2022\u207b)",
                "Nitric oxide radical anion (NO\u207b\u2022)",
                "Azide radical anion (N\u2083\u207b\u2022)",
                "Sulfite radical anion (SO\u2083\u207b\u2022)",
                "Ascorbate radical anion (AscH\u207b\u2022)",
                "Phenoxyl radical anion (PhO\u207b\u2022)",
                "TEMPO radical anion (2,2,6,6-Tetramethylpiperidine 1-oxyl radical)",
                "Benzoate radical anion (C\u2086H\u2085COO\u207b\u2022)",
                "Pyridine radical anion (C\u2085H\u2085N\u207b\u2022)",
                "Thiophenolate radical anion (C\u2084H\u2084S\u207b\u2022)",
                "DPPH radical anion (2,2-diphenyl-1-picrylhydrazyl radical anion)",
                "Naphthoxyl radical anion (C\u2081\u2080H\u2087O\u207b\u2022)",
                "Pyrrole radical anion (C\u2084H\u2085N\u207b\u2022)",
                "Peroxyl radical anion (ROO\u207b\u2022)",
                "Diphenyl radical anion (C\u2081\u2080H\u2088\u207b\u2022)",
                "Glutathione radical anion (GSH\u207b\u2022)",
                "Quinone radical anion (C\u2086H\u2084O\u2082\u207b\u2022)",
                "EPR-detectable solvated electron radical anion",
                "Lithium anthracene radical anion (Li\u207a\u00b7C\u2081\u2084H\u2081\u2080\u207b\u2022)",
                "Anthraquinone radical anion (C\u2081\u2084H\u2088O\u2082\u207b\u2022)",
                "Triphenylmethyl radical anion (Ph\u2083C\u207b\u2022)",
                "Indole radical anion (C\u2088H\u2087N\u207b\u2022)",
                "Carbazole radical anion (C\u2081\u2082H\u2087N\u207b\u2022)"
            ],
            "mismatches": [],
            "true_referents": [
                "Anthraquinone radical anion (C\u2081\u2084H\u2088O\u2082\u207b\u2022)",
                "Ascorbate radical anion (AscH\u207b\u2022)",
                "Azide radical anion (N\u2083\u207b\u2022)",
                "Benzoate radical anion (C\u2086H\u2085COO\u207b\u2022)",
                "Carbazole radical anion (C\u2081\u2082H\u2087N\u207b\u2022)",
                "DPPH radical anion (2,2-diphenyl-1-picrylhydrazyl radical anion)",
                "Diphenyl radical anion (C\u2081\u2080H\u2088\u207b\u2022)",
                "EPR-detectable solvated electron radical anion",
                "Glutathione radical anion (GSH\u207b\u2022)",
                "Hydroxyl radical anion (HO\u2022\u207b)",
                "Indole radical anion (C\u2088H\u2087N\u207b\u2022)",
                "Lithium anthracene radical anion (Li\u207a\u00b7C\u2081\u2084H\u2081\u2080\u207b\u2022)",
                "Naphthoxyl radical anion (C\u2081\u2080H\u2087O\u207b\u2022)",
                "Nitric oxide radical anion (NO\u207b\u2022)",
                "Peroxyl radical anion (ROO\u207b\u2022)",
                "Phenoxyl radical anion (PhO\u207b\u2022)",
                "Pyridine radical anion (C\u2085H\u2085N\u207b\u2022)",
                "Pyrrole radical anion (C\u2084H\u2085N\u207b\u2022)",
                "Quinone radical anion (C\u2086H\u2084O\u2082\u207b\u2022)",
                "Sulfite radical anion (SO\u2083\u207b\u2022)",
                "Superoxide (O\u2082\u207b)",
                "TEMPO radical anion (2,2,6,6-Tetramethylpiperidine 1-oxyl radical)",
                "Thiophenolate radical anion (C\u2084H\u2084S\u207b\u2022)",
                "Triphenylmethyl radical anion (Ph\u2083C\u207b\u2022)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide anion (O2\u2022\u2212)",
            "Hydroxyl radical anion (OH\u2022\u2212)",
            "Nitric oxide anion (NO\u2022\u2212)",
            "Carbonate radical anion (CO3\u2022\u2212)",
            "Sulfite radical anion (SO3\u2022\u2212)",
            "Nitrogen dioxide anion (NO2\u2022\u2212)",
            "Phenoxyl radical anion (C6H5O\u2022\u2212)",
            "Semiquinone radical anion",
            "Ascorbate radical anion",
            "Urate radical anion",
            "Thiyl radical anion (RS\u2022\u2212)",
            "Disulfide radical anion (RSSR\u2022\u2212)",
            "Flavin semiquinone radical anion",
            "Porphyrin \u03c0-radical anion",
            "Fullerene radical anion (C60\u2022\u2212)",
            "Benzene radical anion (C6H6\u2022\u2212)",
            "Naphthalene radical anion (C10H8\u2022\u2212)",
            "Anthracene radical anion (C14H10\u2022\u2212)",
            "Pyrene radical anion (C16H10\u2022\u2212)",
            "Perylene radical anion (C20H12\u2022\u2212)",
            "Coronene radical anion (C24H12\u2022\u2212)",
            "Chlorophyll radical anion"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide anion (O2\u2022\u2212)",
                "Hydroxyl radical anion (OH\u2022\u2212)",
                "Nitric oxide anion (NO\u2022\u2212)",
                "Carbonate radical anion (CO3\u2022\u2212)",
                "Sulfite radical anion (SO3\u2022\u2212)",
                "Nitrogen dioxide anion (NO2\u2022\u2212)",
                "Phenoxyl radical anion (C6H5O\u2022\u2212)",
                "Semiquinone radical anion",
                "Ascorbate radical anion",
                "Urate radical anion",
                "Thiyl radical anion (RS\u2022\u2212)",
                "Disulfide radical anion (RSSR\u2022\u2212)",
                "Flavin semiquinone radical anion",
                "Porphyrin \u03c0-radical anion",
                "Fullerene radical anion (C60\u2022\u2212)",
                "Benzene radical anion (C6H6\u2022\u2212)",
                "Naphthalene radical anion (C10H8\u2022\u2212)",
                "Anthracene radical anion (C14H10\u2022\u2212)",
                "Pyrene radical anion (C16H10\u2022\u2212)",
                "Perylene radical anion (C20H12\u2022\u2212)",
                "Coronene radical anion (C24H12\u2022\u2212)"
            ],
            "mismatches": [
                "Chlorophyll radical anion"
            ],
            "true_referents": [
                "Anthracene radical anion (C14H10\u2022\u2212)",
                "Ascorbate radical anion",
                "Benzene radical anion (C6H6\u2022\u2212)",
                "Carbonate radical anion (CO3\u2022\u2212)",
                "Chlorophyll radical anion",
                "Coronene radical anion (C24H12\u2022\u2212)",
                "Disulfide radical anion (RSSR\u2022\u2212)",
                "Flavin semiquinone radical anion",
                "Fullerene radical anion (C60\u2022\u2212)",
                "Hydroxyl radical anion (OH\u2022\u2212)",
                "Naphthalene radical anion (C10H8\u2022\u2212)",
                "Nitric oxide anion (NO\u2022\u2212)",
                "Nitrogen dioxide anion (NO2\u2022\u2212)",
                "Perylene radical anion (C20H12\u2022\u2212)",
                "Phenoxyl radical anion (C6H5O\u2022\u2212)",
                "Porphyrin \u03c0-radical anion",
                "Pyrene radical anion (C16H10\u2022\u2212)",
                "Semiquinone radical anion",
                "Sulfite radical anion (SO3\u2022\u2212)",
                "Superoxide anion (O2\u2022\u2212)",
                "Thiyl radical anion (RS\u2022\u2212)",
                "Urate radical anion"
            ],
            "TP": 21,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide anion radical (O2\u2022\u2212)",
            "Hydroxyl radical (\u2022OH)",
            "Hydroperoxyl radical (HO2\u2022)",
            "Nitric oxide (NO\u2022)",
            "Nitrogen dioxide (NO2\u2022)",
            "Carbonate radical anion (CO3\u2022\u2212)",
            "Sulfite radical anion (SO3\u2022\u2212)",
            "Thiosulfate radical anion (S2O3\u2022\u2212)",
            "Peroxyl radical (ROO\u2022)",
            "Alkoxyl radical (RO\u2022)",
            "Semiquinone radical anion (Q\u2022\u2212)",
            "Chlorine dioxide radical anion (ClO2\u2022\u2212)",
            "Bromine dioxide radical anion (BrO2\u2022\u2212)",
            "Iodine dioxide radical anion (IO2\u2022\u2212)",
            "Thiyl radical (RS\u2022)",
            "Disulfide radical anion (RSSR\u2022\u2212)",
            "Perthiyl radical (RSS\u2022)",
            "Nitroxyl radical (HNO\u2022)",
            "Azidyl radical (N3\u2022)",
            "Cyanate radical anion (OCN\u2022\u2212)",
            "Thiocyanate radical anion (SCN\u2022\u2212)",
            "Selenocyanate radical anion (SeCN\u2022\u2212)",
            "Tellurocyanate radical anion (TeCN\u2022\u2212)",
            "Cyanomethyl radical anion (\u2022CH2CN\u2212)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide anion radical (O2\u2022\u2212)",
                "Hydroxyl radical (\u2022OH)",
                "Hydroperoxyl radical (HO2\u2022)",
                "Nitric oxide (NO\u2022)",
                "Nitrogen dioxide (NO2\u2022)",
                "Carbonate radical anion (CO3\u2022\u2212)",
                "Sulfite radical anion (SO3\u2022\u2212)",
                "Thiosulfate radical anion (S2O3\u2022\u2212)",
                "Peroxyl radical (ROO\u2022)",
                "Alkoxyl radical (RO\u2022)",
                "Semiquinone radical anion (Q\u2022\u2212)",
                "Chlorine dioxide radical anion (ClO2\u2022\u2212)",
                "Bromine dioxide radical anion (BrO2\u2022\u2212)",
                "Iodine dioxide radical anion (IO2\u2022\u2212)",
                "Thiyl radical (RS\u2022)",
                "Disulfide radical anion (RSSR\u2022\u2212)",
                "Perthiyl radical (RSS\u2022)",
                "Nitroxyl radical (HNO\u2022)",
                "Azidyl radical (N3\u2022)",
                "Cyanate radical anion (OCN\u2022\u2212)",
                "Thiocyanate radical anion (SCN\u2022\u2212)",
                "Selenocyanate radical anion (SeCN\u2022\u2212)",
                "Tellurocyanate radical anion (TeCN\u2022\u2212)",
                "Cyanomethyl radical anion (\u2022CH2CN\u2212)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alkoxyl radical (RO\u2022)",
                "Azidyl radical (N3\u2022)",
                "Bromine dioxide radical anion (BrO2\u2022\u2212)",
                "Carbonate radical anion (CO3\u2022\u2212)",
                "Chlorine dioxide radical anion (ClO2\u2022\u2212)",
                "Cyanate radical anion (OCN\u2022\u2212)",
                "Cyanomethyl radical anion (\u2022CH2CN\u2212)",
                "Disulfide radical anion (RSSR\u2022\u2212)",
                "Hydroperoxyl radical (HO2\u2022)",
                "Hydroxyl radical (\u2022OH)",
                "Iodine dioxide radical anion (IO2\u2022\u2212)",
                "Nitric oxide (NO\u2022)",
                "Nitrogen dioxide (NO2\u2022)",
                "Nitroxyl radical (HNO\u2022)",
                "Peroxyl radical (ROO\u2022)",
                "Perthiyl radical (RSS\u2022)",
                "Selenocyanate radical anion (SeCN\u2022\u2212)",
                "Semiquinone radical anion (Q\u2022\u2212)",
                "Sulfite radical anion (SO3\u2022\u2212)",
                "Superoxide anion radical (O2\u2022\u2212)",
                "Tellurocyanate radical anion (TeCN\u2022\u2212)",
                "Thiocyanate radical anion (SCN\u2022\u2212)",
                "Thiosulfate radical anion (S2O3\u2022\u2212)",
                "Thiyl radical (RS\u2022)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "superoxide radical (O2\u2022\u2212)",
            "hydroxyl radical (\u2022OH)",
            "nitric oxide (NO\u2022)",
            "nitrogen dioxide (NO2\u2022)",
            "peroxyl radical (ROO\u2022)",
            "alkoxyl radical (RO\u2022)",
            "hydroperoxyl radical (HO2\u2022)",
            "carbonate radical anion (CO3\u2022\u2212)",
            "trichloromethylperoxyl radical (CCl3OO\u2022)",
            "tert-butoxyl radical ((CH3)3CO\u2022)",
            "benzyl radical (C6H5CH2\u2022)",
            "methyl radical (\u2022CH3)",
            "ethyl radical (\u2022CH2CH3)",
            "isopropyl radical ((CH3)2CH\u2022)",
            "tert-butyl radical ((CH3)3C\u2022)",
            "phenyl radical (C6H5\u2022)",
            "cyclohexadienyl radical (C6H7\u2022)",
            "allyl radical (CH2=CHCH2\u2022)",
            "propargyl radical (HC\u2261CCH2\u2022)",
            "semiquinone radical anion (Q\u2022\u2212)",
            "galvinoxyl radical ((C6H4)2NO\u2022)",
            "TEMPO radical ((CH3)3C6H9NO\u2022)",
            "DPPH radical (C6H5N=NC6H4NO2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "superoxide radical (O2\u2022\u2212)",
                "hydroxyl radical (\u2022OH)",
                "nitric oxide (NO\u2022)",
                "nitrogen dioxide (NO2\u2022)",
                "peroxyl radical (ROO\u2022)",
                "alkoxyl radical (RO\u2022)",
                "hydroperoxyl radical (HO2\u2022)",
                "carbonate radical anion (CO3\u2022\u2212)",
                "trichloromethylperoxyl radical (CCl3OO\u2022)",
                "tert-butoxyl radical ((CH3)3CO\u2022)",
                "benzyl radical (C6H5CH2\u2022)",
                "methyl radical (\u2022CH3)",
                "ethyl radical (\u2022CH2CH3)",
                "isopropyl radical ((CH3)2CH\u2022)",
                "tert-butyl radical ((CH3)3C\u2022)",
                "phenyl radical (C6H5\u2022)",
                "cyclohexadienyl radical (C6H7\u2022)",
                "allyl radical (CH2=CHCH2\u2022)",
                "propargyl radical (HC\u2261CCH2\u2022)",
                "semiquinone radical anion (Q\u2022\u2212)",
                "galvinoxyl radical ((C6H4)2NO\u2022)",
                "TEMPO radical ((CH3)3C6H9NO\u2022)",
                "DPPH radical (C6H5N=NC6H4NO2)"
            ],
            "mismatches": [],
            "true_referents": [
                "DPPH radical (C6H5N=NC6H4NO2)",
                "TEMPO radical ((CH3)3C6H9NO\u2022)",
                "alkoxyl radical (RO\u2022)",
                "allyl radical (CH2=CHCH2\u2022)",
                "benzyl radical (C6H5CH2\u2022)",
                "carbonate radical anion (CO3\u2022\u2212)",
                "cyclohexadienyl radical (C6H7\u2022)",
                "ethyl radical (\u2022CH2CH3)",
                "galvinoxyl radical ((C6H4)2NO\u2022)",
                "hydroperoxyl radical (HO2\u2022)",
                "hydroxyl radical (\u2022OH)",
                "isopropyl radical ((CH3)2CH\u2022)",
                "methyl radical (\u2022CH3)",
                "nitric oxide (NO\u2022)",
                "nitrogen dioxide (NO2\u2022)",
                "peroxyl radical (ROO\u2022)",
                "phenyl radical (C6H5\u2022)",
                "propargyl radical (HC\u2261CCH2\u2022)",
                "semiquinone radical anion (Q\u2022\u2212)",
                "superoxide radical (O2\u2022\u2212)",
                "tert-butoxyl radical ((CH3)3CO\u2022)",
                "tert-butyl radical ((CH3)3C\u2022)",
                "trichloromethylperoxyl radical (CCl3OO\u2022)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Nitric oxide (NO)",
            "Superoxide radical (O2-)",
            "Hydroxyl radical (OH-)",
            "Peroxide radical (O2-)",
            "Peroxynitrite (ONOO-)",
            "Nitrite (NO2-)",
            "Nitrate (NO3-)",
            "Glutathione radical (GS-)",
            "Ascorbate radical (AscH-)",
            "Ubiquinone radical (CoQ-)",
            "Flavin radical (Flav-)",
            "Tyrosyl radical (Tyr-)",
            "Tryptophan radical (Trp-)",
            "Cysteine radical (Cys-)",
            "Semiquinone radical (SQ-)",
            "Cardiolipin radical (CL-)",
            "Phosphatidylserine radical (PS-)",
            "Phosphatidylethanolamine radical (PE-)",
            "Phosphatidylcholine radical (PC-)",
            "Phosphatidylinositol radical (PI-)",
            "Deoxyribose radical (dR-)",
            "Ribose radical (R-)",
            "Guanine radical (G-)",
            "Adenine radical (A-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nitric oxide (NO)",
                "Superoxide radical (O2-)",
                "Hydroxyl radical (OH-)",
                "Peroxide radical (O2-)",
                "Peroxynitrite (ONOO-)",
                "Nitrite (NO2-)",
                "Nitrate (NO3-)",
                "Glutathione radical (GS-)",
                "Ascorbate radical (AscH-)",
                "Ubiquinone radical (CoQ-)",
                "Flavin radical (Flav-)",
                "Tyrosyl radical (Tyr-)",
                "Tryptophan radical (Trp-)",
                "Cysteine radical (Cys-)",
                "Semiquinone radical (SQ-)",
                "Cardiolipin radical (CL-)",
                "Phosphatidylserine radical (PS-)",
                "Phosphatidylethanolamine radical (PE-)",
                "Phosphatidylcholine radical (PC-)",
                "Phosphatidylinositol radical (PI-)",
                "Deoxyribose radical (dR-)",
                "Ribose radical (R-)",
                "Guanine radical (G-)",
                "Adenine radical (A-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adenine radical (A-)",
                "Ascorbate radical (AscH-)",
                "Cardiolipin radical (CL-)",
                "Cysteine radical (Cys-)",
                "Deoxyribose radical (dR-)",
                "Flavin radical (Flav-)",
                "Glutathione radical (GS-)",
                "Guanine radical (G-)",
                "Hydroxyl radical (OH-)",
                "Nitrate (NO3-)",
                "Nitric oxide (NO)",
                "Nitrite (NO2-)",
                "Peroxide radical (O2-)",
                "Peroxynitrite (ONOO-)",
                "Phosphatidylcholine radical (PC-)",
                "Phosphatidylethanolamine radical (PE-)",
                "Phosphatidylinositol radical (PI-)",
                "Phosphatidylserine radical (PS-)",
                "Ribose radical (R-)",
                "Semiquinone radical (SQ-)",
                "Superoxide radical (O2-)",
                "Tryptophan radical (Trp-)",
                "Tyrosyl radical (Tyr-)",
                "Ubiquinone radical (CoQ-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Radical anion (RA)",
            "Superoxide anion (O2-)",
            "Nitrite anion (NO2-)",
            "Nitrate anion (NO3-)",
            "Hydroxide anion (OH-)",
            "Fluoride anion (F-)",
            "Chloride anion (Cl-)",
            "Bromide anion (Br-)",
            "Iodide anion (I-)",
            "Peroxide anion (O2-2)",
            "Thiol anion (R-S-)",
            "Sulfide anion (S2-)",
            "Phenolate anion (C6H5O-)",
            "Benzene anion (C6H5-)",
            "Naphthalene anion (C10H7-)",
            "Porphyrin anion (C20H12N4-)",
            "Heme anion (C34H32FeN4O4-)",
            "Cytochrome anion (C55H64FeN4O4-)",
            "Flavin anion (C17H13N4O-)",
            "NADH anion (C21H29N7O14P-)",
            "NADPH anion (C21H31N7O17P-)",
            "FAD anion (C27H33N4O12-)",
            "Coenzyme anion (C27H33N4O12-)",
            "Lipoic anion (C8H12O2S2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Radical anion (RA)",
                "Superoxide anion (O2-)",
                "Nitrite anion (NO2-)",
                "Nitrate anion (NO3-)",
                "Hydroxide anion (OH-)",
                "Fluoride anion (F-)",
                "Chloride anion (Cl-)",
                "Bromide anion (Br-)",
                "Iodide anion (I-)",
                "Peroxide anion (O2-2)",
                "Thiol anion (R-S-)",
                "Sulfide anion (S2-)",
                "Phenolate anion (C6H5O-)",
                "Benzene anion (C6H5-)",
                "Naphthalene anion (C10H7-)",
                "Porphyrin anion (C20H12N4-)",
                "Heme anion (C34H32FeN4O4-)",
                "Cytochrome anion (C55H64FeN4O4-)",
                "Flavin anion (C17H13N4O-)",
                "NADH anion (C21H29N7O14P-)",
                "NADPH anion (C21H31N7O17P-)",
                "FAD anion (C27H33N4O12-)",
                "Coenzyme anion (C27H33N4O12-)",
                "Lipoic anion (C8H12O2S2-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Benzene anion (C6H5-)",
                "Bromide anion (Br-)",
                "Chloride anion (Cl-)",
                "Coenzyme anion (C27H33N4O12-)",
                "Cytochrome anion (C55H64FeN4O4-)",
                "FAD anion (C27H33N4O12-)",
                "Flavin anion (C17H13N4O-)",
                "Fluoride anion (F-)",
                "Heme anion (C34H32FeN4O4-)",
                "Hydroxide anion (OH-)",
                "Iodide anion (I-)",
                "Lipoic anion (C8H12O2S2-)",
                "NADH anion (C21H29N7O14P-)",
                "NADPH anion (C21H31N7O17P-)",
                "Naphthalene anion (C10H7-)",
                "Nitrate anion (NO3-)",
                "Nitrite anion (NO2-)",
                "Peroxide anion (O2-2)",
                "Phenolate anion (C6H5O-)",
                "Porphyrin anion (C20H12N4-)",
                "Radical anion (RA)",
                "Sulfide anion (S2-)",
                "Superoxide anion (O2-)",
                "Thiol anion (R-S-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide (O2-)",
            "Nitric oxide (NO)",
            "Hydroxyl radical (OH)",
            "Oxidized flavin adenine dinucleotide (FAD+)",
            "Dehydroascorbic acid radical",
            "Semiquinone radical",
            "Phenoxyl radical",
            "Alkoxyl radical",
            "Peroxy radical",
            "Carbon-centered radical",
            "Nitrogen-centered radical",
            "Oxygen-centered radical",
            "Sulfur-centered radical",
            "Chlorophyll radical",
            "Pheophytin radical",
            "Plastoquinone radical",
            "Ubisemiquinone radical",
            "Coenzyme Q radical",
            "Flavin mononucleotide radical (FMN)",
            "Monohydroxybenzoquinone radical",
            "Dihydroxybenzoquinone radical",
            "Tocopherol radical",
            "Vitamin E radical",
            "Ascorbyl radical",
            "Menadione radical"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O2-)",
                "Nitric oxide (NO)",
                "Hydroxyl radical (OH)",
                "Oxidized flavin adenine dinucleotide (FAD+)",
                "Dehydroascorbic acid radical",
                "Semiquinone radical",
                "Phenoxyl radical",
                "Alkoxyl radical",
                "Peroxy radical",
                "Carbon-centered radical",
                "Nitrogen-centered radical",
                "Oxygen-centered radical",
                "Sulfur-centered radical",
                "Chlorophyll radical",
                "Pheophytin radical",
                "Plastoquinone radical",
                "Ubisemiquinone radical",
                "Coenzyme Q radical",
                "Flavin mononucleotide radical (FMN)",
                "Monohydroxybenzoquinone radical",
                "Dihydroxybenzoquinone radical",
                "Tocopherol radical",
                "Vitamin E radical",
                "Ascorbyl radical"
            ],
            "mismatches": [
                "Menadione radical"
            ],
            "true_referents": [
                "Alkoxyl radical",
                "Ascorbyl radical",
                "Carbon-centered radical",
                "Chlorophyll radical",
                "Coenzyme Q radical",
                "Dehydroascorbic acid radical",
                "Dihydroxybenzoquinone radical",
                "Flavin mononucleotide radical (FMN)",
                "Hydroxyl radical (OH)",
                "Monohydroxybenzoquinone radical",
                "Nitric oxide (NO)",
                "Nitrogen-centered radical",
                "Oxidized flavin adenine dinucleotide (FAD+)",
                "Oxygen-centered radical",
                "Peroxy radical",
                "Phenoxyl radical",
                "Pheophytin radical",
                "Plastoquinone radical",
                "Semiquinone radical",
                "Sulfur-centered radical",
                "Superoxide (O2-)",
                "Tocopherol radical",
                "Ubisemiquinone radical",
                "Vitamin E radical"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": "error when calling model 'amazon.titan-text-express-v1': empty response",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]