[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Nitroxyl anion (HNO\u207b)",
            "Superoxide anion (O\u2082\u207b)",
            "Hydroperoxyl radical anion (HO\u2082\u207b)",
            "Alkoxyl radical anion (RO\u207b)",
            "Nitronyl nitroxide anion (NO\u207bNO\u207b)",
            "Tetrahydrobiopterin radical anion (BH\u2084\u207b\u2022)",
            "Flavin adenine dinucleotide anion radical (FADH\u207b\u2022)",
            "Flavin mononucleotide anion radical (FMNH\u207b\u2022)",
            "Phenoxyl radical anion (PhO\u207b\u2022)",
            "Nitroxide radical anion (RONO\u207b\u2022)",
            "Alkyl radical anion (R\u207b\u2022)",
            "Triphenylmethyl radical anion (Ph\u2083C\u207b\u2022)",
            "Nitric oxide anion (NO\u207b)",
            "Nitrite anion radical (NO\u2082\u207b\u2022)",
            "Nitroxide radical (RONO\u207b)",
            "Sulfenate anion radical (RSO\u2082\u207b\u2022)",
            "Thiolate radical anion (RS\u207b\u2022)",
            "Hydroxyl radical anion (HO\u207b\u2022)",
            "Alkoxy radical anion (RO\u207b\u2022)",
            "Nitrosothiol anion radical (RSNO\u207b\u2022)",
            "Sulfinamide anion radical (RSO\u2082NH\u207b\u2022)",
            "Nitrosyl anion radical (NO\u207a\u207b\u2022)",
            "Nitroxide anion radical (RONO\u207b\u2022)",
            "Nitroso anion radical (NO\u207a\u207b\u2022)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nitroxyl anion (HNO\u207b)",
                "Superoxide anion (O\u2082\u207b)",
                "Hydroperoxyl radical anion (HO\u2082\u207b)",
                "Alkoxyl radical anion (RO\u207b)",
                "Nitronyl nitroxide anion (NO\u207bNO\u207b)",
                "Tetrahydrobiopterin radical anion (BH\u2084\u207b\u2022)",
                "Flavin adenine dinucleotide anion radical (FADH\u207b\u2022)",
                "Flavin mononucleotide anion radical (FMNH\u207b\u2022)",
                "Phenoxyl radical anion (PhO\u207b\u2022)",
                "Nitroxide radical anion (RONO\u207b\u2022)",
                "Alkyl radical anion (R\u207b\u2022)",
                "Triphenylmethyl radical anion (Ph\u2083C\u207b\u2022)",
                "Nitric oxide anion (NO\u207b)",
                "Nitrite anion radical (NO\u2082\u207b\u2022)",
                "Nitroxide radical (RONO\u207b)",
                "Sulfenate anion radical (RSO\u2082\u207b\u2022)",
                "Thiolate radical anion (RS\u207b\u2022)",
                "Hydroxyl radical anion (HO\u207b\u2022)",
                "Alkoxy radical anion (RO\u207b\u2022)",
                "Nitrosothiol anion radical (RSNO\u207b\u2022)",
                "Sulfinamide anion radical (RSO\u2082NH\u207b\u2022)",
                "Nitrosyl anion radical (NO\u207a\u207b\u2022)",
                "Nitroso anion radical (NO\u207a\u207b\u2022)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alkoxy radical anion (RO\u207b\u2022)",
                "Alkoxyl radical anion (RO\u207b)",
                "Alkyl radical anion (R\u207b\u2022)",
                "Flavin adenine dinucleotide anion radical (FADH\u207b\u2022)",
                "Flavin mononucleotide anion radical (FMNH\u207b\u2022)",
                "Hydroperoxyl radical anion (HO\u2082\u207b)",
                "Hydroxyl radical anion (HO\u207b\u2022)",
                "Nitric oxide anion (NO\u207b)",
                "Nitrite anion radical (NO\u2082\u207b\u2022)",
                "Nitronyl nitroxide anion (NO\u207bNO\u207b)",
                "Nitroso anion radical (NO\u207a\u207b\u2022)",
                "Nitrosothiol anion radical (RSNO\u207b\u2022)",
                "Nitrosyl anion radical (NO\u207a\u207b\u2022)",
                "Nitroxide anion radical (RONO\u207b\u2022)",
                "Nitroxide radical (RONO\u207b)",
                "Nitroxide radical anion (RONO\u207b\u2022)",
                "Nitroxyl anion (HNO\u207b)",
                "Phenoxyl radical anion (PhO\u207b\u2022)",
                "Sulfenate anion radical (RSO\u2082\u207b\u2022)",
                "Sulfinamide anion radical (RSO\u2082NH\u207b\u2022)",
                "Superoxide anion (O\u2082\u207b)",
                "Tetrahydrobiopterin radical anion (BH\u2084\u207b\u2022)",
                "Thiolate radical anion (RS\u207b\u2022)",
                "Triphenylmethyl radical anion (Ph\u2083C\u207b\u2022)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide radical anion (O2\u2022\u2212)",
            "Hydroxyl radical anion (HO\u2022\u2212)",
            "Nitrate radical anion (NO3\u2022\u2212)",
            "Peroxide radical anion (O2^2\u2212)",
            "Dithionite radical anion (S2O4^2\u2212)",
            "Ferrocenyl radical anion (Fc\u2022\u2212)",
            "Nitroxyl radical anion (HNO\u2022\u2212)",
            "Azide radical anion (N3\u2022\u2212)",
            "Phenyl radical anion (C6H5\u2022\u2212)",
            "Tetrahydrofuran radical anion (THF\u2022\u2212)",
            "Tetrathiafulvalene radical anion (TTF\u2022\u2212)",
            "Tetracyanoethylene radical anion (TCNE\u2022\u2212)",
            "Porphyrin radical anion (Por\u2022\u2212)",
            "Fluoride radical anion (F\u2022\u2212)",
            "Thiolate radical anion (RS\u2022\u2212)",
            "Catecholate radical anion (C6H4O2\u2022\u2212)",
            "Chloride radical anion (Cl\u2022\u2212)",
            "Benzyl radical anion (C6H5CH2\u2022\u2212)",
            "Cyanide radical anion (CN\u2022\u2212)",
            "Acetate radical anion (CH3COO\u2022\u2212)",
            "Sulfite radical anion (SO3^2\u2212)",
            "Sulfide radical anion (S^2\u2212)",
            "Carboxylate radical anion (RCOO\u2022\u2212)",
            "Methoxide radical anion (CH3O\u2022\u2212)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide radical anion (O2\u2022\u2212)",
                "Hydroxyl radical anion (HO\u2022\u2212)",
                "Nitrate radical anion (NO3\u2022\u2212)",
                "Peroxide radical anion (O2^2\u2212)",
                "Dithionite radical anion (S2O4^2\u2212)",
                "Ferrocenyl radical anion (Fc\u2022\u2212)",
                "Nitroxyl radical anion (HNO\u2022\u2212)",
                "Azide radical anion (N3\u2022\u2212)",
                "Phenyl radical anion (C6H5\u2022\u2212)",
                "Tetrahydrofuran radical anion (THF\u2022\u2212)",
                "Tetrathiafulvalene radical anion (TTF\u2022\u2212)",
                "Tetracyanoethylene radical anion (TCNE\u2022\u2212)",
                "Porphyrin radical anion (Por\u2022\u2212)",
                "Fluoride radical anion (F\u2022\u2212)",
                "Thiolate radical anion (RS\u2022\u2212)",
                "Catecholate radical anion (C6H4O2\u2022\u2212)",
                "Chloride radical anion (Cl\u2022\u2212)",
                "Benzyl radical anion (C6H5CH2\u2022\u2212)",
                "Cyanide radical anion (CN\u2022\u2212)",
                "Acetate radical anion (CH3COO\u2022\u2212)",
                "Sulfite radical anion (SO3^2\u2212)",
                "Sulfide radical anion (S^2\u2212)",
                "Carboxylate radical anion (RCOO\u2022\u2212)",
                "Methoxide radical anion (CH3O\u2022\u2212)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate radical anion (CH3COO\u2022\u2212)",
                "Azide radical anion (N3\u2022\u2212)",
                "Benzyl radical anion (C6H5CH2\u2022\u2212)",
                "Carboxylate radical anion (RCOO\u2022\u2212)",
                "Catecholate radical anion (C6H4O2\u2022\u2212)",
                "Chloride radical anion (Cl\u2022\u2212)",
                "Cyanide radical anion (CN\u2022\u2212)",
                "Dithionite radical anion (S2O4^2\u2212)",
                "Ferrocenyl radical anion (Fc\u2022\u2212)",
                "Fluoride radical anion (F\u2022\u2212)",
                "Hydroxyl radical anion (HO\u2022\u2212)",
                "Methoxide radical anion (CH3O\u2022\u2212)",
                "Nitrate radical anion (NO3\u2022\u2212)",
                "Nitroxyl radical anion (HNO\u2022\u2212)",
                "Peroxide radical anion (O2^2\u2212)",
                "Phenyl radical anion (C6H5\u2022\u2212)",
                "Porphyrin radical anion (Por\u2022\u2212)",
                "Sulfide radical anion (S^2\u2212)",
                "Sulfite radical anion (SO3^2\u2212)",
                "Superoxide radical anion (O2\u2022\u2212)",
                "Tetracyanoethylene radical anion (TCNE\u2022\u2212)",
                "Tetrahydrofuran radical anion (THF\u2022\u2212)",
                "Tetrathiafulvalene radical anion (TTF\u2022\u2212)",
                "Thiolate radical anion (RS\u2022\u2212)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Benzene radical anion (C6H6\u2022\u2212)",
            "Naphthalene radical anion (C10H7\u2022\u2212)",
            "Anthracene radical anion (C14H9\u2022\u2212)",
            "Phenyl radical anion (C6H5\u2022\u2212)",
            "Fluoranthene radical anion (C16H9\u2022\u2212)",
            "Pyrene radical anion (C16H9\u2022\u2212)",
            "Perylene radical anion (C20H11\u2022\u2212)",
            "Nitrobenzene radical anion (C6H4NO2\u2022\u2212)",
            "Chlorobenzene radical anion (C6H4Cl\u2022\u2212)",
            "Bromobenzene radical anion (C6H4Br\u2022\u2212)",
            "Toluene radical anion (C7H7\u2022\u2212)",
            "Xylene radical anion (C8H9\u2022\u2212)",
            "Fluorobenzene radical anion (C6H4F\u2022\u2212)",
            "Iodobenzene radical anion (C6H4I\u2022\u2212)",
            "Aniline radical anion (C6H6N\u2022\u2212)",
            "Phenol radical anion (C6H5O\u2022\u2212)",
            "Benzoic acid radical anion (C7H5O2\u2022\u2212)",
            "Benzaldehyde radical anion (C7H5O\u2022\u2212)",
            "Acetophenone radical anion (C8H7O\u2022\u2212)",
            "Phenylacetylene radical anion (C8H5\u2022\u2212)",
            "Styrene radical anion (C8H7\u2022\u2212)",
            "Anisole radical anion (C7H7O\u2022\u2212)",
            "Nitroaniline radical anion (C6H6N2O2\u2022\u2212)",
            "Nitrotoluene radical anion (C7H6NO2\u2022\u2212)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Benzene radical anion (C6H6\u2022\u2212)",
                "Naphthalene radical anion (C10H7\u2022\u2212)",
                "Anthracene radical anion (C14H9\u2022\u2212)",
                "Phenyl radical anion (C6H5\u2022\u2212)",
                "Fluoranthene radical anion (C16H9\u2022\u2212)",
                "Pyrene radical anion (C16H9\u2022\u2212)",
                "Perylene radical anion (C20H11\u2022\u2212)",
                "Nitrobenzene radical anion (C6H4NO2\u2022\u2212)",
                "Chlorobenzene radical anion (C6H4Cl\u2022\u2212)",
                "Bromobenzene radical anion (C6H4Br\u2022\u2212)",
                "Toluene radical anion (C7H7\u2022\u2212)",
                "Xylene radical anion (C8H9\u2022\u2212)",
                "Fluorobenzene radical anion (C6H4F\u2022\u2212)",
                "Iodobenzene radical anion (C6H4I\u2022\u2212)",
                "Aniline radical anion (C6H6N\u2022\u2212)",
                "Phenol radical anion (C6H5O\u2022\u2212)",
                "Benzoic acid radical anion (C7H5O2\u2022\u2212)",
                "Benzaldehyde radical anion (C7H5O\u2022\u2212)",
                "Acetophenone radical anion (C8H7O\u2022\u2212)",
                "Phenylacetylene radical anion (C8H5\u2022\u2212)",
                "Styrene radical anion (C8H7\u2022\u2212)",
                "Anisole radical anion (C7H7O\u2022\u2212)",
                "Nitroaniline radical anion (C6H6N2O2\u2022\u2212)",
                "Nitrotoluene radical anion (C7H6NO2\u2022\u2212)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetophenone radical anion (C8H7O\u2022\u2212)",
                "Aniline radical anion (C6H6N\u2022\u2212)",
                "Anisole radical anion (C7H7O\u2022\u2212)",
                "Anthracene radical anion (C14H9\u2022\u2212)",
                "Benzaldehyde radical anion (C7H5O\u2022\u2212)",
                "Benzene radical anion (C6H6\u2022\u2212)",
                "Benzoic acid radical anion (C7H5O2\u2022\u2212)",
                "Bromobenzene radical anion (C6H4Br\u2022\u2212)",
                "Chlorobenzene radical anion (C6H4Cl\u2022\u2212)",
                "Fluoranthene radical anion (C16H9\u2022\u2212)",
                "Fluorobenzene radical anion (C6H4F\u2022\u2212)",
                "Iodobenzene radical anion (C6H4I\u2022\u2212)",
                "Naphthalene radical anion (C10H7\u2022\u2212)",
                "Nitroaniline radical anion (C6H6N2O2\u2022\u2212)",
                "Nitrobenzene radical anion (C6H4NO2\u2022\u2212)",
                "Nitrotoluene radical anion (C7H6NO2\u2022\u2212)",
                "Perylene radical anion (C20H11\u2022\u2212)",
                "Phenol radical anion (C6H5O\u2022\u2212)",
                "Phenyl radical anion (C6H5\u2022\u2212)",
                "Phenylacetylene radical anion (C8H5\u2022\u2212)",
                "Pyrene radical anion (C16H9\u2022\u2212)",
                "Styrene radical anion (C8H7\u2022\u2212)",
                "Toluene radical anion (C7H7\u2022\u2212)",
                "Xylene radical anion (C8H9\u2022\u2212)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Naphthoquinone Semiquinone Radical Anion (NQSQ\u207b)",
            "Anthraquinone-2-yl Radical Anion (AQ\u207b)",
            "Benzophenone Ketyl Radical Anion (BPK\u207b)",
            "Dibenzoyl Peroxide Radical Anion (DBPO\u207b)",
            "Flavins (Reduced Forms) (FADH\u207b/FMNH\u207b)",
            "Quinones (Semiquinone Forms) (Q\u207b)",
            "Tetramethyl-p-phenylenediamine Radical Anion (TMPD\u207b)",
            "1,1-Diphenyl-2-picrylhydrazyl Radical Anion (DPPH\u207b)",
            "Superoxide Radical Anion (O\u2082\u207b)",
            "Phenyl Radical Anion (Ph\u207b)",
            "Pyridinium Radical Anion (Py\u207b)",
            "Thiophenol Radical Anion (PhS\u207b)",
            "Catechol Radical Anion (Cat\u207b)",
            "Hydroquinone Radical Anion (HQ\u207b)",
            "Benzoquinone Radical Anion (BQ\u207b)",
            "Phenoxy Radical Anion (PhO\u207b)",
            "Indole-3-acetic acid Radical Anion (IAA\u207b)",
            "Luton Radical Anion (L\u207b)",
            "Melanin Radical Anion (Mel\u207b)",
            "Fullerene Radical Anion (C\u2086\u2080\u207b)",
            "Anthracene Radical Anion (Anth\u207b)",
            "Phenanthrene Radical Anion (Phen\u207b)",
            "Pyrene Radical Anion (Pyr\u207b)",
            "Triphenylmethyl Radical Anion (Tr\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Naphthoquinone Semiquinone Radical Anion (NQSQ\u207b)",
                "Anthraquinone-2-yl Radical Anion (AQ\u207b)",
                "Benzophenone Ketyl Radical Anion (BPK\u207b)",
                "Dibenzoyl Peroxide Radical Anion (DBPO\u207b)",
                "Flavins (Reduced Forms) (FADH\u207b/FMNH\u207b)",
                "Quinones (Semiquinone Forms) (Q\u207b)",
                "Tetramethyl-p-phenylenediamine Radical Anion (TMPD\u207b)",
                "1,1-Diphenyl-2-picrylhydrazyl Radical Anion (DPPH\u207b)",
                "Superoxide Radical Anion (O\u2082\u207b)",
                "Phenyl Radical Anion (Ph\u207b)",
                "Pyridinium Radical Anion (Py\u207b)",
                "Thiophenol Radical Anion (PhS\u207b)",
                "Catechol Radical Anion (Cat\u207b)",
                "Hydroquinone Radical Anion (HQ\u207b)",
                "Benzoquinone Radical Anion (BQ\u207b)",
                "Phenoxy Radical Anion (PhO\u207b)",
                "Indole-3-acetic acid Radical Anion (IAA\u207b)",
                "Luton Radical Anion (L\u207b)",
                "Melanin Radical Anion (Mel\u207b)",
                "Fullerene Radical Anion (C\u2086\u2080\u207b)",
                "Anthracene Radical Anion (Anth\u207b)",
                "Phenanthrene Radical Anion (Phen\u207b)",
                "Pyrene Radical Anion (Pyr\u207b)",
                "Triphenylmethyl Radical Anion (Tr\u207b)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,1-Diphenyl-2-picrylhydrazyl Radical Anion (DPPH\u207b)",
                "Anthracene Radical Anion (Anth\u207b)",
                "Anthraquinone-2-yl Radical Anion (AQ\u207b)",
                "Benzophenone Ketyl Radical Anion (BPK\u207b)",
                "Benzoquinone Radical Anion (BQ\u207b)",
                "Catechol Radical Anion (Cat\u207b)",
                "Dibenzoyl Peroxide Radical Anion (DBPO\u207b)",
                "Flavins (Reduced Forms) (FADH\u207b/FMNH\u207b)",
                "Fullerene Radical Anion (C\u2086\u2080\u207b)",
                "Hydroquinone Radical Anion (HQ\u207b)",
                "Indole-3-acetic acid Radical Anion (IAA\u207b)",
                "Luton Radical Anion (L\u207b)",
                "Melanin Radical Anion (Mel\u207b)",
                "Naphthoquinone Semiquinone Radical Anion (NQSQ\u207b)",
                "Phenanthrene Radical Anion (Phen\u207b)",
                "Phenoxy Radical Anion (PhO\u207b)",
                "Phenyl Radical Anion (Ph\u207b)",
                "Pyrene Radical Anion (Pyr\u207b)",
                "Pyridinium Radical Anion (Py\u207b)",
                "Quinones (Semiquinone Forms) (Q\u207b)",
                "Superoxide Radical Anion (O\u2082\u207b)",
                "Tetramethyl-p-phenylenediamine Radical Anion (TMPD\u207b)",
                "Thiophenol Radical Anion (PhS\u207b)",
                "Triphenylmethyl Radical Anion (Tr\u207b)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide (O2*-)",
            "Nitrogen dioxide anion (NO2*-)",
            "Hydroxyl radical anion (HO*-)",
            "Trichloromethyl anion (CCl3*-)",
            "Peroxyl radical anion (ROO*-)",
            "Phenoxyl radical anion (C6H5O*-)",
            "Nitrosyl anion (NO*-)",
            "Anthraquinone radical anion (AQ*-)",
            "Biphenyl radical anion (C12H9*-)",
            "Benzophenone radical anion (C13H10O*-)",
            "Tetracyanoethylene radical anion (TCNE*-)",
            "Fluorenone radical anion (C13H9O*-)",
            "Azobenzene radical anion (C12H10N2*-)",
            "Tetramethylammonium radical anion (TMA*-)",
            "Chloranil radical anion (C6Cl4O2*-)",
            "Naphthalene radical anion (C10H8*-)",
            "Viologen radical anion (C12H12N2*-)",
            "Dicyanomethylene radical anion (DCM*-)",
            "Tropylium radical anion (C7H7*-)",
            "Fullerene radical anion (C60*-)",
            "Carbazole radical anion (C12H9N*-)",
            "Quinone radical anion (Q*-)",
            "Nitrobenzene radical anion (C6H5NO2*-)",
            "Tetrathiafulvalene radical anion (TTF*-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O2*-)",
                "Nitrogen dioxide anion (NO2*-)",
                "Hydroxyl radical anion (HO*-)",
                "Trichloromethyl anion (CCl3*-)",
                "Peroxyl radical anion (ROO*-)",
                "Phenoxyl radical anion (C6H5O*-)",
                "Nitrosyl anion (NO*-)",
                "Anthraquinone radical anion (AQ*-)",
                "Biphenyl radical anion (C12H9*-)",
                "Benzophenone radical anion (C13H10O*-)",
                "Tetracyanoethylene radical anion (TCNE*-)",
                "Fluorenone radical anion (C13H9O*-)",
                "Azobenzene radical anion (C12H10N2*-)",
                "Tetramethylammonium radical anion (TMA*-)",
                "Chloranil radical anion (C6Cl4O2*-)",
                "Naphthalene radical anion (C10H8*-)",
                "Viologen radical anion (C12H12N2*-)",
                "Dicyanomethylene radical anion (DCM*-)",
                "Tropylium radical anion (C7H7*-)",
                "Fullerene radical anion (C60*-)",
                "Carbazole radical anion (C12H9N*-)",
                "Quinone radical anion (Q*-)",
                "Nitrobenzene radical anion (C6H5NO2*-)",
                "Tetrathiafulvalene radical anion (TTF*-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Anthraquinone radical anion (AQ*-)",
                "Azobenzene radical anion (C12H10N2*-)",
                "Benzophenone radical anion (C13H10O*-)",
                "Biphenyl radical anion (C12H9*-)",
                "Carbazole radical anion (C12H9N*-)",
                "Chloranil radical anion (C6Cl4O2*-)",
                "Dicyanomethylene radical anion (DCM*-)",
                "Fluorenone radical anion (C13H9O*-)",
                "Fullerene radical anion (C60*-)",
                "Hydroxyl radical anion (HO*-)",
                "Naphthalene radical anion (C10H8*-)",
                "Nitrobenzene radical anion (C6H5NO2*-)",
                "Nitrogen dioxide anion (NO2*-)",
                "Nitrosyl anion (NO*-)",
                "Peroxyl radical anion (ROO*-)",
                "Phenoxyl radical anion (C6H5O*-)",
                "Quinone radical anion (Q*-)",
                "Superoxide (O2*-)",
                "Tetracyanoethylene radical anion (TCNE*-)",
                "Tetramethylammonium radical anion (TMA*-)",
                "Tetrathiafulvalene radical anion (TTF*-)",
                "Trichloromethyl anion (CCl3*-)",
                "Tropylium radical anion (C7H7*-)",
                "Viologen radical anion (C12H12N2*-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide (O2\u2022-)",
            "Nitrate radical (NO3\u2022-)",
            "Nitric oxide anion (NO\u2022-)",
            "Adenosine triphosphate radical anion (ATP\u2022-)",
            "Dopamine radical anion (C8H11NO\u2022-)",
            "Lipid peroxyl radical anion (ROO\u2022-)",
            "Phenoxyl radical anion (C6H5O\u2022-)",
            "Hydroxyl radical anion (HO\u2022-)",
            "Benzyl radical anion (C7H7\u2022-)",
            "Chlorophyll radical anion (C55H72N4Mg\u2022-)",
            "Carboxylate radical anion (RCOO\u2022-)",
            "Tryptophan radical anion (C11H10N2O\u2022-)",
            "Thymine radical anion (C5H6N2O2\u2022-)",
            "Amino acid radical anion (RNH2\u2022-)",
            "Flavin radical anion (C17H17N4O9\u2022-)",
            "Ubiquinone radical anion (C59H88O4\u2022-)",
            "Ascorbate radical anion (C6H7O6\u2022-)",
            "Cysteine radical anion (C3H7NO2S\u2022-)",
            "Glutathione radical anion (C10H17N3O6S\u2022-)",
            "Acetyl radical anion (C2H3O\u2022-)",
            "Cyclic peroxyl radical anion (C4H6O2\u2022-)",
            "Sulfate radical anion (SO4\u2022-)",
            "Carbon dioxide radical anion (CO2\u2022-)",
            "Vinyl radical anion (C2H3\u2022-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O2\u2022-)",
                "Nitrate radical (NO3\u2022-)",
                "Nitric oxide anion (NO\u2022-)",
                "Adenosine triphosphate radical anion (ATP\u2022-)",
                "Dopamine radical anion (C8H11NO\u2022-)",
                "Lipid peroxyl radical anion (ROO\u2022-)",
                "Phenoxyl radical anion (C6H5O\u2022-)",
                "Hydroxyl radical anion (HO\u2022-)",
                "Benzyl radical anion (C7H7\u2022-)",
                "Chlorophyll radical anion (C55H72N4Mg\u2022-)",
                "Carboxylate radical anion (RCOO\u2022-)",
                "Tryptophan radical anion (C11H10N2O\u2022-)",
                "Thymine radical anion (C5H6N2O2\u2022-)",
                "Amino acid radical anion (RNH2\u2022-)",
                "Flavin radical anion (C17H17N4O9\u2022-)",
                "Ubiquinone radical anion (C59H88O4\u2022-)",
                "Ascorbate radical anion (C6H7O6\u2022-)",
                "Cysteine radical anion (C3H7NO2S\u2022-)",
                "Glutathione radical anion (C10H17N3O6S\u2022-)",
                "Acetyl radical anion (C2H3O\u2022-)",
                "Cyclic peroxyl radical anion (C4H6O2\u2022-)",
                "Sulfate radical anion (SO4\u2022-)",
                "Carbon dioxide radical anion (CO2\u2022-)",
                "Vinyl radical anion (C2H3\u2022-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl radical anion (C2H3O\u2022-)",
                "Adenosine triphosphate radical anion (ATP\u2022-)",
                "Amino acid radical anion (RNH2\u2022-)",
                "Ascorbate radical anion (C6H7O6\u2022-)",
                "Benzyl radical anion (C7H7\u2022-)",
                "Carbon dioxide radical anion (CO2\u2022-)",
                "Carboxylate radical anion (RCOO\u2022-)",
                "Chlorophyll radical anion (C55H72N4Mg\u2022-)",
                "Cyclic peroxyl radical anion (C4H6O2\u2022-)",
                "Cysteine radical anion (C3H7NO2S\u2022-)",
                "Dopamine radical anion (C8H11NO\u2022-)",
                "Flavin radical anion (C17H17N4O9\u2022-)",
                "Glutathione radical anion (C10H17N3O6S\u2022-)",
                "Hydroxyl radical anion (HO\u2022-)",
                "Lipid peroxyl radical anion (ROO\u2022-)",
                "Nitrate radical (NO3\u2022-)",
                "Nitric oxide anion (NO\u2022-)",
                "Phenoxyl radical anion (C6H5O\u2022-)",
                "Sulfate radical anion (SO4\u2022-)",
                "Superoxide (O2\u2022-)",
                "Thymine radical anion (C5H6N2O2\u2022-)",
                "Tryptophan radical anion (C11H10N2O\u2022-)",
                "Ubiquinone radical anion (C59H88O4\u2022-)",
                "Vinyl radical anion (C2H3\u2022-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide Radical Anion (O2-)",
            "Hydroxyl Radical Anion (OH-)",
            "Nitric Oxide Radical Anion (NO-)",
            "Peroxynitrite Radical Anion (ONOO-)",
            "Chlorine Radical Anion (Cl-)",
            "Bromine Radical Anion (Br-)",
            "Iodine Radical Anion (I-)",
            "Sulfur Dioxide Radical Anion (SO2-)",
            "Nitrogen Dioxide Radical Anion (NO2-)",
            "Carbon Dioxide Radical Anion (CO2-)",
            "Methane Radical Anion (CH4-)",
            "Ethane Radical Anion (C2H6-)",
            "Propane Radical Anion (C3H8-)",
            "Butane Radical Anion (C4H10-)",
            "Pentane Radical Anion (C5H12-)",
            "Hexane Radical Anion (C6H14-)",
            "Heptane Radical Anion (C7H16-)",
            "Octane Radical Anion (C8H18-)",
            "Nonane Radical Anion (C9H20-)",
            "Decane Radical Anion (C10H22-)",
            "Benzene Radical Anion (C6H6-)",
            "Toluene Radical Anion (C7H8-)",
            "Naphthalene Radical Anion (C10H8-)",
            "Anthracene Radical Anion (C14H10-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide Radical Anion (O2-)",
                "Hydroxyl Radical Anion (OH-)",
                "Nitric Oxide Radical Anion (NO-)",
                "Peroxynitrite Radical Anion (ONOO-)",
                "Chlorine Radical Anion (Cl-)",
                "Bromine Radical Anion (Br-)",
                "Iodine Radical Anion (I-)",
                "Sulfur Dioxide Radical Anion (SO2-)",
                "Nitrogen Dioxide Radical Anion (NO2-)",
                "Carbon Dioxide Radical Anion (CO2-)",
                "Methane Radical Anion (CH4-)",
                "Ethane Radical Anion (C2H6-)",
                "Propane Radical Anion (C3H8-)",
                "Butane Radical Anion (C4H10-)",
                "Pentane Radical Anion (C5H12-)",
                "Hexane Radical Anion (C6H14-)",
                "Heptane Radical Anion (C7H16-)",
                "Octane Radical Anion (C8H18-)",
                "Nonane Radical Anion (C9H20-)",
                "Decane Radical Anion (C10H22-)",
                "Benzene Radical Anion (C6H6-)",
                "Toluene Radical Anion (C7H8-)",
                "Naphthalene Radical Anion (C10H8-)",
                "Anthracene Radical Anion (C14H10-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Anthracene Radical Anion (C14H10-)",
                "Benzene Radical Anion (C6H6-)",
                "Bromine Radical Anion (Br-)",
                "Butane Radical Anion (C4H10-)",
                "Carbon Dioxide Radical Anion (CO2-)",
                "Chlorine Radical Anion (Cl-)",
                "Decane Radical Anion (C10H22-)",
                "Ethane Radical Anion (C2H6-)",
                "Heptane Radical Anion (C7H16-)",
                "Hexane Radical Anion (C6H14-)",
                "Hydroxyl Radical Anion (OH-)",
                "Iodine Radical Anion (I-)",
                "Methane Radical Anion (CH4-)",
                "Naphthalene Radical Anion (C10H8-)",
                "Nitric Oxide Radical Anion (NO-)",
                "Nitrogen Dioxide Radical Anion (NO2-)",
                "Nonane Radical Anion (C9H20-)",
                "Octane Radical Anion (C8H18-)",
                "Pentane Radical Anion (C5H12-)",
                "Peroxynitrite Radical Anion (ONOO-)",
                "Propane Radical Anion (C3H8-)",
                "Sulfur Dioxide Radical Anion (SO2-)",
                "Superoxide Radical Anion (O2-)",
                "Toluene Radical Anion (C7H8-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Hydroxyl radical anion (\u2022OH-)",
            "Methyl radical anion (\u2022CH3-)",
            "Phenyl radical anion (\u2022C6H5-)",
            "Benzyl radical anion (\u2022C6H5CH2-)",
            "Allyl radical anion (\u2022CH2CH=CH2-)",
            "Carbonate radical anion (\u2022CO3-)",
            "Nitrate radical anion (\u2022NO3-)",
            "Sulfate radical anion (\u2022SO4-)",
            "Acetate radical anion (\u2022CH3COO-)",
            "Formate radical anion (\u2022HCOO-)",
            "Ethyl radical anion (\u2022C2H5-)",
            "Tert-butyl radical anion (\u2022C(CH3)3-)",
            "Peroxynitrite radical anion (\u2022ONOO-)",
            "Cyanide radical anion (\u2022CN-)",
            "Acetyl radical anion (\u2022CH3CO-)",
            "Propionate radical anion (\u2022CH3CH2COO-)",
            "Hydroperoxyl radical anion (\u2022HO2-)",
            "Phosphite radical anion (\u2022PO3-)",
            "Hydrogen sulfide radical anion (\u2022HS-)",
            "Phosphinate radical anion (\u2022PO2-)",
            "Hydrosulfide radical anion (\u2022HS2-)",
            "Propargyl radical anion (\u2022C3H3-)",
            "Sulfite radical anion (\u2022SO3-)",
            "Thiophenolate radical anion (\u2022C6H5S-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl radical anion (\u2022OH-)",
                "Methyl radical anion (\u2022CH3-)",
                "Phenyl radical anion (\u2022C6H5-)",
                "Benzyl radical anion (\u2022C6H5CH2-)",
                "Allyl radical anion (\u2022CH2CH=CH2-)",
                "Carbonate radical anion (\u2022CO3-)",
                "Nitrate radical anion (\u2022NO3-)",
                "Sulfate radical anion (\u2022SO4-)",
                "Acetate radical anion (\u2022CH3COO-)",
                "Formate radical anion (\u2022HCOO-)",
                "Ethyl radical anion (\u2022C2H5-)",
                "Tert-butyl radical anion (\u2022C(CH3)3-)",
                "Peroxynitrite radical anion (\u2022ONOO-)",
                "Cyanide radical anion (\u2022CN-)",
                "Acetyl radical anion (\u2022CH3CO-)",
                "Propionate radical anion (\u2022CH3CH2COO-)",
                "Hydroperoxyl radical anion (\u2022HO2-)",
                "Phosphite radical anion (\u2022PO3-)",
                "Hydrogen sulfide radical anion (\u2022HS-)",
                "Phosphinate radical anion (\u2022PO2-)",
                "Hydrosulfide radical anion (\u2022HS2-)",
                "Propargyl radical anion (\u2022C3H3-)",
                "Sulfite radical anion (\u2022SO3-)",
                "Thiophenolate radical anion (\u2022C6H5S-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate radical anion (\u2022CH3COO-)",
                "Acetyl radical anion (\u2022CH3CO-)",
                "Allyl radical anion (\u2022CH2CH=CH2-)",
                "Benzyl radical anion (\u2022C6H5CH2-)",
                "Carbonate radical anion (\u2022CO3-)",
                "Cyanide radical anion (\u2022CN-)",
                "Ethyl radical anion (\u2022C2H5-)",
                "Formate radical anion (\u2022HCOO-)",
                "Hydrogen sulfide radical anion (\u2022HS-)",
                "Hydroperoxyl radical anion (\u2022HO2-)",
                "Hydrosulfide radical anion (\u2022HS2-)",
                "Hydroxyl radical anion (\u2022OH-)",
                "Methyl radical anion (\u2022CH3-)",
                "Nitrate radical anion (\u2022NO3-)",
                "Peroxynitrite radical anion (\u2022ONOO-)",
                "Phenyl radical anion (\u2022C6H5-)",
                "Phosphinate radical anion (\u2022PO2-)",
                "Phosphite radical anion (\u2022PO3-)",
                "Propargyl radical anion (\u2022C3H3-)",
                "Propionate radical anion (\u2022CH3CH2COO-)",
                "Sulfate radical anion (\u2022SO4-)",
                "Sulfite radical anion (\u2022SO3-)",
                "Tert-butyl radical anion (\u2022C(CH3)3-)",
                "Thiophenolate radical anion (\u2022C6H5S-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide (O\u2082\u207b\u2022)",
            "Hydroquinone Radical Anion",
            "Semiquinone Radical Anion",
            "Anthraquinone Radical Anion",
            "Phenoxyl Radical Anion",
            "TEMPO Radical Anion",
            "Resorcinol Radical Anion",
            "Pyridine Radical Anion",
            "Tetrathiafulvalene Radical Anion (TTF\u2022\u2013)",
            "Naphthoquinone Radical Anion",
            "Azide Radical Anion (N\u2083\u207b\u2022)",
            "Sulfonium Radical Anion",
            "Tetrazine Radical Anion",
            "Ascorbate Radical Anion (Vitamin C Radical Anion)",
            "Fullerene Radical Anion (C\u2086\u2080\u2022\u2013)",
            "Oxidized Flavin Radical Anion",
            "NADH Radical Anion",
            "Pyrroloquinoline Quinone Radical Anion",
            "Benzoquinone Radical Anion",
            "TEMPOL Radical Anion",
            "Dithionaphthoquinone Radical Anion",
            "Ruthenium Complex Radical Anion",
            "Iron-Sulfur Cluster Radical Anion",
            "DNA Radical Anion"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O\u2082\u207b\u2022)",
                "Hydroquinone Radical Anion",
                "Semiquinone Radical Anion",
                "Anthraquinone Radical Anion",
                "Phenoxyl Radical Anion",
                "TEMPO Radical Anion",
                "Resorcinol Radical Anion",
                "Pyridine Radical Anion",
                "Tetrathiafulvalene Radical Anion (TTF\u2022\u2013)",
                "Naphthoquinone Radical Anion",
                "Azide Radical Anion (N\u2083\u207b\u2022)",
                "Sulfonium Radical Anion",
                "Tetrazine Radical Anion",
                "Ascorbate Radical Anion (Vitamin C Radical Anion)",
                "Fullerene Radical Anion (C\u2086\u2080\u2022\u2013)",
                "Oxidized Flavin Radical Anion",
                "NADH Radical Anion",
                "Pyrroloquinoline Quinone Radical Anion",
                "Benzoquinone Radical Anion",
                "TEMPOL Radical Anion",
                "Dithionaphthoquinone Radical Anion",
                "Ruthenium Complex Radical Anion",
                "Iron-Sulfur Cluster Radical Anion",
                "DNA Radical Anion"
            ],
            "mismatches": [],
            "true_referents": [
                "Anthraquinone Radical Anion",
                "Ascorbate Radical Anion (Vitamin C Radical Anion)",
                "Azide Radical Anion (N\u2083\u207b\u2022)",
                "Benzoquinone Radical Anion",
                "DNA Radical Anion",
                "Dithionaphthoquinone Radical Anion",
                "Fullerene Radical Anion (C\u2086\u2080\u2022\u2013)",
                "Hydroquinone Radical Anion",
                "Iron-Sulfur Cluster Radical Anion",
                "NADH Radical Anion",
                "Naphthoquinone Radical Anion",
                "Oxidized Flavin Radical Anion",
                "Phenoxyl Radical Anion",
                "Pyridine Radical Anion",
                "Pyrroloquinoline Quinone Radical Anion",
                "Resorcinol Radical Anion",
                "Ruthenium Complex Radical Anion",
                "Semiquinone Radical Anion",
                "Sulfonium Radical Anion",
                "Superoxide (O\u2082\u207b\u2022)",
                "TEMPO Radical Anion",
                "TEMPOL Radical Anion",
                "Tetrathiafulvalene Radical Anion (TTF\u2022\u2013)",
                "Tetrazine Radical Anion"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide (O2\u2022\u2212)",
            "Nitric oxide (NO\u2022)",
            "Semiquinone radical",
            "Benzene radical anion",
            "Naphthalene radical anion",
            "Anthracene radical anion",
            "Fullerene radical anion (C60\u2022\u2212)",
            "Phthalocyanine radical anion",
            "Flavin semiquinone radical",
            "Ubisemiquinone radical",
            "Phenoxyl radical anion",
            "Viologen radical anion",
            "Tetracyanoethylene radical anion (TCNE\u2022\u2212)",
            "7,7,8,8-Tetracyanoquinodimethane radical anion (TCNQ\u2022\u2212)",
            "Nitrobenzene radical anion",
            "Azobenzene radical anion",
            "Pyridine radical anion",
            "Pyrimidine radical anion",
            "Tetrazolium radical",
            "Nitroxide radical anion",
            "Peroxyl radical anion (ROO\u2022\u2212)",
            "Hydroxyl radical anion (HO\u2022\u2212)",
            "Carbonate radical anion (CO3\u2022\u2212)",
            "Sulfite radical anion (SO3\u2022\u2212)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O2\u2022\u2212)",
                "Nitric oxide (NO\u2022)",
                "Semiquinone radical",
                "Benzene radical anion",
                "Naphthalene radical anion",
                "Anthracene radical anion",
                "Fullerene radical anion (C60\u2022\u2212)",
                "Phthalocyanine radical anion",
                "Flavin semiquinone radical",
                "Ubisemiquinone radical",
                "Phenoxyl radical anion",
                "Viologen radical anion",
                "Tetracyanoethylene radical anion (TCNE\u2022\u2212)",
                "7,7,8,8-Tetracyanoquinodimethane radical anion (TCNQ\u2022\u2212)",
                "Nitrobenzene radical anion",
                "Azobenzene radical anion",
                "Pyridine radical anion",
                "Pyrimidine radical anion",
                "Tetrazolium radical",
                "Nitroxide radical anion",
                "Peroxyl radical anion (ROO\u2022\u2212)",
                "Hydroxyl radical anion (HO\u2022\u2212)",
                "Carbonate radical anion (CO3\u2022\u2212)",
                "Sulfite radical anion (SO3\u2022\u2212)"
            ],
            "mismatches": [],
            "true_referents": [
                "7,7,8,8-Tetracyanoquinodimethane radical anion (TCNQ\u2022\u2212)",
                "Anthracene radical anion",
                "Azobenzene radical anion",
                "Benzene radical anion",
                "Carbonate radical anion (CO3\u2022\u2212)",
                "Flavin semiquinone radical",
                "Fullerene radical anion (C60\u2022\u2212)",
                "Hydroxyl radical anion (HO\u2022\u2212)",
                "Naphthalene radical anion",
                "Nitric oxide (NO\u2022)",
                "Nitrobenzene radical anion",
                "Nitroxide radical anion",
                "Peroxyl radical anion (ROO\u2022\u2212)",
                "Phenoxyl radical anion",
                "Phthalocyanine radical anion",
                "Pyridine radical anion",
                "Pyrimidine radical anion",
                "Semiquinone radical",
                "Sulfite radical anion (SO3\u2022\u2212)",
                "Superoxide (O2\u2022\u2212)",
                "Tetracyanoethylene radical anion (TCNE\u2022\u2212)",
                "Tetrazolium radical",
                "Ubisemiquinone radical",
                "Viologen radical anion"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide radical anion (O2\u2022\u2212)",
            "Peroxide dianion (O22\u2212)",
            "Semiquinone radical anion (SQ\u2022\u2212)",
            "Benzoquinone radical anion (BQ\u2022\u2212)",
            "Naphthoquinone radical anion (NQ\u2022\u2212)",
            "Flavin semiquinone radical anion (FADH\u2022)",
            "Phenoxide radical anion (PhO\u2022\u2212)",
            "Nitric oxide radical anion (NO\u2022\u2212)",
            "Nitroxyl anion (NO\u2212)",
            "Azide radical anion (N3\u2022\u2212)",
            "Cyanate radical anion (OCN\u2022\u2212)",
            "Thiocyanate radical anion (SCN\u2022\u2212)",
            "Thiolate radical anion (RS\u2022\u2212)",
            "Disulfide radical anion (RSSR\u2022\u2212)",
            "Sulfite radical anion (SO3\u2022\u2212)",
            "Sulfate radical anion (SO4\u2022\u2212)",
            "Phosphate radical anion (PO4\u20222\u2212)",
            "Pyrophosphate radical anion (P2O7\u20223\u2212)",
            "Carbonate radical anion (CO3\u2022\u2212)",
            "Carboxylate radical anion (RCO2\u2022\u2212)",
            "Acetylacetonate radical anion (acac\u2022\u2212)",
            "Bipyridine radical anion (bpy\u2022\u2212)",
            "Phenanthroline radical anion (phen\u2022\u2212)",
            "Terpyridine radical anion (terpy\u2022\u2212)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide radical anion (O2\u2022\u2212)",
                "Peroxide dianion (O22\u2212)",
                "Semiquinone radical anion (SQ\u2022\u2212)",
                "Benzoquinone radical anion (BQ\u2022\u2212)",
                "Naphthoquinone radical anion (NQ\u2022\u2212)",
                "Flavin semiquinone radical anion (FADH\u2022)",
                "Phenoxide radical anion (PhO\u2022\u2212)",
                "Nitric oxide radical anion (NO\u2022\u2212)",
                "Nitroxyl anion (NO\u2212)",
                "Azide radical anion (N3\u2022\u2212)",
                "Cyanate radical anion (OCN\u2022\u2212)",
                "Thiocyanate radical anion (SCN\u2022\u2212)",
                "Thiolate radical anion (RS\u2022\u2212)",
                "Disulfide radical anion (RSSR\u2022\u2212)",
                "Sulfite radical anion (SO3\u2022\u2212)",
                "Sulfate radical anion (SO4\u2022\u2212)",
                "Phosphate radical anion (PO4\u20222\u2212)",
                "Pyrophosphate radical anion (P2O7\u20223\u2212)",
                "Carbonate radical anion (CO3\u2022\u2212)",
                "Carboxylate radical anion (RCO2\u2022\u2212)",
                "Acetylacetonate radical anion (acac\u2022\u2212)",
                "Bipyridine radical anion (bpy\u2022\u2212)",
                "Phenanthroline radical anion (phen\u2022\u2212)",
                "Terpyridine radical anion (terpy\u2022\u2212)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetylacetonate radical anion (acac\u2022\u2212)",
                "Azide radical anion (N3\u2022\u2212)",
                "Benzoquinone radical anion (BQ\u2022\u2212)",
                "Bipyridine radical anion (bpy\u2022\u2212)",
                "Carbonate radical anion (CO3\u2022\u2212)",
                "Carboxylate radical anion (RCO2\u2022\u2212)",
                "Cyanate radical anion (OCN\u2022\u2212)",
                "Disulfide radical anion (RSSR\u2022\u2212)",
                "Flavin semiquinone radical anion (FADH\u2022)",
                "Naphthoquinone radical anion (NQ\u2022\u2212)",
                "Nitric oxide radical anion (NO\u2022\u2212)",
                "Nitroxyl anion (NO\u2212)",
                "Peroxide dianion (O22\u2212)",
                "Phenanthroline radical anion (phen\u2022\u2212)",
                "Phenoxide radical anion (PhO\u2022\u2212)",
                "Phosphate radical anion (PO4\u20222\u2212)",
                "Pyrophosphate radical anion (P2O7\u20223\u2212)",
                "Semiquinone radical anion (SQ\u2022\u2212)",
                "Sulfate radical anion (SO4\u2022\u2212)",
                "Sulfite radical anion (SO3\u2022\u2212)",
                "Superoxide radical anion (O2\u2022\u2212)",
                "Terpyridine radical anion (terpy\u2022\u2212)",
                "Thiocyanate radical anion (SCN\u2022\u2212)",
                "Thiolate radical anion (RS\u2022\u2212)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Superoxide (O2\u2022\u2212)",
            "Hydroxyl radical (\u2022OH)",
            "Tert-butoxy radical ((CH3)3CO\u2022)",
            "Phenoxy radical (C6H5O\u2022)",
            "Trichloromethyl radical (\u2022CCl3)",
            "Nitric oxide (NO\u2022)",
            "Benzyl radical (C6H5CH2\u2022)",
            "Methyl radical (\u2022CH3)",
            "Ethyl radical (CH3CH2\u2022)",
            "Isopropyl radical ((CH3)2CH\u2022)",
            "Cyclohexadienyl radical (C6H7\u2022)",
            "Triphenylmethyl radical ((C6H5)3C\u2022)",
            "Galvinoxyl radical ((C6H4)2NO\u2022)",
            "Semiquinone radical (C6H4O2\u2022\u2212)",
            "Nitroxide radical (>N\u2013O\u2022)",
            "Aminoxyl radical (>N\u2013O\u2022)",
            "Peroxyl radical (ROO\u2022)",
            "Alkoxyl radical (RO\u2022)",
            "Aryloxyl radical (ArO\u2022)",
            "Acyloxyl radical (RC(O)O\u2022)",
            "Phosphoryl radical (PO2\u2022\u2212)",
            "Thiyl radical (RS\u2022)",
            "Sulfinyl radical (RSO\u2022)",
            "Sulfonyl radical (RSO2\u2022)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Superoxide (O2\u2022\u2212)",
                "Hydroxyl radical (\u2022OH)",
                "Tert-butoxy radical ((CH3)3CO\u2022)",
                "Phenoxy radical (C6H5O\u2022)",
                "Trichloromethyl radical (\u2022CCl3)",
                "Nitric oxide (NO\u2022)",
                "Benzyl radical (C6H5CH2\u2022)",
                "Methyl radical (\u2022CH3)",
                "Ethyl radical (CH3CH2\u2022)",
                "Isopropyl radical ((CH3)2CH\u2022)",
                "Cyclohexadienyl radical (C6H7\u2022)",
                "Triphenylmethyl radical ((C6H5)3C\u2022)",
                "Galvinoxyl radical ((C6H4)2NO\u2022)",
                "Semiquinone radical (C6H4O2\u2022\u2212)",
                "Nitroxide radical (>N\u2013O\u2022)",
                "Aminoxyl radical (>N\u2013O\u2022)",
                "Peroxyl radical (ROO\u2022)",
                "Alkoxyl radical (RO\u2022)",
                "Aryloxyl radical (ArO\u2022)",
                "Acyloxyl radical (RC(O)O\u2022)",
                "Phosphoryl radical (PO2\u2022\u2212)",
                "Thiyl radical (RS\u2022)",
                "Sulfinyl radical (RSO\u2022)",
                "Sulfonyl radical (RSO2\u2022)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acyloxyl radical (RC(O)O\u2022)",
                "Alkoxyl radical (RO\u2022)",
                "Aminoxyl radical (>N\u2013O\u2022)",
                "Aryloxyl radical (ArO\u2022)",
                "Benzyl radical (C6H5CH2\u2022)",
                "Cyclohexadienyl radical (C6H7\u2022)",
                "Ethyl radical (CH3CH2\u2022)",
                "Galvinoxyl radical ((C6H4)2NO\u2022)",
                "Hydroxyl radical (\u2022OH)",
                "Isopropyl radical ((CH3)2CH\u2022)",
                "Methyl radical (\u2022CH3)",
                "Nitric oxide (NO\u2022)",
                "Nitroxide radical (>N\u2013O\u2022)",
                "Peroxyl radical (ROO\u2022)",
                "Phenoxy radical (C6H5O\u2022)",
                "Phosphoryl radical (PO2\u2022\u2212)",
                "Semiquinone radical (C6H4O2\u2022\u2212)",
                "Sulfinyl radical (RSO\u2022)",
                "Sulfonyl radical (RSO2\u2022)",
                "Superoxide (O2\u2022\u2212)",
                "Tert-butoxy radical ((CH3)3CO\u2022)",
                "Thiyl radical (RS\u2022)",
                "Trichloromethyl radical (\u2022CCl3)",
                "Triphenylmethyl radical ((C6H5)3C\u2022)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Hydroxide Ion (OH-)",
            "Superoxide Radical Anion (O2-)",
            "Peroxide Radical Anion (O2-2)",
            "Nitrite Radical Anion (NO2-)",
            "Nitrate Radical Anion (NO3-)",
            "Sulfite Radical Anion (SO3-)",
            "Sulfate Radical Anion (SO4-)",
            "Phosphite Radical Anion (PO3-)",
            "Phosphate Radical Anion (PO4-)",
            "Acetate Radical Anion (CH3COO-)",
            "Formate Radical Anion (HCOO-)",
            "Oxalate Radical Anion (C2O4-2)",
            "Malonate Radical Anion (CH2(COO-)2)",
            "Succinate Radical Anion (C2H4(COO-)2)",
            "Glutarate Radical Anion (C3H6(COO-)2)",
            "Adipate Radical Anion (C4H8(COO-)2)",
            "Phthalate Radical Anion (C6H4(COO-)2)",
            "Benzoate Radical Anion (C6H5COO-)",
            "Phenoxide Radical Anion (C6H5O-)",
            "Phenolate Radical Anion (C6H5O-)",
            "Thiolate Radical Anion (RS-)",
            "Enolate Radical Anion (R2C=CR-O-)",
            "Carboxylate Radical Anion (R-COO-)",
            "Alkoxide Radical Anion (R-O-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxide Ion (OH-)",
                "Superoxide Radical Anion (O2-)",
                "Peroxide Radical Anion (O2-2)",
                "Nitrite Radical Anion (NO2-)",
                "Nitrate Radical Anion (NO3-)",
                "Sulfite Radical Anion (SO3-)",
                "Sulfate Radical Anion (SO4-)",
                "Phosphite Radical Anion (PO3-)",
                "Phosphate Radical Anion (PO4-)",
                "Acetate Radical Anion (CH3COO-)",
                "Formate Radical Anion (HCOO-)",
                "Oxalate Radical Anion (C2O4-2)",
                "Malonate Radical Anion (CH2(COO-)2)",
                "Succinate Radical Anion (C2H4(COO-)2)",
                "Glutarate Radical Anion (C3H6(COO-)2)",
                "Adipate Radical Anion (C4H8(COO-)2)",
                "Phthalate Radical Anion (C6H4(COO-)2)",
                "Benzoate Radical Anion (C6H5COO-)",
                "Phenoxide Radical Anion (C6H5O-)",
                "Phenolate Radical Anion (C6H5O-)",
                "Thiolate Radical Anion (RS-)",
                "Enolate Radical Anion (R2C=CR-O-)",
                "Carboxylate Radical Anion (R-COO-)",
                "Alkoxide Radical Anion (R-O-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate Radical Anion (CH3COO-)",
                "Adipate Radical Anion (C4H8(COO-)2)",
                "Alkoxide Radical Anion (R-O-)",
                "Benzoate Radical Anion (C6H5COO-)",
                "Carboxylate Radical Anion (R-COO-)",
                "Enolate Radical Anion (R2C=CR-O-)",
                "Formate Radical Anion (HCOO-)",
                "Glutarate Radical Anion (C3H6(COO-)2)",
                "Hydroxide Ion (OH-)",
                "Malonate Radical Anion (CH2(COO-)2)",
                "Nitrate Radical Anion (NO3-)",
                "Nitrite Radical Anion (NO2-)",
                "Oxalate Radical Anion (C2O4-2)",
                "Peroxide Radical Anion (O2-2)",
                "Phenolate Radical Anion (C6H5O-)",
                "Phenoxide Radical Anion (C6H5O-)",
                "Phosphate Radical Anion (PO4-)",
                "Phosphite Radical Anion (PO3-)",
                "Phthalate Radical Anion (C6H4(COO-)2)",
                "Succinate Radical Anion (C2H4(COO-)2)",
                "Sulfate Radical Anion (SO4-)",
                "Sulfite Radical Anion (SO3-)",
                "Superoxide Radical Anion (O2-)",
                "Thiolate Radical Anion (RS-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": "[\n\"Phenolate anion (PhO-)\" ,\n\"Benzoate radical anion (BzO-)\" ,\n\"Hydroquinone radical anion (HQ-)\" ,\n\"Semiquinone radical anion (SQ-)\" ,\n\"Phenoxyl radical anion (PhO-)\" ,\n\"Superoxide radical anion (O2-)\" ,\n\"Hydroxyl radical anion (HO-)\" ,\n\"Alkyl radical anion (R-)\" ,\n\"Carbonyl radical anion (RCO-)\" ,\n\"Alkoxyl radical anion (RO-)\" ,\n\"Acetylcholine radical anion (ACh-)\" ,\n\"Glutathione radical anion (GSH-)\" ,\n\"Ubiquinol radical anion (UQH2-)\" ,\n\"Coenzyme Q radical anion (CoQ-)\" ,\n\"Vitamin C radical anion (Ascorbate-)\" ,\n\"Flavonoid radical anion (Flav-)\" ,\n\"Anthocyanin radical anion (Anth-)\" ,\n\"Quinone radical anion (Q-)\" ,\n\"Anthraquinone radical anion (AQ-)\" ,\n\"Phenothiazine radical anion (PTZ-)\" ,\n\"Flavonoid radical anion (Flav-)\" ,\n\"Phenolic radical anion (PhOH-)\" ,\n\"Thiol radical anion (RSH-)\" ,\n\"Thiyl radical anion (RS-)\" ,\n\"Thiolate radical anion (RS-)\" ,\n\"Thiolate radical anion (RS-)\"",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            "Fluorophenyl anion (FPh-)\"",
            "Chlorophenyl anion (ClPh-)\"",
            "Phenyl anion (Ph-)\"",
            "Benzyl anion (Bn-)\"",
            "4-Nitrophenyl anion (4-NO2Ph-)\"",
            "2-Carboxyphenyl anion (2-CO2Ph-)\"",
            "4-Carboxyphenyl anion (4-CO2Ph-)\"",
            "2-Nitrophenyl anion (2-NO2Ph-)\"",
            "4-Methylphenyl anion (4-CH3Ph-)\"",
            "2-Methylphenyl anion (2-CH3Ph-)\"",
            "4-Methoxyphenyl anion (4-MeOPh-)\"",
            "2-Methoxyphenyl anion (2-MeOPh-)\"",
            "4-Cyanophenyl anion (4-CNPh-)\"",
            "2-Cyanophenyl anion (2-CNPh-)\"",
            "4-Fluorophenyl anion (4-FPh-)\"",
            "2-Fluorophenyl anion (2-FPh-)\"",
            "4-Chlorophenyl anion (4-ClPh-)\"",
            "2-Chlorophenyl anion (2-ClPh-)\"",
            "1-Naphthyl anion (1-Np-)\"",
            "2-Naphthyl anion (2-Np-)\"",
            "9-Anthryl anion (9-Anth-)\"",
            "1-Pyrenyl anion (1-Pyr-)\"",
            "Quinoxaline radical anion (Qx-)\"",
            "Phenanthridine radical anion (Phd-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fluorophenyl anion (FPh-)\"",
                "Chlorophenyl anion (ClPh-)\"",
                "Phenyl anion (Ph-)\"",
                "Benzyl anion (Bn-)\"",
                "4-Nitrophenyl anion (4-NO2Ph-)\"",
                "2-Carboxyphenyl anion (2-CO2Ph-)\"",
                "4-Carboxyphenyl anion (4-CO2Ph-)\"",
                "2-Nitrophenyl anion (2-NO2Ph-)\"",
                "4-Methylphenyl anion (4-CH3Ph-)\"",
                "2-Methylphenyl anion (2-CH3Ph-)\"",
                "4-Methoxyphenyl anion (4-MeOPh-)\"",
                "2-Methoxyphenyl anion (2-MeOPh-)\"",
                "4-Cyanophenyl anion (4-CNPh-)\"",
                "2-Cyanophenyl anion (2-CNPh-)\"",
                "4-Fluorophenyl anion (4-FPh-)\"",
                "2-Fluorophenyl anion (2-FPh-)\"",
                "4-Chlorophenyl anion (4-ClPh-)\"",
                "2-Chlorophenyl anion (2-ClPh-)\"",
                "1-Naphthyl anion (1-Np-)\"",
                "2-Naphthyl anion (2-Np-)\"",
                "9-Anthryl anion (9-Anth-)\"",
                "1-Pyrenyl anion (1-Pyr-)\"",
                "Quinoxaline radical anion (Qx-)\"",
                "Phenanthridine radical anion (Phd-)"
            ],
            "mismatches": [],
            "true_referents": [
                "1-Naphthyl anion (1-Np-)\"",
                "1-Pyrenyl anion (1-Pyr-)\"",
                "2-Carboxyphenyl anion (2-CO2Ph-)\"",
                "2-Chlorophenyl anion (2-ClPh-)\"",
                "2-Cyanophenyl anion (2-CNPh-)\"",
                "2-Fluorophenyl anion (2-FPh-)\"",
                "2-Methoxyphenyl anion (2-MeOPh-)\"",
                "2-Methylphenyl anion (2-CH3Ph-)\"",
                "2-Naphthyl anion (2-Np-)\"",
                "2-Nitrophenyl anion (2-NO2Ph-)\"",
                "4-Carboxyphenyl anion (4-CO2Ph-)\"",
                "4-Chlorophenyl anion (4-ClPh-)\"",
                "4-Cyanophenyl anion (4-CNPh-)\"",
                "4-Fluorophenyl anion (4-FPh-)\"",
                "4-Methoxyphenyl anion (4-MeOPh-)\"",
                "4-Methylphenyl anion (4-CH3Ph-)\"",
                "4-Nitrophenyl anion (4-NO2Ph-)\"",
                "9-Anthryl anion (9-Anth-)\"",
                "Benzyl anion (Bn-)\"",
                "Chlorophenyl anion (ClPh-)\"",
                "Fluorophenyl anion (FPh-)\"",
                "Phenanthridine radical anion (Phd-)",
                "Phenyl anion (Ph-)\"",
                "Quinoxaline radical anion (Qx-)\""
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "radical anion",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Benzene",
                "Canonical Name": "(C6H6)\u2212"
            },
            {
                "Referent": "Phenyl",
                "Canonical Name": "(C6H5)\u2212"
            },
            {
                "Referent": "Anthracenyl",
                "Canonical Name": "(C14H10)\u2212"
            },
            {
                "Referent": "Phenyl radical anion",
                "Canonical Name": "(C6H5)\u2212"
            },
            {
                "Referent": "Benzene radical anion",
                "Canonical Name": "(C6H6)\u2212"
            },
            {
                "Referent": "Phenyl radical cation",
                "Canonical Name": "(C6H5)2+"
            },
            {
                "Referent": "Benzene radical cation",
                "Canonical Name": "(C6H6)2+"
            },
            {
                "Referent": "Phenyl radical anion",
                "Canonical Name": "(C6H5)\u2212"
            },
            {
                "Referent": "Benzene radical anion",
                "Canonical Name": "(C6H6)\u2212"
            },
            {
                "Referent": "Phenyl radical cation",
                "Canonical Name": "(C6H5)2+"
            },
            {
                "Referent": "Benzene radical cation",
                "Canonical Name": "(C6H6)2+"
            },
            {
                "Referent": "Phenyl radical anion",
                "Canonical Name": "(C6H5)\u2212"
            },
            {
                "Referent": "Benzene radical anion",
                "Canonical Name": "(C6H6)\u2212"
            },
            {
                "Referent": "Phenyl radical cation",
                "Canonical Name": "(C6H5)2+"
            },
            {
                "Referent": "Benzene radical cation",
                "Canonical Name": "(C6H6)2+"
            },
            {
                "Referent": "Phenyl radical anion",
                "Canonical Name": "(C6H5)\u2212"
            },
            {
                "Referent": "Benzene radical anion",
                "Canonical Name": "(C6H6)\u2212"
            },
            {
                "Referent": "Phenyl radical cation",
                "Canonical Name": "(C6H5)2+"
            },
            {
                "Referent": "Benzene radical cation",
                "Canonical Name": "(C6H6)2+"
            },
            {
                "Referent": "Phenyl radical anion",
                "Canonical Name": "(C6H5)\u2212"
            },
            {
                "Referent": "Benzene radical anion",
                "Canonical Name": "(C6H6)\u2212"
            },
            {
                "Referent": "Phenyl radical cation",
                "Canonical Name": "(C6H5)2+"
            },
            {
                "Referent": "Benzene radical cation",
                "Canonical Name": "(C6H6)2+"
            },
            {
                "Referent": "Phenyl radical anion",
                "Canonical Name": "(C6H5)\u2212"
            },
            {
                "Referent": "Benzene radical anion",
                "Canonical Name": "(C6H6)\u2212"
            },
            {
                "Referent": "Phenyl radical cation",
                "Canonical Name": "(C6H5)2+"
            },
            {
                "Referent": "Benzene radical cation",
                "Canonical Name": "(C6H6)2+"
            },
            {
                "Referent": "Phenyl radical anion",
                "Canonical Name": "(C6H5)\u2212"
            },
            {
                "Referent": "Benzene radical anion",
                "Canonical Name": "(C6H6)\u2212"
            },
            {
                "Referent": "Phenyl radical cation",
                "Canonical Name": "(C6H5)2+"
            },
            {
                "Referent": "Benzene radical cation",
                "Canonical Name": "(C6H6)2+"
            },
            {
                "Referent": "Phenyl radical anion",
                "Canonical Name": "(C6H5)\u2212"
            },
            {
                "Referent": "Benzene radical anion",
                "Canonical Name": "(C6H6)\u2212"
            },
            {
                "Referent": "Phenyl radical cation",
                "Canonical Name": "(C6H5)2+"
            },
            {
                "Referent": "Benzene radical cation",
                "Canonical Name": "(C6H6)2+"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Benzene",
                "Phenyl",
                "Anthracenyl",
                "Phenyl radical anion",
                "Benzene radical anion",
                "Phenyl radical cation",
                "Benzene radical cation"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"Anthracenyl\", \"Canonical Name\": \"(C14H10)\\u2212\"}",
                "{\"Referent\": \"Benzene radical anion\", \"Canonical Name\": \"(C6H6)\\u2212\"}",
                "{\"Referent\": \"Benzene radical cation\", \"Canonical Name\": \"(C6H6)2+\"}",
                "{\"Referent\": \"Benzene\", \"Canonical Name\": \"(C6H6)\\u2212\"}",
                "{\"Referent\": \"Phenyl radical anion\", \"Canonical Name\": \"(C6H5)\\u2212\"}",
                "{\"Referent\": \"Phenyl radical cation\", \"Canonical Name\": \"(C6H5)2+\"}",
                "{\"Referent\": \"Phenyl\", \"Canonical Name\": \"(C6H5)\\u2212\"}"
            ],
            "TP": 7,
            "FP": 0,
            "FN": 0
        }
    }
]