[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "sulfite (SO3^2-)",
            "carbonate (CO3^2-)",
            "sulfide (S^2-)",
            "dithionite (S2O4^2-)",
            "oxalate (C2O4^2-)",
            "permanganate (MnO4^2-)",
            "chromate (CrO4^2-)",
            "disulfite (SO2^2-)",
            "thiosulfate (S2O3^2-)",
            "arsenite (AsO3^2-)",
            "phosphate (PO4^3-, with dianion HPO4^2-)",
            "selenite (SeO3^2-)",
            "tellurite (TeO3^2-)",
            "borate (BO3^3-, with dianion B4O5^2-)",
            "cyanate (OCN^-, with dianion NCO^2-)",
            "perchlorate (ClO4^-, with dianion ClO3^2-)",
            "nitrite (NO2^- with dianion N2O4^2-)",
            "hydrogen sulfite (HSO3^- with dianion SO3^2-)",
            "hydrogen phosphate (H2PO4^- with dianion HPO4^2-)",
            "hydrogen arsenite (HAsO3^- with dianion AsO3^2-)",
            "hydrogen selenite (HSeO3^- with dianion SeO3^2-)",
            "hydrogen tellurite (HTeO3^- with dianion TeO3^2-)",
            "hydrogen borate (HBO3^- with dianion B4O5^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "sulfite (SO3^2-)",
                "sulfide (S^2-)",
                "chromate (CrO4^2-)",
                "thiosulfate (S2O3^2-)",
                "arsenite (AsO3^2-)",
                "hydrogen phosphate (H2PO4^- with dianion HPO4^2-)"
            ],
            "mismatches": [
                "carbonate (CO3^2-)",
                "dithionite (S2O4^2-)",
                "oxalate (C2O4^2-)",
                "permanganate (MnO4^2-)",
                "disulfite (SO2^2-)",
                "selenite (SeO3^2-)",
                "tellurite (TeO3^2-)",
                "borate (BO3^3-, with dianion B4O5^2-)",
                "cyanate (OCN^-, with dianion NCO^2-)",
                "perchlorate (ClO4^-, with dianion ClO3^2-)",
                "nitrite (NO2^- with dianion N2O4^2-)",
                "hydrogen sulfite (HSO3^- with dianion SO3^2-)",
                "hydrogen arsenite (HAsO3^- with dianion AsO3^2-)",
                "hydrogen selenite (HSeO3^- with dianion SeO3^2-)",
                "hydrogen tellurite (HTeO3^- with dianion TeO3^2-)",
                "hydrogen borate (HBO3^- with dianion B4O5^2-)"
            ],
            "true_referents": [
                "(3E)-dec-3-en-1-yl sulfate",
                "(R)-secondary-alkyl sulfate oxoanion",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2-ethylhexyl sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "dithiophosphate(2-)",
                "dodecaboride(2-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 6,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Oxalate (C2O4^2-)",
            "Sulfate (SO4^2-)",
            "Sulfite (SO3^2-)",
            "Carbonate (CO3^2-)",
            "Bicarbonate (HCO3^-)",
            "Acetate (C2H3O2^-)",
            "Chromate (CrO4^2-)",
            "Dichromate (Cr2O7^2-)",
            "Permanganate (MnO4^-)",
            "Phosphate (PO4^3-)",
            "Phosphite (PO3^3-)",
            "Arsenate (AsO4^3-)",
            "Arsenite (AsO3^3-)",
            "Borate (BO3^3-)",
            "Nitrate (NO3^-)",
            "Nitrite (NO2^-)",
            "Hydrogen phosphate (HPO4^2-)",
            "Hydrogen sulfide (HS^-)",
            "Thiosulfate (S2O3^2-)",
            "Thiocyanate (SCN^-)",
            "Fumarate (C4H2O4^2-)",
            "Malonate (C3H2O4^2-)",
            "Tartrate (C4H4O6^2-)",
            "Orotate (C5H3N2O4^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4^2-)",
                "Sulfite (SO3^2-)",
                "Chromate (CrO4^2-)",
                "Dichromate (Cr2O7^2-)",
                "Arsenite (AsO3^3-)",
                "Hydrogen phosphate (HPO4^2-)",
                "Thiosulfate (S2O3^2-)"
            ],
            "mismatches": [
                "Oxalate (C2O4^2-)",
                "Carbonate (CO3^2-)",
                "Bicarbonate (HCO3^-)",
                "Acetate (C2H3O2^-)",
                "Permanganate (MnO4^-)",
                "Phosphate (PO4^3-)",
                "Phosphite (PO3^3-)",
                "Arsenate (AsO4^3-)",
                "Borate (BO3^3-)",
                "Nitrate (NO3^-)",
                "Nitrite (NO2^-)",
                "Hydrogen sulfide (HS^-)",
                "Thiocyanate (SCN^-)",
                "Fumarate (C4H2O4^2-)",
                "Malonate (C3H2O4^2-)",
                "Tartrate (C4H4O6^2-)",
                "Orotate (C5H3N2O4^2-)"
            ],
            "true_referents": [
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-2-O-sulfonatolactate(2-)",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(S)-2-O-sulfonatolactate(2-)",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2',3'-dipalmitoyl-2-sulfo-alpha,alpha-trehalose(1-)",
                "2-ethylhexyl sulfate(1-)",
                "3-(3-sulfooxyphenyl)propanoate(2-)",
                "4-methylumbelliferone sulfate(1-)",
                "D-glucose 6-sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "dodecaboride(2-)",
                "ethyl 4-hydroxybenzoate sulfate(1-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetraoxorhenate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Oxide ion (O^2-)",
            "Sulfide ion (S^2-)",
            "Selenide ion (Se^2-)",
            "Telluride ion (Te^2-)",
            "Sulfite ion (SO3^2-)",
            "Chlorite ion (ClO2^2-)",
            "Bromite ion (BrO2^2-)",
            "Iodite ion (IO2^2-)",
            "Carbonate ion (CO3^2-)",
            "Sulfate ion (SO4^2-)",
            "Chromate ion (CrO4^2-)",
            "Molybdate ion (MoO4^2-)",
            "Tungstate ion (WO4^2-)",
            "Phosphate ion (PO4^3-)",
            "Nitrate ion (NO3^-)",
            "Perchlorate ion (ClO4^-)",
            "Permanganate ion (MnO4^-)",
            "Thiosulfate ion (S2O3^2-)",
            "Dithionite ion (S2O4^2-)",
            "Hypochlorite ion (ClO^-)",
            "Hypobromite ion (BrO^-)",
            "Hypoiodite ion (IO^-)",
            "Hydroxide ion (OH^-)",
            "Peroxide ion (O2^2-)",
            "Ozonide ion (O3^-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfide ion (S^2-)",
                "Sulfite ion (SO3^2-)",
                "Sulfate ion (SO4^2-)",
                "Chromate ion (CrO4^2-)",
                "Molybdate ion (MoO4^2-)",
                "Tungstate ion (WO4^2-)",
                "Thiosulfate ion (S2O3^2-)"
            ],
            "mismatches": [
                "Oxide ion (O^2-)",
                "Selenide ion (Se^2-)",
                "Telluride ion (Te^2-)",
                "Chlorite ion (ClO2^2-)",
                "Bromite ion (BrO2^2-)",
                "Iodite ion (IO2^2-)",
                "Carbonate ion (CO3^2-)",
                "Phosphate ion (PO4^3-)",
                "Nitrate ion (NO3^-)",
                "Perchlorate ion (ClO4^-)",
                "Permanganate ion (MnO4^-)",
                "Dithionite ion (S2O4^2-)",
                "Hypochlorite ion (ClO^-)",
                "Hypobromite ion (BrO^-)",
                "Hypoiodite ion (IO^-)",
                "Hydroxide ion (OH^-)",
                "Peroxide ion (O2^2-)",
                "Ozonide ion (O3^-)"
            ],
            "true_referents": [
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3,3'-diiodo-L-thyronine sulfate(1-)",
                "3-hydroxypyridine sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "dithiophosphate(2-)",
                "hexyl sulfate(1-)",
                "hydrogenphosphate",
                "hydrogenselenophosphate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl sulfate(1-)",
                "molybdate",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "tetraoxidophosphate(.2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 7,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO\u2084\u00b2\u207b)",
            "Carbonate (CO\u2083\u00b2\u207b)",
            "Nitrate (NO\u2083\u00b2\u207b)",
            "Phosphate (PO\u2084\u00b3\u207b)",
            "Chromate (CrO\u2084\u00b2\u207b)",
            "Dichromate (Cr\u2082O\u2087\u00b2\u207b)",
            "Silicate (SiO\u2083\u00b2\u207b)",
            "Sulfite (SO\u2083\u00b2\u207b)",
            "Hydrogen Carbonate/Bicarbonate (HCO\u2083\u207b)",
            "Hydrogen Sulfate/Bisulfate (HSO\u2084\u207b)",
            "Cyanide (CN\u207b)",
            "Oxalate (C\u2082O\u2084\u00b2\u207b)",
            "Tartrate (C\u2084H\u2084O\u2086\u00b2\u207b)",
            "Succinate (C\u2084H\u2084O\u2084\u00b2\u207b)",
            "Glutarate (C\u2085H\u2086O\u2084\u00b2\u207b)",
            "Adipate (C\u2086H\u2081\u2080O\u2084\u00b2\u207b)",
            "Maleate (C\u2084H\u2082O\u2084\u00b2\u207b)",
            "Fumarate (C\u2084H\u2082O\u2084\u00b2\u207b)",
            "Phthalate (C\u2088H\u2084O\u2084\u00b2\u207b)",
            "Isophthalate (C\u2088H\u2084O\u2084\u00b2\u207b)",
            "Terephthalate (C\u2088H\u2084O\u2084\u00b2\u207b)",
            "Perchlorate (ClO\u2084\u207b)",
            "Chlorite (ClO\u2082\u207b)",
            "Hypochlorite (ClO\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO\u2084\u00b2\u207b)",
                "Chromate (CrO\u2084\u00b2\u207b)",
                "Dichromate (Cr\u2082O\u2087\u00b2\u207b)",
                "Sulfite (SO\u2083\u00b2\u207b)"
            ],
            "mismatches": [
                "Carbonate (CO\u2083\u00b2\u207b)",
                "Nitrate (NO\u2083\u00b2\u207b)",
                "Phosphate (PO\u2084\u00b3\u207b)",
                "Silicate (SiO\u2083\u00b2\u207b)",
                "Hydrogen Carbonate/Bicarbonate (HCO\u2083\u207b)",
                "Hydrogen Sulfate/Bisulfate (HSO\u2084\u207b)",
                "Cyanide (CN\u207b)",
                "Oxalate (C\u2082O\u2084\u00b2\u207b)",
                "Tartrate (C\u2084H\u2084O\u2086\u00b2\u207b)",
                "Succinate (C\u2084H\u2084O\u2084\u00b2\u207b)",
                "Glutarate (C\u2085H\u2086O\u2084\u00b2\u207b)",
                "Adipate (C\u2086H\u2081\u2080O\u2084\u00b2\u207b)",
                "Maleate (C\u2084H\u2082O\u2084\u00b2\u207b)",
                "Fumarate (C\u2084H\u2082O\u2084\u00b2\u207b)",
                "Phthalate (C\u2088H\u2084O\u2084\u00b2\u207b)",
                "Isophthalate (C\u2088H\u2084O\u2084\u00b2\u207b)",
                "Terephthalate (C\u2088H\u2084O\u2084\u00b2\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Chlorite (ClO\u2082\u207b)",
                "Hypochlorite (ClO\u207b)"
            ],
            "true_referents": [
                "(2R)-2,6-dimethylheptyl sulfate",
                "(3Z,6Z)-dodeca-3,6-dien-1-yl sulfate",
                "(4R)-4,8-dimethylnonyl sulfate",
                "(R)-2-O-sulfonatolactate(2-)",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(S)-2-O-sulfonatolactate(2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "4-isopropylphenyl sulfate(1-)",
                "4-methylumbelliferone sulfate(1-)",
                "6-O-sulfonato-D-glucono-1,5-lactone(1-)",
                "D-glucose 6-sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "bisphenol A sulfate(1-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "ethyl 4-hydroxybenzoate sulfate(1-)",
                "hexyl sulfate(1-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "methyl sulfate(1-)",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "propyl 4-hydroxybenzoate sulfate(1-)",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "tetraoxidophosphate(.2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO4^2-)",
            "Carbonate (CO3^2-)",
            "Chromate (CrO4^2-)",
            "Dichromate (Cr2O7^2-)",
            "Silicate (SiO3^2-)",
            "Thiosulfate (S2O3^2-)",
            "Oxalate (C2O4^2-)",
            "Peroxide (O2^2-)",
            "Molybdate (MoO4^2-)",
            "Selenate (SeO4^2-)",
            "Tungstate (WO4^2-)",
            "Tellurate (TeO4^2-)",
            "Tartrate (C4H4O6^2-)",
            "Zincate (ZnO2^2-)",
            "Phthalate (C8H4O4^2-)",
            "Pyrophosphate (P2O7^2-)",
            "Borate (B4O7^2-)",
            "Selenite (SeO3^2-)",
            "Tellurite (TeO3^2-)",
            "Vanadate (VO4^2-)",
            "Sulfite (SO3^2-)",
            "Arsenate (AsO4^2-)",
            "Arsenite (AsO3^2-)",
            "Hydrogen Phosphate (HPO4^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4^2-)",
                "Chromate (CrO4^2-)",
                "Dichromate (Cr2O7^2-)",
                "Thiosulfate (S2O3^2-)",
                "Molybdate (MoO4^2-)",
                "Selenate (SeO4^2-)",
                "Tungstate (WO4^2-)",
                "Sulfite (SO3^2-)",
                "Arsenite (AsO3^2-)"
            ],
            "mismatches": [
                "Carbonate (CO3^2-)",
                "Silicate (SiO3^2-)",
                "Oxalate (C2O4^2-)",
                "Peroxide (O2^2-)",
                "Tellurate (TeO4^2-)",
                "Tartrate (C4H4O6^2-)",
                "Zincate (ZnO2^2-)",
                "Phthalate (C8H4O4^2-)",
                "Pyrophosphate (P2O7^2-)",
                "Borate (B4O7^2-)",
                "Selenite (SeO3^2-)",
                "Tellurite (TeO3^2-)",
                "Vanadate (VO4^2-)",
                "Arsenate (AsO4^2-)",
                "Hydrogen Phosphate (HPO4^2-)"
            ],
            "true_referents": [
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-2-O-sulfonatolactate(2-)",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2-ethylhexyl sulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "4-vinylguaiacol sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "bisphenol A sulfate(1-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "dodecaboride(2-)",
                "ethyl 4-hydroxybenzoate sulfate(1-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "hydrogenvanadate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "oxidized Watasenia luciferin(2-)",
                "propyl 4-hydroxybenzoate sulfate(1-)",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "tetraoxidophosphate(.2-)",
                "tetraoxorhenate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO4^2-)",
            "Carbonate (CO3^2-)",
            "Phosphate (PO4^2-)",
            "Oxalate (C2O4^2-)",
            "Silicate (SiO3^2-)",
            "Chlorate (ClO3^2-)",
            "Arsenate (AsO4^2-)",
            "Boronate (B(OH)4^2-)",
            "Thiosulfate (S2O3^2-)",
            "Cromate (CrO4^2-)",
            "Manganate (MnO4^2-)",
            "Vanadate (VO4^2-)",
            "Tungstate (WO4^2-)",
            "Zirconate (ZrO4^2-)",
            "Selenate (SeO4^2-)",
            "Tellurate (TeO4^2-)",
            "Hydrogen phosphate (HPO4^2-)",
            "Hydrosulfate (HSO4^2-)",
            "Germinate (GeO4^2-)",
            "Perchlorate (ClO4^2-)",
            "Nitrate (NO3^2-)",
            "Peroxide (O2^2-)",
            "Bromate (BrO3^2-)",
            "Iodate (IO3^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4^2-)",
                "Thiosulfate (S2O3^2-)",
                "Manganate (MnO4^2-)",
                "Tungstate (WO4^2-)",
                "Selenate (SeO4^2-)",
                "Hydrogen phosphate (HPO4^2-)"
            ],
            "mismatches": [
                "Carbonate (CO3^2-)",
                "Phosphate (PO4^2-)",
                "Oxalate (C2O4^2-)",
                "Silicate (SiO3^2-)",
                "Chlorate (ClO3^2-)",
                "Arsenate (AsO4^2-)",
                "Boronate (B(OH)4^2-)",
                "Cromate (CrO4^2-)",
                "Vanadate (VO4^2-)",
                "Zirconate (ZrO4^2-)",
                "Tellurate (TeO4^2-)",
                "Hydrosulfate (HSO4^2-)",
                "Germinate (GeO4^2-)",
                "Perchlorate (ClO4^2-)",
                "Nitrate (NO3^2-)",
                "Peroxide (O2^2-)",
                "Bromate (BrO3^2-)",
                "Iodate (IO3^2-)"
            ],
            "true_referents": [
                "(3E)-dec-3-en-1-yl sulfate",
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2-ethylhexyl sulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3,3'-diiodo-L-thyronine sulfate(1-)",
                "4-vinylguaiacol sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "beta-D-GlcA3S-(1->3)-beta-D-Gal-OMe(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "diphosphate(2-)",
                "dodecaboride(2-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "hydrogenvanadate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "orthoperiodate(2-)",
                "oxidized Watasenia luciferin(2-)",
                "selenate",
                "sulfate",
                "tetrachlorozincate(2-)",
                "tetraoxidophosphate(.2-)",
                "tetraoxorhenate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO4^2-)",
            "Carbonate (CO3^2-)",
            "Dichromate (Cr2O7^2-)",
            "Oxalate (C2O4^2-)",
            "Thiosulfate (S2O3^2-)",
            "Chromate (CrO4^2-)",
            "Perchlorate (ClO4^2-)",
            "Molybdate (MoO4^2-)",
            "Silicate (SiO3^2-)",
            "Phosphate (PO4^2-)",
            "Arsenate (AsO4^2-)",
            "Selenate (SeO4^2-)",
            "Tellurate (TeO4^2-)",
            "Vanadate (VO4^2-)",
            "Antimonate (SbO4^2-)",
            "Stannate (SnO3^2-)",
            "Plumbate (PbO4^2-)",
            "Borate (BO3^2-)",
            "Wolframate (WO4^2-)",
            "Titanate (TiO3^2-)",
            "Zirconate (ZrO3^2-)",
            "Niobate (NbO3^2-)",
            "Tantalate (TaO3^2-)",
            "Germanate (GeO3^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4^2-)",
                "Dichromate (Cr2O7^2-)",
                "Thiosulfate (S2O3^2-)",
                "Chromate (CrO4^2-)",
                "Molybdate (MoO4^2-)",
                "Selenate (SeO4^2-)",
                "Antimonate (SbO4^2-)"
            ],
            "mismatches": [
                "Carbonate (CO3^2-)",
                "Oxalate (C2O4^2-)",
                "Perchlorate (ClO4^2-)",
                "Silicate (SiO3^2-)",
                "Phosphate (PO4^2-)",
                "Arsenate (AsO4^2-)",
                "Tellurate (TeO4^2-)",
                "Vanadate (VO4^2-)",
                "Stannate (SnO3^2-)",
                "Plumbate (PbO4^2-)",
                "Borate (BO3^2-)",
                "Wolframate (WO4^2-)",
                "Titanate (TiO3^2-)",
                "Zirconate (ZrO3^2-)",
                "Niobate (NbO3^2-)",
                "Tantalate (TaO3^2-)",
                "Germanate (GeO3^2-)"
            ],
            "true_referents": [
                "(3E)-dec-3-en-1-yl sulfate",
                "(3Z)-dec-3-en-1-yl sulfate",
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "12-sulfojasmonate",
                "2-ethylhexyl sulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "4-vinylguaiacol sulfate(1-)",
                "Watasenia luciferin(2-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "dodecaboride(2-)",
                "hydrogenphosphate",
                "hydrogenselenophosphate",
                "hydrogenvanadate",
                "manganate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "oxidized Watasenia luciferin(2-)",
                "selenate",
                "sulfate",
                "tetrachlorozincate(2-)",
                "tetraoxorhenate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO4)",
            "Carbonate (CO3)",
            "Oxide (O2-)",
            "Nitrate (NO3)",
            "Phosphate (PO4)",
            "Chloride (Cl)",
            "Bromide (Br)",
            "Iodide (I)",
            "Fluoride (F)",
            "Selenide (Se2-)",
            "Telluride (Te2-)",
            "Sulfide (S2-)",
            "Oxysulfide (S2O2-)",
            "Nitrite (NO2-)",
            "Phosphite (PO3-)",
            "Hypochlorite (ClO-)",
            "Chlorite (ClO2-)",
            "Chlorate (ClO3-)",
            "Perchlorate (ClO4-)",
            "Bromate (BrO3-)",
            "Iodate (IO3-)",
            "Periodate (IO4-)",
            "Fluorosilicate (SiF6)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4)",
                "Sulfide (S2-)"
            ],
            "mismatches": [
                "Carbonate (CO3)",
                "Oxide (O2-)",
                "Nitrate (NO3)",
                "Phosphate (PO4)",
                "Chloride (Cl)",
                "Bromide (Br)",
                "Iodide (I)",
                "Fluoride (F)",
                "Selenide (Se2-)",
                "Telluride (Te2-)",
                "Oxysulfide (S2O2-)",
                "Nitrite (NO2-)",
                "Phosphite (PO3-)",
                "Hypochlorite (ClO-)",
                "Chlorite (ClO2-)",
                "Chlorate (ClO3-)",
                "Perchlorate (ClO4-)",
                "Bromate (BrO3-)",
                "Iodate (IO3-)",
                "Periodate (IO4-)",
                "Fluorosilicate (SiF6)"
            ],
            "true_referents": [
                "(dioxido)trioxidophosphate(.2-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3,3'-diiodo-L-thyronine sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "bisphenol A sulfate(1-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "diphosphate(2-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "organosulfate oxoanion",
                "phosphonate(2-)",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "tetraoxidophosphate(.2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)"
            ],
            "TP": 2,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Oxide (O\u00b2\u207b)",
            "Sulfate (SO\u2084\u00b2\u207b)",
            "Sulfite (SO\u2083\u00b2\u207b)",
            "Carbonate (CO\u2083\u00b2\u207b)",
            "Chromate (CrO\u2084\u00b2\u207b)",
            "Dichromate (Cr\u2082O\u2087\u00b2\u207b)",
            "Hydrogen Phosphate (HPO\u2084\u00b2\u207b)",
            "Phosphite (PO\u2083\u00b2\u207b)",
            "Selenate (SeO\u2084\u00b2\u207b)",
            "Selenite (SeO\u2083\u00b2\u207b)",
            "Tellurate (TeO\u2084\u00b2\u207b)",
            "Tellurite (TeO\u2083\u00b2\u207b)",
            "Peroxydisulfate (S\u2082O\u2088\u00b2\u207b)",
            "Tartrate (C\u2084H\u2084O\u2086\u00b2\u207b)",
            "Malonate (C\u2083H\u2082O\u2084\u00b2\u207b)",
            "Oxalate (C\u2082O\u2084\u00b2\u207b)",
            "Thiosulfate (S\u2082O\u2083\u00b2\u207b)",
            "Pyrosulfate (S\u2082O\u2087\u00b2\u207b)",
            "Peroxomonosulfate (HSO\u2085\u00b2\u207b)",
            "Dissulfate (S\u2082O\u2087\u00b2\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO\u2084\u00b2\u207b)",
                "Sulfite (SO\u2083\u00b2\u207b)",
                "Chromate (CrO\u2084\u00b2\u207b)",
                "Dichromate (Cr\u2082O\u2087\u00b2\u207b)",
                "Hydrogen Phosphate (HPO\u2084\u00b2\u207b)",
                "Selenate (SeO\u2084\u00b2\u207b)",
                "Thiosulfate (S\u2082O\u2083\u00b2\u207b)"
            ],
            "mismatches": [
                "Oxide (O\u00b2\u207b)",
                "Carbonate (CO\u2083\u00b2\u207b)",
                "Phosphite (PO\u2083\u00b2\u207b)",
                "Selenite (SeO\u2083\u00b2\u207b)",
                "Tellurate (TeO\u2084\u00b2\u207b)",
                "Tellurite (TeO\u2083\u00b2\u207b)",
                "Peroxydisulfate (S\u2082O\u2088\u00b2\u207b)",
                "Tartrate (C\u2084H\u2084O\u2086\u00b2\u207b)",
                "Malonate (C\u2083H\u2082O\u2084\u00b2\u207b)",
                "Oxalate (C\u2082O\u2084\u00b2\u207b)",
                "Pyrosulfate (S\u2082O\u2087\u00b2\u207b)",
                "Peroxomonosulfate (HSO\u2085\u00b2\u207b)",
                "Dissulfate (S\u2082O\u2087\u00b2\u207b)"
            ],
            "true_referents": [
                "(R)-2-O-sulfonatolactate(2-)",
                "(R)-secondary-alkyl sulfate oxoanion",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2',3'-dipalmitoyl-2-sulfo-alpha,alpha-trehalose(1-)",
                "3-hydroxypyridine sulfate(1-)",
                "D-glucose 6-sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "methyl sulfate(1-)",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "organosulfate oxoanion",
                "phosphonate(2-)",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "tungstate"
            ],
            "TP": 7,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Carbonate (CO3\u00b2\u207b)",
            "Sulfate (SO4\u00b2\u207b)",
            "Sulfite (SO3\u00b2\u207b)",
            "Chromate (CrO4\u00b2\u207b)",
            "Dichromate (Cr2O7\u00b2\u207b)",
            "Selenate (SeO4\u00b2\u207b)",
            "Selenite (SeO3\u00b2\u207b)",
            "Tellurate (TeO4\u00b2\u207b)",
            "Tellurite (TeO3\u00b2\u207b)",
            "Oxalate (C2O4\u00b2\u207b)",
            "Thiosulfate (S2O3\u00b2\u207b)",
            "Silicate (SiO3\u00b2\u207b)",
            "Molybdate (MoO4\u00b2\u207b)",
            "Tungstate (WO4\u00b2\u207b)",
            "Peroxide (O2\u00b2\u207b)",
            "Sulfide (S\u00b2\u207b)",
            "Selenide (Se\u00b2\u207b)",
            "Telluride (Te\u00b2\u207b)",
            "Oxide (O\u00b2\u207b)",
            "Hydroxide (OH\u207b)\u2082",
            "Phosphite (HPO3\u00b2\u207b)",
            "Hydrogen phosphate (HPO4\u00b2\u207b)",
            "Hydrogen arsenate (HAsO4\u00b2\u207b)",
            "Manganate (MnO4\u00b2\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4\u00b2\u207b)",
                "Sulfite (SO3\u00b2\u207b)",
                "Chromate (CrO4\u00b2\u207b)",
                "Dichromate (Cr2O7\u00b2\u207b)",
                "Selenate (SeO4\u00b2\u207b)",
                "Thiosulfate (S2O3\u00b2\u207b)",
                "Molybdate (MoO4\u00b2\u207b)",
                "Tungstate (WO4\u00b2\u207b)",
                "Sulfide (S\u00b2\u207b)",
                "Manganate (MnO4\u00b2\u207b)",
                "Hydrogen phosphate (HPO4\u00b2\u207b)"
            ],
            "mismatches": [
                "Carbonate (CO3\u00b2\u207b)",
                "Selenite (SeO3\u00b2\u207b)",
                "Tellurate (TeO4\u00b2\u207b)",
                "Tellurite (TeO3\u00b2\u207b)",
                "Oxalate (C2O4\u00b2\u207b)",
                "Silicate (SiO3\u00b2\u207b)",
                "Peroxide (O2\u00b2\u207b)",
                "Selenide (Se\u00b2\u207b)",
                "Telluride (Te\u00b2\u207b)",
                "Oxide (O\u00b2\u207b)",
                "Hydroxide (OH\u207b)\u2082",
                "Phosphite (HPO3\u00b2\u207b)",
                "Hydrogen arsenate (HAsO4\u00b2\u207b)"
            ],
            "true_referents": [
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3-hydroxypyridine sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl sulfate(1-)",
                "molybdate",
                "oxidized Watasenia luciferin(2-)",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "carbonate (CO3 2-)",
            "sulfate (SO4 2-)",
            "sulfite (SO3 2-)",
            "thiosulfate (S2O3 2-)",
            "chromate (CrO4 2-)",
            "dichromate (Cr2O7 2-)",
            "molybdate (MoO4 2-)",
            "tungstate (WO4 2-)",
            "selenate (SeO4 2-)",
            "selenite (SeO3 2-)",
            "tellurate (TeO4 2-)",
            "tellurite (TeO3 2-)",
            "manganate (MnO4 2-)",
            "silicate (SiO4 2-)",
            "germanate (GeO4 2-)",
            "stannate (SnO3 2-)",
            "plumbate (PbO3 2-)",
            "titanate (TiO3 2-)",
            "zirconate (ZrO3 2-)",
            "hafnate (HfO3 2-)",
            "vanadate (VO4 2-)",
            "niobate (NbO4 2-)",
            "tantalate (TaO4 2-)",
            "chromite (CrO3 2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "sulfate (SO4 2-)",
                "sulfite (SO3 2-)",
                "thiosulfate (S2O3 2-)",
                "chromate (CrO4 2-)",
                "dichromate (Cr2O7 2-)",
                "molybdate (MoO4 2-)",
                "tungstate (WO4 2-)",
                "selenate (SeO4 2-)",
                "manganate (MnO4 2-)"
            ],
            "mismatches": [
                "carbonate (CO3 2-)",
                "selenite (SeO3 2-)",
                "tellurate (TeO4 2-)",
                "tellurite (TeO3 2-)",
                "silicate (SiO4 2-)",
                "germanate (GeO4 2-)",
                "stannate (SnO3 2-)",
                "plumbate (PbO3 2-)",
                "titanate (TiO3 2-)",
                "zirconate (ZrO3 2-)",
                "hafnate (HfO3 2-)",
                "vanadate (VO4 2-)",
                "niobate (NbO4 2-)",
                "tantalate (TaO4 2-)",
                "chromite (CrO3 2-)"
            ],
            "true_referents": [
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-2-O-sulfonatolactate(2-)",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "diphosphonate(2-)",
                "halistanol sulfate F(3-)",
                "hydrogenphosphate",
                "hydrogenselenophosphate",
                "hydrogenvanadate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "molybdate",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetraoxorhenate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "sulfate (SO4^2-)",
            "sulfite (SO3^2-)",
            "carbonate (CO3^2-)",
            "chromate (CrO4^2-)",
            "oxalate (C2O4^2-)",
            "silicate (SiO4^4-)",
            "phosphate (PO4^3-)",
            "arsenate (AsO4^3-)",
            "selenate (SeO4^2-)",
            "molybdate (MoO4^2-)",
            "tungstate (WO4^2-)",
            "tellurate (TeO4^2-)",
            "stannate (SnO3^2-)",
            "germanate (GeO3^2-)",
            "plumbate (PbO3^2-)",
            "manganate (MnO4^2-)",
            "perrhenate (ReO4^-)",
            "dichromate (Cr2O7^2-)",
            "pyrophosphate (P2O7^4-)",
            "hypochlorite (ClO^-)",
            "chlorite (ClO2^-)",
            "chlorate (ClO3^-)",
            "perchlorate (ClO4^-)",
            "periodate (IO4^-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "sulfate (SO4^2-)",
                "sulfite (SO3^2-)",
                "chromate (CrO4^2-)",
                "selenate (SeO4^2-)",
                "molybdate (MoO4^2-)",
                "tungstate (WO4^2-)",
                "manganate (MnO4^2-)",
                "dichromate (Cr2O7^2-)"
            ],
            "mismatches": [
                "carbonate (CO3^2-)",
                "oxalate (C2O4^2-)",
                "silicate (SiO4^4-)",
                "phosphate (PO4^3-)",
                "arsenate (AsO4^3-)",
                "tellurate (TeO4^2-)",
                "stannate (SnO3^2-)",
                "germanate (GeO3^2-)",
                "plumbate (PbO3^2-)",
                "perrhenate (ReO4^-)",
                "pyrophosphate (P2O7^4-)",
                "hypochlorite (ClO^-)",
                "chlorite (ClO2^-)",
                "chlorate (ClO3^-)",
                "perchlorate (ClO4^-)",
                "periodate (IO4^-)"
            ],
            "true_referents": [
                "(3E)-dec-3-en-1-yl sulfate",
                "(3Z)-dec-3-en-1-yl sulfate",
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "2-ethylhexyl sulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3,3'-diiodo-L-thyronine sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "hydrogenphosphate",
                "hydrogenselenophosphate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "tetraoxidophosphate(.2-)",
                "tetraoxorhenate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO4^2-)",
            "Carbonate (CO3^2-)",
            "Phosphate (PO4^3-)",
            "Oxide (O^2-)",
            "Nitrite (NO2^-)",
            "Nitrate (NO3^-)",
            "Hydroxide (OH^-)",
            "Peroxide (O2^2-)",
            "Thiosulfate (S2O3^2-)",
            "Pyrophosphate (P2O7^4-)",
            "Silicate (SiO3^2-)",
            "Borate (BO3^3-)",
            "Chromate (CrO4^2-)",
            "Manganate (MnO4^2-)",
            "Dichromate (Cr2O7^2-)",
            "Permanganate (MnO4^-)",
            "Arsenate (AsO4^3-)",
            "Selenate (SeO4^2-)",
            "Tellurate (TeO4^2-)",
            "Vanadate (VO4^3-)",
            "Molybdate (MoO4^2-)",
            "Tungstate (WO4^2-)",
            "Uranate (UO4^2-)",
            "Perchlorate (ClO4^-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Thiosulfate (S2O3^2-)",
                "Chromate (CrO4^2-)",
                "Dichromate (Cr2O7^2-)",
                "Manganate (MnO4^2-)",
                "Selenate (SeO4^2-)",
                "Molybdate (MoO4^2-)",
                "Tungstate (WO4^2-)"
            ],
            "mismatches": [
                "Sulfate (SO4^2-)",
                "Carbonate (CO3^2-)",
                "Phosphate (PO4^3-)",
                "Oxide (O^2-)",
                "Nitrite (NO2^-)",
                "Nitrate (NO3^-)",
                "Hydroxide (OH^-)",
                "Peroxide (O2^2-)",
                "Pyrophosphate (P2O7^4-)",
                "Silicate (SiO3^2-)",
                "Borate (BO3^3-)",
                "Permanganate (MnO4^-)",
                "Arsenate (AsO4^3-)",
                "Tellurate (TeO4^2-)",
                "Vanadate (VO4^3-)",
                "Uranate (UO4^2-)",
                "Perchlorate (ClO4^-)"
            ],
            "true_referents": [
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3-hydroxypyridine sulfate(1-)",
                "4-vinylguaiacol sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "dodecaboride(2-)",
                "hexyl sulfate(1-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenselenophosphate",
                "hydrogenvanadate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "molybdate",
                "oxidized Watasenia luciferin(2-)",
                "selenate",
                "sulfate",
                "tetrachlorozincate(2-)",
                "tetraoxidophosphate(.2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Oxalate (Ox2-)",
            "Sulfate (SO42-)",
            "Phosphate (PO43-)",
            "Nitrite (NO2-)",
            "Carbonate (CO32-)",
            "Chlorate (ClO3-)",
            "Bromate (BrO3-)",
            "Iodate (IO3-)",
            "Perchlorate (ClO4-)",
            "Nitrate (NO3-)",
            "Selenate (SeO42-)",
            "Tellurate (TeO42-)",
            "Tungstate (WO42-)",
            "Molybdate (MoO42-)",
            "Vanadate (VO3-)",
            "Chromate (CrO42-)",
            "Silicate (SiO43-)",
            "Arsenate (AsO43-)",
            "Antimonate (SbO3-)",
            "Tantalate (TaO3-)",
            "Niobate (NbO3-)",
            "Tetrathionate (S4O62-)",
            "Dithionate (S2O62-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Selenate (SeO42-)",
                "Tungstate (WO42-)",
                "Molybdate (MoO42-)",
                "Chromate (CrO42-)"
            ],
            "mismatches": [
                "Oxalate (Ox2-)",
                "Sulfate (SO42-)",
                "Phosphate (PO43-)",
                "Nitrite (NO2-)",
                "Carbonate (CO32-)",
                "Chlorate (ClO3-)",
                "Bromate (BrO3-)",
                "Iodate (IO3-)",
                "Perchlorate (ClO4-)",
                "Nitrate (NO3-)",
                "Tellurate (TeO42-)",
                "Vanadate (VO3-)",
                "Silicate (SiO43-)",
                "Arsenate (AsO43-)",
                "Antimonate (SbO3-)",
                "Tantalate (TaO3-)",
                "Niobate (NbO3-)",
                "Tetrathionate (S4O62-)",
                "Dithionate (S2O62-)"
            ],
            "true_referents": [
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "12-sulfojasmonate",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3,3'-diiodo-L-thyronine sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dimolybdate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "diphosphonate(2-)",
                "dithiophosphate(2-)",
                "hexyl sulfate(1-)",
                "hydridonitrate(2-)",
                "hydrogenselenophosphate",
                "hydrogenvanadate",
                "manganate",
                "methyl sulfate(1-)",
                "molybdate",
                "phosphonate(2-)",
                "selenate",
                "sulfate",
                "tetrachlorozincate(2-)",
                "tetraoxorhenate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 4,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Oxide (O\u00b2\u207b)",
            "Hydroxide (OH\u207b)",
            "Sulfide (S\u00b2\u207b)",
            "Chloride (Cl\u00b2\u207b)",
            "Bromide (Br\u00b2\u207b)",
            "Iodide (I\u00b2\u207b)",
            "Phosphide (P\u00b2\u207b)",
            "Arsonide (As\u00b2\u207b)",
            "Antimonide (Sb\u00b2\u207b)",
            "Bismuthide (Bi\u00b2\u207b)",
            "Selenide (Se\u00b2\u207b)",
            "Telluride (Te\u00b2\u207b)",
            "Polonide (Po\u00b2\u207b)",
            "Astatide (At\u00b2\u207b)",
            "Radonide (Rn\u00b2\u207b)",
            "Oxoanionsulfide (SO\u2083\u00b2\u207b)",
            "Oxoanionnitrite (NO\u2082\u207b)",
            "Oxoanionphosphate (PO\u2084\u00b2\u207b)",
            "Oxoanionsilicate (SiO\u2083\u00b2\u207b)",
            "Oxoanionborate (BO\u2083\u00b2\u207b)",
            "Oxoanionarsenate (AsO\u2083\u00b2\u207b)",
            "Oxoanionchromate (CrO\u2084\u00b2\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfide (S\u00b2\u207b)"
            ],
            "mismatches": [
                "Oxide (O\u00b2\u207b)",
                "Hydroxide (OH\u207b)",
                "Chloride (Cl\u00b2\u207b)",
                "Bromide (Br\u00b2\u207b)",
                "Iodide (I\u00b2\u207b)",
                "Phosphide (P\u00b2\u207b)",
                "Arsonide (As\u00b2\u207b)",
                "Antimonide (Sb\u00b2\u207b)",
                "Bismuthide (Bi\u00b2\u207b)",
                "Selenide (Se\u00b2\u207b)",
                "Telluride (Te\u00b2\u207b)",
                "Polonide (Po\u00b2\u207b)",
                "Astatide (At\u00b2\u207b)",
                "Radonide (Rn\u00b2\u207b)",
                "Oxoanionsulfide (SO\u2083\u00b2\u207b)",
                "Oxoanionnitrite (NO\u2082\u207b)",
                "Oxoanionphosphate (PO\u2084\u00b2\u207b)",
                "Oxoanionsilicate (SiO\u2083\u00b2\u207b)",
                "Oxoanionborate (BO\u2083\u00b2\u207b)",
                "Oxoanionarsenate (AsO\u2083\u00b2\u207b)",
                "Oxoanionchromate (CrO\u2084\u00b2\u207b)"
            ],
            "true_referents": [
                "(R)-secondary-alkyl sulfate oxoanion",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3,3'-diiodo-L-thyronine sulfate(1-)",
                "3-hydroxypyridine sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "aryl sulfate oxoanion",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "dithiophosphate(2-)",
                "dodecaboride(2-)",
                "hexyl sulfate(1-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenselenophosphate",
                "organosulfate oxoanion",
                "phenyl sulfate oxoanion",
                "phosphonate(2-)",
                "selenate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "tetraoxidophosphate(.2-)",
                "tetraoxorhenate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)"
            ],
            "TP": 1,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            {
                "Example": "nitrite",
                "Canonical name": "nitrite (NO2-)"
            },
            {
                "Example": "cyanide",
                "Canonical name": "cyanide (CN-)"
            },
            {
                "Example": "hydrogen sulfide",
                "Canonical name": "hydrogen sulfide (H2S)"
            },
            {
                "Example": "sulfite",
                "Canonical name": "sulfite (SO32-)"
            },
            {
                "Example": "acetate",
                "Canonical name": "acetate (CH3COO-)"
            },
            {
                "Example": "chlorate",
                "Canonical name": "chlorate (ClO3-)"
            },
            {
                "Example": "perchlorate",
                "Canonical name": "perchlorate (ClO4-)"
            },
            {
                "Example": "bromate",
                "Canonical name": "bromate (BrO3-)"
            },
            {
                "Example": "iodate",
                "Canonical name": "iodate (IO3-)"
            },
            {
                "Example": "periodate",
                "Canonical name": "periodate (IO4-)"
            },
            {
                "Example": "nitrate",
                "Canonical name": "nitrate (NO3-)"
            },
            {
                "Example": "sulfate",
                "Canonical name": "sulfate (SO42-)"
            },
            {
                "Example": "phosphate",
                "Canonical name": "phosphate (PO43-)"
            },
            {
                "Example": "carbonate",
                "Canonical name": "carbonate (CO32-)"
            },
            {
                "Example": "hydrogen carbonate",
                "Canonical name": "hydrogen carbonate (HCO3-)"
            },
            {
                "Example": "bicarbonate",
                "Canonical name": "bicarbonate (HCO3-)"
            },
            {
                "Example": "sulfide",
                "Canonical name": "sulfide (S2-)"
            },
            {
                "Example": "selenide",
                "Canonical name": "selenide (Se2-)"
            },
            {
                "Example": "telluride",
                "Canonical name": "telluride (Te2-)"
            },
            {
                "Example": "nitride",
                "Canonical name": "nitride (N3-)"
            },
            {
                "Example": "phosphide",
                "Canonical name": "phosphide (P3-)"
            },
            {
                "Example": "arsenide",
                "Canonical name": "arsenide (As3-)"
            },
            {
                "Example": "antimonide",
                "Canonical name": "antimonide (Sb3-)"
            },
            {
                "Example": "bismuthide",
                "Canonical name": "bismuthide (Bi3-)"
            },
            {
                "Example": "titanide",
                "Canonical name": "titanide (Ti3-)"
            },
            {
                "Example": "vanadate",
                "Canonical name": "vanadate (VO2-)"
            },
            {
                "Example": "chromate",
                "Canonical name": "chromate (CrO42-)"
            },
            {
                "Example": "manganate",
                "Canonical name": "manganate (MnO4-)"
            },
            {
                "Example": "molybdate",
                "Canonical name": "molybdate (MoO42-)"
            },
            {
                "Example": "tungstate",
                "Canonical name": "tungstate (WO42-)"
            },
            {
                "Example": "uranate",
                "Canonical name": "uranate (UO22+)"
            },
            {
                "Example": "oxalate",
                "Canonical name": "oxalate (C2O42-)"
            },
            {
                "Example": "formate",
                "Canonical name": "formate (HCOO-)"
            },
            {
                "Example": "acetate",
                "Canonical name": "acetate (CH3COO-)"
            },
            {
                "Example": "propionate",
                "Canonical name": "propionate (CH3CH2COO-)"
            },
            {
                "Example": "butyrate",
                "Canonical name": "butyrate (CH3CH2CH2COO-)"
            },
            {
                "Example": "valerate",
                "Canonical name": "valerate (CH3CH2CH2CH2COO-)"
            },
            {
                "Example": "heptanoate",
                "Canonical name": "heptanoate (CH3CH2CH2CH2CH2COO-)"
            },
            {
                "Example": "octanoate",
                "Canonical name": "octanoate (CH3CH2CH2CH2CH2CH2COO-)"
            },
            {
                "Example": "nonanoate",
                "Canonical name": "nonanoate (CH3CH2CH2CH2CH2CH2CH2COO-)"
            },
            {
                "Example": "decanoate",
                "Canonical name": "decanoate (CH3CH2CH2CH2CH2CH2CH2CH2COO-)"
            },
            {
                "Example": "undecanoate",
                "Canonical name": "undecanoate (CH3CH2CH2CH2CH2CH2CH2CH2CH2COO-)"
            },
            {
                "Example": "dodecanoate",
                "Canonical name": "dodecanoate (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2COO-)"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "sulfate",
                "chromate",
                "molybdate"
            ],
            "mismatches": [
                "nitrite",
                "cyanide",
                "hydrogen sulfide",
                "sulfite",
                "acetate",
                "chlorate",
                "perchlorate",
                "bromate",
                "iodate",
                "periodate",
                "nitrate",
                "phosphate",
                "carbonate",
                "hydrogen carbonate",
                "bicarbonate",
                "sulfide",
                "selenide",
                "telluride",
                "nitride",
                "phosphide",
                "arsenide",
                "antimonide",
                "bismuthide",
                "titanide",
                "vanadate",
                "manganate",
                "tungstate",
                "uranate",
                "oxalate",
                "formate",
                "propionate",
                "butyrate",
                "valerate",
                "heptanoate",
                "octanoate",
                "nonanoate",
                "decanoate",
                "undecanoate",
                "dodecanoate"
            ],
            "true_referents": [
                "(S)-2-O-sulfonatolactate(2-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3,3'-diiodo-L-thyronine sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "diphosphate(2-)",
                "diphosphonate(2-)",
                "hexyl sulfate(1-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydroxidotrioxidomanganate(2-)",
                "methyl sulfate(1-)",
                "molybdate",
                "orthoperiodate(2-)",
                "phosphonate(2-)",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "tetrachlorozincate(2-)",
                "thiosulfate(2-)",
                "triphosphate(2-)"
            ],
            "TP": 3,
            "FP": 39,
            "FN": 0
        }
    }
]