[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO4^2-)",
            "Carbonate (CO3^2-)",
            "Bicarbonate (HCO3^-)",
            "Phosphate (PO4^3-)",
            "Dihydrogen phosphate (H2PO4^-)",
            "Hydrogen phosphate (HPO4^2-)",
            "Silicate (SiO3^2-)",
            "Oxalate (C2O4^2-)",
            "Selenate (SeO4^2-)",
            "Tellurate (TeO4^2-)",
            "Arsenate (AsO4^3-)",
            "Vanadate (VO4^3-)",
            "Tungstate (WO4^2-)",
            "Molybdate (MoO4^2-)",
            "Nitrite (NO2^-)",
            "Nitrate (NO3^-)",
            "Chromate (CrO4^2-)",
            "Permanganate (MnO4^-)",
            "Chlorate (ClO3^-)",
            "Bromate (BrO3^-)",
            "Iodate (IO3^-)",
            "Thiosulfate (S2O3^2-)",
            "Fluoride (F^-)",
            "Sulfite (SO3^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4^2-)",
                "Hydrogen phosphate (HPO4^2-)",
                "Selenate (SeO4^2-)",
                "Tungstate (WO4^2-)",
                "Molybdate (MoO4^2-)",
                "Chromate (CrO4^2-)",
                "Thiosulfate (S2O3^2-)",
                "Sulfite (SO3^2-)"
            ],
            "mismatches": [
                "Carbonate (CO3^2-)",
                "Bicarbonate (HCO3^-)",
                "Phosphate (PO4^3-)",
                "Dihydrogen phosphate (H2PO4^-)",
                "Silicate (SiO3^2-)",
                "Oxalate (C2O4^2-)",
                "Tellurate (TeO4^2-)",
                "Arsenate (AsO4^3-)",
                "Vanadate (VO4^3-)",
                "Nitrite (NO2^-)",
                "Nitrate (NO3^-)",
                "Permanganate (MnO4^-)",
                "Chlorate (ClO3^-)",
                "Bromate (BrO3^-)",
                "Iodate (IO3^-)",
                "Fluoride (F^-)"
            ],
            "true_referents": [
                "(3E)-dec-3-en-1-yl sulfate",
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2-ethylhexyl sulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3,3'-diiodo-L-thyronine sulfate(1-)",
                "4-vinylguaiacol sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "diphosphonate(2-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "hydrogenvanadate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO4^2-)",
            "Carbonate (CO3^2-)",
            "Chloride (ClO4^2-)",
            "Nitrate (NO3^2-)",
            "Phosphate (PO4^3-)",
            "Acetate (C2H3O2^-)",
            "Bicarbonate (HCO3^-)",
            "Selenate (SeO4^2-)",
            "Thiosulfate (S2O3^2-)",
            "Molybdate (MoO4^2-)",
            "Permanganate (MnO4^-)",
            "Chromate (CrO4^2-)",
            "Dichromate (Cr2O7^2-)",
            "Arsenate (AsO4^3-)",
            "Cyanate (OCN^-)",
            "Oxalate (C2O4^2-)",
            "Tartrate (C4H4O6^2-)",
            "Fumarate (C4H2O4^2-)",
            "Malonate (C3H2O4^2-)",
            "Adeninate (Ade^2-)",
            "Formate (HCOO^-)",
            "Hydrogen phosphate (HPO4^2-)",
            "Dihydrogen phosphate (H2PO4^-)",
            "Methanolate (CH3O^-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Selenate (SeO4^2-)",
                "Thiosulfate (S2O3^2-)",
                "Molybdate (MoO4^2-)",
                "Chromate (CrO4^2-)",
                "Dichromate (Cr2O7^2-)",
                "Hydrogen phosphate (HPO4^2-)"
            ],
            "mismatches": [
                "Sulfate (SO4^2-)",
                "Carbonate (CO3^2-)",
                "Chloride (ClO4^2-)",
                "Nitrate (NO3^2-)",
                "Phosphate (PO4^3-)",
                "Acetate (C2H3O2^-)",
                "Bicarbonate (HCO3^-)",
                "Permanganate (MnO4^-)",
                "Arsenate (AsO4^3-)",
                "Cyanate (OCN^-)",
                "Oxalate (C2O4^2-)",
                "Tartrate (C4H4O6^2-)",
                "Fumarate (C4H2O4^2-)",
                "Malonate (C3H2O4^2-)",
                "Adeninate (Ade^2-)",
                "Formate (HCOO^-)",
                "Dihydrogen phosphate (H2PO4^-)",
                "Methanolate (CH3O^-)"
            ],
            "true_referents": [
                "(4R)-4,8-dimethylnonyl sulfate",
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-2-O-sulfonatolactate(2-)",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(S)-2-O-sulfonatolactate(2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2',3'-dipalmitoyl-2-sulfo-alpha,alpha-trehalose(1-)",
                "2-ethylhexyl sulfate(1-)",
                "3'-phosphonato-5'-adenylyl sulfate(4-)",
                "3-(3-sulfooxyphenyl)propanoate(2-)",
                "4-methylumbelliferone sulfate(1-)",
                "5'-adenylyl sulfate(2-)",
                "D-glucose 6-sulfate(1-)",
                "alkyl sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "diphosphonate(2-)",
                "ethyl 4-hydroxybenzoate sulfate(1-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "hydroxidotrioxidomanganate(2-)",
                "indoxyl sulfate(1-)",
                "manganate",
                "methyl sulfate(1-)",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "selenate",
                "sulfate",
                "sulfite",
                "tetrachlorozincate(2-)",
                "tetraoxorhenate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "triphosphate(2-)"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Carbonate (CO3^2-)",
            "Sulfate (SO4^2-)",
            "Phosphate (PO4^3-)",
            "Chromate (CrO4^2-)",
            "Oxalate (C2O4^2-)",
            "Molybdate (MoO4^2-)",
            "Selenite (SeO3^2-)",
            "Selenate (SeO4^2-)",
            "Tellurate (TeO4^2-)",
            "Tellurite (TeO3^2-)",
            "Peroxide (O2^2-)",
            "Thiocyanate (SCN^-)",
            "Azide (N3^-)",
            "Cyanate (OCN^-)",
            "Dithionite (S2O4^2-)",
            "Dithionate (S2O6^2-)",
            "Hypochlorite (ClO^-)",
            "Hypobromite (BrO^-)",
            "Hypoiodite (IO^-)",
            "Perchlorate (ClO4^-)",
            "Permanganate (MnO4^-)",
            "Cyanide (CN^-)",
            "Chlorite (ClO2^-)",
            "Bromite (BrO2^-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4^2-)",
                "Chromate (CrO4^2-)",
                "Molybdate (MoO4^2-)",
                "Selenate (SeO4^2-)"
            ],
            "mismatches": [
                "Carbonate (CO3^2-)",
                "Phosphate (PO4^3-)",
                "Oxalate (C2O4^2-)",
                "Selenite (SeO3^2-)",
                "Tellurate (TeO4^2-)",
                "Tellurite (TeO3^2-)",
                "Peroxide (O2^2-)",
                "Thiocyanate (SCN^-)",
                "Azide (N3^-)",
                "Cyanate (OCN^-)",
                "Dithionite (S2O4^2-)",
                "Dithionate (S2O6^2-)",
                "Hypochlorite (ClO^-)",
                "Hypobromite (BrO^-)",
                "Hypoiodite (IO^-)",
                "Perchlorate (ClO4^-)",
                "Permanganate (MnO4^-)",
                "Cyanide (CN^-)",
                "Chlorite (ClO2^-)",
                "Bromite (BrO2^-)"
            ],
            "true_referents": [
                "(3Z)-dec-3-en-1-yl sulfate",
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(S)-2-O-sulfonatolactate(2-)",
                "(dioxido)trioxidophosphate(.2-)",
                "2-ethylhexyl sulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3,3'-diiodo-L-thyronine sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "dithiophosphate(2-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenselenophosphate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "oxidized Watasenia luciferin(2-)",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "tetraoxidophosphate(.2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO\u2084\u00b2\u207b)",
            "Carbonate (CO\u2083\u00b2\u207b)",
            "Chromate (CrO\u2084\u00b2\u207b)",
            "Dichromate (Cr\u2082O\u2087\u00b2\u207b)",
            "Nitrite (NO\u2082\u207b)",
            "Silicate (SiO\u2083\u00b2\u207b)",
            "Phosphate (PO\u2084\u00b3\u207b) - behaving as divalent under specific pH",
            "Hydrogen Phosphate (HPO\u2084\u00b2\u207b)",
            "Hydrogen Carbonate (HCO\u2083\u207b) - behaving as divalent under specific pH",
            "Thiosulfate (S\u2082O\u2083\u00b2\u207b)",
            "Molybdate (MoO\u2084\u00b2\u207b)",
            "Tungstate (WO\u2084\u00b2\u207b)",
            "Vanadate (VO\u2084\u00b3\u207b) - behaving as divalent under specific pH",
            "Arsenate (AsO\u2084\u00b3\u207b) - behaving as divalent under specific pH",
            "Permanganate (MnO\u2084\u207b) - though often considered tetravalent, exhibits divalent characteristics in reactions",
            "Selenate (SeO\u2084\u00b2\u207b)",
            "Tellurate (TeO\u2084\u00b2\u207b)",
            "Sulfite (SO\u2083\u00b2\u207b)",
            "Cyanide (CN\u207b) - coordinating as a divalent ligand",
            "Oxalate (C\u2082O\u2084\u00b2\u207b)",
            "Tartrate (C\u2084H\u2084O\u2086\u00b2\u207b)",
            "Malonate (C\u2083H\u2082O\u2084\u00b2\u207b)",
            "Succinate (C\u2084H\u2084O\u2084\u00b2\u207b)",
            "Adipate (C\u2086H\u2081\u2080O\u2084\u00b2\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO\u2084\u00b2\u207b)",
                "Chromate (CrO\u2084\u00b2\u207b)",
                "Dichromate (Cr\u2082O\u2087\u00b2\u207b)",
                "Hydrogen Phosphate (HPO\u2084\u00b2\u207b)",
                "Thiosulfate (S\u2082O\u2083\u00b2\u207b)",
                "Molybdate (MoO\u2084\u00b2\u207b)",
                "Tungstate (WO\u2084\u00b2\u207b)",
                "Selenate (SeO\u2084\u00b2\u207b)",
                "Sulfite (SO\u2083\u00b2\u207b)"
            ],
            "mismatches": [
                "Carbonate (CO\u2083\u00b2\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Silicate (SiO\u2083\u00b2\u207b)",
                "Hydrogen Carbonate (HCO\u2083\u207b) - behaving as divalent under specific pH",
                "Vanadate (VO\u2084\u00b3\u207b) - behaving as divalent under specific pH",
                "Arsenate (AsO\u2084\u00b3\u207b) - behaving as divalent under specific pH",
                "Permanganate (MnO\u2084\u207b) - though often considered tetravalent, exhibits divalent characteristics in reactions",
                "Tellurate (TeO\u2084\u00b2\u207b)",
                "Cyanide (CN\u207b) - coordinating as a divalent ligand",
                "Oxalate (C\u2082O\u2084\u00b2\u207b)",
                "Tartrate (C\u2084H\u2084O\u2086\u00b2\u207b)",
                "Malonate (C\u2083H\u2082O\u2084\u00b2\u207b)",
                "Succinate (C\u2084H\u2084O\u2084\u00b2\u207b)",
                "Adipate (C\u2086H\u2081\u2080O\u2084\u00b2\u207b)"
            ],
            "true_referents": [
                "(2R)-2,6-dimethylheptyl sulfate",
                "(3Z,6Z)-dodeca-3,6-dien-1-yl sulfate",
                "(R)-2-O-sulfonatolactate(2-)",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(S)-2-O-sulfonatolactate(2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2',3'-dipalmitoyl-2-sulfo-alpha,alpha-trehalose(1-)",
                "6-O-sulfonato-D-glucono-1,5-lactone(1-)",
                "D-glucose 6-sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "aryl sulfate oxoanion",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "hydrogenvanadate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl sulfate(1-)",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "phenyl sulfate oxoanion",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "triphosphate(2-)",
                "tungstate",
                "vanillyl alcohol monosulfate(1-)"
            ],
            "TP": 9,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO4^2-)",
            "Carbonate (CO3^2-)",
            "Chromate (CrO4^2-)",
            "Dichromate (Cr2O7^2-)",
            "Molybdate (MoO4^2-)",
            "Tungstate (WO4^2-)",
            "Oxalate (C2O4^2-)",
            "Peroxide (O2^2-)",
            "Selenate (SeO4^2-)",
            "Tellurate (TeO4^2-)",
            "Thiosulfate (S2O3^2-)",
            "Silicate (SiO3^2-)",
            "Selenite (SeO3^2-)",
            "Tellurite (TeO3^2-)",
            "Tartrate (C4H4O6^2-)",
            "Phthalate (C8H4O4^2-)",
            "Hydrogen phosphate (HPO4^2-)",
            "Pyrophosphate (P2O7^4-)",
            "Disulfide (S2^2-)",
            "Oxalate (C2O4^2-)",
            "Peroxodisulfate (S2O8^2-)",
            "Tetraborate (B4O7^2-)",
            "Citrate (C6H5O7^3-)",
            "Thiocyanate (SCN^-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4^2-)",
                "Chromate (CrO4^2-)",
                "Dichromate (Cr2O7^2-)",
                "Molybdate (MoO4^2-)",
                "Tungstate (WO4^2-)",
                "Selenate (SeO4^2-)",
                "Thiosulfate (S2O3^2-)",
                "Hydrogen phosphate (HPO4^2-)"
            ],
            "mismatches": [
                "Carbonate (CO3^2-)",
                "Oxalate (C2O4^2-)",
                "Peroxide (O2^2-)",
                "Tellurate (TeO4^2-)",
                "Silicate (SiO3^2-)",
                "Selenite (SeO3^2-)",
                "Tellurite (TeO3^2-)",
                "Tartrate (C4H4O6^2-)",
                "Phthalate (C8H4O4^2-)",
                "Pyrophosphate (P2O7^4-)",
                "Disulfide (S2^2-)",
                "Peroxodisulfate (S2O8^2-)",
                "Tetraborate (B4O7^2-)",
                "Citrate (C6H5O7^3-)",
                "Thiocyanate (SCN^-)"
            ],
            "true_referents": [
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-2-O-sulfonatolactate(2-)",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(S)-2-O-sulfonatolactate(2-)",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2-ethylhexyl sulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3-hydroxypyridine sulfate(1-)",
                "D-glucose 6-sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "bisphenol A sulfate(1-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "dithiophosphate(2-)",
                "dodecaboride(2-)",
                "ethyl 4-hydroxybenzoate sulfate(1-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "oxidized Watasenia luciferin(2-)",
                "propyl 4-hydroxybenzoate sulfate(1-)",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "tetraoxidophosphate(.2-)",
                "tetraoxorhenate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 8,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO4^2-)",
            "Carbonate (CO3^2-)",
            "Phosphate (PO4^3-)",
            "Nitrate (NO3^-)",
            "Sulfite (SO3^2-)",
            "Arsenate (AsO4^3-)",
            "Chromate (CrO4^2-)",
            "Dichromate (Cr2O7^2-)",
            "Hydrogen phosphate (HPO4^2-)",
            "Hydroxide (OH^-)",
            "Silicate (SiO3^2-)",
            "Vanadate (VO4^3-)",
            "Molybdate (MoO4^2-)",
            "Tungstate (WO4^2-)",
            "Tellurate (TeO4^2-)",
            "Perchlorate (ClO4^-)",
            "Bicarbonate (HCO3^-)",
            "Selenate (SeO4^2-)",
            "Borate (BO3^3-)",
            "Oxalate (C2O4^2-)",
            "Cyanate (OCN^-)",
            "Thiosulfate (S2O3^2-)",
            "Phosphite (PO3^3-)",
            "Arsenite (AsO3^3-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "sulfate",
                "sulfite",
                "chromate(2-)",
                "dichromate(2-)",
                "hydrogenphosphate",
                "molybdate",
                "selenate",
                "thiosulfate(2-)",
                "arsenite(2-)"
            ],
            "mismatches": [
                "carbonate (CO3^2-)",
                "phosphate (PO4^3-)",
                "nitrate (NO3^-)",
                "arsenate (AsO4^3-)",
                "hydroxide (OH^-)",
                "silicate (SiO3^2-)",
                "vanadate (VO4^3-)",
                "tungstate (WO4^2-)",
                "tellurate (TeO4^2-)",
                "perchlorate (ClO4^-)",
                "bicarbonate (HCO3^-)",
                "borate (BO3^3-)",
                "oxalate (C2O4^2-)",
                "cyanate (OCN^-)",
                "phosphite (PO3^3-)"
            ],
            "true_referents": [
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2-ethylhexyl sulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3-hydroxypyridine sulfate(1-)",
                "4-vinylguaiacol sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "dodecaboride(2-)",
                "hexyl sulfate(1-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "hydrogenvanadate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO4^2-)",
            "Carbonate (CO3^2-)",
            "Chromate (CrO4^2-)",
            "Dichromate (Cr2O7^2-)",
            "Oxalate (C2O4^2-)",
            "Silicate (SiO3^2-)",
            "Phosphate (PO4^2-)",
            "Hydrogen phosphate (HPO4^2-)",
            "Dihydrogen phosphate (H2PO4^2-)",
            "Thiosulfate (S2O3^2-)",
            "Tartrate (C4H4O6^2-)",
            "Perchlorate (ClO4^2-)",
            "Molybdate (MoO4^2-)",
            "Tungstate (WO4^2-)",
            "Tellurate (TeO4^2-)",
            "Selenate (SeO4^2-)",
            "Vanadate (VO4^2-)",
            "Niobate (NbO3^2-)",
            "Titanate (TiO3^2-)",
            "Zirconate (ZrO3^2-)",
            "Hafnate (HfO3^2-)",
            "Stannate (SnO3^2-)",
            "Plumbate (PbO3^2-)",
            "Bismuthate (BiO3^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4^2-)",
                "Chromate (CrO4^2-)",
                "Dichromate (Cr2O7^2-)",
                "Hydrogen phosphate (HPO4^2-)",
                "Thiosulfate (S2O3^2-)",
                "Molybdate (MoO4^2-)",
                "Tungstate (WO4^2-)",
                "Selenate (SeO4^2-)"
            ],
            "mismatches": [
                "Carbonate (CO3^2-)",
                "Oxalate (C2O4^2-)",
                "Silicate (SiO3^2-)",
                "Phosphate (PO4^2-)",
                "Dihydrogen phosphate (H2PO4^2-)",
                "Tartrate (C4H4O6^2-)",
                "Perchlorate (ClO4^2-)",
                "Tellurate (TeO4^2-)",
                "Vanadate (VO4^2-)",
                "Niobate (NbO3^2-)",
                "Titanate (TiO3^2-)",
                "Zirconate (ZrO3^2-)",
                "Hafnate (HfO3^2-)",
                "Stannate (SnO3^2-)",
                "Plumbate (PbO3^2-)",
                "Bismuthate (BiO3^2-)"
            ],
            "true_referents": [
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-2-O-sulfonatolactate(2-)",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2-ethylhexyl sulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "4-vinylguaiacol sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "bisphenol A sulfate(1-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "diphosphonate(2-)",
                "ethyl 4-hydroxybenzoate sulfate(1-)",
                "halistanol sulfate F(3-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "hydrogenvanadate",
                "manganate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "selenate",
                "sulfate",
                "tetrachlorozincate(2-)",
                "tetraoxorhenate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride (Cl-)",
            "Bromide (Br-)",
            "Iodide (I-)",
            "Fluoride (F-)",
            "Hydroxide (OH-)",
            "Nitrate (NO3-)",
            "Nitrite (NO2-)",
            "Sulfate (SO4^2-)",
            "Sulfite (SO3^2-)",
            "Carbonate (CO3^2-)",
            "Phosphate (PO4^3-)",
            "Arsenate (AsO4^3-)",
            "Cyanide (CN-)",
            "Borate (BO3^3-)",
            "Chromate (CrO4^2-)",
            "Dichromate (Cr2O7^2-)",
            "Permanganate (MnO4-)",
            "Peroxide (O2^2-)",
            "Thiocyanate (SCN-)",
            "Acetate (C2H3O2-)",
            "Oxalate (C2O4^2-)",
            "Silicate (SiO3^2-)",
            "Thiosulfate (S2O3^2-)",
            "Selenate (SeO4^2-)",
            "Tellurate (TeO4^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4^2-)",
                "Sulfite (SO3^2-)",
                "Chromate (CrO4^2-)",
                "Dichromate (Cr2O7^2-)",
                "Thiosulfate (S2O3^2-)",
                "Selenate (SeO4^2-)"
            ],
            "mismatches": [
                "Chloride (Cl-)",
                "Bromide (Br-)",
                "Iodide (I-)",
                "Fluoride (F-)",
                "Hydroxide (OH-)",
                "Nitrate (NO3-)",
                "Nitrite (NO2-)",
                "Carbonate (CO3^2-)",
                "Phosphate (PO4^3-)",
                "Arsenate (AsO4^3-)",
                "Cyanide (CN-)",
                "Borate (BO3^3-)",
                "Permanganate (MnO4-)",
                "Peroxide (O2^2-)",
                "Thiocyanate (SCN-)",
                "Acetate (C2H3O2-)",
                "Oxalate (C2O4^2-)",
                "Silicate (SiO3^2-)",
                "Tellurate (TeO4^2-)"
            ],
            "true_referents": [
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(S)-2-O-sulfonatolactate(2-)",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2-ethylhexyl sulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3,3'-diiodo-L-thyronine sulfate(1-)",
                "3-(3-sulfooxyphenyl)propanoate(2-)",
                "3-hydroxypyridine sulfate(1-)",
                "D-glucose 6-sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "dodecaboride(2-)",
                "hexyl sulfate(1-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenselenophosphate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "oxidized Watasenia luciferin(2-)",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "tetraoxidophosphate(.2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)"
            ],
            "TP": 6,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO\u2084\u00b2\u207b)",
            "Carbonate (CO\u2083\u00b2\u207b)",
            "Oxalate (C\u2082O\u2084\u00b2\u207b)",
            "Chromate (CrO\u2084\u00b2\u207b)",
            "Dichromate (Cr\u2082O\u2087\u00b2\u207b)",
            "Sulfite (SO\u2083\u00b2\u207b)",
            "Thiosulfate (S\u2082O\u2083\u00b2\u207b)",
            "Peroxydisulfate (S\u2082O\u2088\u00b2\u207b)",
            "Manganate (MnO\u2084\u00b2\u207b)",
            "Molybdate (MoO\u2084\u00b2\u207b)",
            "Tungstate (WO\u2084\u00b2\u207b)",
            "Vanadate (VO\u2084\u00b2\u207b)",
            "Selenate (SeO\u2084\u00b2\u207b)",
            "Selenite (SeO\u2083\u00b2\u207b)",
            "Tellurate (TeO\u2084\u00b2\u207b)",
            "Tellurite (TeO\u2083\u00b2\u207b)",
            "Dithionate (S\u2082O\u2086\u00b2\u207b)",
            "Hydrogen phosphate (HPO\u2084\u00b2\u207b)",
            "Silicate (SiO\u2083\u00b2\u207b)",
            "Peroxomonosulfate (HSO\u2085\u00b2\u207b)",
            "Peroxotungstate (W\u2082O\u2087\u00b2\u207b)",
            "Peroxomanganate (MnO\u2085\u00b2\u207b)",
            "Peroxovanadate (VO\u2085\u00b2\u207b)",
            "Peroxomolybdate (MoO\u2085\u00b2\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO\u2084\u00b2\u207b)",
                "Chromate (CrO\u2084\u00b2\u207b)",
                "Dichromate (Cr\u2082O\u2087\u00b2\u207b)",
                "Sulfite (SO\u2083\u00b2\u207b)",
                "Manganate (MnO\u2084\u00b2\u207b)",
                "Molybdate (MoO\u2084\u00b2\u207b)",
                "Tungstate (WO\u2084\u00b2\u207b)",
                "Selenate (SeO\u2084\u00b2\u207b)"
            ],
            "mismatches": [
                "Carbonate (CO\u2083\u00b2\u207b)",
                "Oxalate (C\u2082O\u2084\u00b2\u207b)",
                "Thiosulfate (S\u2082O\u2083\u00b2\u207b)",
                "Peroxydisulfate (S\u2082O\u2088\u00b2\u207b)",
                "Vanadate (VO\u2084\u00b2\u207b)",
                "Selenite (SeO\u2083\u00b2\u207b)",
                "Tellurate (TeO\u2084\u00b2\u207b)",
                "Tellurite (TeO\u2083\u00b2\u207b)",
                "Dithionate (S\u2082O\u2086\u00b2\u207b)",
                "Hydrogen phosphate (HPO\u2084\u00b2\u207b)",
                "Silicate (SiO\u2083\u00b2\u207b)",
                "Peroxomonosulfate (HSO\u2085\u00b2\u207b)",
                "Peroxotungstate (W\u2082O\u2087\u00b2\u207b)",
                "Peroxomanganate (MnO\u2085\u00b2\u207b)",
                "Peroxovanadate (VO\u2085\u00b2\u207b)",
                "Peroxomolybdate (MoO\u2085\u00b2\u207b)"
            ],
            "true_referents": [
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "3-hydroxypyridine sulfate(1-)",
                "4-vinylguaiacol sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "dithiophosphate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "hydrogenvanadate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl sulfate(1-)",
                "molybdate",
                "organosulfate oxoanion",
                "oxidized Watasenia luciferin(2-)",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetraoxidophosphate(.2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "tungstate"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO4^2-)",
            "Carbonate (CO3^2-)",
            "Oxide (O^2-)",
            "Sulfite (SO3^2-)",
            "Selenate (SeO4^2-)",
            "Chromate (CrO4^2-)",
            "Dichromate (Cr2O7^2-)",
            "Sulfide (S^2-)",
            "Selenite (SeO3^2-)",
            "Tellurite (TeO3^2-)",
            "Tellurate (TeO4^2-)",
            "Thiosulfate (S2O3^2-)",
            "Molybdate (MoO4^2-)",
            "Tungstate (WO4^2-)",
            "Silicate (SiO3^2-)",
            "Phosphite (HPO3^2-)",
            "Hydrogen phosphate (HPO4^2-)",
            "Peroxide (O2^2-)",
            "Manganate (MnO4^2-)",
            "Permanganate (MnO4^2-)",
            "Oxalate (C2O4^2-)",
            "Sulfamate (NH2SO3^2-)",
            "Periodate (IO4^2-)",
            "Borate (BO3^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4^2-)",
                "Sulfite (SO3^2-)",
                "Selenate (SeO4^2-)",
                "Chromate (CrO4^2-)",
                "Dichromate (Cr2O7^2-)",
                "Sulfide (S^2-)",
                "Thiosulfate (S2O3^2-)",
                "Molybdate (MoO4^2-)",
                "Tungstate (WO4^2-)",
                "Hydrogen phosphate (HPO4^2-)",
                "Manganate (MnO4^2-)"
            ],
            "mismatches": [
                "Carbonate (CO3^2-)",
                "Oxide (O^2-)",
                "Selenite (SeO3^2-)",
                "Tellurite (TeO3^2-)",
                "Tellurate (TeO4^2-)",
                "Silicate (SiO3^2-)",
                "Phosphite (HPO3^2-)",
                "Peroxide (O2^2-)",
                "Permanganate (MnO4^2-)",
                "Oxalate (C2O4^2-)",
                "Sulfamate (NH2SO3^2-)",
                "Periodate (IO4^2-)",
                "Borate (BO3^2-)"
            ],
            "true_referents": [
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2-ethylhexyl sulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3,3'-diiodo-L-thyronine sulfate(1-)",
                "3-D-glucuronosyl-N(2),6-disulfonato-beta-D-glucosamine(3-)",
                "3-aminopropyl N-acetyl-6-O-sulfonato-beta-D-glucosaminide",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "diphosphonate(2-)",
                "dodecaboride(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "oxidized Watasenia luciferin(2-)",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetraoxidophosphate(.2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "carbonate (CO3^2-)",
            "sulfate (SO4^2-)",
            "sulfite (SO3^2-)",
            "thiosulfate (S2O3^2-)",
            "chromate (CrO4^2-)",
            "dichromate (Cr2O7^2-)",
            "molybdate (MoO4^2-)",
            "tungstate (WO4^2-)",
            "selenate (SeO4^2-)",
            "selenite (SeO3^2-)",
            "tellurate (TeO4^2-)",
            "tellurite (TeO3^2-)",
            "manganate (MnO4^2-)",
            "silicate (SiO4^4-)",
            "germanate (GeO4^4-)",
            "stannate (SnO3^2-)",
            "plumbate (PbO3^2-)",
            "titanate (TiO3^2-)",
            "zirconate (ZrO3^2-)",
            "vanadate (VO4^3-)",
            "niobate (NbO4^3-)",
            "tantalate (TaO4^3-)",
            "phosphate (PO4^3-)",
            "arsenate (AsO4^3-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "sulfate (SO4^2-)",
                "sulfite (SO3^2-)",
                "thiosulfate (S2O3^2-)",
                "chromate (CrO4^2-)",
                "dichromate (Cr2O7^2-)",
                "molybdate (MoO4^2-)",
                "tungstate (WO4^2-)",
                "selenate (SeO4^2-)",
                "manganate (MnO4^2-)"
            ],
            "mismatches": [
                "carbonate (CO3^2-)",
                "selenite (SeO3^2-)",
                "tellurate (TeO4^2-)",
                "tellurite (TeO3^2-)",
                "silicate (SiO4^4-)",
                "germanate (GeO4^4-)",
                "stannate (SnO3^2-)",
                "plumbate (PbO3^2-)",
                "titanate (TiO3^2-)",
                "zirconate (ZrO3^2-)",
                "vanadate (VO4^3-)",
                "niobate (NbO4^3-)",
                "tantalate (TaO4^3-)",
                "phosphate (PO4^3-)",
                "arsenate (AsO4^3-)"
            ],
            "true_referents": [
                "(3Z)-dec-3-en-1-yl sulfate",
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "4-vinylguaiacol sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "hydrogenphosphate",
                "hydrogenselenophosphate",
                "hydrogenvanadate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "molybdate",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetraoxorhenate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Sulfate (SO4^2-)",
            "Carbonate (CO3^2-)",
            "Chromate (CrO4^2-)",
            "Oxalate (C2O4^2-)",
            "Selenate (SeO4^2-)",
            "Silicate (SiO3^2-)",
            "Phosphate (PO4^3-)",
            "Sulfite (SO3^2-)",
            "Thiosulfate (S2O3^2-)",
            "Dichromate (Cr2O7^2-)",
            "Molybdate (MoO4^2-)",
            "Pyrophosphate (P2O7^4-)",
            "Hypochlorite (ClO^-)",
            "Chlorite (ClO2^-)",
            "Chlorate (ClO3^-)",
            "Perchlorate (ClO4^-)",
            "Permanganate (MnO4^-)",
            "Arsenate (AsO4^3-)",
            "Borate (BO3^3-)",
            "Nitrite (NO2^-)",
            "Nitrate (NO3^-)",
            "Peroxide (O2^2-)",
            "Hydroxide (OH^-)",
            "Carbide (C^4-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4^2-)",
                "Chromate (CrO4^2-)",
                "Selenate (SeO4^2-)",
                "Sulfite (SO3^2-)",
                "Thiosulfate (S2O3^2-)",
                "Dichromate (Cr2O7^2-)",
                "Molybdate (MoO4^2-)"
            ],
            "mismatches": [
                "Carbonate (CO3^2-)",
                "Oxalate (C2O4^2-)",
                "Silicate (SiO3^2-)",
                "Phosphate (PO4^3-)",
                "Pyrophosphate (P2O7^4-)",
                "Hypochlorite (ClO^-)",
                "Chlorite (ClO2^-)",
                "Chlorate (ClO3^-)",
                "Perchlorate (ClO4^-)",
                "Permanganate (MnO4^-)",
                "Arsenate (AsO4^3-)",
                "Borate (BO3^3-)",
                "Nitrite (NO2^-)",
                "Nitrate (NO3^-)",
                "Peroxide (O2^2-)",
                "Hydroxide (OH^-)",
                "Carbide (C^4-)"
            ],
            "true_referents": [
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2-ethylhexyl sulfate(1-)",
                "3-hydroxypyridine sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "dodecaboride(2-)",
                "hexyl sulfate(1-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenselenophosphate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "oxidized Watasenia luciferin(2-)",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "tetraoxidophosphate(.2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Carbonate (CO3^2-)",
            "Sulfate (SO4^2-)",
            "Phosphate (PO4^3-)",
            "Oxalate (C2O4^2-)",
            "Chromate (CrO4^2-)",
            "Selenate (SeO4^2-)",
            "Tellurate (TeO4^2-)",
            "Molybdate (MoO4^2-)",
            "Tungstate (WO4^2-)",
            "Permanganate (MnO4^2-)",
            "Thiosulfate (S2O3^2-)",
            "Dithionite (S2O4^2-)",
            "Diphosphate (P2O7^4-)",
            "Pyrophosphate (P2O7^4-)",
            "Silicate (SiO3^2-)",
            "Borate (BO3^3-)",
            "Vanadate (VO4^3-)",
            "Titanate (TiO3^2-)",
            "Zirconate (ZrO3^2-)",
            "Stannate (SnO3^2-)",
            "Plumbate (PbO3^2-)",
            "Manganate (MnO4^2-)",
            "Ferrate (FeO4^2-)",
            "Cobaltate (CoO4^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO4^2-)",
                "Chromate (CrO4^2-)",
                "Selenate (SeO4^2-)",
                "Molybdate (MoO4^2-)",
                "Tungstate (WO4^2-)",
                "Thiosulfate (S2O3^2-)",
                "Diphosphate (P2O7^4-)",
                "Manganate (MnO4^2-)"
            ],
            "mismatches": [
                "Carbonate (CO3^2-)",
                "Phosphate (PO4^3-)",
                "Oxalate (C2O4^2-)",
                "Tellurate (TeO4^2-)",
                "Permanganate (MnO4^2-)",
                "Dithionite (S2O4^2-)",
                "Pyrophosphate (P2O7^4-)",
                "Silicate (SiO3^2-)",
                "Borate (BO3^3-)",
                "Vanadate (VO4^3-)",
                "Titanate (TiO3^2-)",
                "Zirconate (ZrO3^2-)",
                "Stannate (SnO3^2-)",
                "Plumbate (PbO3^2-)",
                "Ferrate (FeO4^2-)",
                "Cobaltate (CoO4^2-)"
            ],
            "true_referents": [
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(dioxido)trioxidophosphate(.2-)",
                "1,2,3-benzenetriol monosulfate(1-)",
                "2-ethylhexyl sulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "4-vinylguaiacol sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "diphosphonate(2-)",
                "dithiophosphate(2-)",
                "dodecaboride(2-)",
                "hydrogenphosphate",
                "hydrogenselenophosphate",
                "hydrogenvanadate",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "selenate",
                "sulfate",
                "tetraoxidophosphate(.2-)",
                "tetraoxorhenate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Carbonate (CO3^2-)",
            "Sulfate (SO4^2-)",
            "Phosphate (PO4^3-)",
            "Nitrite (NO2^-)",
            "Nitrate (NO3^-)",
            "Chloride (Cl^-)",
            "Bromide (Br^-)",
            "Iodide (I^-)",
            "Fluoride (F^-)",
            "Acetate (CH3COO^-)",
            "Citrate (C6H5O7^2-)",
            "Tartrate (C4H4O6^2-)",
            "Malate (C4H4O5^2-)",
            "Oxalate (C2O4^2-)",
            "Selenite (SeO3^2-)",
            "Selenate (SeO4^2-)",
            "Tellurite (TeO3^2-)",
            "Tellurate (TeO4^2-)",
            "Arsenate (AsO4^3-)",
            "Arsenite (AsO3^3-)",
            "Phosphite (PO3^3-)",
            "Phosphonate (PO3R^2-)",
            "Silicate (SiO4^4-)",
            "Germanate (GeO4^2-)",
            "Molybdate (MoO4^2-)",
            "Tungstate (WO4^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Selenate (SeO4^2-)",
                "Arsenite (AsO3^3-)",
                "Phosphonate (PO3R^2-)",
                "Sulfate (SO4^2-)",
                "Tungstate (WO4^2-)"
            ],
            "mismatches": [
                "Carbonate (CO3^2-)",
                "Phosphate (PO4^3-)",
                "Nitrite (NO2^-)",
                "Nitrate (NO3^-)",
                "Chloride (Cl^-)",
                "Bromide (Br^-)",
                "Iodide (I^-)",
                "Fluoride (F^-)",
                "Acetate (CH3COO^-)",
                "Citrate (C6H5O7^2-)",
                "Tartrate (C4H4O6^2-)",
                "Malate (C4H4O5^2-)",
                "Oxalate (C2O4^2-)",
                "Selenite (SeO3^2-)",
                "Tellurite (TeO3^2-)",
                "Tellurate (TeO4^2-)",
                "Arsenate (AsO4^3-)",
                "Phosphite (PO3^3-)",
                "Silicate (SiO4^4-)",
                "Germanate (GeO4^2-)",
                "Molybdate (MoO4^2-)"
            ],
            "true_referents": [
                "(3Z)-dec-3-en-1-yl sulfate",
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-2-O-sulfonatolactate(2-)",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(S)-2-O-sulfonatolactate(2-)",
                "(dioxido)trioxidophosphate(.2-)",
                "2-ethylhexyl sulfate(1-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3,3'-diiodo-L-thyronine sulfate(1-)",
                "3-phosphonatopyruvate(3-)",
                "D-glucose 6-sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "diphosphate(2-)",
                "diphosphonate(2-)",
                "ethyl 4-hydroxybenzoate sulfate(1-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydrogenselenophosphate",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "phosphonate(2-)",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "tetrachlorozincate(2-)",
                "tetraoxorhenate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 5,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride (Cl-) ",
            "Hydrogen carbonate (HCO3-) ",
            "Bicarbonate (HCO3-) ",
            "Sulfate (SO42-) ",
            "Thiosulfate (S2O32-) ",
            "Hydrogen sulfate (HSO4-) ",
            "Phosphate (PO43-) ",
            "Hydrogen phosphate (HPO42-) ",
            "Dihydrogen phosphate (H2PO4-) ",
            "Carbonate (CO32-) ",
            "Hydrogen carbonate (HCO3-) ",
            "Chromate (CrO42-) ",
            "Permanganate (MnO4-) ",
            "Ar\u0441\u0435\u043dite (AsO33-) ",
            "Antimonite (SbO33-) ",
            "Silicate (SiO44-) ",
            "Metasilicate (SiO32-) ",
            "Orthosilicate (SiO44-) ",
            "Metaborate (BO32-) ",
            "Orthoborate (BO33-) ",
            "Hydrogen oxalate (HC2O4-) ",
            "Oxalate (C2O42-) ",
            "Hydrogen citrate (HC6H5O7-) ",
            "Citrate (C6H5O73-) "
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfate (SO42-)",
                "Thiosulfate (S2O32-)",
                "Chromate (CrO42-)"
            ],
            "mismatches": [
                "Chloride (Cl-)",
                "Hydrogen carbonate (HCO3-)",
                "Bicarbonate (HCO3-)",
                "Hydrogen sulfate (HSO4-)",
                "Phosphate (PO43-)",
                "Hydrogen phosphate (HPO42-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Carbonate (CO32-)",
                "Permanganate (MnO4-)",
                "Ar\u0441enite (AsO33-)",
                "Antimonite (SbO33-)",
                "Silicate (SiO44-)",
                "Metasilicate (SiO32-)",
                "Orthosilicate (SiO44-)",
                "Metaborate (BO32-)",
                "Orthoborate (BO33-)",
                "Hydrogen oxalate (HC2O4-)",
                "Oxalate (C2O42-)",
                "Hydrogen citrate (HC6H5O7-)",
                "Citrate (C6H5O73-)"
            ],
            "true_referents": [
                "(R)-2-O-sulfonatolactate(2-)",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(S)-2-O-sulfonatolactate(2-)",
                "25-hydroxyvitamin D3 sulfate(1-)",
                "3-hydroxypyridine sulfate(1-)",
                "D-glucose 6-sulfate(1-)",
                "antimonate(2-)",
                "arsenite(2-)",
                "aryl sulfate oxoanion",
                "bisphenol A sulfate(1-)",
                "chromate(2-)",
                "dichromate(2-)",
                "dihydrogensilicate(2-)",
                "dioxidodiperoxidochromate(2-)",
                "diphosphate(2-)",
                "diphosphonate(2-)",
                "dodecaboride(2-)",
                "ethyl 4-hydroxybenzoate sulfate(1-)",
                "hexyl sulfate(1-)",
                "holothurin A3(1-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "hydroxidotrioxidomanganate(2-)",
                "manganate",
                "methyl sulfate(1-)",
                "methyl-4-hydroxybenzoate O-sulfate(1-)",
                "molybdate",
                "phosphonate(2-)",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "thiophosphate(2-)",
                "thiosulfate(2-)",
                "triphosphate(2-)",
                "tungstate"
            ],
            "TP": 3,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "divalent inorganic anion",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Ammonium",
                "Canonical name": "NH4+ (NH3)4"
            },
            {
                "Referent": "Bicarbonate",
                "Canonical name": "HCO3- (HCO3)3"
            },
            {
                "Referent": "Chloride",
                "Canonical name": "Cl- (Cl)2"
            },
            {
                "Referent": "Fluoride",
                "Canonical name": "F- (F)2"
            },
            {
                "Referent": "Hydrogen carbonate",
                "Canonical name": "HCO3- (HCO3)3"
            },
            {
                "Referent": "Hydrogen phosphate",
                "Canonical name": "HPO42- (HPO4)2"
            },
            {
                "Referent": "Hydroxide",
                "Canonical name": "OH- (OH)2"
            },
            {
                "Referent": "Nitrite",
                "Canonical name": "NO2- (NO2)3"
            },
            {
                "Referent": "Nitrate",
                "Canonical name": "NO3- (NO3)3"
            },
            {
                "Referent": "Phosphate",
                "Canonical name": "PO43- (PO4)2"
            },
            {
                "Referent": "Sulfate",
                "Canonical name": "SO42- (SO4)2"
            },
            {
                "Referent": "Sulfite",
                "Canonical name": "SO32- (SO3)2"
            },
            {
                "Referent": "Thiocyanate",
                "Canonical name": "SCN- (SCN)2"
            },
            {
                "Referent": "Acetate",
                "Canonical name": "CH3COO- (CH3COO)2"
            },
            {
                "Referent": "Bromide",
                "Canonical name": "Br- (Br)2"
            },
            {
                "Referent": "Iodide",
                "Canonical name": "I- (I)2"
            },
            {
                "Referent": "Perchlorate",
                "Canonical name": "ClO4- (ClO4)2"
            },
            {
                "Referent": "Selenite",
                "Canonical name": "SeO32- (SeO3)2"
            },
            {
                "Referent": "Tellurite",
                "Canonical name": "TeO3- (TeO3)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            },
            {
                "Referent": "Tetrafluoroborate",
                "Canonical name": "BF4- (BF4)2"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrogen phosphate",
                "Sulfate",
                "Sulfite"
            ],
            "mismatches": [
                "Ammonium",
                "Bicarbonate",
                "Chloride",
                "Fluoride",
                "Hydrogen carbonate",
                "Hydroxide",
                "Nitrite",
                "Nitrate",
                "Phosphate",
                "Thiocyanate",
                "Acetate",
                "Bromide",
                "Iodide",
                "Perchlorate",
                "Selenite",
                "Tellurite",
                "Tetrafluoroborate"
            ],
            "true_referents": [
                "(4Z,7Z)-deca-4,7-dien-1-yl sulfate",
                "(R)-2-O-sulfonatolactate(2-)",
                "(R)-secondary-alkyl sulfate oxoanion",
                "(S)-2-O-sulfonatolactate(2-)",
                "(dioxido)trioxidophosphate(.2-)",
                "3,3',5'-triiodo-L-thyronine sulfate(1-)",
                "3,3',5-triiodo-L-thyronine sulfate(1-)",
                "3,3'-diiodo-L-thyronine sulfate(1-)",
                "D-glucose 6-sulfate(1-)",
                "arsenite(2-)",
                "butyl sulfate(1-)",
                "dihydrogensilicate(2-)",
                "diphosphate(2-)",
                "diphosphonate(2-)",
                "dodecaboride(2-)",
                "hexyl sulfate(1-)",
                "hydridonitrate(2-)",
                "hydrogenphosphate",
                "hydrogenphosphite",
                "methyl sulfate(1-)",
                "molybdate",
                "selenate",
                "sulfate",
                "sulfide(2-)",
                "sulfite",
                "tetrachlorozincate(2-)",
                "thiosulfate(2-)",
                "trioxidophosphate(.2-)",
                "triphosphate(2-)"
            ],
            "TP": 3,
            "FP": 17,
            "FN": 0
        }
    }
]