[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Ethyl sulfate (EtOSO3H)",
            "Methyl sulfate (MeOSO3H)",
            "Propyl sulfate",
            "Butyl sulfate",
            "Phenyl sulfate",
            "Benzenesulfonic acid (BzSO3H)",
            "Toluene-4-sulfonic acid",
            "Naphthalene-1-sulfonic acid",
            "Methanesulfonic acid (MsOH)",
            "Triflic acid (CF3SO3H)",
            "P-toluenesulfonic acid (pTsOH)",
            "Sulfuric acid (H2SO4)",
            "Sulfur trioxide (SO3)",
            "Sulfur dioxide (SO2)",
            "Sulfonic acid (R-SO3H)",
            "Sulfate ester (ROSO3H)",
            "Sulfuric anhydride (SO3)",
            "Sulfuric acid anhydride (SO3)",
            "Sulfuric acid ester (ROSO3H)",
            "Sulfuric acid monohydrate (H2SO4\u00b7H2O)",
            "Sulfuric acid pyridine complex (H2SO4\u00b7C5H5N)",
            "Sulfuric acid pyridine adduct (H2SO4\u00b7C5H5N)",
            "Sulfuric acid tetrahydrate (H2SO4\u00b74H2O)",
            "Sulfuric acid dihydrate (H2SO4\u00b72H2O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl sulfate (MeOSO3H)"
            ],
            "mismatches": [
                "Ethyl sulfate (EtOSO3H)",
                "Propyl sulfate",
                "Butyl sulfate",
                "Phenyl sulfate",
                "Benzenesulfonic acid (BzSO3H)",
                "Toluene-4-sulfonic acid",
                "Naphthalene-1-sulfonic acid",
                "Methanesulfonic acid (MsOH)",
                "Triflic acid (CF3SO3H)",
                "P-toluenesulfonic acid (pTsOH)",
                "Sulfuric acid (H2SO4)",
                "Sulfur trioxide (SO3)",
                "Sulfur dioxide (SO2)",
                "Sulfonic acid (R-SO3H)",
                "Sulfate ester (ROSO3H)",
                "Sulfuric anhydride (SO3)",
                "Sulfuric acid anhydride (SO3)",
                "Sulfuric acid ester (ROSO3H)",
                "Sulfuric acid monohydrate (H2SO4\u00b7H2O)",
                "Sulfuric acid pyridine complex (H2SO4\u00b7C5H5N)",
                "Sulfuric acid pyridine adduct (H2SO4\u00b7C5H5N)",
                "Sulfuric acid tetrahydrate (H2SO4\u00b74H2O)",
                "Sulfuric acid dihydrate (H2SO4\u00b72H2O)"
            ],
            "true_referents": [
                "(3-aminopropoxy)sulfonic acid",
                "(3-ethenylphenyl)oxidanesulfonic acid",
                "(3S,4E)-3-methyldec-4-en-1-yl hydrogen sulfate",
                "(3Z,6Z)-dodeca-3,6-dien-1-yl hydrogen sulfate",
                "(4-ethyl-2-methoxyphenyl)oxidanesulfonic acid",
                "(4Z,7Z)-deca-4,7-dien-1-yl hydrogen sulfate",
                "(6S)-6-methyloctyl sulfate",
                "1,2,3-benzenetriol monosulfate",
                "2-(sulfooxy)pentanoic acid",
                "2-[(sulfooxy)methyl]butanoic acid",
                "2-butyloctyl hydrogen sulfate",
                "2-hydroxy-3-(sulfooxy)benzoic acid",
                "2-naphthyl sulfate",
                "3-(3-sulfooxyphenyl)propanoic acid",
                "3-ethylphenyl sulfate",
                "4-(sulfooxy)butanoic acid",
                "4-ethylphenyl sulfate",
                "4-hydroxy-3-(sulfooxy)benzoic acid",
                "5,7-dimethyl-2-methylamino-4-(3-pyridylmethyl)-1,3-benzothiazol-6-yl hydrogen sulfate",
                "5-(sulfooxy)pentanoic acid",
                "7-methyloctyl hydrogen sulfate",
                "Benzeneacetamide-4-O-sulphate",
                "Butyl hydrogen sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "[(3-methylbut-2-en-1-yl)oxy]sulfonic acid",
                "[(oxolan-2-yl)methoxy]sulfonic acid",
                "[2-(dimethylamino)ethoxy]sulfonic acid",
                "alkyl sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "methyl sulfate",
                "phenyl hydrogen sulfate",
                "propyl 4-hydroxybenzoate sulfate",
                "propyl hydrogen sulfate",
                "salicylsulfuric acid",
                "sulfuric acid [4-(2-aminoethyl)phenyl] ester",
                "tetradecyl sulfonic acid"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Methyl hydrogen sulfate (CH3SO3H)",
            "Ethyl hydrogen sulfate (C2H5SO3H)",
            "Isopropyl hydrogen sulfate ((CH3)2CHSO3H)",
            "t-Butyl hydrogen sulfate ((CH3)3COSO3H)",
            "Diacetyl peroxide (C4H6O4)",
            "Dimethyl sulfate ((CH3)2SO4)",
            "Ethyl sulfate (C2H5OSO3H)",
            "Isopropyl sulfate ((CH3)2CHOSO3H)",
            "t-Butyl sulfate ((CH3)3COSO3H)",
            "Phenyl hydrogen sulfate (C6H5SO3H)",
            "Benzenesulfonic acid (C6H5SO3H)",
            "Methyl triflate (CH3OSO2CF3)",
            "Ethyl triflate (C2H5OSO2CF3)",
            "Isopropyl triflate ((CH3)2CHOSO2CF3)",
            "t-Butyl triflate ((CH3)3COSO2CF3)",
            "Tert-butyl hydrogen sulfate ((CH3)3COSO3H)",
            "Methyl chlorosulfate (CH3OSO2Cl)",
            "Ethyl chlorosulfate (C2H5OSO2Cl)",
            "Isopropyl chlorosulfate ((CH3)2CHOSO2Cl)",
            "Phenyl chlorosulfate (C6H5OSO2Cl)",
            "Methyl tosylate (CH3OSO2C6H4CH3)",
            "Ethyl tosylate (C2H5OSO2C6H4CH3)",
            "Isopropyl tosylate ((CH3)2CHOSO2C6H4CH3)",
            "t-Butyl tosylate ((CH3)3COSO2C6H4CH3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl hydrogen sulfate",
                "Dimethyl sulfate",
                "Phenyl hydrogen sulfate"
            ],
            "mismatches": [
                "Methyl hydrogen sulfate (CH3SO3H)",
                "Isopropyl hydrogen sulfate ((CH3)2CHSO3H)",
                "t-Butyl hydrogen sulfate ((CH3)3COSO3H)",
                "Diacetyl peroxide (C4H6O4)",
                "Ethyl sulfate (C2H5OSO3H)",
                "Isopropyl sulfate ((CH3)2CHOSO3H)",
                "t-Butyl sulfate ((CH3)3COSO3H)",
                "Benzenesulfonic acid (C6H5SO3H)",
                "Methyl triflate (CH3OSO2CF3)",
                "Ethyl triflate (C2H5OSO2CF3)",
                "Isopropyl triflate ((CH3)2CHOSO2CF3)",
                "t-Butyl triflate ((CH3)3COSO2CF3)",
                "Tert-butyl hydrogen sulfate ((CH3)3COSO3H)",
                "Methyl chlorosulfate (CH3OSO2Cl)",
                "Ethyl chlorosulfate (C2H5OSO2Cl)",
                "Isopropyl chlorosulfate ((CH3)2CHOSO2Cl)",
                "Phenyl chlorosulfate (C6H5OSO2Cl)",
                "Methyl tosylate (CH3OSO2C6H4CH3)",
                "Ethyl tosylate (C2H5OSO2C6H4CH3)",
                "Isopropyl tosylate ((CH3)2CHOSO2C6H4CH3)",
                "t-Butyl tosylate ((CH3)3COSO2C6H4CH3)"
            ],
            "true_referents": [
                "(2,4)2,5-dimethylphenol sulfate",
                "(3-ethenylphenyl)oxidanesulfonic acid",
                "(3S,4E)-3-methyldec-4-en-1-yl hydrogen sulfate",
                "(3Z)-9-methyldec-3-en-1-yl hydrogen sulfate",
                "(4-ethyl-2-methoxyphenyl)oxidanesulfonic acid",
                "(5-ethenyl-2-hydroxyphenyl)oxidanesulfonic acid",
                "(5-ethyl-2-hydroxyphenyl)oxidanesulfonic acid",
                "(6S)-6-methyloctyl sulfate",
                "1-phenanthryl hydrogen sulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-anhydro-3-O-(2-O-sulfo-alpha-L-idopyranuronosyl)-D-glucitol",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-(methoxymethyl)phenyl hydrogen sulfate",
                "2-[(sulfooxy)methyl]butanoic acid",
                "2-butyloctyl hydrogen sulfate",
                "3,4-Dihydroxyphenylacetate sulfate",
                "3-(3-sulfooxyphenyl)propanoic acid",
                "3-Sulfooxybutanoic acid",
                "3-ethylphenyl sulfate",
                "4-(sulfooxy)butanoic acid",
                "4-hydroxyphenylacetic acid sulfate",
                "4-isopropylphenyl sulfate",
                "7-methyloctyl hydrogen sulfate",
                "Butyl hydrogen sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "[3-(3-oxopropyl)phenyl]oxidanesulfonic acid",
                "[4-(3-oxopropyl)phenyl]oxidanesulfonic acid",
                "alpha-L-IdopA-(1->3)-2,5-anhydro-D-Glc-OH4S",
                "diethyl sulfate",
                "dimethyl sulfate",
                "methyl sulfate",
                "phenyl hydrogen sulfate",
                "propyl hydrogen sulfate"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Phosphatidylcholine (PC)",
            "Phosphatidylethanolamine (PE)",
            "Phosphatidylserine (PS)",
            "Phosphatidylinositol (PI)",
            "Phosphatidylglycerol (PG)",
            "Lysophosphatidylcholine (LPC)",
            "Lysophosphatidylethanolamine (LPE)",
            "Sphingosine-1-phosphate (S1P)",
            "Cerebroside Sulfate",
            "Cholesterol Sulfate",
            "Glucuronylgalactosylceramide Sulfate",
            "Sulfatide",
            "Sulfatide (Galactosylceramide Sulfate)",
            "Heparan Sulfate",
            "Chondroitin Sulfate",
            "Dermatan Sulfate",
            "Keratan Sulfate",
            "Osteoarthritis Sulfate",
            "Hyaluronic Acid Sulfate",
            "Sulfated Glycosaminoglycan",
            "Sulfated Dextran",
            "Sulfated Chitin",
            "Sulfated Heparin",
            "Sulfated Chondroitin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholesterol Sulfate",
                "Heparan Sulfate",
                "Chondroitin Sulfate",
                "Dermatan Sulfate",
                "Keratan Sulfate",
                "Sulfated Glycosaminoglycan"
            ],
            "mismatches": [
                "Phosphatidylcholine (PC)",
                "Phosphatidylethanolamine (PE)",
                "Phosphatidylserine (PS)",
                "Phosphatidylinositol (PI)",
                "Phosphatidylglycerol (PG)",
                "Lysophosphatidylcholine (LPC)",
                "Lysophosphatidylethanolamine (LPE)",
                "Sphingosine-1-phosphate (S1P)",
                "Cerebroside Sulfate",
                "Glucuronylgalactosylceramide Sulfate",
                "Sulfatide",
                "Sulfatide (Galactosylceramide Sulfate)",
                "Osteoarthritis Sulfate",
                "Hyaluronic Acid Sulfate",
                "Sulfated Dextran",
                "Sulfated Chitin",
                "Sulfated Heparin",
                "Sulfated Chondroitin"
            ],
            "true_referents": [
                "(24S)-hydroxycholesterol 3-sulfate",
                "1-(3-O-sulfo-beta-D-galactosyl)-N-[(2R)-2-hydroxylignoceroyl]sphingosine",
                "1-(3-O-sulfo-beta-D-galactosyl)sphingosine",
                "1-(3-O-sulfo-beta-D-galactosyl-(1->4)-beta-D-glucosyl)-N-acylsphingosine",
                "3-O-Sulfogalactosylceramide (d18:1/22:0)",
                "C24 Sulfatide",
                "Palmyrolide A",
                "Panosialin A",
                "[4)-beta-D-GlcpA-(1->4)-alpha-D-GlcpNS6OS-(1->]n",
                "cholesterol sulfate",
                "choline hydrogen sulfate",
                "choline sulfate",
                "chondroitin 4'-sulfate",
                "chondroitin 6'-sulfate",
                "chondroitin sulfate",
                "dermatan 6'-sulfate",
                "dermatan sulfate",
                "dextran sulfate",
                "digalactosylceramide sulfate",
                "galactosylceramide sulfate",
                "glucosamine sulfate",
                "glycerone sulfate",
                "heparan sulfate",
                "heparan sulfate proteoglycan",
                "heparan sulfates",
                "heparin glucosamine 3-O-sulfate",
                "keratan 6'-sulfate",
                "keratan sulfate",
                "keratan sulfate D-glucuronosyl-D-galactosyl-D-galactosyl-D-xylosyl-L-threonine",
                "polysaccharide sulfate",
                "proteochondroitin sulfate",
                "psychosine sulfate",
                "steroid sulfate",
                "sulfated glycosaminoglycan",
                "sulfoglycosphingolipid",
                "sulfolipid-1(1-)"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfate (DMS)",
            "Diethyl sulfate (DES)",
            "Diphenyl sulfate",
            "Methyl phenyl sulfate",
            "Ethyl phenyl sulfate",
            "Benzyl sulfate",
            "p-Nitrophenyl sulfate",
            "Sucrose sulfate",
            "Glucose-6-sulfate",
            "Heparan sulfate",
            "Chondroitin sulfate",
            "Dermatan sulfate",
            "Keratan sulfate",
            "Hyaluronic acid sulfate",
            "Myristyl sulfate",
            "Cetyl sulfate",
            "Stearyl sulfate",
            "Lauryl sulfate",
            "Sodium lauryl sulfate (SLS)",
            "Ammonium lauryl sulfate (ALS)",
            "Potassium lauryl sulfate (KLS)",
            "Sodium laureth sulfate (SLES)",
            "Ammonium laureth sulfate (ALES)",
            "Cholesterol sulfate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfate",
                "Diethyl sulfate",
                "Glucose-6-sulfate",
                "Heparan sulfate",
                "Chondroitin sulfate",
                "Dermatan sulfate",
                "Keratan sulfate",
                "Cholesterol sulfate"
            ],
            "mismatches": [
                "Diphenyl sulfate",
                "Methyl phenyl sulfate",
                "Ethyl phenyl sulfate",
                "Benzyl sulfate",
                "p-Nitrophenyl sulfate",
                "Sucrose sulfate",
                "Hyaluronic acid sulfate",
                "Myristyl sulfate",
                "Cetyl sulfate",
                "Stearyl sulfate",
                "Lauryl sulfate",
                "Sodium lauryl sulfate (SLS)",
                "Ammonium lauryl sulfate (ALS)",
                "Potassium lauryl sulfate (KLS)",
                "Sodium laureth sulfate (SLES)",
                "Ammonium laureth sulfate (ALES)"
            ],
            "true_referents": [
                "(24S)-hydroxycholesterol 3-sulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-hydroxy-5-nitrophenyl hydrogen sulfate",
                "2-methoxy-4-methylphenol sulfate",
                "3,5-dihydroxybenzoic acid sulfate",
                "3-ethylphenyl sulfate",
                "4-ethylphenyl sulfate",
                "4-nitrophenyl hydrogen sulfate",
                "D-glucopyranose 6-sulfate",
                "D-glucose 6-sulfate",
                "Ethyl hydrogen sulfate",
                "Galactose 6-sulfate",
                "Laurolactam",
                "Steryl sulfate",
                "alkyl sulfate",
                "aryl sulfate",
                "carbohydrate sulfate",
                "cholesterol sulfate",
                "chondroitin 4'-sulfate",
                "chondroitin 6'-sulfate",
                "chondroitin sulfate",
                "decyl hydrogen sulfate",
                "dermatan 6'-sulfate",
                "dermatan sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "glucosamine sulfate",
                "heparan sulfate",
                "heparan sulfate proteoglycan",
                "heparan sulfates",
                "keratan 6'-sulfate",
                "keratan sulfate",
                "keratan sulfate D-glucuronosyl-D-galactosyl-D-galactosyl-D-xylosyl-L-threonine",
                "methyl sulfate",
                "monosaccharide sulfate",
                "p-methylaminophenyl sulfate",
                "phenyl hydrogen sulfate",
                "sodium myristyl sulfate",
                "steroid sulfate",
                "sucrose octasulfate"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfate (DMS)",
            "Diethyl sulfate (DES)",
            "Ethyl methanesulfonate (EMS)",
            "Methyl methanesulfonate (MMS)",
            "Phenyl methanesulfonate",
            "Tosyl chloride (TsCl)",
            "Methanesulfonyl chloride (MsCl)",
            "Ethyl p-toluenesulfonate",
            "Methyl p-toluenesulfonate",
            "Trifluoromethanesulfonic anhydride (Tf2O)",
            "Trifluoromethanesulfonic acid methyl ester",
            "Trifluoromethanesulfonic acid ethyl ester",
            "Sulfuryl chloride (SO2Cl2)",
            "Sulfuryl fluoride (SO2F2)",
            "Sulfuryl dichloride",
            "Sulfuryl diethylamide",
            "Sulfuryl diamide",
            "Sulfuryl dimethylamide",
            "Sulfuryl diethyl sulfate",
            "Sulfuryl dimethyl sulfate",
            "Sulfuryl diethyl ether",
            "Sulfuryl dimethyl ether",
            "Sulfuryl diethyl carbonate",
            "Sulfuryl dimethyl carbonate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfate",
                "Diethyl sulfate"
            ],
            "mismatches": [
                "Ethyl methanesulfonate",
                "Methyl methanesulfonate",
                "Phenyl methanesulfonate",
                "Tosyl chloride",
                "Methanesulfonyl chloride",
                "Ethyl p-toluenesulfonate",
                "Methyl p-toluenesulfonate",
                "Trifluoromethanesulfonic anhydride",
                "Trifluoromethanesulfonic acid methyl ester",
                "Trifluoromethanesulfonic acid ethyl ester",
                "Sulfuryl chloride",
                "Sulfuryl fluoride",
                "Sulfuryl dichloride",
                "Sulfuryl diethylamide",
                "Sulfuryl diamide",
                "Sulfuryl dimethylamide",
                "Sulfuryl diethyl sulfate",
                "Sulfuryl dimethyl sulfate",
                "Sulfuryl diethyl ether",
                "Sulfuryl dimethyl ether",
                "Sulfuryl diethyl carbonate",
                "Sulfuryl dimethyl carbonate"
            ],
            "true_referents": [
                "(6S)-6-methyloctyl sulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-(sulfooxy)acetate",
                "2-(sulfooxy)acetic acid",
                "2-(sulfooxy)pentanoic acid",
                "3-ethylphenyl sulfate",
                "4-Methylcatechol 1-O-sulfate",
                "4-Methylcatechol 2-O-sulfate",
                "4-ethylphenyl sulfate",
                "Ethyl hydrogen sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "[(3-methylbut-2-en-1-yl)oxy]sulfonic acid",
                "[2-(dimethylamino)ethoxy]sulfonic acid",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "methyl sulfate",
                "p-methylaminophenyl sulfate",
                "phenanthryl monosulfate",
                "phenyl hydrogen sulfate",
                "sulfuric acid [4-(2-aminoethyl)phenyl] ester",
                "syringol sulfate",
                "tetradecyl sulfonic acid"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfate (DMS)",
            "Diethyl sulfate (DES)",
            "Methyl sulfate (MeOSO3H)",
            "Ethyl sulfate (EtOSO3H)",
            "Isopropyl sulfate (iPrOSO3H)",
            "Butyl sulfate (BuOSO3H)",
            "Phenyl sulfate (PhOSO3H)",
            "Benzyl sulfate (BnOSO3H)",
            "Tert-butyl sulfate (tBuOSO3H)",
            "Cyclohexyl sulfate (cHexOSO3H)",
            "Allyl sulfate (AllylOSO3H)",
            "Octyl sulfate (OctOSO3H)",
            "Decyl sulfate (DecOSO3H)",
            "Sodium lauryl sulfate (SLS)",
            "Sodium dodecyl sulfate (SDS)",
            "Methyl phenyl sulfate (MPS)",
            "Ethyl phenyl sulfate (EPS)",
            "Naphthyl sulfate (NaphOSO3H)",
            "Cholesterol sulfate (CholOSO3H)",
            "Steroid sulfate (SteroidOSO3H)",
            "Amino acid sulfate (AAS)",
            "Glucosamine sulfate (GlcNSO4)",
            "Heparin sulfate (HS)",
            "Chondroitin sulfate (CS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfate (DMS)",
                "Diethyl sulfate (DES)",
                "Methyl sulfate (MeOSO3H)",
                "Phenyl sulfate (PhOSO3H)",
                "Octyl sulfate (OctOSO3H)",
                "Decyl sulfate (DecOSO3H)",
                "Cholesterol sulfate (CholOSO3H)",
                "Steroid sulfate (SteroidOSO3H)",
                "Glucosamine sulfate (GlcNSO4)"
            ],
            "mismatches": [
                "Ethyl sulfate (EtOSO3H)",
                "Isopropyl sulfate (iPrOSO3H)",
                "Butyl sulfate (BuOSO3H)",
                "Benzyl sulfate (BnOSO3H)",
                "Tert-butyl sulfate (tBuOSO3H)",
                "Cyclohexyl sulfate (cHexOSO3H)",
                "Allyl sulfate (AllylOSO3H)",
                "Sodium lauryl sulfate (SLS)",
                "Sodium dodecyl sulfate (SDS)",
                "Methyl phenyl sulfate (MPS)",
                "Ethyl phenyl sulfate (EPS)",
                "Naphthyl sulfate (NaphOSO3H)",
                "Amino acid sulfate (AAS)",
                "Heparin sulfate (HS)",
                "Chondroitin sulfate (CS)"
            ],
            "true_referents": [
                "(24S)-hydroxycholesterol 3-sulfate",
                "(6S)-6-methyloctyl sulfate",
                "1,2,3-benzenetriol monosulfate",
                "1-phenanthryl hydrogen sulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-aminophenyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-hydroxy-17beta-estradiol 3-sulfate",
                "2-naphthyl sulfate",
                "26-hydroxycholesterol 3-sulfate",
                "3,4-dihydroxy-5-(sulfooxy)cyclohex-1-ene-1-carboxylic acid",
                "3,5-dihydroxy-4-(sulfooxy)cyclohex-1-ene-1-carboxylic acid",
                "3,5-dihydroxybenzoic acid sulfate",
                "3-ethylphenyl sulfate",
                "3-phenanthryl hydrogen sulfate",
                "3alpha,7alpha,12alpha-trihydroxy-5alpha-cholan-24-yl sulfate",
                "4-allylcatechol sulfate",
                "4-allylpyrocatechol sulfate",
                "4-androsten-3alpha,17alpha-diol 17-sulfate",
                "4-ethylphenyl sulfate",
                "4-isopropylphenyl sulfate",
                "7-methyloctyl hydrogen sulfate",
                "Butyl hydrogen sulfate",
                "Butyrolactone I 4''-sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "L-serine O-sulfate",
                "N-acetyl-D-glucosamine 4-sulfate",
                "Steryl sulfate",
                "beta-D-glucosamine 6-sulfate",
                "cholesterol sulfate",
                "chondroitin 4'-sulfate",
                "chondroitin 6'-sulfate",
                "chondroitin sulfate",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "glucosamine sulfate",
                "heparan sulfate",
                "heparan sulfates",
                "heparin sodium",
                "methyl sulfate",
                "methyl-4-hydroxybenzoate O-sulfate",
                "o-cresol hydrogen sulfate",
                "octyl hydrogen sulfate",
                "p-methylaminophenyl sulfate",
                "phenyl hydrogen sulfate",
                "propyl hydrogen sulfate",
                "sodium myristyl sulfate",
                "steroid sulfate",
                "sucrose octasulfate",
                "sulfuric acid [4-(2-aminoethyl)phenyl] ester"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfate (DMS)",
            "Diethyl sulfate (DES)",
            "Dipropyl sulfate",
            "Dibutyl sulfate",
            "Dipentyl sulfate",
            "Dihexyl sulfate",
            "Dioctyl sulfate",
            "Dinonyl sulfate",
            "Didodecyl sulfate",
            "Diphenyl sulfate",
            "Ditolyl sulfate",
            "Diisopropyl sulfate",
            "Ditert-butyl sulfate",
            "Dicyclohexyl sulfate",
            "Dibenzoylethylene sulfate",
            "Di-sec-amyl sulfate",
            "Diisobutyl sulfate",
            "Di-2-ethylhexyl sulfate",
            "Dinaphthyl sulfate",
            "Dipicryl sulfate",
            "Diphenylmethane sulfate",
            "Ditrimethylolpropane sulfate",
            "Dibenzothiophene sulfate",
            "Diphenyl ether sulfate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Diisopropyl sulfate",
                "Dimethyl sulfate",
                "Diethyl sulfate"
            ],
            "mismatches": [
                "Dipropyl sulfate",
                "Dibutyl sulfate",
                "Dipentyl sulfate",
                "Dihexyl sulfate",
                "Dioctyl sulfate",
                "Dinonyl sulfate",
                "Didodecyl sulfate",
                "Diphenyl sulfate",
                "Ditolyl sulfate",
                "Ditert-butyl sulfate",
                "Dicyclohexyl sulfate",
                "Dibenzoylethylene sulfate",
                "Di-sec-amyl sulfate",
                "Diisobutyl sulfate",
                "Di-2-ethylhexyl sulfate",
                "Dinaphthyl sulfate",
                "Dipicryl sulfate",
                "Diphenylmethane sulfate",
                "Ditrimethylolpropane sulfate",
                "Dibenzothiophene sulfate",
                "Diphenyl ether sulfate"
            ],
            "true_referents": [
                "17alpha-ethynylestradiol 3-sulfate",
                "2,4-dihydroxyacetophenone-5-O-sulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "3,4-Dihydroxyphenylacetate sulfate",
                "3,4-Dihydroxyphenylglycol O-sulfate",
                "3,4-phenanthrenediyl bissulfate",
                "3,5-dihydroxybenzoic acid sulfate",
                "3-ethylphenyl sulfate",
                "4-isopropylphenyl sulfate",
                "Butyl hydrogen sulfate",
                "Desmethyltetrahydropiperine sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "alkyl sulfate",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "phenyl hydrogen sulfate",
                "propyl hydrogen sulfate",
                "tetradecyl sulfonic acid"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Methyl sulfuric ester (CH3SO3CH3)",
            "Ethyl sulfuric ester (C2H5SO3C2H5)",
            "Propyl sulfuric ester (C3H7SO3C3H7)",
            "Butyl sulfuric ester (C4H9SO3C4H9)",
            "Isobutyl sulfuric ester (CH3CH2CH(CH3)SO3C4H9)",
            "Pentyl sulfuric ester (C5H11SO3C5H11)",
            "Hexyl sulfuric ester (C6H13SO3C6H13)",
            "Heptyl sulfuric ester (C7H15SO3C7H15)",
            "Octyl sulfuric ester (C8H17SO3C8H17)",
            "Nonyl sulfuric ester (C9H19SO3C9H19)",
            "Decyl sulfuric ester (C10H21SO3C10H21)",
            "Dodecyl sulfuric ester (C12H25SO3C12H25)",
            "Octadecyl sulfuric ester (C18H37SO3C18H37)",
            "Phenyl sulfuric ester (C6H5SO3C6H5)",
            "Benzyl sulfuric ester (C6H5CH2SO3C6H5)",
            "Tert-butyl sulfuric ester ((CH3)3CSO3(CH3)3)",
            "Isoamyl sulfuric ester (CH3CH2CH(CH3)CH2SO3C5H11)",
            "Cyclohexyl sulfuric ester (C6H11SO3C6H11)",
            "Methoxy sulfuric ester (CH3OSO3CH3)",
            "Ethoxy sulfuric ester (C2H5OSO3C2H5)",
            "Phenoxy sulfuric ester (C6H5OSO3C6H5)",
            "Butoxy sulfuric ester (C4H9OSO3C4H9)",
            "Isopropoxy sulfuric ester (CH3CH(CH3)OSO3CH(CH3)CH3)",
            "Isobutoxy sulfuric ester (CH3CH2CH(CH3)OSO3C(CH3)3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Decyl hydrogen sulfate",
                "Dodecyl hydrogen sulfate",
                "octyl hydrogen sulfate"
            ],
            "mismatches": [
                "Methyl sulfuric ester (CH3SO3CH3)",
                "Ethyl sulfuric ester (C2H5SO3C2H5)",
                "Propyl sulfuric ester (C3H7SO3C3H7)",
                "Butyl sulfuric ester (C4H9SO3C4H9)",
                "Isobutyl sulfuric ester (CH3CH2CH(CH3)SO3C4H9)",
                "Pentyl sulfuric ester (C5H11SO3C5H11)",
                "Hexyl sulfuric ester (C6H13SO3C6H13)",
                "Heptyl sulfuric ester (C7H15SO3C7H15)",
                "Nonyl sulfuric ester (C9H19SO3C9H19)",
                "Octadecyl sulfuric ester (C18H37SO3C18H37)",
                "Phenyl sulfuric ester (C6H5SO3C6H5)",
                "Benzyl sulfuric ester (C6H5CH2SO3C6H5)",
                "Tert-butyl sulfuric ester ((CH3)3CSO3(CH3)3)",
                "Isoamyl sulfuric ester (CH3CH2CH(CH3)CH2SO3C5H11)",
                "Cyclohexyl sulfuric ester (C6H11SO3C6H11)",
                "Methoxy sulfuric ester (CH3OSO3CH3)",
                "Ethoxy sulfuric ester (C2H5OSO3C2H5)",
                "Phenoxy sulfuric ester (C6H5OSO3C6H5)",
                "Butoxy sulfuric ester (C4H9OSO3C4H9)",
                "Isopropoxy sulfuric ester (CH3CH(CH3)OSO3CH(CH3)CH3)",
                "Isobutoxy sulfuric ester (CH3CH2CH(CH3)OSO3C(CH3)3)"
            ],
            "true_referents": [
                "(2S)-2,6-dimethylheptyl hydrogen sulfate",
                "(6S)-6-methyloctyl sulfate",
                "(E)-2-Propenyl [3-(2-propenylthio)-2-propenyl] sulfate",
                "2,6-dimethylheptyl hydrogen sulfate",
                "2-[3-(sulfooxy)phenyl]acetic acid",
                "2-[4-hydroxy-3-(sulfooxy)phenyl]acetic acid",
                "3,4-dihydroxy-5-(sulfooxy)cyclohex-1-ene-1-carboxylic acid",
                "3,5-dihydroxy-4-(sulfooxy)cyclohex-1-ene-1-carboxylic acid",
                "4-(sulfooxy)butanoic acid",
                "5-(3-methoxyphenyl)-4-(sulfooxy)pentanoic acid",
                "Butyl hydrogen sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "[4-(3-hydroxybutyl)-2-methoxyphenyl]oxidanesulfonic acid",
                "decyl hydrogen sulfate",
                "dodecyl hydrogen sulfate",
                "octyl hydrogen sulfate",
                "propyl hydrogen sulfate",
                "sulfuric acid [4-(2-aminoethyl)phenyl] ester"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Methyl sulfate (MeSO4)",
            "Ethyl sulfate (EtSO4)",
            "Propyl sulfate",
            "Butyl sulfate",
            "Isopropyl sulfate",
            "Isobutyl sulfate",
            "Benzyl sulfate",
            "Phenyl sulfate",
            "Octyl sulfate",
            "Decyl sulfate",
            "Dodecyl sulfate",
            "Sodium dodecyl sulfate (SDS)",
            "Diethyl sulfate",
            "Triethyl sulfate",
            "Sodium ethyl sulfate",
            "Sodium methyl sulfate",
            "Dimethyl sulfate",
            "Triethylamine sulfate",
            "Tetramethylammonium sulfate",
            "Potassium sulfate ester",
            "Ammonium sulfate ester",
            "Trimethylsilyl sulfate",
            "Lauryl sulfate",
            "Oleyl sulfate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl sulfate (MeSO4)",
                "Diethyl sulfate",
                "Dimethyl sulfate"
            ],
            "mismatches": [
                "Ethyl sulfate (EtSO4)",
                "Propyl sulfate",
                "Butyl sulfate",
                "Isopropyl sulfate",
                "Isobutyl sulfate",
                "Benzyl sulfate",
                "Phenyl sulfate",
                "Octyl sulfate",
                "Decyl sulfate",
                "Dodecyl sulfate",
                "Sodium dodecyl sulfate (SDS)",
                "Triethyl sulfate",
                "Sodium ethyl sulfate",
                "Sodium methyl sulfate",
                "Triethylamine sulfate",
                "Tetramethylammonium sulfate",
                "Potassium sulfate ester",
                "Ammonium sulfate ester",
                "Trimethylsilyl sulfate",
                "Lauryl sulfate",
                "Oleyl sulfate"
            ],
            "true_referents": [
                "(6S)-6-methyloctyl sulfate",
                "1,2,3-benzenetriol monosulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "3,5-dihydroxybenzoic acid sulfate",
                "3-ethylphenyl sulfate",
                "4-ethylphenyl sulfate",
                "4-isopropylphenyl sulfate",
                "Butyl hydrogen sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Steryl sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "alkyl sulfate",
                "aryl sulfate",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "glycerone sulfate",
                "keratan sulfate",
                "methyl sulfate",
                "octyl hydrogen sulfate",
                "p-methylaminophenyl sulfate",
                "phenyl hydrogen sulfate",
                "propyl 4-hydroxybenzoate sulfate",
                "propyl hydrogen sulfate",
                "sodium myristyl sulfate",
                "sulfuric acid [4-(2-aminoethyl)phenyl] ester"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfate (DMS)",
            "Diethyl sulfate (DES)",
            "Cholesteryl sulfate",
            "Heparan sulfate",
            "Chondroitin sulfate",
            "Dermatan sulfate",
            "Keratan sulfate",
            "Estrone sulfate",
            "Dehydroepiandrosterone sulfate (DHEA-S)",
            "Testosterone sulfate",
            "Pregnenolone sulfate",
            "Ethyl sulfate",
            "Methyl sulfate",
            "Propyl sulfate",
            "Butyl sulfate",
            "Pentyl sulfate",
            "Hexyl sulfate",
            "Heptyl sulfate",
            "Octyl sulfate",
            "Nonyl sulfate",
            "Decyl sulfate",
            "Lauryl sulfate",
            "Cetyl sulfate",
            "Stearyl sulfate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfate",
                "Diethyl sulfate",
                "Heparan sulfate",
                "Chondroitin sulfate",
                "Dermatan sulfate",
                "Keratan sulfate",
                "Dehydroepiandrosterone sulfate",
                "Testosterone sulfate",
                "Pregnenolone sulfate",
                "Methyl sulfate"
            ],
            "mismatches": [
                "Cholesteryl sulfate",
                "Estrone sulfate",
                "Ethyl sulfate",
                "Propyl sulfate",
                "Butyl sulfate",
                "Pentyl sulfate",
                "Hexyl sulfate",
                "Heptyl sulfate",
                "Octyl sulfate",
                "Nonyl sulfate",
                "Decyl sulfate",
                "Lauryl sulfate",
                "Cetyl sulfate",
                "Stearyl sulfate"
            ],
            "true_referents": [
                "(24S)-hydroxycholesterol 3-sulfate",
                "(2R)-2,6-dimethylheptyl hydrogen sulfate",
                "(2S)-2,6-dimethylheptyl hydrogen sulfate",
                "(6S)-6-methyloctyl sulfate",
                "17alpha-hydroxypregnenolone 3-sulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2,6-dimethylheptyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "26-hydroxycholesterol 3-sulfate",
                "3-ethylphenyl sulfate",
                "5alpha-dihydrotestosterone sulfate",
                "Butyl hydrogen sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Steryl sulfate",
                "alkyl sulfate",
                "androsterone sulfate",
                "cholesterol sulfate",
                "chondroitin 4'-sulfate",
                "chondroitin 6'-sulfate",
                "chondroitin sulfate",
                "decyl hydrogen sulfate",
                "dehydroepiandrosterone sulfate",
                "dermatan 6'-sulfate",
                "dermatan sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "epiandrosterone sulfate",
                "estrone 3-sulfate",
                "estrone sodium sulfate",
                "heparan sulfate",
                "heparan sulfate proteoglycan",
                "heparan sulfates",
                "keratan 6'-sulfate",
                "keratan sulfate",
                "keratan sulfate D-glucuronosyl-D-galactosyl-D-galactosyl-D-xylosyl-L-threonine",
                "methyl sulfate",
                "octyl hydrogen sulfate",
                "pentosan sulfate",
                "pregnenolone sulfate",
                "propyl 4-hydroxybenzoate sulfate",
                "propyl hydrogen sulfate",
                "sodium myristyl sulfate",
                "steroid sulfate",
                "testosterone sulfate"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Adenosine 5'-phosphosulfate (APS)",
            "3'-Phosphoadenosine 5'-phosphosulfate (PAPS)",
            "Choline sulfate",
            "Estrone sulfate",
            "Dehydroepiandrosterone sulfate (DHEA-S)",
            "Heparan sulfate",
            "Chondroitin sulfate",
            "Dermatan sulfate",
            "Keratan sulfate",
            "Guanosine 5'-diphosphate 3'-diphosphate (ppGpp)",
            "Sulfatide",
            "Cerebroside sulfate",
            "Tyrosine-O-sulfate",
            "Cholesterol sulfate",
            "Indoxyl sulfate",
            "p-Cresol sulfate",
            "Phenol sulfate",
            "Pregnenolone sulfate",
            "Testosterone sulfate",
            "Vitamin D3 sulfate",
            "Galactosylceramide sulfate",
            "Lactosylceramide sulfate",
            "Psychosine sulfate",
            "Seminolipid sulfate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Choline sulfate",
                "Dehydroepiandrosterone sulfate",
                "Heparan sulfate",
                "Chondroitin sulfate",
                "Dermatan sulfate",
                "Keratan sulfate",
                "Cholesterol sulfate",
                "Indoxyl sulfate",
                "p-Cresol sulfate",
                "Pregnenolone sulfate",
                "Testosterone sulfate",
                "Galactosylceramide sulfate",
                "Psychosine sulfate"
            ],
            "mismatches": [
                "Adenosine 5'-phosphosulfate (APS)",
                "3'-Phosphoadenosine 5'-phosphosulfate (PAPS)",
                "Estrone sulfate",
                "Guanosine 5'-diphosphate 3'-diphosphate (ppGpp)",
                "Sulfatide",
                "Cerebroside sulfate",
                "Tyrosine-O-sulfate",
                "Phenol sulfate",
                "Vitamin D3 sulfate",
                "Lactosylceramide sulfate",
                "Seminolipid sulfate"
            ],
            "true_referents": [
                "(24S)-hydroxycholesterol 3-sulfate",
                "17alpha-hydroxypregnenolone 3-sulfate",
                "2-methoxy-4-methylphenol sulfate",
                "3-O-Sulfogalactosylceramide (d18:1/22:0)",
                "4-androsten-3alpha,17alpha-diol 17-sulfate",
                "5-(sulfooxy)pentanoic acid",
                "5-bromo-4-chloro-3-indolyl sulfate",
                "5alpha-dihydrotestosterone sulfate",
                "5beta-Androstan-3alpha-ol-17-one sulfate",
                "6-hydroxyindole sulfate",
                "C24 Sulfatide",
                "D-Galp3S-(1->4)-D-Glcp",
                "L-tyrosine methyl ester 4-sulfate",
                "O(4')-sulfo-L-tyrosine",
                "Tyrosol 4-sulfate",
                "androsterone sulfate",
                "beta-D-Galp3S-(1->4)-[alpha-L-Fucp-(1->3)]-D-Glcp",
                "beta-D-Galp3S-(1->4)-[alpha-L-Fucp-(1->3)]-beta-D-Glcp",
                "cholesterol sulfate",
                "choline hydrogen sulfate",
                "choline sulfate",
                "choline sulfates",
                "chondroitin 4'-sulfate",
                "chondroitin 6'-sulfate",
                "chondroitin sulfate",
                "dehydroepiandrosterone sulfate",
                "dermatan 6'-sulfate",
                "dermatan sulfate",
                "digalactosylceramide sulfate",
                "dopamine 3-O-sulfate",
                "epiandrosterone sulfate",
                "epitestosterone sulfate(1-)",
                "estrone 3-sulfate",
                "estrone sodium sulfate",
                "galactosamine sulfate",
                "galactosylceramide sulfate",
                "heparan sulfate",
                "heparan sulfate proteoglycan",
                "heparan sulfates",
                "indoxyl sulfate",
                "keratan 6'-sulfate",
                "keratan sulfate",
                "keratan sulfate D-glucuronosyl-D-galactosyl-D-galactosyl-D-xylosyl-L-threonine",
                "o-cresol hydrogen sulfate",
                "p-cresol sulfate",
                "p-methylaminophenyl sulfate",
                "phenyl hydrogen sulfate",
                "pregnenolone sulfate",
                "psychosine sulfate",
                "steroid sulfate",
                "sulfoglycolipid",
                "sulfoglycosphingolipid",
                "sulfolipid-1(1-)",
                "testosterone sulfate"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfate (DMS)",
            "Diethyl sulfate (DES)",
            "Diisopropyl sulfate (DIPS)",
            "Di-n-butyl sulfate (DBS)",
            "Di-tert-butyl sulfate (DTBS)",
            "Diphenyl sulfate (DPhS)",
            "Bis(2-methoxyethyl) sulfate",
            "Bis(2-chloroethyl) sulfate",
            "Bis(2-bromoethyl) sulfate",
            "Bis(2-iodoethyl) sulfate",
            "Bis(trifluoromethyl) sulfate",
            "Methyl trifluoromethanesulfonate",
            "Ethyl trifluoromethanesulfonate",
            "Isopropyl trifluoromethanesulfonate",
            "n-Butyl trifluoromethanesulfonate",
            "tert-Butyl trifluoromethanesulfonate",
            "Phenyl trifluoromethanesulfonate",
            "2-Methoxyethyl trifluoromethanesulfonate",
            "2-Chloroethyl trifluoromethanesulfonate",
            "2-Bromoethyl trifluoromethanesulfonate",
            "2-Iodoethyl trifluoromethanesulfonate",
            "Trifluoromethanesulfonic anhydride",
            "Methanesulfonic anhydride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfate",
                "Diethyl sulfate",
                "Diisopropyl sulfate"
            ],
            "mismatches": [
                "Di-n-butyl sulfate",
                "Di-tert-butyl sulfate",
                "Diphenyl sulfate",
                "Bis(2-methoxyethyl) sulfate",
                "Bis(2-chloroethyl) sulfate",
                "Bis(2-bromoethyl) sulfate",
                "Bis(2-iodoethyl) sulfate",
                "Bis(trifluoromethyl) sulfate",
                "Methyl trifluoromethanesulfonate",
                "Ethyl trifluoromethanesulfonate",
                "Isopropyl trifluoromethanesulfonate",
                "n-Butyl trifluoromethanesulfonate",
                "tert-Butyl trifluoromethanesulfonate",
                "Phenyl trifluoromethanesulfonate",
                "2-Methoxyethyl trifluoromethanesulfonate",
                "2-Chloroethyl trifluoromethanesulfonate",
                "2-Bromoethyl trifluoromethanesulfonate",
                "2-Iodoethyl trifluoromethanesulfonate",
                "Trifluoromethanesulfonic anhydride",
                "Methanesulfonic anhydride"
            ],
            "true_referents": [
                "(2,4)2,5-dimethylphenol sulfate",
                "(3'-sulfo)Galbeta-Cer(d18:0/2-OH-20:0)",
                "(3-ethenylphenyl)oxidanesulfonic acid",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-(methoxymethyl)phenyl hydrogen sulfate",
                "2-[(sulfooxy)methyl]butanoic acid",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "2-methoxy-4-methylphenol sulfate",
                "3,3',5-triiodo-L-thyronine sulfate",
                "3,3'-diiodo-L-thyronine sulfate",
                "3-(3-sulfooxyphenyl)propanoic acid",
                "3-Sulfooxybutanoic acid",
                "3-methoxy-4-hydroxyphenylethyleneglycol sulfate",
                "4-(sulfooxy)butanoic acid",
                "4-isopropylphenyl sulfate",
                "5-(3-methoxyphenyl)-4-(sulfooxy)pentanoic acid",
                "5-bromo-4-chloro-3-indolyl sulfate",
                "Butyl hydrogen sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "[(3-methylbut-2-en-1-yl)oxy]sulfonic acid",
                "[2-(dimethylamino)ethoxy]sulfonic acid",
                "bisphenol A sulfate",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "halistanol sulfonic acid F",
                "methyl sulfate",
                "phenyl hydrogen sulfate",
                "propyl hydrogen sulfate",
                "tetradecyl sulfonic acid"
            ],
            "TP": 3,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfate (DMS)",
            "Diethyl sulfate (DES)",
            "Dibutyl sulfate (DBS)",
            "Dihexyl sulfate (DHS)",
            "Dioctyl sulfate (DOS)",
            "Diallyl sulfate (DAS)",
            "Benzyl sulfate (BS)",
            "Phenyl sulfate (PS)",
            "Ethyl hydrogen sulfate (EHS)",
            "Propyl hydrogen sulfate (PHS)",
            "Butyl hydrogen sulfate (BHS)",
            "Hexyl hydrogen sulfate (HHS)",
            "Octyl hydrogen sulfate (OHS)",
            "Allyl hydrogen sulfate (AHS)",
            "Cholesteryl sulfate (CS)",
            "Testosterone sulfate (TS)",
            "Estrone sulfate (ES)",
            "Glucose 6-sulfate (G6S)",
            "Galactose 6-sulfate (Gal6S)",
            "N-Acetylglucosamine 6-sulfate (GlcNAc6S)",
            "Chondroitin sulfate (CS)",
            "Keratan sulfate (KS)",
            "Heparan sulfate (HS)",
            "Dermatan sulfate (DS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfate",
                "Diethyl sulfate",
                "Ethyl hydrogen sulfate",
                "Propyl hydrogen sulfate",
                "Butyl hydrogen sulfate",
                "Octyl hydrogen sulfate",
                "cholesterol sulfate",
                "testosterone sulfate",
                "Galactose 6-sulfate",
                "chondroitin sulfate",
                "keratan sulfate",
                "heparan sulfate",
                "dermatan sulfate"
            ],
            "mismatches": [
                "Dibutyl sulfate",
                "Dihexyl sulfate",
                "Dioctyl sulfate",
                "Diallyl sulfate",
                "Benzyl sulfate",
                "Phenyl sulfate",
                "Hexyl hydrogen sulfate",
                "Allyl hydrogen sulfate",
                "Cholesteryl sulfate",
                "Estrone sulfate",
                "Glucose 6-sulfate",
                "N-Acetylglucosamine 6-sulfate"
            ],
            "true_referents": [
                "(24S)-hydroxycholesterol 3-sulfate",
                "1,2,3-benzenetriol monosulfate",
                "17beta-estradiol 3-sulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "26-hydroxycholesterol 3-sulfate",
                "3,4-Dihydroxyphenylglycol O-sulfate",
                "3-ethylphenyl sulfate",
                "4-acetylphenyl hydrogen sulfate",
                "4-allylcatechol sulfate",
                "Benzeneacetamide-4-O-sulphate",
                "Butyl hydrogen sulfate",
                "D-galactose 6-sulfate",
                "D-glucopyranose 6-sulfate",
                "D-glucose 6-sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Galactose 6-sulfate",
                "N-acetyl-D-galactosamine 6-sulfate",
                "N-acetyl-beta-D-galactosamine 6-sulfate",
                "N-acetylglucosamine 4-sulfate",
                "alpha-D-galactose 6-sulfate",
                "androsterone sulfate",
                "aryl sulfate",
                "cholesterol sulfate",
                "chondroitin 4'-sulfate",
                "chondroitin 6'-sulfate",
                "chondroitin sulfate",
                "decyl hydrogen sulfate",
                "dermatan 6'-sulfate",
                "dermatan sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "estrone 3-sulfate",
                "estrone sodium sulfate",
                "glycosmisic acid sulfate",
                "heparan sulfate",
                "heparan sulfate proteoglycan",
                "heparan sulfates",
                "keratan 6'-sulfate",
                "keratan sulfate",
                "keratan sulfate D-glucuronosyl-D-galactosyl-D-galactosyl-D-xylosyl-L-threonine",
                "octyl hydrogen sulfate",
                "phenanthryl monosulfate",
                "phenyl hydrogen sulfate",
                "propyl 4-hydroxybenzoate sulfate",
                "propyl hydrogen sulfate",
                "steroid sulfate",
                "testosterone sulfate"
            ],
            "TP": 13,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfide (DMS) (1)",
            "Dimethyl sulfoxide (DMSO) (2)",
            "Sulfuric acid esters of polyethylene glycols (3)",
            "Ethyl sulfite (4)",
            "Methyl sulfite (5)",
            "Ethyl sulfonate (6)",
            "Methyl sulfonate (7)",
            "Sulfuric acid esters of polypropylene glycols (8)",
            "Diethyl sulfite (9)",
            "Diethyl sulfoxide (10)",
            "Ethyl methyl sulfite (11)",
            "Methyl ethyl sulfite (12)",
            "Diisopropyl sulfite (13)",
            "Diisopropyl sulfoxide (14)",
            "Ethyl isopropyl sulfite (15)",
            "Methyl isopropyl sulfite (16)",
            "Di-tert-butyl sulfite (17)",
            "Di-tert-butyl sulfoxide (18)",
            "Ethyl tert-butyl sulfite (19)",
            "Methyl tert-butyl sulfite (20)",
            "Sulfuric acid esters of polyvinyl alcohols (21)",
            "Polyethylene sulfite (22)",
            "Polypropylene sulfite (23)",
            "Sulfuric acid esters of polyvinyl acetate (24)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Dimethyl sulfide (DMS) (1)",
                "Dimethyl sulfoxide (DMSO) (2)",
                "Sulfuric acid esters of polyethylene glycols (3)",
                "Ethyl sulfite (4)",
                "Methyl sulfite (5)",
                "Ethyl sulfonate (6)",
                "Methyl sulfonate (7)",
                "Sulfuric acid esters of polypropylene glycols (8)",
                "Diethyl sulfite (9)",
                "Diethyl sulfoxide (10)",
                "Ethyl methyl sulfite (11)",
                "Methyl ethyl sulfite (12)",
                "Diisopropyl sulfite (13)",
                "Diisopropyl sulfoxide (14)",
                "Ethyl isopropyl sulfite (15)",
                "Methyl isopropyl sulfite (16)",
                "Di-tert-butyl sulfite (17)",
                "Di-tert-butyl sulfoxide (18)",
                "Ethyl tert-butyl sulfite (19)",
                "Methyl tert-butyl sulfite (20)",
                "Sulfuric acid esters of polyvinyl alcohols (21)",
                "Polyethylene sulfite (22)",
                "Polypropylene sulfite (23)",
                "Sulfuric acid esters of polyvinyl acetate (24)"
            ],
            "true_referents": [
                "(2,4)2,5-dimethylphenol sulfate",
                "(6S)-6-methyloctyl sulfate",
                "1,2,3-benzenetriol monosulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-(sulfooxy)acetate",
                "2-[(sulfooxy)methyl]butanoic acid",
                "4-(sulfooxy)butanoic acid",
                "4-ethylphenyl sulfate",
                "4-isopropylphenyl sulfate",
                "7-methyloctyl hydrogen sulfate",
                "Butyl hydrogen sulfate",
                "Dihydro isoferulate 3-O-sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "[(3-methylbut-2-en-1-yl)oxy]sulfonic acid",
                "[(oxolan-2-yl)methoxy]sulfonic acid",
                "[2-(dimethylamino)ethoxy]sulfonic acid",
                "bisphenol A sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "methyl sulfate",
                "poly(vinyl sulfate)",
                "sulfuric acid [4-(2-aminoethyl)phenyl] ester",
                "vanillyl alcohol monosulfate"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Cholesterol sulfate (CS)",
            "Sulfatide",
            "Cerebroside 3-sulfate",
            "Psychosine sulfate",
            "Lactosyl sulfatide",
            "Sulfated galactosyl ceramide",
            "Seminalplasmin",
            "Tyrosin O-sulfate",
            "Chondroitin sulfate A (CSA)",
            "Chondroitin sulfate C (CSC)",
            "Chondroitin sulfate D (CSD)",
            "Chondroitin sulfate E (CSE)",
            "Keratan sulfate I",
            "Keratan sulfate II",
            "Keratan sulfate III",
            "Keratan sulfate IV",
            "Heparin",
            "Heparan sulfate",
            "Dermatan sulfate",
            "Chondroitin",
            "Glucuronosyl sulfatide",
            "Galactosyl sulfatide",
            "Lactosylceramide 3-sulfate",
            "Seminalplasmin sulfate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cholesterol sulfate",
                "psychosine sulfate",
                "heparin",
                "heparan sulfate",
                "dermatan sulfate",
                "chondroitin sulfate E"
            ],
            "mismatches": [
                "sulfatide",
                "cerebroside 3-sulfate",
                "lactosyl sulfatide",
                "sulfated galactosyl ceramide",
                "seminalplasmin",
                "tyrosin O-sulfate",
                "chondroitin sulfate A (CSA)",
                "chondroitin sulfate C (CSC)",
                "chondroitin sulfate D (CSD)",
                "keratan sulfate I",
                "keratan sulfate II",
                "keratan sulfate III",
                "keratan sulfate IV",
                "chondroitin",
                "glucuronosyl sulfatide",
                "galactosyl sulfatide",
                "lactosylceramide 3-sulfate",
                "seminalplasmin sulfate"
            ],
            "true_referents": [
                "(24S)-hydroxycholesterol 3-sulfate",
                "1-(3,6-di-O-sulfo-beta-D-galactosyl)-N-lauroylsphingosine",
                "1-(3-O-sulfo-beta-D-galactosyl)-N-stearoylsphingosine",
                "1-(3-O-sulfo-beta-D-galactosyl)sphingosine",
                "3-D-glucuronosyl-N(2),6-disulfo-beta-D-glucosamine",
                "3-O-Sulfogalactosylceramide (d18:1/22:0)",
                "3-O-sulfo-beta-D-galactose",
                "5-dehydro-4-deoxy-2-O-sulfo-D-glucuronic acid",
                "C24 Sulfatide",
                "D-glucopyranose 3-sulfate",
                "L-tyrosine methyl ester 4-sulfate",
                "Tyrosol 4-sulfate",
                "cholesterol sulfate",
                "chondroitin 4'-sulfate",
                "chondroitin 6'-sulfate",
                "chondroitin sulfate",
                "chondroitin sulfate E",
                "dermatan 6'-sulfate",
                "dermatan sulfate",
                "digalactosylceramide sulfate",
                "galactosamine sulfate",
                "galactosylceramide sulfate",
                "heparan sulfate",
                "heparan sulfate proteoglycan",
                "heparan sulfates",
                "heparin",
                "heparins",
                "heparitin",
                "hydroxytyrosol 3'-sulfate",
                "keratan 6'-sulfate",
                "keratan sulfate",
                "keratan sulfate D-glucuronosyl-D-galactosyl-D-galactosyl-D-xylosyl-L-threonine",
                "p-methylaminophenyl sulfate",
                "proteochondroitin sulfate",
                "psychosine sulfate",
                "resveratrol glucuronide sulfate 1",
                "steroid sulfate",
                "sulfoglycosphingolipid",
                "sulfolipid-1(1-)"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Sulfuric acid diethyl ester",
                "Canonical name": "Diethyl sulfate"
            },
            {
                "Referent": "Sulfuric acid methyl ester",
                "Canonical name": "Methyl sulfate"
            },
            {
                "Referent": "Sulfuric acid ethyl ester",
                "Canonical name": "Ethyl sulfate"
            },
            {
                "Referent": "Sulfuric acid butyl ester",
                "Canonical name": "Butyl sulfate"
            },
            {
                "Referent": "Sulfuric acid isopropyl ester",
                "Canonical name": "Isopropyl sulfate"
            },
            {
                "Referent": "Sulfuric acid tert-butyl ester",
                "Canonical name": "tert-Butyl sulfate"
            },
            {
                "Referent": "Sulfuric acid isobutyl ester",
                "Canonical name": "Isobutyl sulfate"
            },
            {
                "Referent": "Sulfuric acid sec-butyl ester",
                "Canonical name": "sec-Butyl sulfate"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethyl ester",
                "Canonical name": "tert-Butylmethyl sulfate"
            },
            {
                "Referent": "Sulfuric acid isopropylmethyl ester",
                "Canonical name": "Isopropylmethyl sulfate"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethylmethyl ester",
                "Canonical name": "tert-Butylmethylmethyl sulfate"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethyl ethyl ester",
                "Canonical name": "tert-Butylmethyl ethyl sulfate"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethyl isopropyl ester",
                "Canonical name": "tert-Butylmethyl isopropyl sulfate"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethyl isopropylmethyl ester",
                "Canonical name": "tert-Butylmethyl isopropylmethyl sulfate"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethyl ethylmethyl ester",
                "Canonical name": "tert-Butylmethyl ethylmethyl sulfate"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethyl ethylmethylmethyl ester",
                "Canonical name": "tert-Butylmethyl ethylmethylmethyl sulfate"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethyl ethylmethyl ethylester",
                "Canonical name": "tert-Butylmethyl ethylmethyl ethylester"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethyl ethylmethyl ethylmethylester",
                "Canonical name": "tert-Butylmethyl ethylmethyl ethylmethylester"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethyl ethylmethyl ethylmethylmethylester",
                "Canonical name": "tert-Butylmethyl ethylmethyl ethylmethylmethylester"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethyl ethylmethyl ethylmethylmethylmethylester",
                "Canonical name": "tert-Butylmethyl ethylmethyl ethylmethylmethylmethylester"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethyl ethylmethyl ethylmethylmethylmethylmethylester",
                "Canonical name": "tert-Butylmethyl ethylmethyl ethylmethylmethylmethylmethylester"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethyl ethylmethyl ethylmethylmethylmethylmethylmethylester",
                "Canonical name": "tert-Butylmethyl ethylmethyl ethylmethylmethylmethylmethylmethylester"
            },
            {
                "Referent": "Sulfuric acid tert-butylmethyl ethylmethyl ethylmethylmethylmethylmethylmethylmethylester",
                "Canonical name": "tert-Butylmethyl ethylmethyl ethylmethylmethylmethylmethylmethylmethylester"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Diethyl sulfate",
                "Methyl sulfate"
            ],
            "mismatches": [
                "Ethyl sulfate",
                "Butyl sulfate",
                "Isopropyl sulfate",
                "tert-Butyl sulfate",
                "Isobutyl sulfate",
                "sec-Butyl sulfate",
                "tert-Butylmethyl sulfate",
                "Isopropylmethyl sulfate",
                "tert-Butylmethylmethyl sulfate",
                "tert-Butylmethyl ethyl sulfate",
                "tert-Butylmethyl isopropyl sulfate",
                "tert-Butylmethyl isopropylmethyl sulfate",
                "tert-Butylmethyl ethylmethyl sulfate",
                "tert-Butylmethyl ethylmethylmethyl sulfate",
                "tert-Butylmethyl ethylmethyl ethylester",
                "tert-Butylmethyl ethylmethyl ethylmethylester",
                "tert-Butylmethyl ethylmethyl ethylmethylmethylester",
                "tert-Butylmethyl ethylmethyl ethylmethylmethylmethylester",
                "tert-Butylmethyl ethylmethyl ethylmethylmethylmethylmethylester",
                "tert-Butylmethyl ethylmethyl ethylmethylmethylmethylmethylmethylester",
                "tert-Butylmethyl ethylmethyl ethylmethylmethylmethylmethylmethylmethylester"
            ],
            "true_referents": [
                "(3Z,6Z)-dodeca-3,6-dien-1-yl hydrogen sulfate",
                "(6S)-6-methyloctyl sulfate",
                "Butyl hydrogen sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "diethyl sulfate",
                "methyl sulfate",
                "sulfuric acid [4-(2-aminoethyl)phenyl] ester"
            ],
            "TP": 2,
            "FP": 21,
            "FN": 0
        }
    }
]