[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "ethyl hydrogen sulfate (EHS)",
            "methyl hydrogen sulfate (MHS)",
            "propyl hydrogen sulfate (PHS)",
            "butyl hydrogen sulfate (BHS)",
            "isopropyl hydrogen sulfate (iP-HS)",
            "sec-butyl hydrogen sulfate (sB-HS)",
            "tert-butyl hydrogen sulfate (tB-HS)",
            "benzyl hydrogen sulfate (BZ-HS)",
            "phenethyl hydrogen sulfate (PE-HS)",
            "ethyl p-toluenesulfonate (Et-PTSO4)",
            "methyl p-toluenesulfonate (Me-PTSO4)",
            "propyl p-toluenesulfonate (Pr-PTSO4)",
            "butyl p-toluenesulfonate (Bu-PTSO4)",
            "isopropyl p-toluenesulfonate (iPr-PTSO4)",
            "sec-butyl p-toluenesulfonate (sBu-PTSO4)",
            "tert-butyl p-toluenesulfonate (tBu-PTSO4)",
            "benzyl p-toluenesulfonate (Bn-PTSO4)",
            "phenethyl p-toluenesulfonate (PhEt-PTSO4)",
            "ethyl trifluoromethanesulfonate (Et-TfO4)",
            "methyl trifluoromethanesulfonate (Me-TfO4)",
            "propyl trifluoromethanesulfonate (Pr-TfO4)",
            "butyl trifluoromethanesulfonate (Bu-TfO4)",
            "isopropyl trifluoromethanesulfonate (iPr-TfO4)",
            "sec-butyl trifluoromethanesulfonate (sBu-TfO4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethyl hydrogen sulfate",
                "butyl hydrogen sulfate"
            ],
            "mismatches": [
                "methyl hydrogen sulfate",
                "propyl hydrogen sulfate",
                "isopropyl hydrogen sulfate",
                "sec-butyl hydrogen sulfate",
                "tert-butyl hydrogen sulfate",
                "benzyl hydrogen sulfate",
                "phenethyl hydrogen sulfate",
                "ethyl p-toluenesulfonate",
                "methyl p-toluenesulfonate",
                "propyl p-toluenesulfonate",
                "butyl p-toluenesulfonate",
                "isopropyl p-toluenesulfonate",
                "sec-butyl p-toluenesulfonate",
                "tert-butyl p-toluenesulfonate",
                "benzyl p-toluenesulfonate",
                "phenethyl p-toluenesulfonate",
                "ethyl trifluoromethanesulfonate",
                "methyl trifluoromethanesulfonate",
                "propyl trifluoromethanesulfonate",
                "butyl trifluoromethanesulfonate",
                "isopropyl trifluoromethanesulfonate",
                "sec-butyl trifluoromethanesulfonate"
            ],
            "true_referents": [
                "(3-aminopropoxy)sulfonic acid",
                "(4-ethyl-2-methoxyphenyl)oxidanesulfonic acid",
                "(6S)-6-methyloctyl sulfate",
                "(E)-2-Propenyl [3-(2-propenylthio)-2-propenyl] sulfate",
                "1,2,3-benzenetriol monosulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "2-methoxy-4-methylphenol sulfate",
                "3-(3-sulfooxyphenyl)propanoic acid",
                "3-Sulfooxybutanoic acid",
                "3-ethylphenyl sulfate",
                "4-(sulfooxy)butanoic acid",
                "4-acetylphenyl hydrogen sulfate",
                "4-ethylphenyl sulfate",
                "4-isopropylphenyl sulfate",
                "Butyl hydrogen sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "L-tyrosine methyl ester 4-sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "[4-(3-oxopropyl)phenyl]oxidanesulfonic acid",
                "decyl hydrogen sulfate",
                "dimethyl sulfate",
                "methyl sulfate",
                "octyl hydrogen sulfate",
                "p-methylaminophenyl sulfate",
                "phenanthryl monosulfate",
                "phenyl hydrogen sulfate",
                "propyl 4-hydroxybenzoate sulfate",
                "propyl hydrogen sulfate",
                "sodium picosulfate",
                "sulfuric acid [4-(2-aminoethyl)phenyl] ester",
                "tetradecyl sulfonic acid"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Ethyl hydrogen sulfate (C2H5HSO4)",
            "Methyl hydrogen sulfate (CH3HSO4)",
            "Propyl hydrogen sulfate (C3H7HSO4)",
            "Butyl hydrogen sulfate (C4H9HSO4)",
            "Isopropyl hydrogen sulfate ((CH3)2CHHSO4)",
            "tert-Butyl hydrogen sulfate ((CH3)3CHSO4)",
            "Phenethyl hydrogen sulfate (C8H9HSO4)",
            "Isobutyl hydrogen sulfate ((CH3)2CHCH2HSO4)",
            "Sec-butyl hydrogen sulfate (CH3CH2CHHSO4CH3)",
            "Isopentyl hydrogen sulfate (C5H11HSO4)",
            "Neopentyl hydrogen sulfate (C5H11HSO4)",
            "Cyclohexyl hydrogen sulfate (C6H11HSO4)",
            "Benzyl hydrogen sulfate (C7H7HSO4)",
            "Cyclopentyl hydrogen sulfate (C5H9HSO4)",
            "2-Phenylethyl hydrogen sulfate (C8H9HSO4)",
            "3-Methylbutyl hydrogen sulfate (C5H11HSO4)",
            "1-Butanol hydrogen sulfate (C4H9HSO4)",
            "2-Methyl-1-propanol hydrogen sulfate (C4H9HSO4)",
            "3-Methyl-1-butanol hydrogen sulfate (C5H11HSO4)",
            "2-Methyl-2-propanol hydrogen sulfate ((CH3)3CHSO4)",
            "1-Pentanol hydrogen sulfate (C5H11HSO4)",
            "2-Methyl-1-butanol hydrogen sulfate (C5H11HSO4)",
            "3-Pentanol hydrogen sulfate (C5H11HSO4)",
            "1-Hexanol hydrogen sulfate (C6H13HSO4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl hydrogen sulfate (C2H5HSO4)",
                "Butyl hydrogen sulfate (C4H9HSO4)"
            ],
            "mismatches": [
                "Methyl hydrogen sulfate (CH3HSO4)",
                "Propyl hydrogen sulfate (C3H7HSO4)",
                "Isopropyl hydrogen sulfate ((CH3)2CHHSO4)",
                "tert-Butyl hydrogen sulfate ((CH3)3CHSO4)",
                "Phenethyl hydrogen sulfate (C8H9HSO4)",
                "Isobutyl hydrogen sulfate ((CH3)2CHCH2HSO4)",
                "Sec-butyl hydrogen sulfate (CH3CH2CHHSO4CH3)",
                "Isopentyl hydrogen sulfate (C5H11HSO4)",
                "Neopentyl hydrogen sulfate (C5H11HSO4)",
                "Cyclohexyl hydrogen sulfate (C6H11HSO4)",
                "Benzyl hydrogen sulfate (C7H7HSO4)",
                "Cyclopentyl hydrogen sulfate (C5H9HSO4)",
                "2-Phenylethyl hydrogen sulfate (C8H9HSO4)",
                "3-Methylbutyl hydrogen sulfate (C5H11HSO4)",
                "1-Butanol hydrogen sulfate (C4H9HSO4)",
                "2-Methyl-1-propanol hydrogen sulfate (C4H9HSO4)",
                "3-Methyl-1-butanol hydrogen sulfate (C5H11HSO4)",
                "2-Methyl-2-propanol hydrogen sulfate ((CH3)3CHSO4)",
                "1-Pentanol hydrogen sulfate (C5H11HSO4)",
                "2-Methyl-1-butanol hydrogen sulfate (C5H11HSO4)",
                "3-Pentanol hydrogen sulfate (C5H11HSO4)",
                "1-Hexanol hydrogen sulfate (C6H13HSO4)"
            ],
            "true_referents": [
                "(2S)-2,6-dimethylheptyl hydrogen sulfate",
                "(3S,4E)-3-methyldec-4-en-1-yl hydrogen sulfate",
                "(3Z)-dodec-3-en-1-yl hydrogen sulfate",
                "(3Z,6Z)-dodeca-3,6-dien-1-yl hydrogen sulfate",
                "(6S)-6-methyloctyl sulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2,6-dimethylheptyl hydrogen sulfate",
                "2-(methoxymethyl)phenyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "3,4-dihydroxy-5-(sulfooxy)cyclohex-1-ene-1-carboxylic acid",
                "3,5-dihydroxy-4-(sulfooxy)cyclohex-1-ene-1-carboxylic acid",
                "4-acetylphenyl hydrogen sulfate",
                "4-isopropylphenyl sulfate",
                "7-methyloctyl hydrogen sulfate",
                "Butyl hydrogen sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "decyl hydrogen sulfate",
                "methyl sulfate",
                "propyl hydrogen sulfate"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Methyl sulfate (Methyl hydrogen sulfate)",
            "Ethyl sulfate (Ethyl hydrogen sulfate)",
            "Propyl sulfate (Propyl hydrogen sulfate)",
            "Butyl sulfate (Butyl hydrogen sulfate)",
            "Isopropyl sulfate (Isopropyl hydrogen sulfate)",
            "tert-Butyl sulfate (tert-Butyl hydrogen sulfate)",
            "Phenyl sulfate (Phenyl hydrogen sulfate)",
            "Benzyl sulfate (Benzyl hydrogen sulfate)",
            "Cyclohexyl sulfate (Cyclohexyl hydrogen sulfate)",
            "Methyl sulfate (Methyl hydrogen sulfate)",
            "Ethyl sulfate (Ethyl hydrogen sulfate)",
            "Propyl sulfate (Propyl hydrogen sulfate)",
            "Butyl sulfate (Butyl hydrogen sulfate)",
            "Isopropyl sulfate (Isopropyl hydrogen sulfate)",
            "tert-Butyl sulfate (tert-Butyl hydrogen sulfate)",
            "Phenyl sulfate (Phenyl hydrogen sulfate)",
            "Benzyl sulfate (Benzyl hydrogen sulfate)",
            "Cyclohexyl sulfate (Cyclohexyl hydrogen sulfate)",
            "Octyl sulfate (Octyl hydrogen sulfate)",
            "Decyl sulfate (Decyl hydrogen sulfate)",
            "Dodecyl sulfate (Dodecyl hydrogen sulfate)",
            "Hexadecyl sulfate (Cetyl sulfate)",
            "Octadecyl sulfate (Stearyl sulfate)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl sulfate (Methyl hydrogen sulfate)",
                "Ethyl sulfate (Ethyl hydrogen sulfate)",
                "Propyl sulfate (Propyl hydrogen sulfate)",
                "Butyl sulfate (Butyl hydrogen sulfate)",
                "Phenyl sulfate (Phenyl hydrogen sulfate)",
                "Octyl sulfate (Octyl hydrogen sulfate)",
                "Decyl sulfate (Decyl hydrogen sulfate)",
                "Dodecyl sulfate (Dodecyl hydrogen sulfate)"
            ],
            "mismatches": [
                "Isopropyl sulfate (Isopropyl hydrogen sulfate)",
                "tert-Butyl sulfate (tert-Butyl hydrogen sulfate)",
                "Benzyl sulfate (Benzyl hydrogen sulfate)",
                "Cyclohexyl sulfate (Cyclohexyl hydrogen sulfate)",
                "Hexadecyl sulfate (Cetyl sulfate)",
                "Octadecyl sulfate (Stearyl sulfate)"
            ],
            "true_referents": [
                "(3S,4E)-3-methyldec-4-en-1-yl hydrogen sulfate",
                "(3Z)-dodec-3-en-1-yl hydrogen sulfate",
                "1-phenanthryl hydrogen sulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-(methoxymethyl)phenyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "3,5-dihydroxy-4-(sulfooxy)cyclohex-1-ene-1-carboxylic acid",
                "4-isopropylphenyl sulfate",
                "7-methyloctyl hydrogen sulfate",
                "Butyl hydrogen sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Steryl sulfate",
                "alkyl sulfate",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "dodecyl hydrogen sulfate",
                "methyl sulfate",
                "octyl hydrogen sulfate",
                "phenyl hydrogen sulfate",
                "propyl 4-hydroxybenzoate sulfate",
                "propyl hydrogen sulfate"
            ],
            "TP": 8,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfate (DMS)",
            "Diethyl sulfate (DES)",
            "Diphenyl sulfate (DPS)",
            "Methyl ethyl sulfate (MES)",
            "Ethyl methyl sulfate (EMS)",
            "Butyl sulfate",
            "Isobutyl sulfate",
            "Octyl sulfate",
            "Lauryl sulfate",
            "Cetyl sulfate",
            "Stearyl sulfate",
            "2-Ethylhexyl sulfate",
            "Benzyl sulfate",
            "Phenethyl sulfate",
            "Methyl sulfate monoethanolamine salt",
            "Sodium lauryl sulfate (SLS)",
            "Ammonium lauryl sulfate (ALS)",
            "Potassium lauryl sulfate (KLS)",
            "Sodium ethyl sulfate (SES)",
            "Triethanolamine lauryl sulfate",
            "Coco sulfate",
            "Disodium Laureth Sulfosuccinate (though a sulfosuccinate, derived from sulfate esters)",
            "Methyl hydrogen sulfate",
            "Ethyl hydrogen sulfate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfate (DMS)",
                "Diethyl sulfate (DES)",
                "2-Ethylhexyl sulfate",
                "Ethyl hydrogen sulfate"
            ],
            "mismatches": [
                "Diphenyl sulfate (DPS)",
                "Methyl ethyl sulfate (MES)",
                "Ethyl methyl sulfate (EMS)",
                "Butyl sulfate",
                "Isobutyl sulfate",
                "Octyl sulfate",
                "Lauryl sulfate",
                "Cetyl sulfate",
                "Stearyl sulfate",
                "Benzyl sulfate",
                "Phenethyl sulfate",
                "Methyl sulfate monoethanolamine salt",
                "Sodium lauryl sulfate (SLS)",
                "Ammonium lauryl sulfate (ALS)",
                "Potassium lauryl sulfate (KLS)",
                "Sodium ethyl sulfate (SES)",
                "Triethanolamine lauryl sulfate",
                "Coco sulfate",
                "Disodium Laureth Sulfosuccinate (though a sulfosuccinate, derived from sulfate esters)",
                "Methyl hydrogen sulfate"
            ],
            "true_referents": [
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "3,5-dihydroxybenzoic acid sulfate",
                "3-ethylphenyl sulfate",
                "7-methyloctyl hydrogen sulfate",
                "Butyl hydrogen sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Laurolactam",
                "Steryl sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "alkyl sulfate",
                "aryl sulfate",
                "carbohydrate sulfate",
                "cholesterol sulfate",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "ethyl 4-hydroxybenzoate sulfate",
                "eugenol sulfate",
                "methyl sulfate",
                "octyl hydrogen sulfate",
                "p-methylaminophenyl sulfate",
                "phenyl hydrogen sulfate",
                "sodium myristyl sulfate"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Ethyl sulfate (EtOSO3H)",
            "Methyl sulfate (MeOSO3H)",
            "Dimethyl sulfate ((CH3O)2SO2)",
            "Diethyl sulfate ((C2H5O)2SO2)",
            "Isopropyl sulfate ((CH3)2CHO)SO3H",
            "Butyl sulfate (BuOSO3H)",
            "Hexyl sulfate (HexOSO3H)",
            "Cyclohexyl sulfate (C6H11OSO3H)",
            "Phenyl sulfate (PhOSO3H)",
            "Benzyl sulfate (BnOSO3H)",
            "Octyl sulfate (OctOSO3H)",
            "Lauryl sulfate (C12H25OSO3H)",
            "Cetyl sulfate (C16H33OSO3H)",
            "Stearyl sulfate (C18H37OSO3H)",
            "Glyceryl sulfate (C3H5(OH)2OSO3H)",
            "Propyl sulfate (PrOSO3H)",
            "Pentyl sulfate (PentOSO3H)",
            "Sec-butyl sulfate ((CH3)(C2H5)CHOSO3H)",
            "Tert-butyl sulfate ((CH3)3COSO3H)",
            "Allyl sulfate (CH2=CHCH2OSO3H)",
            "Vinyl sulfate (CH2=CHOSO3H)",
            "Propargyl sulfate (HC\u2261CCH2OSO3H)",
            "2-Butoxyethanol sulfate (C4H9OC2H4OSO3H)",
            "2-Ethylhexyl sulfate (C8H17OSO3H)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Diethyl sulfate",
                "2-ethylhexyl sulfate"
            ],
            "mismatches": [
                "Ethyl sulfate (EtOSO3H)",
                "Methyl sulfate (MeOSO3H)",
                "Dimethyl sulfate ((CH3O)2SO2)",
                "Isopropyl sulfate ((CH3)2CHO)SO3H",
                "Butyl sulfate (BuOSO3H)",
                "Hexyl sulfate (HexOSO3H)",
                "Cyclohexyl sulfate (C6H11OSO3H)",
                "Phenyl sulfate (PhOSO3H)",
                "Benzyl sulfate (BnOSO3H)",
                "Octyl sulfate (OctOSO3H)",
                "Lauryl sulfate (C12H25OSO3H)",
                "Cetyl sulfate (C16H33OSO3H)",
                "Stearyl sulfate (C18H37OSO3H)",
                "Glyceryl sulfate (C3H5(OH)2OSO3H)",
                "Propyl sulfate (PrOSO3H)",
                "Pentyl sulfate (PentOSO3H)",
                "Sec-butyl sulfate ((CH3)(C2H5)CHOSO3H)",
                "Tert-butyl sulfate ((CH3)3COSO3H)",
                "Allyl sulfate (CH2=CHCH2OSO3H)",
                "Vinyl sulfate (CH2=CHOSO3H)",
                "Propargyl sulfate (HC\u2261CCH2OSO3H)",
                "2-Butoxyethanol sulfate (C4H9OC2H4OSO3H)"
            ],
            "true_referents": [
                "(2,4)2,5-dimethylphenol sulfate",
                "(24S)-hydroxycholesterol 3-sulfate",
                "(3S,4E)-3-methyldec-4-en-1-yl hydrogen sulfate",
                "(3Z)-dodec-3-en-1-yl hydrogen sulfate",
                "(3Z,6Z)-dodeca-3,6-dien-1-yl hydrogen sulfate",
                "(6S)-6-methyloctyl sulfate",
                "(E)-2-Propenyl [3-(2-propenylthio)-2-propenyl] sulfate",
                "1,2,3-benzenetriol monosulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2,6-dimethylheptyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "3,4-dihydroxy-5-(sulfooxy)cyclohex-1-ene-1-carboxylic acid",
                "3,5-dihydroxy-4-(sulfooxy)cyclohex-1-ene-1-carboxylic acid",
                "3,5-dihydroxybenzoic acid sulfate",
                "3-ethylphenyl sulfate",
                "3-phenanthryl hydrogen sulfate",
                "4-allylcatechol sulfate",
                "4-isopropylphenyl sulfate",
                "4-vinylcatechol sulfate",
                "4-vinylphenol sulfate",
                "7-methyloctyl hydrogen sulfate",
                "Butyl hydrogen sulfate",
                "Butyrolactone I 4''-sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Steryl sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "glycerone sulfate",
                "hexosamine sulfate",
                "methyl sulfate",
                "methyl-4-hydroxybenzoate O-sulfate",
                "octyl hydrogen sulfate",
                "pentosan sulfate",
                "phenyl hydrogen sulfate",
                "poly(vinyl sulfate)",
                "propyl 4-hydroxybenzoate sulfate",
                "propyl hydrogen sulfate",
                "sucrose octasulfate"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "ethyl sulfate (EtOSO3H)",
            "methyl sulfate (MeOSO3H)",
            "propyl sulfate (PrOSO3H)",
            "butyl sulfate (BuOSO3H)",
            "isobutyl sulfate (iBuOSO3H)",
            "pentyl sulfate (PeOSO3H)",
            "hexyl sulfate (HxOSO3H)",
            "heptyl sulfate (HpOSO3H)",
            "octyl sulfate (OcOSO3H)",
            "nonyl sulfate (NoOSO3H)",
            "decyl sulfate (DcOSO3H)",
            "dodecyl sulfate (DdOSO3H)",
            "lauryl sulfate (LaOSO3H)",
            "myristyl sulfate (MyOSO3H)",
            "cetyl sulfate (CeOSO3H)",
            "stearyl sulfate (StOSO3H)",
            "oleyl sulfate (OlOSO3H)",
            "arachidyl sulfate (ArOSO3H)",
            "behenyl sulfate (BeOSO3H)",
            "tridecyl sulfate (TdOSO3H)",
            "tetradecyl sulfate (TdOSO3H)",
            "pentadecyl sulfate (PdOSO3H)",
            "hexadecyl sulfate (HdOSO3H)",
            "heptadecyl sulfate (HdOSO3H)",
            "octadecyl sulfate (OdOSO3H)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methyl sulfate",
                "decyl hydrogen sulfate",
                "sodium myristyl sulfate",
                "Sulfuric acid, monooctadecyl ester"
            ],
            "mismatches": [
                "ethyl sulfate (EtOSO3H)",
                "propyl sulfate (PrOSO3H)",
                "butyl sulfate (BuOSO3H)",
                "isobutyl sulfate (iBuOSO3H)",
                "pentyl sulfate (PeOSO3H)",
                "hexyl sulfate (HxOSO3H)",
                "heptyl sulfate (HpOSO3H)",
                "octyl sulfate (OcOSO3H)",
                "nonyl sulfate (NoOSO3H)",
                "dodecyl sulfate (DdOSO3H)",
                "lauryl sulfate (LaOSO3H)",
                "cetyl sulfate (CeOSO3H)",
                "stearyl sulfate (StOSO3H)",
                "oleyl sulfate (OlOSO3H)",
                "arachidyl sulfate (ArOSO3H)",
                "behenyl sulfate (BeOSO3H)",
                "tridecyl sulfate (TdOSO3H)",
                "tetradecyl sulfate (TdOSO3H)",
                "pentadecyl sulfate (PdOSO3H)",
                "hexadecyl sulfate (HdOSO3H)",
                "heptadecyl sulfate (HdOSO3H)"
            ],
            "true_referents": [
                "(24S)-hydroxycholesterol 3-sulfate",
                "(2R)-2,6-dimethylheptyl hydrogen sulfate",
                "(2S)-2,6-dimethylheptyl hydrogen sulfate",
                "(3-ethenylphenyl)oxidanesulfonic acid",
                "(3Z)-dodec-3-en-1-yl hydrogen sulfate",
                "(6S)-6-methyloctyl sulfate",
                "1,2,3-benzenetriol monosulfate",
                "2,6-dimethylheptyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "3-ethylphenyl sulfate",
                "3alpha,7alpha,12alpha-trihydroxy-5alpha-cholan-24-yl sulfate",
                "4-ethylphenyl sulfate",
                "7-methyloctyl hydrogen sulfate",
                "Butyl hydrogen sulfate",
                "Butyrolactone I 4''-sulfate",
                "D-glucopyranose 3-sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Steryl sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "alkyl sulfate",
                "alpha-CEHC sulfate",
                "aryl sulfate",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "digalactosylceramide sulfate",
                "dodecyl hydrogen sulfate",
                "methyl sulfate",
                "methyl-4-hydroxybenzoate O-sulfate",
                "octyl hydrogen sulfate",
                "pentosan sulfate",
                "propyl 4-hydroxybenzoate sulfate",
                "propyl hydrogen sulfate",
                "sodium myristyl sulfate",
                "sucrose octasulfate",
                "tetradecyl sulfonic acid"
            ],
            "TP": 4,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfate (DMS)",
            "Diethyl sulfate (DES)",
            "Dipropyl sulfate (DPS)",
            "Dibutyl sulfate (DBS)",
            "Dipentyl sulfate (DPS)",
            "Hexyl sulfate (HS)",
            "Heptyl sulfate (HepS)",
            "Octyl sulfate (OS)",
            "Nonanyl sulfate (NS)",
            "Decyl sulfate (DS)",
            "Undecyl sulfate (US)",
            "Dodecyl sulfate (DDS)",
            "Tridecyl sulfate (TS)",
            "Tetradecyl sulfate (TeS)",
            "Pentadecyl sulfate (PS)",
            "Hexadecyl sulfate (HS)",
            "Heptadecyl sulfate (HepS)",
            "Octadecyl sulfate (OS)",
            "Nonadecyl sulfate (NS)",
            "Eicosyl sulfate (ES)",
            "Docosyl sulfate (DoS)",
            "Tetracosyl sulfate (TeS)",
            "Pentacosyl sulfate (PS)",
            "Hexacosyl sulfate (HS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "dimethyl sulfate",
                "diethyl sulfate",
                "dodecyl hydrogen sulfate"
            ],
            "mismatches": [
                "Dipropyl sulfate",
                "Dibutyl sulfate",
                "Dipentyl sulfate",
                "Hexyl sulfate",
                "Heptyl sulfate",
                "Octyl sulfate",
                "Nonanyl sulfate",
                "Decyl sulfate",
                "Undecyl sulfate",
                "Tridecyl sulfate",
                "Tetradecyl sulfate",
                "Pentadecyl sulfate",
                "Hexadecyl sulfate",
                "Heptadecyl sulfate",
                "Octadecyl sulfate",
                "Nonadecyl sulfate",
                "Eicosyl sulfate",
                "Docosyl sulfate",
                "Tetracosyl sulfate",
                "Pentacosyl sulfate",
                "Hexacosyl sulfate"
            ],
            "true_referents": [
                "(2S)-2,6-dimethylheptyl hydrogen sulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2,6-dimethylheptyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "3,3',5-triiodo-L-thyronine sulfate",
                "3-ethylcatechol sulfate",
                "3-ethylphenyl sulfate",
                "Butyl hydrogen sulfate",
                "Desmethyltetrahydropiperine sulfate",
                "Diisopropyl sulfate",
                "Docosanediol-1,14-disulfate",
                "Ethyl hydrogen sulfate",
                "N-acetyl-beta-D-galactosamine 6-sulfate",
                "N-acetyl-beta-D-glucosamine 6-sulfate",
                "N-desulfoheparin",
                "Steryl sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "digalactosylceramide sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "heparan sulfates",
                "hexosamine sulfate",
                "nucleotide-sugar sulfate",
                "octyl hydrogen sulfate",
                "oligosaccharide sulfate",
                "p-cresol sulfate",
                "pentosan sulfate",
                "phenyl hydrogen sulfate",
                "polysaccharide sulfate",
                "propyl 4-hydroxybenzoate sulfate",
                "propyl hydrogen sulfate",
                "sodium myristyl sulfate",
                "steroid sulfate",
                "sucrose octasulfate",
                "tetradecyl sulfonic acid",
                "trehalose sulfate"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Methyl sulfate (MeOSO2OCH3)",
            "Ethyl sulfate (EtOSO2OCH2CH3)",
            "Propyl sulfate (PrOSO2OCH2CH2CH3)",
            "Butyl sulfate (BuOSO2OCH2CH2CH2CH3)",
            "Isobutyl sulfate (i-BuOSO2OCH(CH3)CH2CH3)",
            "Pentyl sulfate (PeOSO2OCH2CH2CH2CH2CH3)",
            "Hexyl sulfate (HeOSO2OCH2CH2CH2CH2CH2CH3)",
            "Heptyl sulfate (HpOSO2OCH2CH2CH2CH2CH2CH2CH3)",
            "Octyl sulfate (OctOSO2OCH2CH2CH2CH2CH2CH2CH2CH3)",
            "Nonyl sulfate (NoOSO2OCH2CH2CH2CH2CH2CH2CH2CH2CH3)",
            "Decyl sulfate (DecOSO2OCH2CH2CH2CH2CH2CH2CH2CH2CH2CH3)",
            "Dodecyl sulfate (DodOSO2OCH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH3)",
            "Lauryl sulfate (LaOSO2OCH2(CH2)10CH3)",
            "Myristyl sulfate (MyrOSO2OCH2(CH2)12CH3)",
            "Cetyl sulfate (CeOSO2OCH2(CH2)14CH3)",
            "Stearyl sulfate (SteOSO2OCH2(CH2)16CH3)",
            "Palmitoyl sulfate (PalOSO2OCH2(CH2)14CH3)",
            "Arachidoyl sulfate (AraOSO2OCH2(CH2)18CH3)",
            "Behenyl sulfate (BehOSO2OCH2(CH2)20CH3)",
            "Lignoceryl sulfate (LigOSO2OCH2(CH2)24CH3)",
            "Cholesterol sulfate (CholOSO2OCH2(CH2)3CH3)",
            "Ergosterol sulfate (ErgOSO2OCH2(CH2)3CH3)",
            "Sitosterol sulfate (SitOSO2OCH2(CH2)3CH3)",
            "Stigmasterol sulfate (StigOSO2OCH2(CH2)3CH3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methyl sulfate",
                "cholesterol sulfate"
            ],
            "mismatches": [
                "ethyl sulfate",
                "propyl sulfate",
                "butyl sulfate",
                "isobutyl sulfate",
                "pentyl sulfate",
                "hexyl sulfate",
                "heptyl sulfate",
                "octyl sulfate",
                "nonyl sulfate",
                "decyl sulfate",
                "dodecyl sulfate",
                "lauryl sulfate",
                "myristyl sulfate",
                "cetyl sulfate",
                "stearyl sulfate",
                "palmitoyl sulfate",
                "arachidoyl sulfate",
                "behenyl sulfate",
                "lignoceryl sulfate",
                "ergosterol sulfate",
                "sitosterol sulfate",
                "stigmasterol sulfate"
            ],
            "true_referents": [
                "(2,4)2,5-dimethylphenol sulfate",
                "(24S)-hydroxycholesterol 3-sulfate",
                "(2R)-2,6-dimethylheptyl hydrogen sulfate",
                "(2S)-2,6-dimethylheptyl hydrogen sulfate",
                "(3Z)-dodec-3-en-1-yl hydrogen sulfate",
                "(3beta,5alpha,17beta)-3-hydroxyandrostan-17-yl sulfate",
                "(4R)-4,8-dimethylnonyl hydrogen sulfate",
                "(6S)-6-methyloctyl sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2,6-dimethylheptyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "2-palmitoyl-3,6,6'-tristearoyl-2'-sulfo-alpha,alpha-trehalose",
                "2-palmitoyl-3-stearoyl-2'-sulfo-alpha,alpha-trehalose",
                "3,4-Dihydroxyphenylglycol O-sulfate",
                "3-ethylphenyl sulfate",
                "3alpha,7alpha,12alpha-trihydroxy-5alpha-cholan-24-yl sulfate",
                "4-Androsten-3alpha,17alpha-diol 3-sulphate",
                "4-Androsten-3beta,17beta-diol 3-sulfate",
                "4-Methylcatechol 1-O-sulfate",
                "4-Methylcatechol 2-O-sulfate",
                "4-acetylcatechol sulfate",
                "Butyl hydrogen sulfate",
                "Butyrolactone I 4''-sulfate",
                "Ethyl hydrogen sulfate",
                "Steryl sulfate",
                "alkyl sulfate",
                "cholesterol sulfate",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "glycerone sulfate",
                "methyl sulfate",
                "octyl hydrogen sulfate",
                "propyl 4-hydroxybenzoate sulfate",
                "propyl hydrogen sulfate",
                "sodium myristyl sulfate"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Methyl hydrogen sulfate (CAS: 100-99-9)",
            "Ethyl hydrogen sulfate (CAS: 112-24-7)",
            "Isopropyl hydrogen sulfate (CAS: 98-54-8)",
            "n-Butyl hydrogen sulfate (CAS: 98-55-9)",
            "t-Butyl hydrogen sulfate (CAS: 593-34-0)",
            "Vinyl hydrogen sulfate (CAS: 107-22-7)",
            "Benzyl hydrogen sulfate (CAS: 98-57-1)",
            "Phenethyl hydrogen sulfate (CAS: 104-37-5)",
            "Cyclohexyl hydrogen sulfate (CAS: 96-02-3)",
            "n-Pentyl hydrogen sulfate (CAS: 577-13-8)",
            "Hexyl hydrogen sulfate (CAS: 75-30-6)",
            "Heptyl hydrogen sulfate (CAS: 111-79-3)",
            "Octyl hydrogen sulfate (CAS: 101-20-3)",
            "Nonyl hydrogen sulfate (CAS: 629-88-5)",
            "Decyl hydrogen sulfate (CAS: 108-54-4)",
            "Dodecyl hydrogen sulfate (CAS: 110-54-3)",
            "Lauryl hydrogen sulfate (CAS: 68439-25-1)",
            "Cetyl hydrogen sulfate (CAS: 22235-10-3)",
            "Stearyl hydrogen sulfate (CAS: 20568-46-4)",
            "Oleyl hydrogen sulfate (CAS: 1401-75-2)",
            "Lauryl alcohol sulfate (CAS: 25171-37-8)",
            "Myristyl alcohol sulfate (CAS: 98-55-9)",
            "Palmityl alcohol sulfate (CAS: 110-54-3)",
            "Stearyl alcohol sulfate (CAS: 20568-46-4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl hydrogen sulfate",
                "Decyl hydrogen sulfate",
                "Dodecyl hydrogen sulfate",
                "Octyl hydrogen sulfate"
            ],
            "mismatches": [
                "Methyl hydrogen sulfate (CAS: 100-99-9)",
                "Isopropyl hydrogen sulfate (CAS: 98-54-8)",
                "n-Butyl hydrogen sulfate (CAS: 98-55-9)",
                "t-Butyl hydrogen sulfate (CAS: 593-34-0)",
                "Vinyl hydrogen sulfate (CAS: 107-22-7)",
                "Benzyl hydrogen sulfate (CAS: 98-57-1)",
                "Phenethyl hydrogen sulfate (CAS: 104-37-5)",
                "Cyclohexyl hydrogen sulfate (CAS: 96-02-3)",
                "n-Pentyl hydrogen sulfate (CAS: 577-13-8)",
                "Hexyl hydrogen sulfate (CAS: 75-30-6)",
                "Heptyl hydrogen sulfate (CAS: 111-79-3)",
                "Nonyl hydrogen sulfate (CAS: 629-88-5)",
                "Lauryl hydrogen sulfate (CAS: 68439-25-1)",
                "Cetyl hydrogen sulfate (CAS: 22235-10-3)",
                "Stearyl hydrogen sulfate (CAS: 20568-46-4)",
                "Oleyl hydrogen sulfate (CAS: 1401-75-2)",
                "Lauryl alcohol sulfate (CAS: 25171-37-8)",
                "Myristyl alcohol sulfate (CAS: 98-55-9)",
                "Palmityl alcohol sulfate (CAS: 110-54-3)",
                "Stearyl alcohol sulfate (CAS: 20568-46-4)"
            ],
            "true_referents": [
                "(2R)-2,6-dimethylheptyl hydrogen sulfate",
                "(2S)-2,6-dimethylheptyl hydrogen sulfate",
                "(3Z)-9-methyldec-3-en-1-yl hydrogen sulfate",
                "(3Z)-dodec-3-en-1-yl hydrogen sulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2,6-dimethylheptyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "2-palmitoyl-3,6,6'-tristearoyl-2'-sulfo-alpha,alpha-trehalose",
                "2-palmitoyl-3-stearoyl-2'-sulfo-alpha,alpha-trehalose",
                "4-acetylphenyl hydrogen sulfate",
                "4-isopropylphenyl sulfate",
                "Butyl hydrogen sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Steryl sulfate",
                "alkyl sulfate",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "methyl sulfate",
                "octyl hydrogen sulfate",
                "phenyl hydrogen sulfate",
                "poly(vinyl sulfate)",
                "propyl hydrogen sulfate",
                "sodium myristyl sulfate",
                "vanillyl alcohol 4-sulfate"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfate (DMS)",
            "Diethyl sulfate (DES)",
            "Methyl methanesulfonate (MMS)",
            "Ethyl methanesulfonate (EMS)",
            "Isopropyl methanesulfonate (IMS)",
            "Methyl p-toluenesulfonate (MTS)",
            "Ethyl p-toluenesulfonate (ETS)",
            "Butyl p-toluenesulfonate (BTS)",
            "Methyl trifluoromethanesulfonate (methyl triflate)",
            "Ethyl trifluoromethanesulfonate (ethyl triflate)",
            "Propyl trifluoromethanesulfonate (propyl triflate)",
            "Benzyl methanesulfonate",
            "Phenyl methanesulfonate",
            "Allyl methanesulfonate",
            "Cyclohexyl methanesulfonate",
            "tert-Butyl methanesulfonate",
            "2-Chloroethyl methanesulfonate",
            "2-Bromoethyl methanesulfonate",
            "Glycol sulfate",
            "Ethylene sulfate",
            "Propylene sulfate",
            "Butylene sulfate",
            "Cholesteryl sulfate",
            "Dehydroepiandrosterone sulfate (DHEAS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfate",
                "Diethyl sulfate",
                "dehydroepiandrosterone sulfate"
            ],
            "mismatches": [
                "Methyl methanesulfonate",
                "Ethyl methanesulfonate",
                "Isopropyl methanesulfonate",
                "Methyl p-toluenesulfonate",
                "Ethyl p-toluenesulfonate",
                "Butyl p-toluenesulfonate",
                "Methyl trifluoromethanesulfonate",
                "Ethyl trifluoromethanesulfonate",
                "Propyl trifluoromethanesulfonate",
                "Benzyl methanesulfonate",
                "Phenyl methanesulfonate",
                "Allyl methanesulfonate",
                "Cyclohexyl methanesulfonate",
                "tert-Butyl methanesulfonate",
                "2-Chloroethyl methanesulfonate",
                "2-Bromoethyl methanesulfonate",
                "Glycol sulfate",
                "Ethylene sulfate",
                "Propylene sulfate",
                "Butylene sulfate",
                "Cholesteryl sulfate"
            ],
            "true_referents": [
                "(24S)-hydroxycholesterol 3-sulfate",
                "(3-ethenylphenyl)oxidanesulfonic acid",
                "(6S)-6-methyloctyl sulfate",
                "16alpha-hydroxydehydroepiandrosterone 3-sulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-[(sulfooxy)methyl]butanoic acid",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "26-hydroxycholesterol 3-sulfate",
                "3,4-Dihydroxyphenylglycol O-sulfate",
                "3,4-dihydroxy-5-(sulfooxy)cyclohex-1-ene-1-carboxylic acid",
                "3,5-dihydroxy-4-(sulfooxy)cyclohex-1-ene-1-carboxylic acid",
                "3-(3-sulfooxyphenyl)propanoic acid",
                "3-[4-(sulfooxy)phenyl]propanoic acid",
                "3-ethylphenyl sulfate",
                "4-(sulfooxy)butanoic acid",
                "4-allylcatechol sulfate",
                "4-allylpyrocatechol sulfate",
                "4-isopropylphenyl sulfate",
                "5-methyl-3-isoxazolyl sulfate",
                "5alpha-dihydrotestosterone sulfate",
                "Butyl hydrogen sulfate",
                "Butyrolactone I 4''-sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "[(3-methylbut-2-en-1-yl)oxy]sulfonic acid",
                "[2-(dimethylamino)ethoxy]sulfonic acid",
                "cholesterol sulfate",
                "decyl hydrogen sulfate",
                "dehydroepiandrosterone sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "glycerone sulfate",
                "glycosmisic acid sulfate",
                "methyl sulfate",
                "p-methylaminophenyl sulfate",
                "phenanthryl monosulfate",
                "phenyl hydrogen sulfate",
                "propyl 4-hydroxybenzoate sulfate",
                "propyl hydrogen sulfate",
                "tetradecyl sulfonic acid"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Methyl sulfate (Me2SO4)",
            "Ethyl sulfate (EtOSO3H)",
            "Isopropyl sulfate ((CH3)2CHOSO3H)",
            "n-Propyl sulfate (C3H7OSO3H)",
            "n-Butyl sulfate (C4H9OSO3H)",
            "sec-Butyl sulfate ((CH3)2CHCH2OSO3H)",
            "tert-Butyl sulfate ((CH3)3COSO3H)",
            "n-Pentyl sulfate (C5H11OSO3H)",
            "n-Hexyl sulfate (C6H13OSO3H)",
            "n-Heptyl sulfate (C7H15OSO3H)",
            "n-Octyl sulfate (C8H17OSO3H)",
            "n-Nonyl sulfate (C9H19OSO3H)",
            "n-Decyl sulfate (C10H21OSO3H)",
            "Lauryl sulfate (C12H25OSO3H)",
            "Myristyl sulfate (C14H29OSO3H)",
            "Cetyl sulfate (C16H33OSO3H)",
            "Stearyl sulfate (C18H37OSO3H)",
            "Oleyl sulfate (C18H35OSO3H)",
            "Benzyl sulfate (C6H5CH2OSO3H)",
            "2-Phenylethyl sulfate (C6H5CH2CH2OSO3H)",
            "Geranyl sulfate ((CH3)2C=CHCH2CH2C(CH3)=CHCH2OSO3H)",
            "Cinnamyl sulfate (C6H5CH=CHCH2OSO3H)",
            "Cholesteryl sulfate (C27H45OSO3H)",
            "Vitamin D3 sulfate (C27H43OSO3H)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methyl sulfate",
                "ethyl hydrogen sulfate",
                "propyl hydrogen sulfate",
                "octyl hydrogen sulfate",
                "decyl hydrogen sulfate",
                "steryl sulfate"
            ],
            "mismatches": [
                "isopropyl sulfate",
                "n-butyl sulfate",
                "sec-butyl sulfate",
                "tert-butyl sulfate",
                "n-pentyl sulfate",
                "n-hexyl sulfate",
                "n-heptyl sulfate",
                "n-nonyl sulfate",
                "lauryl sulfate",
                "myristyl sulfate",
                "cetyl sulfate",
                "stearyl sulfate",
                "oleyl sulfate",
                "benzyl sulfate",
                "2-phenylethyl sulfate",
                "geranyl sulfate",
                "cinnamyl sulfate",
                "cholesteryl sulfate",
                "vitamin d3 sulfate"
            ],
            "true_referents": [
                "(2,4)2,5-dimethylphenol sulfate",
                "(24S)-hydroxycholesterol 3-sulfate",
                "(2R)-2,6-dimethylheptyl hydrogen sulfate",
                "(2S)-2,6-dimethylheptyl hydrogen sulfate",
                "(3S,4E)-3-methyldec-4-en-1-yl hydrogen sulfate",
                "(3Z)-dodec-3-en-1-yl hydrogen sulfate",
                "(3alpha,5alpha,17beta)-3-hydroxyandrostan-17-yl sulfate",
                "(3beta,5alpha,17beta)-3-hydroxyandrostan-17-yl sulfate",
                "(4R)-4,8-dimethylnonyl hydrogen sulfate",
                "(4Z,7Z)-deca-4,7-dien-1-yl hydrogen sulfate",
                "(6S)-6-methyloctyl sulfate",
                "(E)-2-Propenyl [3-(2-propenylthio)-2-propenyl] sulfate",
                "1,2,3-benzenetriol monosulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2,6-dimethylheptyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "26-hydroxycholesterol 3-sulfate",
                "3-ethylphenyl sulfate",
                "4-(sulfooxy)-cinnamic acid",
                "4-Methylcatechol 2-O-sulfate",
                "4-androsten-3alpha,17alpha-diol 17-sulfate",
                "4-isopropylphenyl sulfate",
                "7-methyloctyl hydrogen sulfate",
                "Butyl hydrogen sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "N-acetyl-beta-D-galactosamine 4-sulfate",
                "N-acetyl-beta-D-galactosamine 6-sulfate",
                "Steryl sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "alkyl sulfate",
                "cholesterol sulfate",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "methyl sulfate",
                "octyl hydrogen sulfate",
                "pentosan sulfate",
                "propyl hydrogen sulfate",
                "sodium myristyl sulfate"
            ],
            "TP": 6,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "ethyl sulfate (EtOSO3)",
            "methyl sulfate (MeOSO3)",
            "propyl sulfate (PrOSO3)",
            "butyl sulfate (BuOSO3)",
            "pentyl sulfate (PentOSO3)",
            "hexyl sulfate (HexOSO3)",
            "heptyl sulfate (HeptOSO3)",
            "octyl sulfate (OctOSO3)",
            "nonyl sulfate (NonOSO3)",
            "decyl sulfate (DecOSO3)",
            "lauryl sulfate (LAS)",
            "cetyl sulfate",
            "stearyl sulfate",
            "cholesteryl sulfate",
            "menthyl sulfate",
            "cyclohexyl sulfate",
            "benzyl sulfate",
            "phenyl sulfate",
            "naphthyl sulfate",
            "\u03b1-terpinyl sulfate",
            "glyceryl sulfate",
            "glucose sulfate",
            "cellulose sulfate",
            "chondroitin sulfate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "chondroitin sulfate"
            ],
            "mismatches": [
                "ethyl sulfate (EtOSO3)",
                "methyl sulfate (MeOSO3)",
                "propyl sulfate (PrOSO3)",
                "butyl sulfate (BuOSO3)",
                "pentyl sulfate (PentOSO3)",
                "hexyl sulfate (HexOSO3)",
                "heptyl sulfate (HeptOSO3)",
                "octyl sulfate (OctOSO3)",
                "nonyl sulfate (NonOSO3)",
                "decyl sulfate (DecOSO3)",
                "lauryl sulfate (LAS)",
                "cetyl sulfate",
                "stearyl sulfate",
                "cholesteryl sulfate",
                "menthyl sulfate",
                "cyclohexyl sulfate",
                "benzyl sulfate",
                "phenyl sulfate",
                "naphthyl sulfate",
                "\u03b1-terpinyl sulfate",
                "glyceryl sulfate",
                "glucose sulfate",
                "cellulose sulfate"
            ],
            "true_referents": [
                "(24S)-hydroxycholesterol 3-sulfate",
                "(2R)-2,6-dimethylheptyl hydrogen sulfate",
                "(2S)-2,6-dimethylheptyl hydrogen sulfate",
                "(6S)-6-methyloctyl sulfate",
                "1-phenanthryl sulfate",
                "2,6-dimethylheptyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "2-naphthyl sulfate",
                "26-hydroxycholesterol 3-sulfate",
                "3,4-dihydroxy-5-(sulfooxy)cyclohex-1-ene-1-carboxylic acid",
                "3,5-dihydroxy-4-(sulfooxy)cyclohex-1-ene-1-carboxylic acid",
                "3,5-dihydroxybenzoic acid sulfate",
                "3-ethylphenyl sulfate",
                "3-methylcatechol sulfate",
                "4-ethylphenyl sulfate",
                "Butyl hydrogen sulfate",
                "Butyrolactone I 4''-sulfate",
                "D-glucopyranose 3-sulfate",
                "D-glucose 6-sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Laurolactam",
                "N-acetyl-beta-D-galactosamine 4-sulfate",
                "N-acetyl-beta-D-galactosamine 6-sulfate",
                "Steryl sulfate",
                "alkyl sulfate",
                "alpha,alpha-trehalose-2-sulfate",
                "aryl sulfate",
                "carbohydrate sulfate",
                "cholesterol sulfate",
                "chondroitin 4'-sulfate",
                "chondroitin 6'-sulfate",
                "chondroitin sulfate",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "digalactosylceramide sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "glycerone sulfate",
                "hexosamine sulfate",
                "methyl sulfate",
                "monosaccharide sulfate",
                "octyl hydrogen sulfate",
                "oligosaccharide sulfate",
                "p-cresol sulfate",
                "pentosan sulfate",
                "phenyl hydrogen sulfate",
                "polysaccharide sulfate",
                "propyl 4-hydroxybenzoate sulfate",
                "propyl hydrogen sulfate",
                "sodium myristyl sulfate",
                "sucrose octasulfate"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Sulfuric acid ethyl ester (SAEE)",
            "Diethyl sulfate (DES)",
            "Ethyl hydrogen sulfate (EHS)",
            "Sulfuric acid propyl ester (SAPE)",
            "Sulfuric acid butyl ester (SABE)",
            "Sulfuric acid pentyl ester (SAPE)",
            "Sulfuric acid hexyl ester (SAHE)",
            "Sulfuric acid heptyl ester (SAHE)",
            "Sulfuric acid octyl ester (SAOE)",
            "Sulfuric acid nonyl ester (SANE)",
            "Sulfuric acid decyl ester (SADE)",
            "Sulfuric acid undecyl ester (SAUE)",
            "Sulfuric acid dodecyl ester (SADE)",
            "Sulfuric acid tridecyl ester (SATE)",
            "Sulfuric acid tetradecyl ester (SATE)",
            "Sulfuric acid pentadecyl ester (SAPE)",
            "Sulfuric acid hexadecyl ester (SAHE)",
            "Sulfuric acid heptadecyl ester (SAHE)",
            "Sulfuric acid octadecyl ester (SAOE)",
            "Sulfuric acid nonadecyl ester (SANE)",
            "Sulfuric acid eicosyl ester (SAEE)",
            "Sulfuric acid heneicosyl ester (SAHE)",
            "Sulfuric acid docosyl ester (SADE)",
            "Sulfuric acid tricosyl ester (SATE)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Diethyl sulfate (DES)",
                "Ethyl hydrogen sulfate (EHS)"
            ],
            "mismatches": [
                "Sulfuric acid ethyl ester (SAEE)",
                "Sulfuric acid propyl ester (SAPE)",
                "Sulfuric acid butyl ester (SABE)",
                "Sulfuric acid pentyl ester (SAPE)",
                "Sulfuric acid hexyl ester (SAHE)",
                "Sulfuric acid heptyl ester (SAHE)",
                "Sulfuric acid octyl ester (SAOE)",
                "Sulfuric acid nonyl ester (SANE)",
                "Sulfuric acid decyl ester (SADE)",
                "Sulfuric acid undecyl ester (SAUE)",
                "Sulfuric acid dodecyl ester (SADE)",
                "Sulfuric acid tridecyl ester (SATE)",
                "Sulfuric acid tetradecyl ester (SATE)",
                "Sulfuric acid pentadecyl ester (SAPE)",
                "Sulfuric acid hexadecyl ester (SAHE)",
                "Sulfuric acid heptadecyl ester (SAHE)",
                "Sulfuric acid octadecyl ester (SAOE)",
                "Sulfuric acid nonadecyl ester (SANE)",
                "Sulfuric acid eicosyl ester (SAEE)",
                "Sulfuric acid heneicosyl ester (SAHE)",
                "Sulfuric acid docosyl ester (SADE)",
                "Sulfuric acid tricosyl ester (SATE)"
            ],
            "true_referents": [
                "(6S)-6-methyloctyl sulfate",
                "1,2,3-benzenetriol monosulfate",
                "2,6-dimethylheptyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "Butyl hydrogen sulfate",
                "Docosanediol-1,14-disulfate",
                "Ethyl hydrogen sulfate",
                "L-tyrosine methyl ester 4-sulfate",
                "Steryl sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "decyl hydrogen sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "octyl hydrogen sulfate",
                "propyl hydrogen sulfate",
                "sucrose octasulfate",
                "sulfuric acid [4-(2-aminoethyl)phenyl] ester",
                "tetradecyl sulfonic acid"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Sulfuric acid ester of ethyl alcohol (Ethyl sulfate)",
            "Sulfuric acid ester of methyl alcohol (Methyl sulfate)",
            "Sulfuric acid ester of isopropyl alcohol (Isopropyl sulfate)",
            "Sulfuric acid ester of n-butyl alcohol (n-Butyl sulfate)",
            "Sulfuric acid ester of sec-butyl alcohol (sec-Butyl sulfate)",
            "Sulfuric acid ester of tert-butyl alcohol (t-Butyl sulfate)",
            "Sulfuric acid ester of phenol (Phenyl sulfate)",
            "Sulfuric acid ester of o-cresol (o-Cresyl sulfate)",
            "Sulfuric acid ester of m-cresol (m-Cresyl sulfate)",
            "Sulfuric acid ester of p-cresol (p-Cresyl sulfate)",
            "Sulfuric acid ester of xylenol (Xylenyl sulfate)",
            "Sulfuric acid ester of salicylic acid (Salicyl sulfate)",
            "Sulfuric acid ester of acetylsalicylic acid (Acetylsalicyl sulfate)",
            "Sulfuric acid ester of cinnamic acid (Cinnamyl sulfate)",
            "Sulfuric acid ester of benzoic acid (Benzoate sulfate)",
            "Sulfuric acid ester of p-hydroxybenzoic acid (p-Hydroxybenzoate sulfate)",
            "Sulfuric acid ester of hippuric acid (Hippurate sulfate)",
            "Sulfuric acid ester of mandelic acid (Mandelate sulfate)",
            "Sulfuric acid ester of tartaric acid (Tartarate sulfate)",
            "Sulfuric acid ester of citric acid (Citrate sulfate)",
            "Sulfuric acid ester of malic acid (Malate sulfate)",
            "Sulfuric acid ester of fumaric acid (Fumarate sulfate)",
            "Sulfuric acid ester of succinic acid (Succinate sulfate)",
            "Sulfuric acid ester of glutamic acid (Glutamate sulfate)",
            "Sulfuric acid ester of aspartic acid (Aspartate sulfate)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfuric acid ester of ethyl alcohol (Ethyl sulfate)",
                "Sulfuric acid ester of methyl alcohol (Methyl sulfate)",
                "Sulfuric acid ester of phenol (Phenyl sulfate)",
                "Sulfuric acid ester of o-cresol (o-Cresyl sulfate)",
                "Sulfuric acid ester of p-cresol (p-Cresyl sulfate)",
                "Sulfuric acid ester of salicylic acid (Salicyl sulfate)",
                "Sulfuric acid ester of cinnamic acid (Cinnamyl sulfate)",
                "Sulfuric acid ester of p-hydroxybenzoic acid (p-Hydroxybenzoate sulfate)"
            ],
            "mismatches": [
                "Sulfuric acid ester of isopropyl alcohol (Isopropyl sulfate)",
                "Sulfuric acid ester of n-butyl alcohol (n-Butyl sulfate)",
                "Sulfuric acid ester of sec-butyl alcohol (sec-Butyl sulfate)",
                "Sulfuric acid ester of tert-butyl alcohol (t-Butyl sulfate)",
                "Sulfuric acid ester of m-cresol (m-Cresyl sulfate)",
                "Sulfuric acid ester of xylenol (Xylenyl sulfate)",
                "Sulfuric acid ester of acetylsalicylic acid (Acetylsalicyl sulfate)",
                "Sulfuric acid ester of benzoic acid (Benzoate sulfate)",
                "Sulfuric acid ester of hippuric acid (Hippurate sulfate)",
                "Sulfuric acid ester of mandelic acid (Mandelate sulfate)",
                "Sulfuric acid ester of tartaric acid (Tartarate sulfate)",
                "Sulfuric acid ester of citric acid (Citrate sulfate)",
                "Sulfuric acid ester of malic acid (Malate sulfate)",
                "Sulfuric acid ester of fumaric acid (Fumarate sulfate)",
                "Sulfuric acid ester of succinic acid (Succinate sulfate)",
                "Sulfuric acid ester of glutamic acid (Glutamate sulfate)",
                "Sulfuric acid ester of aspartic acid (Aspartate sulfate)"
            ],
            "true_referents": [
                "(6S)-6-methyloctyl sulfate",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-butyloctyl hydrogen sulfate",
                "2-hydroxy-3-(sulfooxy)benzoic acid",
                "3,5-dihydroxybenzoic acid sulfate",
                "4-(sulfooxy)-cinnamic acid",
                "4-acetylphenyl hydrogen sulfate",
                "4-isopropylphenyl sulfate",
                "Butyl hydrogen sulfate",
                "Butyrolactone I 4''-sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "L-tyrosine methyl ester 4-sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "alkyl sulfate",
                "diethyl sulfate",
                "ethyl 4-hydroxybenzoate sulfate",
                "methyl sulfate",
                "o-cresol hydrogen sulfate",
                "p-cresol sulfate",
                "phenyl hydrogen sulfate",
                "propyl 4-hydroxybenzoate sulfate",
                "salicylsulfuric acid",
                "sulfuric acid [4-(2-aminoethyl)phenyl] ester"
            ],
            "TP": 8,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            "Alkyl sulfate (AS)",
            "Sodium lauryl sulfate (SLS)",
            "Sodium laureth sulfate (SLES)",
            "Diethyl sulfate",
            "Dimethyl sulfate",
            "Sulfuric acid monododecyl ester",
            "Sulfuric acid monomyristyl ester",
            "Sulfuric acid monostearyl ester",
            "Sulfuric acid dioleyl ester",
            "Sulfuric acid dimyristyl ester",
            "Sulfuric acid distearyl ester",
            "Cetyl sulfate",
            "Stearyl sulfate",
            "Myristyl sulfate",
            "Oleyl sulfate",
            "Lauryl sulfate",
            "Cetearyl sulfate",
            "Cetostearyl sulfate",
            "Sodium cetyl sulfate",
            "Sodium stearyl sulfate",
            "Sodium myristyl sulfate",
            "Sodium oleyl sulfate",
            "Dioctyl sodium sulfosuccinate",
            "Dinonyl sodium sulfosuccinate",
            "Dicetyl sodium sulfosuccinate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Diethyl sulfate",
                "Dimethyl sulfate",
                "Sodium myristyl sulfate",
                "Stearyl sulfate"
            ],
            "mismatches": [
                "Alkyl sulfate (AS)",
                "Sodium lauryl sulfate (SLS)",
                "Sodium laureth sulfate (SLES)",
                "Sulfuric acid monododecyl ester",
                "Sulfuric acid monomyristyl ester",
                "Sulfuric acid monostearyl ester",
                "Sulfuric acid dioleyl ester",
                "Sulfuric acid dimyristyl ester",
                "Sulfuric acid distearyl ester",
                "Cetyl sulfate",
                "Myristyl sulfate",
                "Oleyl sulfate",
                "Lauryl sulfate",
                "Cetearyl sulfate",
                "Cetostearyl sulfate",
                "Sodium cetyl sulfate",
                "Sodium stearyl sulfate",
                "Sodium oleyl sulfate",
                "Dioctyl sodium sulfosuccinate",
                "Dinonyl sodium sulfosuccinate",
                "Dicetyl sodium sulfosuccinate"
            ],
            "true_referents": [
                "(6S)-6-methyloctyl sulfate",
                "2,4-dimethylphenyl hydrogen sulfate",
                "2,5-anhydro-3-O-(2-O-sulfo-alpha-L-idopyranuronosyl)-D-glucitol",
                "2,5-dimethylphenyl hydrogen sulfate",
                "2-(sulfooxy)acetate",
                "2-(sulfooxy)acetic acid",
                "2-O-sulfo-alpha-L-idopyranuronic acid",
                "2-butyloctyl hydrogen sulfate",
                "Diisopropyl sulfate",
                "Ethyl hydrogen sulfate",
                "Steryl sulfate",
                "Sulfuric acid, monooctadecyl ester",
                "alkyl sulfate",
                "cholesterol sulfate",
                "diethyl sulfate",
                "dimethyl sulfate",
                "dodecyl hydrogen sulfate",
                "glycerone sulfate",
                "methyl sulfate",
                "octyl hydrogen sulfate",
                "sodium myristyl sulfate",
                "sulfuric acid [4-(2-aminoethyl)phenyl] ester",
                "tetradecyl sulfonic acid"
            ],
            "TP": 4,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "sulfuric ester",
        "domain": "chemistry",
        "response": [
            [
                "Referent",
                "ethanol"
            ],
            [
                "Referent",
                "methanol"
            ],
            [
                "Referent",
                "propanol"
            ],
            [
                "Referent",
                "butanol"
            ],
            [
                "Referent",
                "pentanol"
            ],
            [
                "Referent",
                "hexanol"
            ],
            [
                "Referent",
                "heptanol"
            ],
            [
                "Referent",
                "octanol"
            ],
            [
                "Referent",
                "nonanol"
            ],
            [
                "Referent",
                "decanol"
            ],
            [
                "Referent",
                "undecanol"
            ],
            [
                "Referent",
                "dodecanol"
            ],
            [
                "Referent",
                "tridecanol"
            ],
            [
                "Referent",
                "tetradecanol"
            ],
            [
                "Referent",
                "pentadecanol"
            ],
            [
                "Referent",
                "hexadecanol"
            ],
            [
                "Referent",
                "heptadecanol"
            ],
            [
                "Referent",
                "octadecanol"
            ],
            [
                "Referent",
                "nonadecanol"
            ],
            [
                "Referent",
                "eicosanol"
            ]
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "ethanol",
                "methanol",
                "propanol",
                "butanol",
                "pentanol",
                "hexanol",
                "heptanol",
                "octanol",
                "nonanol",
                "decanol",
                "undecanol",
                "dodecanol",
                "tridecanol",
                "tetradecanol",
                "pentadecanol",
                "hexadecanol",
                "heptadecanol",
                "octadecanol",
                "nonadecanol",
                "eicosanol"
            ],
            "true_referents": [
                "(3'-SulfO)galbeta-cer(D18:1/20:0)",
                "(3'-sulfo)Galbeta-Cer(d18:1/18:0(2OH))",
                "1,11,22-Trihydroxy-1,6,11,16,22,27-hexazacyclodotriacontane-2,5,12,15,23,26-hexone",
                "2-palmitoyl-3-stearoyl-2'-sulfo-alpha,alpha-trehalose",
                "Butyl hydrogen sulfate",
                "Cadabicine methyl ether",
                "HS_dp08_0004",
                "HepMer_dp09_0001",
                "Incednam",
                "Maytansinol-9-methyl ether-3-3'-methylbutyrate",
                "Maytansinol-9-methyl ether-3-propionate",
                "Mycotrienin I",
                "Palmyrolide A",
                "Penicipyrroether A",
                "PubChem CID 91849816",
                "SNF-4794-12",
                "Sulfuric acid, monooctadecyl ester",
                "UCF-116-A",
                "alpha-D-GlcNS(6S)-(1->4)-alpha-L-IdoUA(2S)-(1->4)-D-GlcNS(6S)",
                "dimethyl sulfate",
                "octyl hydrogen sulfate",
                "propyl hydrogen sulfate"
            ],
            "TP": 0,
            "FP": 20,
            "FN": 0
        }
    }
]