[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Ethyl acetate (EtOAc)",
            "Methyl benzoate (MeBzO)",
            "Butyl formate",
            "Propyl lactate",
            "Isopropyl acetate",
            "Methyl salicylate",
            "Butyl benzoate",
            "Ethyl butyrate",
            "Isopropyl butyrate",
            "Methyl propionate",
            "Ethyl acetate (repeated for clarity, but only one instance should be used)",
            "Isobutyl acetate",
            "Methyl butyrate",
            "Ethyl valerate",
            "Propyl acetate",
            "Isopropyl acetate (repeated for clarity, but only one instance should be used)",
            "Methyl hexanoate",
            "Ethyl pivalate",
            "Isopropyl propionate",
            "Methyl octanoate",
            "Ethyl lactate",
            "Isopropyl butyrate (repeated for clarity, but only one instance should be used)",
            "Methyl decanoate",
            "Ethyl isovalerate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl acetate",
                "Methyl benzoate",
                "Butyl formate",
                "Isopropyl acetate",
                "Methyl salicylate",
                "Butyl benzoate",
                "Ethyl butyrate",
                "Isopropyl butyrate",
                "Methyl propionate",
                "Isobutyl acetate",
                "Methyl butyrate",
                "Propyl acetate",
                "Methyl hexanoate",
                "Isopropyl propionate",
                "Methyl octanoate",
                "Methyl decanoate",
                "Ethyl isovalerate"
            ],
            "mismatches": [
                "Propyl lactate",
                "Ethyl valerate",
                "Ethyl pivalate",
                "Ethyl lactate"
            ],
            "true_referents": [
                "(S)-Isopropyl lactate",
                "2-phenylethyl pivalate",
                "3-Methylbutyl benzoate",
                "Allyl valerate",
                "Benzyl salicylate",
                "Butyl lactate",
                "Isobutyl octanoate",
                "Isobutyl pentanoate",
                "Isopropyl butyrate",
                "Isopropyl octanoate",
                "Isopropyl propionate",
                "Methyl butyrate",
                "Methyl propionate",
                "Propyl pentanoate",
                "acetate ester",
                "benzyl benzoate",
                "butyl benzoate",
                "butyl formate",
                "ethyl (2R)-lactate",
                "ethyl (2S)-lactate",
                "ethyl 2-hydroxyisovalerate",
                "ethyl acetate",
                "ethyl butyrate",
                "ethyl ester",
                "ethyl formate",
                "ethyl isovalerate",
                "ethyl propionate",
                "etilefrine pivalate",
                "isobutyl acetate",
                "isobutyl butyrate",
                "isopropyl acetate",
                "isopropyl ester",
                "methyl benzoate",
                "methyl decanoate",
                "methyl hexanoate",
                "methyl octanoate",
                "methyl salicylate",
                "pivalate ester",
                "propyl acetate",
                "propyl butyrate",
                "propyl propionate",
                "valerate ester"
            ],
            "TP": 17,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Ethyl acetate (C4H8O2)",
            "Methyl salicylate (C8H8O3)",
            "Isopropyl acetate (C5H10O2)",
            "Butyl acetate (C6H12O2)",
            "Propyl formate (C4H8O2)",
            "Ethyl formate (C3H6O2)",
            "Benzyl acetate (C9H10O2)",
            "Methyl butyrate (C5H10O2)",
            "Isopentyl acetate (C7H14O2)",
            "Octyl acetate (C10H20O2)",
            "Propyl benzoate (C10H12O2)",
            "Methyl benzoate (C8H8O2)",
            "Ethyl benzoate (C9H10O2)",
            "Phenyl acetate (C8H8O2)",
            "Tert-butyl acetate (C6H12O2)",
            "Isobutyl acetate (C6H12O2)",
            "Isoamyl acetate (C7H14O2)",
            "Ethyl cinnamate (C11H12O2)",
            "Methyl cinnamate (C10H10O2)",
            "Propyl cinnamate (C12H14O2)",
            "Hexyl acetate (C8H16O2)",
            "Octyl formate (C9H18O2)",
            "Methyl salicylate (C8H8O3)",
            "Ethyl salicylate (C9H10O3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl acetate (C4H8O2)",
                "Methyl salicylate (C8H8O3)",
                "Isopropyl acetate (C5H10O2)",
                "Butyl acetate (C6H12O2)",
                "Propyl formate (C4H8O2)",
                "Ethyl formate (C3H6O2)",
                "Benzyl acetate (C9H10O2)",
                "Methyl butyrate (C5H10O2)",
                "Octyl acetate (C10H20O2)",
                "Propyl benzoate (C10H12O2)",
                "Methyl benzoate (C8H8O2)",
                "Ethyl benzoate (C9H10O2)",
                "Phenyl acetate (C8H8O2)",
                "Isobutyl acetate (C6H12O2)",
                "Isoamyl acetate (C7H14O2)",
                "Ethyl cinnamate (C11H12O2)",
                "Methyl cinnamate (C10H10O2)",
                "Propyl cinnamate (C12H14O2)",
                "Hexyl acetate (C8H16O2)",
                "Octyl formate (C9H18O2)"
            ],
            "mismatches": [
                "Isopentyl acetate (C7H14O2)",
                "Tert-butyl acetate (C6H12O2)",
                "Ethyl salicylate (C9H10O3)"
            ],
            "true_referents": [
                "(E)-2-Methyl-2-butenyl butyrate",
                "(E)-hex-2-enyl acetate",
                "1-Methyl-2-oxopropyl butyrate",
                "1-Phenylethyl acetate",
                "1-Phenylpropyl acetate",
                "2-Butoxyethyl acetate",
                "2-Methylpropyl formate",
                "2-Octenyl acetate",
                "2-ethylhexyl acetate",
                "3,7-Dimethyl-6-octenyl formate",
                "3-Methyl-3-butenyl acetate",
                "3-Octyl acetate",
                "3-Octyl formate",
                "3-Phenylpropyl cinnamate",
                "Benzyl acetoacetate",
                "Benzyl salicylate",
                "Ethyl cinnamate",
                "Ethylhexyl salicylate",
                "Isooctyl acetate",
                "Isopentenyl acetate",
                "Isopropyl 2,4-dimethyl-2E,4E-heptadienoate",
                "Isopropyl 2-methylbutanoate",
                "Isopropyl formate",
                "Isopropyl octanoate",
                "Methyl butyrate",
                "Propyl cinnamate",
                "Propyl formate",
                "acetate ester",
                "benzyl acetate",
                "benzyl benzoate",
                "benzyl cinnamate",
                "butyl acetate",
                "ethyl acetate",
                "ethyl benzoate",
                "ethyl formate",
                "hexyl acetate",
                "isoamyl acetate",
                "isoamyl formate",
                "isoamyl propanoate",
                "isobutyl acetate",
                "isopropyl acetate",
                "isopropyl ester",
                "methyl benzoate",
                "methyl cinnamate",
                "methyl formate",
                "methyl salicylate",
                "methyl-3,4,5-trimethoxy cinnamate",
                "octyl acetate",
                "octyl formate",
                "phenyl acetate",
                "phenyl salicylate",
                "propyl benzoate",
                "tert-butyl benzoate",
                "tert-butyl ester"
            ],
            "TP": 20,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Methyl acetate (CAS: 79-20-9)",
            "Ethyl acetate (CAS: 141-78-6)",
            "Propyl acetate (CAS: 109-60-4)",
            "Butyl acetate (CAS: 123-86-4)",
            "Isopropyl acetate (CAS: 108-21-4)",
            "Ethyl formate (CAS: 109-94-4)",
            "Methyl propionate (CAS: 557-07-5)",
            "Ethyl butyrate (CAS: 105-54-4)",
            "Methyl benzoate (CAS: 93-58-3)",
            "Ethyl benzoate (CAS: 93-89-0)",
            "Methyl salicylate (CAS: 119-36-8)",
            "Ethyl salicylate (CAS: 118-61-6)",
            "Methyl methylthioacetate (CAS: 14694-32-7)",
            "Methyl phenylacetate (CAS: 101-27-9)",
            "Ethyl phenylacetate (CAS: 101-97-3)",
            "Methyl laurate (CAS: 111-82-0)",
            "Ethyl laurate (CAS: 106-33-2)",
            "Methyl stearate (CAS: 112-61-8)",
            "Ethyl stearate (CAS: 111-61-5)",
            "Methyl oleate (CAS: 112-62-9)",
            "Ethyl oleate (CAS: 111-62-6)",
            "Methyl linoleate (CAS: 112-63-0)",
            "Ethyl linoleate (CAS: 111-63-7)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl acetate (CAS: 79-20-9)",
                "Ethyl acetate (CAS: 141-78-6)",
                "Propyl acetate (CAS: 109-60-4)",
                "Butyl acetate (CAS: 123-86-4)",
                "Isopropyl acetate (CAS: 108-21-4)",
                "Ethyl formate (CAS: 109-94-4)",
                "Methyl propionate (CAS: 557-07-5)",
                "Ethyl butyrate (CAS: 105-54-4)",
                "Methyl benzoate (CAS: 93-58-3)",
                "Ethyl benzoate (CAS: 93-89-0)",
                "Methyl salicylate (CAS: 119-36-8)",
                "Methyl laurate (CAS: 111-82-0)",
                "Ethyl laurate (CAS: 106-33-2)",
                "Methyl stearate (CAS: 112-61-8)",
                "Methyl oleate (CAS: 112-62-9)",
                "Ethyl oleate (CAS: 111-62-6)",
                "Methyl linoleate (CAS: 112-63-0)"
            ],
            "mismatches": [
                "Ethyl salicylate (CAS: 118-61-6)",
                "Methyl methylthioacetate (CAS: 14694-32-7)",
                "Methyl phenylacetate (CAS: 101-27-9)",
                "Ethyl phenylacetate (CAS: 101-97-3)",
                "Ethyl stearate (CAS: 111-61-5)",
                "Ethyl linoleate (CAS: 111-63-7)"
            ],
            "true_referents": [
                "(3-Methylphenyl)methyl acetate",
                "1-Phenylethyl acetate",
                "3-Methyl-2-butenyl propionate",
                "3-Methyl-3-butenyl acetate",
                "3-Methylbutyl benzoate",
                "3-methylthiopropyl acetate",
                "Benzyl salicylate",
                "Ethyl 2-(methylthio)acetate",
                "Ethylhexyl salicylate",
                "Isopropyl octanoate",
                "Methyl 2-(methylthio)acetate",
                "Methyl propionate",
                "Methyl stearate",
                "Oleyl laurate",
                "Phenylmethyl benzeneacetate",
                "acetate ester",
                "benzyl benzoate",
                "butyl acetate",
                "butyrate ester",
                "ethyl acetate",
                "ethyl benzoate",
                "ethyl butyrate",
                "ethyl formate",
                "ethyl laurate",
                "ethyl linoleate",
                "ethyl linolenate",
                "ethyl oleate",
                "ethyl propionate",
                "fatty acid ethyl ester",
                "fatty acid methyl ester",
                "isopropyl acetate",
                "isopropyl ester",
                "methyl acetate",
                "methyl benzoate",
                "methyl formate",
                "methyl laurate",
                "methyl linoleate",
                "methyl linolenate",
                "methyl oleate",
                "methyl salicylate",
                "phenyl acetate",
                "propanoate ester",
                "propyl acetate"
            ],
            "TP": 17,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Methyl formate (HCOOCH3)",
            "Ethyl acetate (CH3COOCH2CH3)",
            "Butyl propanoate (CH3CH2COOCH2CH2CH2CH3)",
            "Isopropyl myristate (CH3(CH2)12COOCH(CH3)2)",
            "Benzyl benzoate (C6H5COOCH2C6H5)",
            "Ethyl butyrate (CH3CH2CH2COOCH2CH3)",
            "Methyl salicylate (C7H6O3)",
            "Amyl acetate (CH3COOCH2CH2CH2CH2CH3)",
            "Octyl palmitate (CH3(CH2)14COOCH2(CH2)7CH3)",
            "Methyl benzoate (C8H8O2)",
            "Ethyl benzoate (C9H10O2)",
            "Linoleic acid methyl ester (C19H36O2)",
            "Cetyl palmitate (CH3(CH2)14COOCH2(CH2)15CH3)",
            "Phenethyl acetate (C10H12O2)",
            "Methyl cinnamate (C10H10O2)",
            "Ethyl vanillin (C11H14O3)",
            "Glyceryl triacetate (C9H14O6)",
            "Polyethylene terephthalate (PET) repeat unit (-(C10H8O4)-)",
            "Nitrocellulose acetate (mixed ester)",
            "Cholesterol linoleate (C31H50O2)",
            "Tocopheryl acetate (Vitamin E acetate, C31H50O2)",
            "Retinyl acetate (Vitamin A acetate, C20H30O2)",
            "Propylparaben (C10H12O3)",
            "Methylparaben (C8H8O3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl formate (HCOOCH3)",
                "Ethyl acetate (CH3COOCH2CH3)",
                "Benzyl benzoate (C6H5COOCH2C6H5)",
                "Ethyl butyrate (CH3CH2CH2COOCH2CH3)",
                "Methyl salicylate (C7H6O3)",
                "Octyl palmitate (CH3(CH2)14COOCH2(CH2)7CH3)",
                "Methyl benzoate (C8H8O2)",
                "Ethyl benzoate (C9H10O2)",
                "Phenethyl acetate (C10H12O2)",
                "Methyl cinnamate (C10H10O2)",
                "Propylparaben (C10H12O3)",
                "Methylparaben (C8H8O3)",
                "Retinyl acetate (Vitamin A acetate, C20H30O2)"
            ],
            "mismatches": [
                "Butyl propanoate (CH3CH2COOCH2CH2CH2CH3)",
                "Isopropyl myristate (CH3(CH2)12COOCH(CH3)2)",
                "Amyl acetate (CH3COOCH2CH2CH2CH2CH3)",
                "Linoleic acid methyl ester (C19H36O2)",
                "Cetyl palmitate (CH3(CH2)14COOCH2(CH2)15CH3)",
                "Ethyl vanillin (C11H14O3)",
                "Glyceryl triacetate (C9H14O6)",
                "Polyethylene terephthalate (PET) repeat unit (-(C10H8O4)-)",
                "Nitrocellulose acetate (mixed ester)",
                "Cholesterol linoleate (C31H50O2)",
                "Tocopheryl acetate (Vitamin E acetate, C31H50O2)"
            ],
            "true_referents": [
                "(3-Methylphenyl)methyl acetate",
                "(E)-2-Butenyl butyrate",
                "1-O-alkyl-2-acetyl-3-acylglycerol",
                "1-O-vanilloyl-beta-D-glucose",
                "1-Phenylethyl acetate",
                "2-Octadecoxyethyl octadecanoate",
                "2-Propenyl 2-ethylbutanoate",
                "4-nitrophenyl acetate",
                "9-cis-retinyl hexadecanoate",
                "Benzyl salicylate",
                "Glycerol 1,2-dihexadecanoate 3-(9Z-octadecenoate)",
                "Glycerol 1,3-dihexadecanoate 2-(9Z-octadecenoate)",
                "Isopropyl 2,4-dimethyl-2E,4E-heptadienoate",
                "Isopropyl 2-methylpropanoate",
                "Mono-(2-ethylhexyl) terephthalate",
                "Mono-2-ethyl-5-carboxypentyl terephthalate",
                "acetate ester",
                "alpha-tocopheronolactone",
                "benzyl benzoate",
                "bis(2-hydroxyethyl) terephthalate",
                "butyl butanoate",
                "cellulose acetate",
                "cholesteryl linoleate",
                "cholesteryl linolenate",
                "decyl palmitate",
                "ethyl acetate",
                "ethyl benzoate",
                "ethyl butyrate",
                "ethyl formate",
                "ethyl myristate",
                "ethyl vanillin isobutyrate",
                "ethylparaben",
                "fatty acid methyl ester",
                "isoamyl acetate",
                "methyl benzoate",
                "methyl cinnamate",
                "methyl formate",
                "methyl linoleate",
                "methyl salicylate",
                "methyl-3,4,5-trimethoxy cinnamate",
                "methylparaben",
                "octyl palmitate",
                "phenethyl acetate",
                "propylparaben",
                "retinyl acetate",
                "retinyl ester",
                "tocopherol succinate",
                "vanillin acetate"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Ethyl acetate (EtOAc)",
            "Methyl benzoate",
            "Propyl acetate",
            "Butyl butyrate",
            "Isoamyl acetate",
            "Methyl salicylate",
            "Ethyl butyrate",
            "Ethyl formate",
            "Methyl acetate",
            "Pentyl acetate",
            "Octyl acetate",
            "Ethyl lactate",
            "Methyl propionate",
            "Ethyl propionate",
            "Isopropyl acetate",
            "Benzyl acetate",
            "Methyl butyrate",
            "Ethyl valerate",
            "Methyl methacrylate (MMA)",
            "Vinyl acetate",
            "Methyl palmitate",
            "Ethyl hexanoate",
            "Methyl laurate",
            "Ethyl oleate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl acetate (EtOAc)",
                "Methyl benzoate",
                "Propyl acetate",
                "Butyl butyrate",
                "Isoamyl acetate",
                "Methyl salicylate",
                "Ethyl butyrate",
                "Ethyl formate",
                "Methyl acetate",
                "Pentyl acetate",
                "Octyl acetate",
                "Methyl propionate",
                "Ethyl propionate",
                "Isopropyl acetate",
                "Benzyl acetate",
                "Methyl butyrate",
                "Methyl methacrylate (MMA)",
                "Vinyl acetate",
                "Methyl palmitate",
                "Ethyl hexanoate",
                "Methyl laurate",
                "Ethyl oleate"
            ],
            "mismatches": [
                "Ethyl lactate",
                "Ethyl valerate"
            ],
            "true_referents": [
                "3-Octyl acetate",
                "Allyl valerate",
                "Benzyl acetoacetate",
                "Benzyl salicylate",
                "Isopropyl octanoate",
                "Methyl butyrate",
                "Methyl palmitate",
                "Methyl propionate",
                "Octadecyl acetate",
                "Propyl pentanoate",
                "acetate ester",
                "benzyl acetate",
                "benzyl benzoate",
                "bisphenol A dimethacrylate",
                "butyl butanoate",
                "cellulose acetate",
                "decyl propionate",
                "ethyl (2R)-lactate",
                "ethyl (2S)-lactate",
                "ethyl acetate",
                "ethyl butyrate",
                "ethyl formate",
                "ethyl hexanoate",
                "ethyl isovalerate",
                "ethyl oleate",
                "ethyl propionate",
                "isoamyl acetate",
                "isoamyl isobutyrate",
                "isoamyl propanoate",
                "isopropyl acetate",
                "isopropyl ester",
                "methyl acetate",
                "methyl benzoate",
                "methyl formate",
                "methyl laurate",
                "methyl methacrylate",
                "methyl salicylate",
                "myristyl palmitate",
                "octyl acetate",
                "oleyl oleate",
                "pentyl acetate",
                "pentyl octanoate",
                "pentyl propanoate",
                "propyl acetate",
                "propyl butyrate",
                "propyl propionate",
                "valerate ester",
                "vinyl acetate"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Ethyl acetate (C4H8O2)",
            "Methyl acetate (C3H6O2)",
            "Butyl acetate (C6H12O2)",
            "Propyl acetate (C5H10O2)",
            "Acetylsalicylic acid (Aspirin) (C9H8O4)",
            "Benzyl acetate (C9H10O2)",
            "Octyl acetate (C10H20O2)",
            "Isobutyl acetate (C5H10O2)",
            "Vinyl acetate (C4H6O2)",
            "Ethyl butanoate (C6H12O2)",
            "Methyl propanoate (C4H8O2)",
            "Ethyl hexanoate (C8H16O2)",
            "Butyl butanoate (C8H16O2)",
            "Methyl benzoate (C8H8O2)",
            "Ethyl lactate (C5H10O3)",
            "Benzyl benzoate (C14H12O2)",
            "Diethyl phthalate (C12H14O4)",
            "Dimethyl phthalate (C10H10O4)",
            "Ethyl 4-aminobenzoate (Benzocaine) (C9H11NO2)",
            "Methyl salicylate (Wintergreen oil) (C8H8O3)",
            "Ethyl 2-methylbutanoate (C7H14O2)",
            "Methyl 2-phenylacetate (C10H12O2)",
            "Ethyl 3-hydroxybutanoate (C6H12O3)",
            "Benzyl salicylate (C13H12O3)",
            "Ethyl 3-phenylpropanoate (C12H14O2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl acetate",
                "Methyl acetate",
                "Butyl acetate",
                "Propyl acetate",
                "Acetylsalicylic acid",
                "Benzyl acetate",
                "Octyl acetate",
                "Isobutyl acetate",
                "Vinyl acetate",
                "Ethyl hexanoate",
                "Butyl butanoate",
                "Methyl benzoate",
                "Benzyl benzoate",
                "Diethyl phthalate",
                "Dimethyl phthalate",
                "Methyl salicylate",
                "Ethyl 3-hydroxybutanoate",
                "Benzyl salicylate"
            ],
            "mismatches": [
                "Ethyl butanoate",
                "Methyl propanoate",
                "Ethyl lactate",
                "Ethyl 4-aminobenzoate",
                "Ethyl 2-methylbutanoate",
                "Methyl 2-phenylacetate",
                "Ethyl 3-phenylpropanoate"
            ],
            "true_referents": [
                "(3-Methylphenyl)methyl acetate",
                "(3S)-3,7-dimethyloct-7-en-1-yl phenylacetate",
                "(E)-hex-2-enyl acetate",
                "1-Ethenylhexyl butanoate",
                "1-Phenylethyl acetate",
                "1-Phenylpropyl acetate",
                "2-Butoxyethyl acetate",
                "2-Methylbutyl 2-methylbutanoate",
                "2-Methylpropyl propanoate",
                "2-Octenyl acetate",
                "2-Propenyl 2-aminobenzoate",
                "2-Propenyl 2-ethylbutanoate",
                "2-Propenyl octanoate",
                "3-Hexenyl salicylic acid",
                "3-Methyl-3-butenyl acetate",
                "3-Octyl acetate",
                "Benzyl acetoacetate",
                "Benzyl salicylate",
                "Di(2,6-dimethyl-4-heptyl) phthalate",
                "Dimethyl phthalate",
                "Ethyl 2-aminobenzoate",
                "Ethyl 2-ethylbutanoate",
                "Ethyl 2-ethylhexanoate",
                "Glycerol 1-propanoate diacetate",
                "Isobutyl 10-undecenoate",
                "Isobutyl pentanoate",
                "Methyl 3-amino-4-methylbenzoate",
                "Phenylmethyl benzeneacetate",
                "Propyl 2-methylpropanoate",
                "acetate ester",
                "acetylsalicylic acid",
                "benzoate ester",
                "benzyl acetate",
                "benzyl benzoate",
                "butyl acetate",
                "butyl butanoate",
                "butyl octanoate",
                "diethyl phthalate",
                "ethyl (2R)-lactate",
                "ethyl (2S)-lactate",
                "ethyl (R)-3-hydroxybutanoate",
                "ethyl 3-hydroxybutyrate",
                "ethyl acetate",
                "ethyl hexanoate",
                "isobutyl acetate",
                "methyl 8-[2-(2-formyl-vinyl)-3-hydroxy-5-oxo-cyclopentyl]-octanoate",
                "methyl acetate",
                "methyl benzoate",
                "methyl salicylate",
                "octyl acetate",
                "phenyl salicylate",
                "propyl acetate",
                "vinyl acetate"
            ],
            "TP": 18,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Acetic acid ethyl ester (EtOAc)",
            "Methyl acetate (MeOAc)",
            "Ethyl butyrate (EtBu)",
            "Methyl butyrate (MeBu)",
            "Propyl acetate (PrOAc)",
            "Butyl acetate (BuOAc)",
            "Isobutyl acetate (i-BuOAc)",
            "Pentyl acetate (PeOAc)",
            "Hexyl acetate (HexOAc)",
            "Heptyl acetate (HeptOAc)",
            "Octyl acetate (OctOAc)",
            "Nonyl acetate (NonOAc)",
            "Decyl acetate (DecOAc)",
            "Undecyl acetate (UndOAc)",
            "Dodecyl acetate (DodOAc)",
            "Tridecyl acetate (TridOAc)",
            "Tetradecyl acetate (TetraOAc)",
            "Pentadecyl acetate (PentaOAc)",
            "Hexadecyl acetate (HexaOAc)",
            "Heptadecyl acetate (HeptaOAc)",
            "Octadecyl acetate (OctaOAc)",
            "Nonadecyl acetate (NonaOAc)",
            "Eicosyl acetate (EicosOAc)",
            "Heneicosyl acetate (HeneicOAc)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethyl acetate",
                "methyl acetate",
                "ethyl butyrate",
                "methyl butyrate",
                "propyl acetate",
                "butyl acetate",
                "isobutyl acetate",
                "pentyl acetate",
                "hexyl acetate",
                "heptyl acetate",
                "octyl acetate",
                "nonyl acetate",
                "decyl acetate",
                "undecyl acetate",
                "dodecyl acetate",
                "tridecyl acetate",
                "tetradecyl acetate",
                "pentadecyl acetate",
                "heptadecyl acetate",
                "octadecyl acetate",
                "eicosyl acetate"
            ],
            "mismatches": [
                "Nonadecyl acetate (NonaOAc)",
                "Heneicosyl acetate (HeneicOAc)"
            ],
            "true_referents": [
                "1,4-Nonanediol diacetate",
                "1-octadecyl-heptadecanoate",
                "10-Undecenyl acetate",
                "2-(pentyloxy)ethyl acetate",
                "2-Nonenyl acetate",
                "2-Undecenyl acetate",
                "2-ethylhexyl acetate",
                "3-Heptyl acetate",
                "3-Nonanon-1-yl acetate",
                "3-Octyl acetate",
                "3E-Hexenyl acetate",
                "9-Octadecenyl acetate",
                "Butyl 3-methylbutanoate",
                "Decyl acetate",
                "Dodecyl acetate",
                "Eicosyl acetate",
                "Ethyl 2-ethylbutanoate",
                "Ethyl pentadecanoate",
                "Heptadecyl acetate",
                "Heptyl acetate",
                "Heptyl heptanoate",
                "Isobutyl octanoate",
                "Isobutyl pentanoate",
                "Methyl 3-methylbutanoate",
                "Methyl butyrate",
                "Methyl methoxyacetate",
                "Octadecyl acetate",
                "Octyl octanoate",
                "Pentadecyl acetate",
                "Propyl 2-methylpropanoate",
                "Tetradecyl acetate",
                "Tridecyl acetate",
                "Undecyl acetate",
                "acetate ester",
                "butyl acetate",
                "butyl butanoate",
                "decyl decanoate",
                "decyl oleate",
                "dodecyl dodecanoate",
                "dodecyl octanoate",
                "ethyl acetate",
                "ethyl arachidonate",
                "ethyl butyrate",
                "hexadecyl hexanoate",
                "hexyl acetate",
                "hexyl hexanoate",
                "isobutyl acetate",
                "methyl acetate",
                "methyl henicosanoate",
                "nonyl acetate",
                "octyl acetate",
                "pentadecyl butyrate",
                "pentyl acetate",
                "propanoate ester",
                "propyl acetate",
                "tetradecyl octanoate"
            ],
            "TP": 21,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Methyl acetate (CH3COOCH3)",
            "Ethyl butanoate (CH3CH2COOCH2CH3)",
            "Propyl propionate (CH3CH2CH2COOCH2CH3)",
            "Butyl formate (CH3CH2CH2COOCH3)",
            "Pentyl isobutyrate (CH3CH2CH2CH2COOCH(CH3)2)",
            "Hexyl valerate (CH3(CH2)4COOCH2CH3)",
            "Heptyl caproate (CH3(CH2)5COOCH2CH3)",
            "Octyl palmitate (CH3(CH2)6COOCH2(CH2)14CH3)",
            "Nonyl oleate (CH3(CH2)7COOCH2CH=CH(CH2)7CH3)",
            "Decyl stearate (CH3(CH2)8COOCH2(CH2)16CH3)",
            "Undecyl benzoate (CH3(CH2)9COOCH2C6H5)",
            "Dodecyl phthalate (CH3(CH2)10COOCH2C6H4COO(CH2)10CH3)",
            "Tridecyl citrate (CH3(CH2)11COOCH2CH2COOC(CH2)2COO(CH2)10CH3)",
            "Tetradecyl acetate (CH3(CH2)12COOCH2CH3)",
            "Pentadecyl propionate (CH3(CH2)13COOCH2CH2CH3)",
            "Hexadecyl butyrate (CH3(CH2)14COOCH2CH2CH2CH3)",
            "Heptadecyl isovalerate (CH3(CH2)15COOCH2CH(CH3)CH2CH3)",
            "Octadecyl caproate (CH3(CH2)16COOCH2(CH2)4CH3)",
            "Nonadecyl valerate (CH3(CH2)17COOCH2CH2CH2CH2CH3)",
            "Eicosyl laurate (CH3(CH2)18COOCH2(CH2)10CH3)",
            "Heneicosyl myristate (CH3(CH2)19COOCH2(CH2)12CH3)",
            "Docosyl palmitoleate (CH3(CH2)20COOCH2(CH=CH(CH2)14CH3)",
            "Tricosyl oleate (CH3(CH2)21COOCH2CH=CH(CH2)7CH3)",
            "Tetracosyl linoleate (CH3(CH2)22COOCH2CH=CH(CH2)4CH=CH(CH2)7CH3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl acetate (CH3COOCH3)",
                "Pentyl isobutyrate (CH3CH2CH2CH2COOCH(CH3)2)",
                "Octyl palmitate (CH3(CH2)6COOCH2(CH2)14CH3)",
                "Hexadecyl butyrate (CH3(CH2)14COOCH2CH2CH2CH3)",
                "Tetradecyl acetate (CH3(CH2)12COOCH2CH3)",
                "Propyl propionate (CH3CH2CH2COOCH2CH3)",
                "Butyl formate (CH3CH2CH2COOCH3)"
            ],
            "mismatches": [
                "Ethyl butanoate (CH3CH2COOCH2CH3)",
                "Hexyl valerate (CH3(CH2)4COOCH2CH3)",
                "Heptyl caproate (CH3(CH2)5COOCH2CH3)",
                "Nonyl oleate (CH3(CH2)7COOCH2CH=CH(CH2)7CH3)",
                "Decyl stearate (CH3(CH2)8COOCH2(CH2)16CH3)",
                "Undecyl benzoate (CH3(CH2)9COOCH2C6H5)",
                "Dodecyl phthalate (CH3(CH2)10COOCH2C6H4COO(CH2)10CH3)",
                "Pentadecyl propionate (CH3(CH2)13COOCH2CH2CH3)",
                "Heptadecyl isovalerate (CH3(CH2)15COOCH2CH(CH3)CH2CH3)",
                "Octadecyl caproate (CH3(CH2)16COOCH2(CH2)4CH3)",
                "Nonadecyl valerate (CH3(CH2)17COOCH2CH2CH2CH2CH3)",
                "Eicosyl laurate (CH3(CH2)18COOCH2(CH2)10CH3)",
                "Heneicosyl myristate (CH3(CH2)19COOCH2(CH2)12CH3)",
                "Docosyl palmitoleate (CH3(CH2)20COOCH2(CH=CH(CH2)14CH3)",
                "Tricosyl oleate (CH3(CH2)21COOCH2CH=CH(CH2)7CH3)",
                "Tetracosyl linoleate (CH3(CH2)22COOCH2CH=CH(CH2)4CH=CH(CH2)7CH3)"
            ],
            "true_referents": [
                "(+/-)-Ethyl 2-hydroxy-3-methylvalerate",
                "(2E)-2-hexenyl isovalerate",
                "(2R)-3-(Octadecyloxy)-2-(pentadecanoyloxy)propyl octadecanoate",
                "(3-Methylphenyl)methyl acetate",
                "(E)-16-octadecenoic acid methyl ester",
                "(E)-2-Hexenyl butyrate",
                "1-Ethenylhexyl butanoate",
                "1-O-16-methylheptadecyl oleate",
                "1-O-20-methylhenicosyl oleate",
                "1-O-24-methylpentacosyl oleate",
                "1-O-hexacosyl oleate",
                "1-O-tetracosyl oleate",
                "1-octadecyl-11E-hexadecenoate",
                "12-Methyltetradecyl acetate",
                "12E-Tetradecenyl acetate",
                "2-Hexenyl valerate",
                "2-Pentyl 3-methylbutanoate",
                "3-Heptyl acetate",
                "7E,9E,11-Dodecatrienyl acetate",
                "8E-octadecenyl heptadecanoate",
                "Allyl valerate",
                "Bis(3,5,5-trimethylhexyl) phthalate",
                "Di(2,6-dimethyl-4-heptyl) phthalate",
                "Ethyl 2-ethylbutanoate",
                "Ethyl 2-methyl-3,4-pentadienoate",
                "Ethyl pentadecanoate",
                "Heptyl acetate",
                "Heptyl heptanoate",
                "Isopropyl 2,4-dimethyl-2E,4E-heptadienoate",
                "Linoleyl linoleate",
                "Linoleyl oleate",
                "Methyl propionate",
                "Nonyl isovalerate",
                "Nonyl octanoate",
                "Oleyl laurate",
                "Pentadecyl palmitoleate",
                "Pentyl 3-methylbutanoate",
                "Tetradecyl acetate",
                "Tridecyl acetate",
                "benzyl benzoate",
                "butyl formate",
                "decyl butyrate",
                "decyl palmitate",
                "ethyl benzoate",
                "ethyl butyrate",
                "ethyl formate",
                "ethyl laurate",
                "ethyl myristate",
                "ethyl propionate",
                "hexadecyl butyrate",
                "l-Norvaline, N-(2-methoxyethoxycarbonyl)-, undecyl ester",
                "methyl acetate",
                "methyl palmitoleate",
                "n-butyl oleate",
                "octyl palmitate",
                "oleyl oleate",
                "pentyl isobutyrate",
                "phthalate ester",
                "propyl propionate",
                "valeryl hexanoate"
            ],
            "TP": 7,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Methyl acetate (CH\u2083COOCH\u2083)",
            "Ethyl acetate (CH\u2083COOCH\u2082CH\u2083)",
            "Propyl acetate (CH\u2083COOCH\u2082CH\u2082CH\u2083)",
            "Butyl acetate (CH\u2083COOCH\u2082CH\u2082CH\u2082CH\u2083)",
            "Benzyl acetate (C\u2086H\u2085CH\u2082OOCCH\u2083)",
            "Ethyl butyrate (CH\u2083CH\u2082CH\u2082COOCH\u2082CH\u2083)",
            "Methyl formate (HCOOCH\u2083)",
            "Dimethyl phthalate (C\u2086H\u2084(CO\u2082CH\u2083)\u2082)",
            "Diethyl sebacate (C\u2081\u2080H\u2081\u2088O\u2084)",
            "Ethyl lactate (CH\u2083CH(OH)COOCH\u2082CH\u2083)",
            "Methyl salicylate (C\u2087H\u2086O\u2083)",
            "Isopropyl myristate (C\u2081\u2085H\u2083\u2080O\u2082)",
            "Octyl acetate (CH\u2083COO(CH\u2082)\u2086CH\u2083)",
            "Butyl methacrylate (CH\u2082=C(CH\u2083)COOCH\u2082CH\u2082CH\u2082CH\u2083)",
            "Isobutyl acetate (CH\u2083COOCH(CH\u2083)CH\u2082CH\u2083)",
            "Butyl butyrate (CH\u2083CH\u2082CH\u2082COOCH\u2082CH\u2082CH\u2082CH\u2083)",
            "Triethyl citrate (C\u2086H\u2081\u2084O\u2087)",
            "Benzyl butyrate (C\u2081\u2084H\u2082\u2082O\u2082)",
            "Ethyl propionate (CH\u2083CH\u2082COOCH\u2082CH\u2083)",
            "Methyl benzoate (C\u2087H\u2086O\u2082)",
            "Propyl formate (HCOOCH\u2082CH\u2082CH\u2083)",
            "Ethyl hexanoate (CH\u2083(CH\u2082)\u2084COOCH\u2082CH\u2083)",
            "Methyl anthranilate (C\u2089H\u2089NO\u2082)",
            "Ethyl laurate (CH\u2083(CH\u2082)\u2087COOCH\u2082CH\u2083)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl acetate (CH\u2083COOCH\u2083)",
                "Ethyl acetate (CH\u2083COOCH\u2082CH\u2083)",
                "Propyl acetate (CH\u2083COOCH\u2082CH\u2082CH\u2083)",
                "Butyl acetate (CH\u2083COOCH\u2082CH\u2082CH\u2082CH\u2083)",
                "Benzyl acetate (C\u2086H\u2085CH\u2082OOCCH\u2083)",
                "Ethyl butyrate (CH\u2083CH\u2082CH\u2082COOCH\u2082CH\u2083)",
                "Methyl formate (HCOOCH\u2083)",
                "Methyl salicylate (C\u2087H\u2086O\u2083)",
                "Octyl acetate (CH\u2083COO(CH\u2082)\u2086CH\u2083)",
                "Butyl methacrylate (CH\u2082=C(CH\u2083)COOCH\u2082CH\u2082CH\u2082CH\u2083)",
                "Isobutyl acetate (CH\u2083COOCH(CH\u2083)CH\u2082CH\u2083)",
                "Ethyl propionate (CH\u2083CH\u2082COOCH\u2082CH\u2083)",
                "Methyl benzoate (C\u2087H\u2086O\u2082)",
                "Propyl formate (HCOOCH\u2082CH\u2082CH\u2083)",
                "Ethyl hexanoate (CH\u2083(CH\u2082)\u2084COOCH\u2082CH\u2083)",
                "Methyl anthranilate (C\u2089H\u2089NO\u2082)",
                "Ethyl laurate (CH\u2083(CH\u2082)\u2087COOCH\u2082CH\u2083)"
            ],
            "mismatches": [
                "Dimethyl phthalate (C\u2086H\u2084(CO\u2082CH\u2083)\u2082)",
                "Diethyl sebacate (C\u2081\u2080H\u2081\u2088O\u2084)",
                "Ethyl lactate (CH\u2083CH(OH)COOCH\u2082CH\u2083)",
                "Isopropyl myristate (C\u2081\u2085H\u2083\u2080O\u2082)",
                "Butyl butyrate (CH\u2083CH\u2082CH\u2082COOCH\u2082CH\u2082CH\u2082CH\u2083)",
                "Triethyl citrate (C\u2086H\u2081\u2084O\u2087)",
                "Benzyl butyrate (C\u2081\u2084H\u2082\u2082O\u2082)"
            ],
            "true_referents": [
                "(3-Methylphenyl)methyl acetate",
                "(E)-2-Butenyl butyrate",
                "(E)-2-Methyl-2-butenyl butyrate",
                "(E)-2-Octenyl butyrate",
                "2-Butoxyethyl acetate",
                "2-Methylpropyl formate",
                "2E,7-Octadienyl acetate",
                "3-Methyl-3-butenyl acetate",
                "3-Octyl acetate",
                "7E,9E,11-Dodecatrienyl acetate",
                "Benzyl salicylate",
                "Butylmethacrylate",
                "Di(2,6-dimethyl-4-heptyl) phthalate",
                "Ethyl (2E,6Z)-dodecadienoate",
                "Ethyl (E)-7,9-decadienoate",
                "Ethyl 2-ethyl-3-phenylpropanoate",
                "Ethyl 2-ethylhexanoate",
                "Ethyl 5-methylhexanoate",
                "Isopropyl 2-methyl-2E-pentenoate",
                "Isopropyl 2-methylbutanoate",
                "Isopropyl 2-methylpropanoate",
                "Isopropyl 3-methylbutanoate",
                "Methyl propionate",
                "Propyl formate",
                "acetate ester",
                "benzyl acetate",
                "benzyl benzoate",
                "butyl acetate",
                "butyl acrylate",
                "butyrate ester",
                "decyl propionate",
                "dimethyl sebacate",
                "ethyl (2R)-lactate",
                "ethyl (2S)-lactate",
                "ethyl acetate",
                "ethyl butyrate",
                "ethyl formate",
                "ethyl hexanoate",
                "ethyl laurate",
                "ethyl propionate",
                "isobutyl acetate",
                "methyl N-methylanthranilate",
                "methyl acetate",
                "methyl anthranilate",
                "methyl benzoate",
                "methyl formate",
                "methyl laurate",
                "methyl methacrylate",
                "methyl salicylate",
                "mono[2-(carboxymethyl)hexyl] phthalate",
                "octyl acetate",
                "propyl acetate"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Ethyl acetate (EtOAc)",
            "Methyl salicylate",
            "Glyceryl trioleate",
            "Butyl butyrate",
            "Isopropyl myristate",
            "Cellulose acetate",
            "Polyethylene terephthalate (PET)",
            "Aspirin (acetylsalicylic acid)",
            "Vitamin A palmitate",
            "Ethyl formate",
            "Propyl propionate",
            "Methyl benzoate",
            "Triacetin",
            "Isoamyl acetate",
            "Ethyl butyrate",
            "Benzyl acetate",
            "Methyl methacrylate",
            "Cocaine",
            "Heroin",
            "Ethyl cinnamate",
            "Octyl acetate",
            "Methyl anthranilate",
            "Ethyl vanillin",
            "Gamma-butyrolactone (GBL)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl acetate",
                "Methyl salicylate",
                "Cellulose acetate",
                "acetylsalicylic acid",
                "Ethyl formate",
                "Propyl propionate",
                "Methyl benzoate",
                "Triacetin",
                "Isoamyl acetate",
                "Ethyl butyrate",
                "Benzyl acetate",
                "Methyl methacrylate",
                "Cocaine",
                "Ethyl cinnamate",
                "Octyl acetate",
                "Methyl anthranilate",
                "gamma-butyrolactone"
            ],
            "mismatches": [
                "Glyceryl trioleate",
                "Butyl butyrate",
                "Isopropyl myristate",
                "Polyethylene terephthalate (PET)",
                "Vitamin A palmitate",
                "Heroin",
                "Ethyl vanillin"
            ],
            "true_referents": [
                "3-Octyl acetate",
                "4-butyl-gamma-butyrolactone",
                "Benzyl acetoacetate",
                "Benzyl salicylate",
                "Cocaethylene",
                "Ethyl cinnamate",
                "Glycerol triundecanoate",
                "Glyceryl lactooleate",
                "Isopropyl 2-methylpropanoate",
                "Methyl acrylate",
                "Mono-(2-ethylhexyl) terephthalate",
                "Octadecyl acetate",
                "Oleyl palmitate",
                "Tanacetin",
                "Trinactin",
                "Vanillin isobutyrate",
                "acetate ester",
                "acetylsalicylic acid",
                "all-trans-retinyl palmitate",
                "benzyl acetate",
                "benzyl benzoate",
                "bis(2-hydroxyethyl) terephthalate",
                "butyl butanoate",
                "butyl propionate",
                "cellulose acetate",
                "cocaine",
                "dimethyl terephthalate",
                "ethyl acetate",
                "ethyl butyrate",
                "ethyl formate",
                "ethyl propionate",
                "ethyl vanillin isobutyrate",
                "gamma-butyrolactone",
                "glycolate ester",
                "isoamyl acetate",
                "isoamyl isobutyrate",
                "isoamyl propanoate",
                "isopropyl palmitate",
                "lofentanyl",
                "methyl N-methylanthranilate",
                "methyl anthranilate",
                "methyl benzoate",
                "methyl cinnamate",
                "methyl formate",
                "methyl methacrylate",
                "methyl salicylate",
                "octyl acetate",
                "propyl butyrate",
                "propyl propionate",
                "retinyl palmitate",
                "triacetin",
                "vanillin acetate",
                "vinyl acetate"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Methyl acetate",
            "Ethyl acetate",
            "Propyl acetate",
            "Isopropyl acetate",
            "Butyl acetate",
            "Isobutyl acetate",
            "Amyl acetate",
            "Methyl propionate",
            "Ethyl propionate",
            "Methyl butyrate",
            "Ethyl butyrate",
            "Methyl valerate",
            "Ethyl valerate",
            "Methyl caproate",
            "Ethyl caproate",
            "Methyl benzoate",
            "Ethyl benzoate",
            "Propyl benzoate",
            "Butyl benzoate",
            "Benzyl acetate",
            "Phenethyl acetate",
            "Methyl salicylate",
            "Ethyl salicylate",
            "Aspirin (Acetylsalicylic acid)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl acetate",
                "Ethyl acetate",
                "Propyl acetate",
                "Isopropyl acetate",
                "Butyl acetate",
                "Isobutyl acetate",
                "Methyl propionate",
                "Ethyl propionate",
                "Methyl butyrate",
                "Ethyl butyrate",
                "Methyl benzoate",
                "Ethyl benzoate",
                "Propyl benzoate",
                "Butyl benzoate",
                "Benzyl acetate",
                "Phenethyl acetate",
                "Methyl salicylate",
                "acetylsalicylic acid"
            ],
            "mismatches": [
                "Amyl acetate",
                "Methyl valerate",
                "Ethyl valerate",
                "Methyl caproate",
                "Ethyl caproate",
                "Ethyl salicylate"
            ],
            "true_referents": [
                "1-Phenylethyl acetate",
                "2-Hexenyl valerate",
                "Allyl valerate",
                "Benzyl acetoacetate",
                "Benzyl salicylate",
                "Ethyl 3-cyclohexylpropionate",
                "Ethyl undecanoate",
                "Ethylhexyl salicylate",
                "Isobutyl octanoate",
                "Isobutyl pentanoate",
                "Isopropyl octanoate",
                "Methyl butyrate",
                "Methyl propionate",
                "Phenylmethyl benzeneacetate",
                "Propyl pentanoate",
                "acetylsalicylic acid",
                "benzyl acetate",
                "benzyl benzoate",
                "butyl acetate",
                "butyl benzoate",
                "butyl butanoate",
                "decyl propionate",
                "ethyl acetate",
                "ethyl acetoacetate",
                "ethyl benzoate",
                "ethyl butyrate",
                "ethyl isovalerate",
                "ethyl octanoate",
                "ethyl propionate",
                "isoamyl acetate",
                "isobutyl acetate",
                "isopropyl acetate",
                "isopropyl ester",
                "methyl acetate",
                "methyl benzoate",
                "methyl oleate",
                "methyl salicylate",
                "methyl undecanoate",
                "phenethyl acetate",
                "propyl acetate",
                "propyl benzoate",
                "propyl butyrate",
                "propyl propionate",
                "valerate ester"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Ethyl acetate (EtOAc)",
            "Methyl methacrylate (MMA)",
            "Isopropyl myristate",
            "Polyvinyl acetate (PVAc)",
            "Cellulose acetate",
            "Aspirin (acetylsalicylic acid)",
            "Vitamin C palmitate (ascorbyl palmitate)",
            "Benzocaine",
            "Triacetin",
            "Polyethylene terephthalate (PET)",
            "Polylactic acid (PLA)",
            "Isoamyl acetate",
            "Ethyl butyrate",
            "Dimethyl phthalate",
            "Diethyl malonate",
            "Methyl salicylate",
            "Ethyl lactate",
            "Glyceryl tristearate",
            "Polyhydroxybutyrate (PHB)",
            "Polyhydroxyalkanoates (PHA)",
            "Mestranol",
            "Testosterone undecanoate",
            "Ricinoleic acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl acetate",
                "Methyl methacrylate",
                "Cellulose acetate",
                "acetylsalicylic acid",
                "ascorbyl palmitate",
                "Benzocaine",
                "Triacetin",
                "Isoamyl acetate",
                "Ethyl butyrate",
                "Dimethyl phthalate",
                "Methyl salicylate"
            ],
            "mismatches": [
                "Isopropyl myristate",
                "Polyvinyl acetate",
                "Polyethylene terephthalate",
                "Polylactic acid",
                "Ethyl lactate",
                "Glyceryl tristearate",
                "Polyhydroxybutyrate",
                "Polyhydroxyalkanoates",
                "Mestranol",
                "Testosterone undecanoate",
                "Ricinoleic acid"
            ],
            "true_referents": [
                "(R)-mevalonolactone",
                "Arachidyl linoleate",
                "Benzyl salicylate",
                "Diethyl 2-(3-butenyl)malonate",
                "Diethyl aminomalonate",
                "Dimethyl phthalate",
                "Ethylene glycol distearate",
                "Glycidyl stearate",
                "Hexyl 3-methylbutanoate",
                "Isopropyl 2-methylpropanoate",
                "L-ascorbate",
                "L-ascorbic acid",
                "Linoleyl oleate",
                "Mono-(2-ethylhexyl) terephthalate",
                "Monobutylphthalate",
                "Oleyl linoleate",
                "Palmitic acid, 4-hydroxybutyl ester",
                "Polyoxyethylene dioleate",
                "Tanacetin",
                "Trinactin",
                "Tropacocaine",
                "acetate ester",
                "acetylsalicylic acid",
                "ascorbyl palmitate",
                "benzocaine",
                "bis(2-hydroxyethyl) terephthalate",
                "bisphenol A dimethacrylate",
                "cellulose acetate",
                "diethyl malate",
                "diethyl phthalate",
                "dimethyl terephthalate",
                "ethyl (2R)-lactate",
                "ethyl (2S)-lactate",
                "ethyl 3-hydroxybutyrate",
                "ethyl acetate",
                "ethyl butyrate",
                "isoamyl acetate",
                "isoamyl isobutyrate",
                "isoamyl propanoate",
                "isopropyl palmitate",
                "medroxyprogesterone acetate",
                "methyl methacrylate",
                "methyl salicylate",
                "methyl undecanoate",
                "procaine",
                "propyl butyrate",
                "spironolactone",
                "testosterone acetate",
                "testosterone cypionate",
                "triacetin",
                "tristearoylglycerol",
                "vinyl acetate"
            ],
            "TP": 11,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Ethyl acetate (EtOAc)",
            "Methyl benzoate (MeBz)",
            "Isopropyl myristate (IPM)",
            "Methyl salicylate (MeSal)",
            "Glyceryl trinitrate (GTN)",
            "Ethyl butyrate (EtBu)",
            "Methyl palmitate (MePa)",
            "Butyl acetate (BuOAc)",
            "Ethyl formate (EtFor)",
            "Propyl propionate (PrPr)",
            "Isopentyl acetate (IpAc)",
            "Benzyl benzoate (BzBz)",
            "Methyl stearate (MeSt)",
            "Ethyl laurate (EtLa)",
            "Propyl acetate (PrOAc)",
            "Isobutyl isobutyrate (iBuiBu)",
            "Phenethyl acetate (PhEtOAc)",
            "Methyl oleate (MeOl)",
            "Ethyl linoleate (EtLi)",
            "Butyl butyrate (BuBu)",
            "Methyl arachidonate (MeAr)",
            "Ethyl linolenate (EtLn)",
            "Propyl palmitate (PrPa)",
            "Isoamyl acetate (IpAc)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl acetate",
                "Methyl benzoate",
                "Methyl salicylate",
                "Ethyl butyrate",
                "Methyl palmitate",
                "Butyl acetate",
                "Ethyl formate",
                "Propyl propionate",
                "Benzyl benzoate",
                "Methyl stearate",
                "Ethyl laurate",
                "Propyl acetate",
                "Phenethyl acetate",
                "Methyl oleate",
                "Ethyl linoleate",
                "Butyl butyrate",
                "Methyl arachidonate",
                "Ethyl linolenate",
                "Isoamyl acetate"
            ],
            "mismatches": [
                "Isopropyl myristate",
                "Glyceryl trinitrate",
                "Isopentyl acetate",
                "Isobutyl isobutyrate",
                "Propyl palmitate"
            ],
            "true_referents": [
                "1,2-ditetradecanoyl-sn-glycerol",
                "1-Phenylethyl acetate",
                "3-Methylbutyl benzoate",
                "Benzyl salicylate",
                "Ethyl 2-ethylbutanoate",
                "Isobutyl pentanoate",
                "Isooctyl acetate",
                "Isopentenyl acetate",
                "Isopropyl 2-methylbutanoate",
                "Isopropyl 2-methylpropanoate",
                "Isopropyl 3-methylbutanoate",
                "Methyl palmitate",
                "Methyl stearate",
                "Myristoleyl arachidonate",
                "Myristoleyl oleate",
                "Oleyl laurate",
                "Phenylmethyl benzeneacetate",
                "Propyl 2-methylpropanoate",
                "acetate ester",
                "benzoate ester",
                "benzyl benzoate",
                "butyl acetate",
                "butyl butanoate",
                "butyrate ester",
                "decyl palmitate",
                "decyl propionate",
                "ethyl acetate",
                "ethyl butyrate",
                "ethyl formate",
                "ethyl laurate",
                "ethyl linoleate",
                "ethyl linolenate",
                "ethyl propionate",
                "isoamyl acetate",
                "isoamyl isobutyrate",
                "isoamyl propanoate",
                "isobutyl acetate",
                "isobutyl benzoate",
                "methyl arachidonate",
                "methyl benzoate",
                "methyl formate",
                "methyl oleate",
                "methyl salicylate",
                "myristyl palmitate",
                "octyl palmitate",
                "phenethyl acetate",
                "propanoate ester",
                "propyl acetate",
                "propyl propionate",
                "triacyl-sn-glycerol"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Ethyl acetate (EtOAc)",
            "Isopropyl acetate",
            "Ethyl butyrate",
            "Isobutyl acetate",
            "Ethyl hexanoate",
            "Geraniol acetate",
            "Ethyl benzoate",
            "Isopropyl salicylate",
            "Ethyl cinnamate",
            "Ethyl 4-hydroxybenzoate",
            "Methyl salicylate",
            "Ethyl vanillate",
            "Ethyl 4-hydroxybenzoate",
            "Isobutyl salicylate",
            "Ethyl 3-hydroxybenzoate",
            "Ethyl 2-hydroxybenzoate",
            "Ethyl 4-methoxybenzoate",
            "Ethyl 3-methoxybenzoate",
            "Ethyl 2-methoxybenzoate",
            "Ethyl 4-ethoxybenzoate",
            "Ethyl 3-ethoxybenzoate",
            "Ethyl 2-ethoxybenzoate",
            "Ethyl 4-propoxybenzoate",
            "Ethyl 3-propoxybenzoate",
            "Ethyl 2-propoxybenzoate",
            "Ethyl 4-butoxybenzoate",
            "Ethyl 3-butoxybenzoate",
            "Ethyl 2-butoxybenzoate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl acetate",
                "Isopropyl acetate",
                "Ethyl butyrate",
                "Isobutyl acetate",
                "Ethyl hexanoate",
                "Ethyl benzoate",
                "Isopropyl salicylate",
                "Ethyl cinnamate",
                "Methyl salicylate",
                "Isobutyl salicylate"
            ],
            "mismatches": [
                "Geraniol acetate",
                "Ethyl vanillate",
                "Ethyl 3-hydroxybenzoate",
                "Ethyl 2-hydroxybenzoate",
                "Ethyl 4-methoxybenzoate",
                "Ethyl 3-methoxybenzoate",
                "Ethyl 2-methoxybenzoate",
                "Ethyl 4-ethoxybenzoate",
                "Ethyl 3-ethoxybenzoate",
                "Ethyl 2-ethoxybenzoate",
                "Ethyl 4-propoxybenzoate",
                "Ethyl 3-propoxybenzoate",
                "Ethyl 2-propoxybenzoate",
                "Ethyl 4-butoxybenzoate",
                "Ethyl 3-butoxybenzoate",
                "Ethyl 2-butoxybenzoate"
            ],
            "true_referents": [
                "2-Ethylhexyl-4-hydroxybenzoate",
                "4-Ethoxy ethylbenzoate",
                "Amyl salicylate",
                "Benzyl salicylate",
                "Ethyl cinnamate",
                "Ethyl undecanoate",
                "Isobutyl octanoate",
                "Isobutyl pentanoate",
                "Isobutyl salicylate",
                "Isopropyl octanoate",
                "acetate ester",
                "benzyl benzoate",
                "citronellol acetate",
                "ethyl 3,4-dihydroxybenzoate",
                "ethyl 4-hydroxybenzoate sulfate",
                "ethyl acetate",
                "ethyl benzoate",
                "ethyl butyrate",
                "ethyl hexanoate",
                "ethyl vanillin isobutyrate",
                "isobutyl acetate",
                "isopropyl acetate",
                "isopropyl ester",
                "isopropyl salicylate",
                "methyl 3-hydroxybenzoate",
                "methyl 4-acetoxy-3-methoxybenzoate",
                "methyl cinnamate",
                "methyl salicylate",
                "methyl vanillate",
                "methyl-4-acetoxybenzoate",
                "propyl butyrate"
            ],
            "TP": 10,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            "Methyl acetate (MeAc)",
            "Methyl formate (MeF)",
            "Ethyl acetate (EtAc)",
            "Ethyl formate (EtF)",
            "Isopropyl acetate (i-PrAc)",
            "Butyl acetate (BuAc)",
            "Isobutyl acetate (i-BuAc)",
            "Methyl salicylate (MeSal)",
            "Methyl benzoate (MeBz)",
            "Ethyl benzoate (EtBz)",
            "Methyl 4-hydroxybenzoate (MePHB)",
            "Methyl 3,4-dihydroxybenzoate (Me34DHB)",
            "Aspirin (Acetylsalicylic acid)",
            "Methyl phenylacetate (MePAA)",
            "Ethyl phenylacetate (EtPAA)",
            "Methyl 3-phenylpropionate (Me3PPP)",
            "Methyl 2-phenylbutyrate (Me2PBB)",
            "Methyl 4-phenylbutyrate (Me4PBB)",
            "Methyl cinnamate (MeCin)",
            "Ethyl cinnamate (EtCin)",
            "Methyl nicotinate (MeNic)",
            "Ethyl nicotinate (EtNic)",
            "Methyl gallate (MeGal)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl acetate (MeAc)",
                "Methyl formate (MeF)",
                "Ethyl acetate (EtAc)",
                "Ethyl formate (EtF)",
                "Isopropyl acetate (i-PrAc)",
                "Butyl acetate (BuAc)",
                "Isobutyl acetate (i-BuAc)",
                "Methyl salicylate (MeSal)",
                "Methyl benzoate (MeBz)",
                "Ethyl benzoate (EtBz)",
                "Methyl 3,4-dihydroxybenzoate (Me34DHB)",
                "Aspirin (Acetylsalicylic acid)",
                "Methyl cinnamate (MeCin)",
                "Ethyl cinnamate (EtCin)"
            ],
            "mismatches": [
                "Methyl 4-hydroxybenzoate (MePHB)",
                "Methyl phenylacetate (MePAA)",
                "Ethyl phenylacetate (EtPAA)",
                "Methyl 3-phenylpropionate (Me3PPP)",
                "Methyl 2-phenylbutyrate (Me2PBB)",
                "Methyl 4-phenylbutyrate (Me4PBB)",
                "Methyl nicotinate (MeNic)",
                "Ethyl nicotinate (EtNic)",
                "Methyl gallate (MeGal)"
            ],
            "true_referents": [
                "(R)-4,8-dimethylnonanoylcarnitine",
                "1-Phenylethyl acetate",
                "2-Methylpropyl 2-methylpropionate",
                "2-methylbutyl pentanoate",
                "3-Methylbutyl benzoate",
                "3-phenylpropionate ester",
                "4-Methyloctyl acetate",
                "Benzyl salicylate",
                "Dodecyl gallate",
                "Ethyl 4-phenylbutanoate",
                "Ethyl cinnamate",
                "Isobutyl octanoate",
                "Isopropyl octanoate",
                "Methyl 2,5-dihydroxybenzoate",
                "Methyl 2,6-dihydroxybenzoate",
                "Methyl 4-phenylbutanoate",
                "Octyl phenylacetate",
                "Phenylmethyl benzeneacetate",
                "acetylsalicylic acid",
                "benzoate ester",
                "benzyl cinnamate",
                "benzyl nicotinate",
                "butyl acetate",
                "butyl butanoate",
                "cyclitol nicotinate",
                "ethyl acetate",
                "ethyl benzoate",
                "ethyl ester",
                "ethyl formate",
                "ethyl gallate",
                "ethyl nonanoate",
                "inositol nicotinate",
                "isobutyl acetate",
                "isobutyl butyrate",
                "isopropyl acetate",
                "isopropyl ester",
                "methyl 3,4-dihydroxybenzoate",
                "methyl 3-hydroxybenzoate",
                "methyl 3-phenylpropanoate",
                "methyl acetate",
                "methyl benzoate",
                "methyl cinnamate",
                "methyl cis-cinnamate",
                "methyl formate",
                "methyl salicylate",
                "methyl-4-acetoxybenzoate",
                "octyl gallate",
                "phenethyl acetate",
                "phenyl acetate"
            ],
            "TP": 14,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "carboxylic ester",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "carboxylic acid",
                "Identifier": "CA"
            },
            {
                "Referent": "carboxylic acid derivative",
                "Identifier": "CAD"
            },
            {
                "Referent": "carboxylic acid anhydride",
                "Identifier": "CAA"
            },
            {
                "Referent": "carboxylic acid chloride",
                "Identifier": "CAC"
            },
            {
                "Referent": "carboxylic acid halide",
                "Identifier": "CAB"
            },
            {
                "Referent": "carboxylic acid ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid methyl ester",
                "Identifier": "CEM"
            },
            {
                "Referent": "carboxylic acid ethyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid propyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid butyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid pentyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid hexyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid heptyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid octyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid nonyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid decyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid undecyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid dodecyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid tridecyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid tetradecyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid pentadecyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid hexadecyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid heptadecyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid octadecyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid nonadecyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid eicosyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid docosyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid tetracosyl ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid pentacosanol ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid hexacosanol ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid heptacosanol ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid octacosanol ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid nonacosanol ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid triacontanol ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid tetratriacontanol ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid pentatriacontanol ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid hexatriacontanol ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid heptatriacontanol ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid octatriacontanol ester",
                "Identifier": "CEC"
            },
            {
                "Referent": "carboxylic acid nonatriacontanol ester",
                "Identifier": "CEC"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "carboxylic acid",
                "carboxylic acid derivative",
                "carboxylic acid anhydride",
                "carboxylic acid chloride",
                "carboxylic acid halide",
                "carboxylic acid ester",
                "carboxylic acid methyl ester",
                "carboxylic acid ethyl ester",
                "carboxylic acid propyl ester",
                "carboxylic acid butyl ester",
                "carboxylic acid pentyl ester",
                "carboxylic acid hexyl ester",
                "carboxylic acid heptyl ester",
                "carboxylic acid octyl ester",
                "carboxylic acid nonyl ester",
                "carboxylic acid decyl ester",
                "carboxylic acid undecyl ester",
                "carboxylic acid dodecyl ester",
                "carboxylic acid tridecyl ester",
                "carboxylic acid tetradecyl ester",
                "carboxylic acid pentadecyl ester",
                "carboxylic acid hexadecyl ester",
                "carboxylic acid heptadecyl ester",
                "carboxylic acid octadecyl ester",
                "carboxylic acid nonadecyl ester",
                "carboxylic acid eicosyl ester",
                "carboxylic acid docosyl ester",
                "carboxylic acid tetracosyl ester",
                "carboxylic acid pentacosanol ester",
                "carboxylic acid hexacosanol ester",
                "carboxylic acid heptacosanol ester",
                "carboxylic acid octacosanol ester",
                "carboxylic acid nonacosanol ester",
                "carboxylic acid triacontanol ester",
                "carboxylic acid tetratriacontanol ester",
                "carboxylic acid pentatriacontanol ester",
                "carboxylic acid hexatriacontanol ester",
                "carboxylic acid heptatriacontanol ester",
                "carboxylic acid octatriacontanol ester",
                "carboxylic acid nonatriacontanol ester"
            ],
            "true_referents": [
                "(-)-camphanic acid",
                "(E)-lowdenic acid",
                "1,10-dimethyl ester-2-decenedioic acid",
                "2-Methylbutyl 2-methylbutanoate",
                "2-Methylbutyl 3-methylbutanoate",
                "3-Methylbutyl 2-methylbutanoate",
                "7-Hexadecenoic acid, methyl ester",
                "9-Octadecenoic acid, ethyl ester",
                "Dodecyl acetate",
                "Ethyl 2-methyl-3,4-pentadienoate",
                "Octadecadienoic acid, methyl ester",
                "Propanoic acid, 2-methyl-, 2-ethyl-3-hydroxyhexyl ester",
                "dodecyl hexanoate"
            ],
            "TP": 0,
            "FP": 40,
            "FN": 0
        }
    }
]