[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone ((CH3)2CO)",
            "Acetoacetate (AcAc-)",
            "Beta-hydroxybutyrate (BHB)",
            "Acetophenone (C8H8O)",
            "Butanone (MEK, Methyl Ethyl Ketone)",
            "Pentan-2-one (Methyl Butanone)",
            "Hexan-2-one (Methyl Pentanone)",
            "Hexan-3-one (Methyl Methylbutanone)",
            "Heptan-2-one (Ethyl Butanone)",
            "Heptan-4-one (Methyl Methylpentanone)",
            "Octan-2-one (Ethyl Pentanone)",
            "Octan-3-one (Methyl Methylpentanone)",
            "Octan-4-one (Methyl Ethylbutanone)",
            "Octan-5-one (Methyl Butylmethanone)",
            "Nonan-2-one (Ethyl Hexanone)",
            "Nonan-3-one (Methyl Methylhexanone)",
            "Nonan-4-one (Methyl Ethylpentanone)",
            "Nonan-5-one (Methyl Butylpentanone)",
            "Nonan-6-one (Ethyl Butylmethanone)",
            "Decan-2-one (Ethyl Heptanone)",
            "Decan-3-one (Methyl Methylheptanone)",
            "Decan-4-one (Methyl Ethylhexanone)",
            "Decan-5-one (Methyl Butylpentanone)",
            "Decan-6-one (Ethyl Butylpentanone)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "acetone",
                "acetophenone",
                "butanone",
                "heptan-2-one",
                "pentanone"
            ],
            "mismatches": [
                "Acetoacetate (AcAc-)",
                "Beta-hydroxybutyrate (BHB)",
                "Pentan-2-one (Methyl Butanone)",
                "Hexan-2-one (Methyl Pentanone)",
                "Hexan-3-one (Methyl Methylbutanone)",
                "Heptan-4-one (Methyl Methylpentanone)",
                "Octan-2-one (Ethyl Pentanone)",
                "Octan-3-one (Methyl Methylpentanone)",
                "Octan-4-one (Methyl Ethylbutanone)",
                "Octan-5-one (Methyl Butylmethanone)",
                "Nonan-2-one (Ethyl Hexanone)",
                "Nonan-3-one (Methyl Methylhexanone)",
                "Nonan-4-one (Methyl Ethylpentanone)",
                "Nonan-5-one (Methyl Butylpentanone)",
                "Nonan-6-one (Ethyl Butylmethanone)",
                "Decan-2-one (Ethyl Heptanone)",
                "Decan-3-one (Methyl Methylheptanone)",
                "Decan-4-one (Methyl Ethylhexanone)",
                "Decan-5-one (Methyl Butylpentanone)",
                "Decan-6-one (Ethyl Butylpentanone)"
            ],
            "true_referents": [
                "(S)-2-acetyl-2-hydroxybutanoic acid",
                "2,4-dimethyl-3-pentanone",
                "2-Methyl-3-heptanone",
                "2-Methyl-3-nonacosanone",
                "2-Methyl-4-heptanone",
                "2-Methyloctan-4-one",
                "2-octanone",
                "3,3,4,4-tetramethyl-2-pentanone",
                "3-Methyl-1-phenyl-1-butanone",
                "3-Methyl-2,4-nonanedione",
                "3-Methylbutan-2-one",
                "3-Methylene-2-octanone",
                "3-Methylheptan-2-one",
                "3-Methylheptan-4-one",
                "3-Methylhexan-2-one",
                "3-Methylpentan-2-one",
                "3-decanone",
                "3-octanone",
                "4-Hydroxy-3-methyl-2-butanone",
                "4-Methylhexan-2-one",
                "4-Methylhexan-3-one",
                "4-hydroxybutan-2-one",
                "4-methylheptan-3-one",
                "4-propoxy-2-butanone",
                "4S-Methylhexan-3-one",
                "6-oxo-nonan-1-ol",
                "Acetoin acetate",
                "Acetoxyacetone",
                "Heptan-2,5-dione",
                "Nonan-2,5-dione",
                "acetone",
                "acetophenone",
                "acetophenones",
                "beta-hydroxy ketone",
                "butanone",
                "decan-2-one",
                "dehydroacetic acid",
                "heptan-2-one",
                "hexanone",
                "methyl ketone",
                "nonane-4,6-dione",
                "pentanone"
            ],
            "TP": 5,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (CH3COCH3)",
            "Beta-hydroxybutyrate",
            "Acetoacetate",
            "3-Hydroxybutanone",
            "Acetylacetone (2,4-Pentanedione)",
            "Butanone (MEK)",
            "Cyclohexanone",
            "Methyl ethyl ketone (MEK)",
            "2-Heptanone",
            "2-Butanone (MEK)",
            "2-Pentanone",
            "2-Hexanone",
            "2-Octanone",
            "3-Pentanone",
            "4-Methyl-2-pentanone",
            "2-Nonanone",
            "3-Hexanone",
            "3-Heptanone",
            "2-Undecanone",
            "Diacetyl (2,3-Butanedione)",
            "Acetoin (3-Hydroxy-2-butanone)",
            "Methyl isobutyl ketone (MIBK)",
            "Methyl isopropyl ketone (MIK)",
            "Mesityl oxide (2,4-Pentanone)",
            "Cyclopentanone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "acetone",
                "acetylacetone",
                "butanone",
                "cyclohexanone",
                "2-octanone",
                "3-hexanone",
                "methyl isobutyl ketone"
            ],
            "mismatches": [
                "Beta-hydroxybutyrate",
                "Acetoacetate",
                "3-Hydroxybutanone",
                "Methyl ethyl ketone (MEK)",
                "2-Heptanone",
                "2-Pentanone",
                "2-Hexanone",
                "3-Pentanone",
                "4-Methyl-2-pentanone",
                "2-Nonanone",
                "3-Heptanone",
                "2-Undecanone",
                "Diacetyl (2,3-Butanedione)",
                "Acetoin (3-Hydroxy-2-butanone)",
                "Methyl isopropyl ketone (MIK)",
                "Mesityl oxide (2,4-Pentanone)",
                "Cyclopentanone"
            ],
            "true_referents": [
                "(R)-acetoin",
                "(S)-2-acetyl-2-hydroxybutanoic acid",
                "1,3-Diacetylpropane",
                "1-Hydroxy-2-pentanone",
                "1-hydroxybutan-2-one",
                "1-phenyl-2-hexanone",
                "2,3-Decanedione",
                "2,3-Undecanedione",
                "2,4-dimethyl-3-pentanone",
                "2-Dodecanone",
                "2-Methyl-3-heptanone",
                "2-Methyl-3-hexanone",
                "2-Methyl-4-heptanone",
                "2-Nonadecanone",
                "2-octanone",
                "3,3,4,4-tetramethyl-2-pentanone",
                "3-Hydroxy-2-pentanone",
                "3-Methyl-1-phenyl-1-butanone",
                "3-Methylene-2-octanone",
                "3-hexanone",
                "3-octanone",
                "4,4-Dimethoxy-2-butanone",
                "4-Hydroxy-3-methyl-2-butanone",
                "4-Methyl-2,3-pentanedione",
                "4-heptanone",
                "4-propoxy-2-butanone",
                "6-Undecanone",
                "Acetoin acetate",
                "Acetoxyacetone",
                "Ethyl isobutyl ketone",
                "Ethyl isopropyl ketone",
                "Methyl isobutyl ketone",
                "Nonan-2,5-dione",
                "acetoin",
                "acetone",
                "acetone d6",
                "acetylacetonate",
                "acetylacetone",
                "beta-hydroxy ketone",
                "butane-2,3-dione",
                "butanone",
                "cyclohexanone",
                "cyclohexanones",
                "hexanone",
                "hydroxycyclohexanone",
                "mesityl(piperidin-4-yl)methanone",
                "methyl ketone",
                "methyl propenyl ketone",
                "methyl pyruvate",
                "nonanone",
                "pentanone"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (2-Propanone)",
            "Methyl Ethyl Ketone (MEK, 2-Butanone)",
            "Methyl Isobutyl Ketone (MIBK, 4-Methyl-2-Pentanone)",
            "Methyl Propyl Ketone (2-Pentanone)",
            "Diethyl Ketone (3-Pentanone)",
            "Methyl tert-Butyl Ketone (MTBK, 2,2-Dimethyl-3-Butanone)",
            "Acetophenone (1-Phenylethanone)",
            "Benzophenone (Diphenylmethanone)",
            "Cyclohexanone",
            "Methyl Vinyl Ketone (3-Buten-2-one)",
            "Ethyl Acetoacetate (Ethyl 3-Oxo-Butanoate)",
            "Acetoacetone (2,4-Pentanedione)",
            "Propionyl Chloride (Propionyl Chloride)",
            "Butyryl Chloride (Butyryl Chloride)",
            "Valeryl Chloride (Valeryl Chloride)",
            "Hexanoyl Chloride (Hexanoyl Chloride)",
            "Isovaleryl Chloride (Isovaleryl Chloride)",
            "Acetylacetone (2,4-Pentanedione)",
            "Fructose-1,6-bisphosphate",
            "Acetoacetate",
            "\u03b2-Hydroxy-\u03b2-methylbutyryl-CoA",
            "Acetyl-CoA",
            "Acetoacetyl-CoA",
            "3-Hydroxy-3-methylglutaryl-CoA (HMG-CoA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "acetone",
                "acetophenone",
                "benzophenone",
                "cyclohexanone",
                "acetylacetone"
            ],
            "mismatches": [
                "Methyl Ethyl Ketone (MEK, 2-Butanone)",
                "Methyl Isobutyl Ketone (MIBK, 4-Methyl-2-Pentanone)",
                "Methyl Propyl Ketone (2-Pentanone)",
                "Diethyl Ketone (3-Pentanone)",
                "Methyl tert-Butyl Ketone (MTBK, 2,2-Dimethyl-3-Butanone)",
                "Methyl Vinyl Ketone (3-Buten-2-one)",
                "Ethyl Acetoacetate (Ethyl 3-Oxo-Butanoate)",
                "Acetoacetone (2,4-Pentanedione)",
                "Propionyl Chloride (Propionyl Chloride)",
                "Butyryl Chloride (Butyryl Chloride)",
                "Valeryl Chloride (Valeryl Chloride)",
                "Hexanoyl Chloride (Hexanoyl Chloride)",
                "Isovaleryl Chloride (Isovaleryl Chloride)",
                "Fructose-1,6-bisphosphate",
                "Acetoacetate",
                "\u03b2-Hydroxy-\u03b2-methylbutyryl-CoA",
                "Acetyl-CoA",
                "Acetoacetyl-CoA",
                "3-Hydroxy-3-methylglutaryl-CoA (HMG-CoA)"
            ],
            "true_referents": [
                "(2,3,3-trimethyl-5-oxocyclopent-3-enyl)acetyl-CoA",
                "(5R)-5-hydroxyhexan-2-one",
                "1,5-anhydro-D-fructose",
                "11-oxo-ETE-CoA",
                "12alpha-hydroxy-3-oxochola-4,6-dien-24-oyl-CoA",
                "2,4-dimethyl-3-pentanone",
                "2-chloro-1-(4-isopropylphenyl)-3-methyl-1-butanone",
                "2-hydroxy-1-phenyl-1-propanone",
                "3-(4-hydroxy-3-methoxyphenyl)-3-oxopropanoyl-CoA",
                "3-Methylbutan-2-one",
                "3-chloro-1-phenyl-1-propanone",
                "3-deoxy-keto-D-fructose",
                "3-oxocholoyl-CoA",
                "4-Methyl-2,3-pentanedione",
                "5-methoxyvalerophenone O-(2-aminoethyl)oxime",
                "Acetoin acetate",
                "Acetoxyacetone",
                "Butylone",
                "Butyro-betaine",
                "Ethyl 3,5-dimethoxy-2-propionylphenylacetate",
                "Ethyl 3-oxo-3-phenylpropanoate",
                "Ethyl isobutyl ketone",
                "Hexachloroacetone",
                "Hexacosane-7,9-dione",
                "Methyl isobutyl ketone",
                "N-(2-benzoyl-1-methylvinyl)acetamide",
                "acetone",
                "acetophenone",
                "acetylacetonate",
                "acetylacetone",
                "benzophenone",
                "benzophenones",
                "cyclohexanone",
                "cyclohexanones",
                "fluticasone propionate",
                "hydroxyacetone",
                "hydroxycyclohexanone",
                "methyl ketone",
                "methyl propenyl ketone",
                "methyl pyruvate",
                "p-Ethylacetophenone",
                "valerophenone"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (propan-2-one)",
            "Butanone (2-butanone)",
            "Pentanone (2-pentanone)",
            "Hexanone (2-hexanone)",
            "Cyclopentanone",
            "Cyclohexanone",
            "Acetophenone (methyl phenyl ketone)",
            "Benzophenone (diphenyl ketone)",
            "Propiophenone (ethyl phenyl ketone)",
            "Diacetyl (2,3-butanedione)",
            "Acetylacetone (pentane-2,4-dione)",
            "Furanone (2(5H)-furanone)",
            "Ribulose-5-phosphate",
            "Fructose (D-Fructose)",
            "Psuedoionone",
            "Methyl ethyl ketone (2-butanone)",
            "Isophorone (3,5,5-trimethylcyclohex-2-en-1-one)",
            "Mesityl oxide (4-methylpent-3-en-2-one)",
            "Camphor (2,3-dimethyl-3-campholenone)",
            "Cortisone (17\u03b1-hydroxyprogesterone)",
            "Testosterone (17\u03b2-hydroxyandrost-4-en-3-one)",
            "Cholesterol (cholesta-5,16-dien-3\u03b2-ol)",
            "Rubredoxin",
            "Phloroglucinol acetone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetone (propan-2-one)",
                "Butanone (2-butanone)",
                "Cyclopentanone",
                "Cyclohexanone",
                "Acetophenone (methyl phenyl ketone)",
                "Benzophenone (diphenyl ketone)",
                "Propiophenone (ethyl phenyl ketone)",
                "Pseudoionone",
                "Isophorone (3,5,5-trimethylcyclohex-2-en-1-one)",
                "Testosterone (17\u03b2-hydroxyandrost-4-en-3-one)"
            ],
            "mismatches": [
                "Pentanone (2-pentanone)",
                "Hexanone (2-hexanone)",
                "Diacetyl (2,3-butanedione)",
                "Acetylacetone (pentane-2,4-dione)",
                "Furanone (2(5H)-furanone)",
                "Ribulose-5-phosphate",
                "Fructose (D-Fructose)",
                "Psuedoionone",
                "Mesityl oxide (4-methylpent-3-en-2-one)",
                "Camphor (2,3-dimethyl-3-campholenone)",
                "Cortisone (17\u03b1-hydroxyprogesterone)",
                "Cholesterol (cholesta-5,16-dien-3\u03b2-ol)",
                "Rubredoxin",
                "Phloroglucinol acetone"
            ],
            "true_referents": [
                "(R)-camphor",
                "(S)-5-(benzoyl)dihydro-2(3H)-furanone",
                "1,3-Diacetylpropane",
                "1,5-anhydro-D-fructose",
                "1-(2-furanyl)-1-Octanone",
                "1-Hydroxy-2-pentanone",
                "1-hydroxy-4-methylpentan-2-one",
                "1-phenyl-2-hexanone",
                "17alpha-hydroxyprogesterone",
                "2'-methyl-Propiophenone",
                "2'-methylacetophenone",
                "2,3-Decanedione",
                "2-acyl-4,6-diprenylphloroglucinol",
                "2-acylphloroglucinol",
                "3,5,5-Trimethyl-3-cyclohexen-1-one",
                "3-Hydroxy-2-pentanone",
                "3-cyano-2-butanone",
                "3-deoxy-keto-D-fructose",
                "3-hexanone",
                "3-methylcyclopentanone",
                "3beta-hydroxy-5alpha-cholestan-15-one",
                "3beta-hydroxycholest-5-en-26-al",
                "4,5alpha-Dihydro-2-(hydroxymethylene)testosterone",
                "4-hydroxy-5-methyl-3-furanone",
                "4-propoxy-2-butanone",
                "5alpha-cholesta-24-en-3beta,20beta-diol-23-one",
                "CDP-D-ribulose",
                "Ethyl isobutyl ketone",
                "L-erythrulose 1-phosphate",
                "acetone",
                "acetone d6",
                "acetophenone",
                "acetylacetone",
                "alpha-ionone",
                "benzophenone",
                "benzophenones",
                "butane-2,3-dione",
                "butanone",
                "cyclohexanone",
                "cyclohexanones",
                "cyclopentanone",
                "cyclopentanones",
                "hexanone",
                "hydroxycyclohexanone",
                "isophorone",
                "mesityl(piperidin-4-yl)methanone",
                "methyl ketone",
                "methyl propenyl ketone",
                "methyl pyruvate",
                "pentane-2,3-dione",
                "pentanone",
                "propiophenone",
                "pseudoionone",
                "rubiadin",
                "rubrorotiorin",
                "testosterone"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (C3H6O)",
            "Butanone (C4H8O)",
            "Cyclohexanone (C6H10O)",
            "Acetophenone (C8H8O)",
            "Benzophenone (C13H10O)",
            "2-Pentanone (C5H10O)",
            "3-Pentanone (C5H10O)",
            "4-Heptanone (C7H14O)",
            "2-Heptanone (C7H14O)",
            "Methyl Ethyl Ketone (MEK, C4H8O)",
            "Diisopropyl Ketone (C7H14O)",
            "2-Octanone (C8H16O)",
            "3-Octanone (C8H16O)",
            "3,3-Dimethyl-2-butanone (C6H12O)",
            "Camphor (C10H16O)",
            "Mesityl Oxide (C6H10O)",
            "Dibenzyl Ketone (C15H14O)",
            "Pinacolone (C6H12O)",
            "2-Nonanone (C9H18O)",
            "Methyl Isobutyl Ketone (MIBK, C6H12O)",
            "3-Hexanone (C6H12O)",
            "1-Phenyl-2-propanone (P2P, C9H10O)",
            "2-Undecanone (C11H22O)",
            "2-Decanone (C10H20O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetone (C3H6O)",
                "Butanone (C4H8O)",
                "Cyclohexanone (C6H10O)",
                "Acetophenone (C8H8O)",
                "Benzophenone (C13H10O)",
                "4-Heptanone (C7H14O)",
                "2-Octanone (C8H16O)",
                "3-Octanone (C8H16O)",
                "Camphor (C10H16O)",
                "Methyl Isobutyl Ketone (MIBK, C6H12O)",
                "3-Hexanone (C6H12O)"
            ],
            "mismatches": [
                "2-Pentanone (C5H10O)",
                "3-Pentanone (C5H10O)",
                "2-Heptanone (C7H14O)",
                "Methyl Ethyl Ketone (MEK, C4H8O)",
                "Diisopropyl Ketone (C7H14O)",
                "3,3-Dimethyl-2-butanone (C6H12O)",
                "Mesityl Oxide (C6H10O)",
                "Dibenzyl Ketone (C15H14O)",
                "Pinacolone (C6H12O)",
                "2-Nonanone (C9H18O)",
                "1-Phenyl-2-propanone (P2P, C9H10O)",
                "2-Undecanone (C11H22O)",
                "2-Decanone (C10H20O)"
            ],
            "true_referents": [
                "1-Hydroxy-2-pentanone",
                "1-isopropoxyacetone",
                "2,3',4,6-tetrahydroxybenzophenone",
                "2,3-Undecanedione",
                "2,4-dimethyl-3-pentanone",
                "2-Dodecanone",
                "2-Methyl-3-heptanone",
                "2-Methyl-3-hexanone",
                "2-Methyl-4-heptanone",
                "2-Nonadecanone",
                "2-Tetradecanone",
                "2-hydroxy-1-phenyl-1-propanone",
                "2-octanone",
                "3-Hydroxy-2-pentanone",
                "3-Methyl-1-phenyl-1-butanone",
                "3-Methylene-2-octanone",
                "3-decanone",
                "3-hexanone",
                "3-octanone",
                "4,4-Dimethoxy-2-butanone",
                "4-heptanone",
                "4-propoxy-2-butanone",
                "6-C-(3-Hydroxyisopentyl)eriodictyol",
                "6-Undecanone",
                "Ethyl isobutyl ketone",
                "Ethyl isopropyl ketone",
                "Methyl isobutyl ketone",
                "Nonan-2,5-dione",
                "Penicanone",
                "Pinophilone A",
                "acetone",
                "acetone d6",
                "acetophenone",
                "acetophenones",
                "benzophenone",
                "benzophenones",
                "butanone",
                "camphor",
                "cyclohexanone",
                "cyclohexanone, 4-(1,1-dimethylethyl)-",
                "dialkyl ketone",
                "dibenzoylmethane",
                "diketone",
                "hexanone",
                "hydroxycyclohexanone",
                "mesityl(piperidin-4-yl)methanone",
                "mesityl(piperidin-4-yl)methanone hydrochloride",
                "methyl ketone",
                "methyl propenyl ketone",
                "nonanone",
                "pentanone"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (C3H6O)",
            "2-Butanone (C4H8O)",
            "Cyclohexanone (C6H10O)",
            "3-Pentanone (C5H10O)",
            "4-Pentanone (C5H10O)",
            "2-Pentanone (C5H10O)",
            "2-Hexanone (C6H12O)",
            "3-Hexanone (C6H12O)",
            "2-Heptanone (C7H14O)",
            "3-Heptanone (C7H14O)",
            "2-Octanone (C8H16O)",
            "3-Octanone (C8H16O)",
            "2-Nonanone (C9H18O)",
            "3-Nonanone (C9H18O)",
            "2-Undecanone (C11H22O)",
            "3-Undecanone (C11H22O)",
            "2-Nonyl-3-oxobutanoate (C13H24O3)",
            "Acetoacetate (C4H6O3)",
            "Benzyl methyl ketone (C10H12O)",
            "Dihydroxyacetone (C3H6O3)",
            "5-Oxohexanoic acid (C6H10O3)",
            "2-Pyrone (C5H6O2)",
            "2-Propyl-3-pentanone (C8H16O)",
            "2-Methyl-3-hexanone (C7H14O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "acetone",
                "butanone",
                "cyclohexanone",
                "3-hexanone",
                "2-octanone",
                "3-octanone",
                "2-undecanone",
                "dihydroxyacetone",
                "2-methyl-3-hexanone"
            ],
            "mismatches": [
                "3-pentanone",
                "4-pentanone",
                "2-pentanone",
                "2-hexanone",
                "3-heptanone",
                "2-nonanone",
                "3-nonanone",
                "3-undecanone",
                "2-nonyl-3-oxobutanoate",
                "acetoacetate",
                "benzyl methyl ketone",
                "5-oxohexanoic acid",
                "2-pyrone",
                "2-propyl-3-pentanone"
            ],
            "true_referents": [
                "(S)-3,4-dihydroxy-2-oxobutanoic acid",
                "1-Hydroxy-2-pentanone",
                "1-phenyl-2-hexanone",
                "2,3-Undecanedione",
                "2,4-dimethyl-3-pentanone",
                "2-Dodecanone",
                "2-Methyl-3-heptanone",
                "2-Methyl-3-hexanone",
                "2-Methyl-4-heptanone",
                "2-Nonadecanone",
                "2-octanone",
                "2D-2,3,5/4,6-pentahydroxycyclohexanone",
                "3,3,4,4-tetramethyl-2-pentanone",
                "3,3-dimethyl-2-Hexanone",
                "3-Hydroxy-2-pentanone",
                "3-Methylene-2-octanone",
                "3-hexanone",
                "3-hydroxy-2-methyl-4-pyrone",
                "3-hydroxycyclohexanone",
                "3-octanone",
                "3-pyrones",
                "4,4-Dimethoxy-2-butanone",
                "4-heptanone",
                "4-propoxy-2-butanone",
                "5-methyl-2-hexanone",
                "6-(2,4-dihydroxyl-5-methylphenyl)-6-oxohexanoic acid",
                "6-Undecanone",
                "Acetoin acetate",
                "Acetoxyacetone",
                "Ethyl isopropyl ketone",
                "Nonan-2,5-dione",
                "acetone",
                "acetone d6",
                "benzyl 2-methyl-3-oxobutanoate",
                "butanone",
                "cyclohexanone",
                "cyclohexanone, 4-(1,1-dimethylethyl)-",
                "dehydroacetic acid",
                "dihydroxyacetone",
                "hexanone",
                "hydroxyacetone",
                "hydroxycyclohexanone",
                "methyl ketone",
                "methyl propenyl ketone",
                "naphtho-gamma-pyrone",
                "nonane-4,6-dione",
                "nonanone",
                "pentanone"
            ],
            "TP": 9,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (Propanone)",
            "Butanone (MEK)",
            "Cyclohexanone",
            "Benzophenone",
            "Acetophenone",
            "Methyl Ethyl Ketone (MEK)",
            "Methyl Isobutyl Ketone (MIBK)",
            "Diethyl Ketone",
            "Diacetone Alcohol",
            "Methyl Vinyl Ketone",
            "Isophorone",
            "Mesityl Oxide",
            "Cyclopentanone",
            "Dibenzyl Ketone",
            "Methyl Propyl Ketone",
            "Ethyl Butyl Ketone",
            "Dipropyl Ketone",
            "Diisopropyl Ketone",
            "Diisobutyl Ketone",
            "Cycloheptanone",
            "Cyclooctanone",
            "Cyclononanone",
            "Cyclodecanone",
            "Cycloundecanone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetone (Propanone)",
                "Butanone (MEK)",
                "Cyclohexanone",
                "Benzophenone",
                "Acetophenone",
                "Methyl Isobutyl Ketone (MIBK)",
                "Diacetone Alcohol",
                "Isophorone",
                "Cyclopentanone"
            ],
            "mismatches": [
                "Methyl Ethyl Ketone (MEK)",
                "Diethyl Ketone",
                "Methyl Vinyl Ketone",
                "Mesityl Oxide",
                "Dibenzyl Ketone",
                "Methyl Propyl Ketone",
                "Ethyl Butyl Ketone",
                "Dipropyl Ketone",
                "Diisopropyl Ketone",
                "Diisobutyl Ketone",
                "Cycloheptanone",
                "Cyclooctanone",
                "Cyclononanone",
                "Cyclodecanone",
                "Cycloundecanone"
            ],
            "true_referents": [
                "2-Acetylcycloheptanone",
                "2-Methylcyclododecanone",
                "2-Tetradecanone",
                "2-Tetradecylcyclobutanone",
                "2-acetyl-4,6-dimethoxybenzoic acid",
                "3-Methyl-1-phenyl-1-butanone",
                "3-methylcyclopentanone",
                "4-propoxy-2-butanone",
                "Cyclododecanone",
                "Ethyl isobutyl ketone",
                "Ethyl isopropyl ketone",
                "Methyl isobutyl ketone",
                "acetone",
                "acetone d6",
                "acetophenone",
                "acetophenones",
                "benzophenone",
                "benzophenones",
                "benzylideneacetone",
                "butanone",
                "cyclobutenone",
                "cycloeucalenone",
                "cyclohexanone",
                "cyclohexanones",
                "cyclohexenone",
                "cyclopentanone",
                "cyclopentanones",
                "diacetone alcohol",
                "dialkenyl ketone",
                "dialkyl ketone",
                "dihydroxyacetone",
                "diketone",
                "hydroxycyclohexanone",
                "isophorone",
                "isophorone diisocyanate",
                "mesityl(piperidin-4-yl)methanone",
                "mesityl(piperidin-4-yl)methanone hydrochloride",
                "methyl ketone",
                "methyl propenyl ketone"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (CH3COCH3)",
            "Butanone (CH3COCH2CH3)",
            "Cyclohexanone (C6H10O)",
            "Hexan-2-one (CH3COCH2CH2CH2CH3)",
            "2-Pentanone (CH3COCH2CH2CH3)",
            "3-Pentanone (CH3COCH2CH2CH3)",
            "Cyclopentanone (C5H8O)",
            "Methyl ethyl ketone (CH3COCH2CH3)",
            "Isophorone (C9H14O)",
            "Cycloheptanone (C7H12O)",
            "4-Heptanone (CH3COCH2CH2CH2CH2CH3)",
            "Cyclooctanone (C8H14O)",
            "2-Hexanone (CH3COCH2CH2CH2CH3)",
            "3-Hexanone (CH3COCH2CH2CH2CH3)",
            "2-Heptanone (CH3COCH2CH2CH2CH2CH3)",
            "3-Heptanone (CH3COCH2CH2CH2CH2CH3)",
            "4-Hexanone (CH3COCH2CH2CH2CH3)",
            "2-Octanone (CH3COCH2CH2CH2CH2CH2CH3)",
            "3-Octanone (CH3COCH2CH2CH2CH2CH2CH3)",
            "4-Octanone (CH3COCH2CH2CH2CH2CH2CH3)",
            "2-Nonanone (CH3COCH2CH2CH2CH2CH2CH2CH3)",
            "3-Nonanone (CH3COCH2CH2CH2CH2CH2CH2CH3)",
            "4-Nonanone (CH3COCH2CH2CH2CH2CH2CH2CH3)",
            "2-Decanone (CH3COCH2CH2CH2CH2CH2CH2CH2CH3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetone (CH3COCH3)",
                "Butanone (CH3COCH2CH3)",
                "Cyclohexanone (C6H10O)",
                "Isophorone (C9H14O)",
                "4-Heptanone (CH3COCH2CH2CH2CH2CH3)",
                "3-Hexanone (CH3COCH2CH2CH2CH3)",
                "2-Octanone (CH3COCH2CH2CH2CH2CH2CH3)",
                "3-Octanone (CH3COCH2CH2CH2CH2CH2CH3)"
            ],
            "mismatches": [
                "Hexan-2-one (CH3COCH2CH2CH2CH3)",
                "2-Pentanone (CH3COCH2CH2CH3)",
                "3-Pentanone (CH3COCH2CH2CH3)",
                "Cyclopentanone (C5H8O)",
                "Methyl ethyl ketone (CH3COCH2CH3)",
                "Cycloheptanone (C7H12O)",
                "Cyclooctanone (C8H14O)",
                "2-Hexanone (CH3COCH2CH2CH2CH3)",
                "2-Heptanone (CH3COCH2CH2CH2CH2CH3)",
                "3-Heptanone (CH3COCH2CH2CH2CH2CH3)",
                "4-Hexanone (CH3COCH2CH2CH2CH3)",
                "4-Octanone (CH3COCH2CH2CH2CH2CH2CH3)",
                "2-Nonanone (CH3COCH2CH2CH2CH2CH2CH2CH3)",
                "3-Nonanone (CH3COCH2CH2CH2CH2CH2CH2CH3)",
                "4-Nonanone (CH3COCH2CH2CH2CH2CH2CH2CH3)",
                "2-Decanone (CH3COCH2CH2CH2CH2CH2CH2CH2CH3)"
            ],
            "true_referents": [
                "2,3-Decanedione",
                "2,4-dimethyl-3-pentanone",
                "2-(5,8-Tetradecadienyl)cyclobutanone",
                "2-(trans-2-Pentenyl)cyclopentanone",
                "2-Acetylcycloheptanone",
                "2-Methyl-3-heptanone",
                "2-Methyl-3-hexanone",
                "2-Methyl-4-heptanone",
                "2-Tetradecylcyclobutanone",
                "2-octanone",
                "3,3,4,4-tetramethyl-2-pentanone",
                "3,3-dimethyl-2-Hexanone",
                "3-Cyclohepten-1-one",
                "3-Hexanone-2,2,4,4-d4",
                "3-Methyl-1-phenyl-1-butanone",
                "3-Methyl-2,4-nonanedione",
                "3-Methylene-2-octanone",
                "3-Methylhexan-2-one",
                "3-decanone",
                "3-hexanone",
                "3-octanone",
                "4-Methylhexan-2-one",
                "4-heptanone",
                "4-propoxy-2-butanone",
                "4S-Methylhexan-3-one",
                "Cyclododecanone",
                "Cyclopentanone, 3-methyl-2-(2-pentenyl)-",
                "Ethyl isopropyl ketone",
                "Nonan-2,5-dione",
                "acetone",
                "acetone d6",
                "butanone",
                "cyclohexanone",
                "cyclohexanone, 4-(1,1-dimethylethyl)-",
                "cyclopentanone",
                "hexanone",
                "hydroxycyclohexanone",
                "isophorone",
                "isophorone diisocyanate",
                "methyl ketone",
                "methyl propenyl ketone",
                "nonane-4,6-dione"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (Propanone)",
            "Butanone (Methyl Ethyl Ketone, MEK)",
            "Cyclohexanone",
            "Benzophenone",
            "Acetoacetone (2,4-Pentanedione)",
            "Diethyl Ketone",
            "Methyl Isobutyl Ketone (MIBK)",
            "Camphor",
            "Testosterone",
            "Progesterone",
            "Acetophenone",
            "2-Pentanone",
            "Acetoin (3-Hydroxy-2-Butanone)",
            "Ethyl Methyl Ketone",
            "Methyl Ethyl Ketone Peroxide",
            "Meldrum's Acid",
            "Camphorquinone",
            "Acetylacetone",
            "Cyclopentanone",
            "2-Butanone",
            "2-Heptanone",
            "3-Heptanone",
            "2-Octanone",
            "3-Octanone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetone (Propanone)",
                "Butanone (Methyl Ethyl Ketone, MEK)",
                "Cyclohexanone",
                "Benzophenone",
                "Methyl Isobutyl Ketone (MIBK)",
                "Camphor",
                "Testosterone",
                "Progesterone",
                "Acetophenone",
                "Acetoin (3-Hydroxy-2-Butanone)",
                "Acetylacetone",
                "Cyclopentanone",
                "2-Octanone",
                "3-Octanone"
            ],
            "mismatches": [
                "Acetoacetone (2,4-Pentanedione)",
                "Diethyl Ketone",
                "2-Pentanone",
                "Ethyl Methyl Ketone",
                "Methyl Ethyl Ketone Peroxide",
                "Meldrum's Acid",
                "Camphorquinone",
                "2-Butanone",
                "2-Heptanone",
                "3-Heptanone"
            ],
            "true_referents": [
                "(R)-acetoin",
                "1-Hydroxy-2-pentanone",
                "2-Methyl-3-heptanone",
                "2-Methyl-4-heptanone",
                "2-octanone",
                "3-Hydroxy-2-pentanone",
                "3-Methyl-1-phenyl-1-butanone",
                "3-Methylene-2-octanone",
                "3-hexanone",
                "3-methylcyclopentanone",
                "3-octanone",
                "4-Methyl-2,3-pentanedione",
                "4-heptanone",
                "4-propoxy-2-butanone",
                "Acetoxyacetone",
                "Dioctylketone",
                "Ethyl isobutyl ketone",
                "Ethyl isopropyl ketone",
                "Methyl isobutyl ketone",
                "acetoin",
                "acetone",
                "acetone d6",
                "acetophenone",
                "acetophenones",
                "acetylacetonate",
                "acetylacetone",
                "anthraquinone",
                "benzophenone",
                "benzophenones",
                "benzoquinone",
                "butanone",
                "camphor",
                "cyclohexanone",
                "cyclohexanones",
                "cyclopentanone",
                "cyclopentanones",
                "dialkyl ketone",
                "hydroxyacetone",
                "hydroxycyclohexanone",
                "kermesic acid",
                "methyl ketone",
                "methyl propenyl ketone",
                "morellic acid",
                "naphthoquinone",
                "pentanone",
                "progesterone",
                "testosterone"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (CH3COCH3)",
            "Butanone (MEK)",
            "Acetophenone",
            "Cyclohexanone",
            "Benzophenone",
            "Acetylacetone",
            "Camphor",
            "2-Pentanone",
            "3-Pentanone",
            "4-Heptanone",
            "Acetoacetic acid",
            "Beta-hydroxybutyric acid",
            "Acetoacetyl-CoA",
            "Isopropyl methyl ketone",
            "Methyl isobutyl ketone (MIBK)",
            "Diacetyl",
            "Acetoin",
            "Cyclopentanone",
            "2-Octanone",
            "Menthone",
            "Carvone",
            "Jasmone",
            "Muscone",
            "Raspberry ketone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetone (CH3COCH3)",
                "Butanone (MEK)",
                "Acetophenone",
                "Cyclohexanone",
                "Benzophenone",
                "Acetylacetone",
                "Camphor",
                "4-Heptanone",
                "Methyl isobutyl ketone (MIBK)",
                "Acetoin",
                "Cyclopentanone",
                "2-Octanone",
                "Jasmone",
                "Muscone",
                "Raspberry ketone"
            ],
            "mismatches": [
                "2-Pentanone",
                "3-Pentanone",
                "Acetoacetic acid",
                "Beta-hydroxybutyric acid",
                "Acetoacetyl-CoA",
                "Isopropyl methyl ketone",
                "Diacetyl",
                "Menthone",
                "Carvone"
            ],
            "true_referents": [
                "(-)-methyl jasmonate",
                "(S)-2-acetyl-2-hydroxybutanoic acid",
                "1,3-Diacetylpropane",
                "1-Hydroxy-2-pentanone",
                "11-oxo-ETE-CoA",
                "2,4-dimethyl-3-pentanone",
                "2-Methyl-3-heptanone",
                "2-Methyl-4-heptanone",
                "2-octanone",
                "3-Hydroxy-2-pentanone",
                "3-Methyl-1-phenyl-1-butanone",
                "3-Methylene-2-octanone",
                "3-methylcyclopentanone",
                "3-octanone",
                "4-Hydroxy-3-methyl-2-butanone",
                "4-heptanone",
                "4-propoxy-2-butanone",
                "Acetoin acetate",
                "Acetoxyacetone",
                "Dioctylketone",
                "Ethyl isobutyl ketone",
                "Ethyl isopropyl ketone",
                "Jasmone",
                "Methyl isobutyl ketone",
                "Muscomosin",
                "Muscone",
                "acetoin",
                "acetone",
                "acetone d6",
                "acetophenone",
                "acetophenones",
                "acetylacetonate",
                "acetylacetone",
                "alpha-hydroxy ketone",
                "benzophenone",
                "benzophenones",
                "beta-hydroxy ketone",
                "butanone",
                "camphor",
                "cyclohexanone",
                "cyclohexanones",
                "cyclopentanone",
                "cyclopentanones",
                "dehydroacetic acid",
                "hydroxycyclohexanone",
                "methyl ketone",
                "monoterpene ketone",
                "muqubilone",
                "p-menthadien-3-one",
                "pentanone",
                "piperitone",
                "raspberry ketone",
                "terpene ketone",
                "trans-Jasmone",
                "triacetic acid"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (CH3COCH3)",
            "Acetophenone (C6H5COCH3)",
            "Benzophenone ((C6H5)2CO)",
            "Butanone (MEK, CH3COC2H5)",
            "Camphor (C10H16O)",
            "Cyclohexanone (C6H10O)",
            "Cyclopentanone (C5H8O)",
            "Diacetyl (CH3COCOCH3)",
            "Ethyl levulinate (C7H12O3)",
            "Fructose (C6H12O6)",
            "Hydroxymethylglyoxal (C3H4O3)",
            "Isophorone (C9H14O)",
            "Menthone (C10H18O)",
            "Methyl acetoacetate (C5H8O3)",
            "Methyl isobutyl ketone (MIBK, (CH3)2CHCH2COCH3)",
            "Methyl vinyl ketone (MVK, CH2CHCOCH3)",
            "Pentanedione (CH3COCOCH2CH3)",
            "Perillyl alcohol ((S)-(-)-Perillyl alcohol, C10H16O)",
            "Propiophenone (C6H5COCH2CH3)",
            "Pyruvic acid (CH3COCOOH)",
            "Raspberry ketone (4-(4-Hydroxyphenyl)butan-2-one, C10H12O2)",
            "Sulcatone (6-Methyl-5-hepten-2-one, C8H14O)",
            "Triacetone alcohol ((CH3)2C(OH)CH2COCH3)",
            "\u03b2-Hydroxybutyric acid (BHB, C4H8O3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "acetone",
                "acetophenone",
                "benzophenone",
                "butanone",
                "camphor",
                "cyclohexanone",
                "cyclopentanone",
                "isophorone",
                "methyl isobutyl ketone",
                "propiophenone",
                "raspberry ketone",
                "sulcatone"
            ],
            "mismatches": [
                "Acetone (CH3COCH3)",
                "Acetophenone (C6H5COCH3)",
                "Benzophenone ((C6H5)2CO)",
                "Butanone (MEK, CH3COC2H5)",
                "Camphor (C10H16O)",
                "Cyclohexanone (C6H10O)",
                "Cyclopentanone (C5H8O)",
                "Diacetyl (CH3COCOCH3)",
                "Ethyl levulinate (C7H12O3)",
                "Fructose (C6H12O6)",
                "Hydroxymethylglyoxal (C3H4O3)",
                "Isophorone (C9H14O)",
                "Menthone (C10H18O)",
                "Methyl acetoacetate (C5H8O3)",
                "Methyl vinyl ketone (MVK, CH2CHCOCH3)",
                "Pentanedione (CH3COCOCH2CH3)",
                "Perillyl alcohol ((S)-(-)-Perillyl alcohol, C10H16O)",
                "Propiophenone (C6H5COCH2CH3)",
                "Pyruvic acid (CH3COCOOH)",
                "Raspberry ketone (4-(4-Hydroxyphenyl)butan-2-one, C10H12O2)",
                "Sulcatone (6-Methyl-5-hepten-2-one, C8H14O)",
                "Triacetone alcohol ((CH3)2C(OH)CH2COCH3)",
                "\u03b2-Hydroxybutyric acid (BHB, C4H8O3)"
            ],
            "true_referents": [
                "(+)-(12E,2S,3S,4R,5R,6R,9S,11S,15R)-3-benzoyloxy-5,6-epoxylathyr-12-en-15-ol-14-one",
                "(-)-(12E,2S,3S,4R,5R,6R,9S,11S,15R)-3-acetoxy-5,6-epoxylathyr-12-en-15-ol-14-one",
                "(S)-2-acetyl-2-hydroxybutanoic acid",
                "1,3-Diacetylpropane",
                "1,5-anhydro-D-fructose",
                "1-(2-Furanyl)-1-pentanone",
                "1-(2-furanyl)-1-Octanone",
                "2',4'-Dimethoxypropiophenone",
                "2'-Hydroxyfurano[2'',3'':4',3']chalcone",
                "2'-methyl-Propiophenone",
                "2,3',4,6-tetrahydroxybenzophenone",
                "2,4-dimethyl-3-pentanone",
                "2-(2-methyl-4-oxo-3-pyranyl)acetaldehyde",
                "2-(trans-2-Pentenyl)cyclopentanone",
                "2-ethyl-4-hydroxy-5-methyl-3(2H)-furanone",
                "3-Mercapto-2-pentanone",
                "3-Methyl-1-phenyl-1-butanone",
                "3-deoxy-keto-D-fructose",
                "3-hydroxy-3-methyl-2-oxobutanoic acid",
                "4'-Methoxybenzophenone-2-carboxylic acid",
                "4-Hydroxy-3-methyl-2-butanone",
                "4-Methyl-2,3-pentanedione",
                "4-propoxy-2-butanone",
                "Acetoin acetate",
                "Acetoxyacetone",
                "Cyclopentanone, 3-methyl-2-(2-pentenyl)-",
                "Ethyl isobutyl ketone",
                "Methyl isobutyl ketone",
                "acetone",
                "acetone d6",
                "acetophenone",
                "acetylacetone",
                "acetylpyruvic acid",
                "benzophenone",
                "butanone",
                "camphor",
                "cyclohexanone",
                "cyclohexanone, 4-(1,1-dimethylethyl)-",
                "cyclopentanone",
                "hydroxycyclohexanone",
                "isophorone",
                "isophorone diisocyanate",
                "methyl 4-hydroxy-3-(3-methylbutanoyl)benzoate",
                "methyl ketone",
                "methyl phenylglyoxalate",
                "methyl propenyl ketone",
                "methyl pyruvate",
                "methylglyoxal",
                "p-Ethylacetophenone",
                "p-menthadien-3-one",
                "pentane-2,3-dione",
                "propiophenone",
                "raspberry ketone",
                "sulcatone",
                "triacetic acid"
            ],
            "TP": 12,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (CH3COCH3)",
            "Acetylacetone (CH3COCH2COCH3)",
            "Benzophenone (C6H5COC6H5)",
            "Camphor (C10H16O)",
            "Cyclohexanone (C6H10O)",
            "Diacetyl (CH3COCOCH3)",
            "Diethyl ketone (CH3COC2H5)",
            "Ethyl methyl ketone (CH3COC2H5)",
            "Fenchone (C10H16O)",
            "Isophorone (C9H14O)",
            "Menthone (C10H18O)",
            "Methyl isopropyl ketone (CH3COCH(CH3)2)",
            "Methyl vinyl ketone (CH3COCH=CH2)",
            "Pulegone (C10H16O)",
            "Raspberry ketone (C10H12O2)",
            "Stearone (CH3(CH2)15COCH3)",
            "Thujone (C10H16O)",
            "Acetoacetic acid (CH3COCH2COOH)",
            "Acetoacetyl-CoA (CH3COCH2CO-CoA)",
            "Acetoacetylcholine (CH3COCH2CH2N(CH3)3+)",
            "Acetylacetone enolate (CH3COCH=C(O-)CH3)",
            "\u03b2-Hydroxybutyrate (CH3CH(OH)CH2COOH)",
            "Mevalonic acid (HO-C(CH2)2COCH2COOH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetone (CH3COCH3)",
                "Acetylacetone (CH3COCH2COCH3)",
                "Benzophenone (C6H5COC6H5)",
                "Camphor (C10H16O)",
                "Cyclohexanone (C6H10O)",
                "Fenchone (C10H16O)",
                "Isophorone (C9H14O)",
                "Raspberry ketone (C10H12O2)",
                "Thujone (C10H16O)"
            ],
            "mismatches": [
                "Diacetyl (CH3COCOCH3)",
                "Diethyl ketone (CH3COC2H5)",
                "Ethyl methyl ketone (CH3COC2H5)",
                "Menthone (C10H18O)",
                "Methyl isopropyl ketone (CH3COCH(CH3)2)",
                "Methyl vinyl ketone (CH3COCH=CH2)",
                "Pulegone (C10H16O)",
                "Stearone (CH3(CH2)15COCH3)",
                "Acetoacetic acid (CH3COCH2COOH)",
                "Acetoacetyl-CoA (CH3COCH2CO-CoA)",
                "Acetoacetylcholine (CH3COCH2CH2N(CH3)3+)",
                "Acetylacetone enolate (CH3COCH=C(O-)CH3)",
                "\u03b2-Hydroxybutyrate (CH3CH(OH)CH2COOH)",
                "Mevalonic acid (HO-C(CH2)2COCH2COOH)"
            ],
            "true_referents": [
                "(+)-beta-thujone",
                "(+)-pulegone",
                "(1S,4R)-fenchone",
                "(2,3,3-trimethyl-5-oxocyclopent-3-enyl)acetyl-CoA",
                "(25S)-3-oxocholest-4-en-26-oyl-CoA",
                "(S)-2-acetyl-2-hydroxybutanoic acid",
                "1,3-Diacetylpropane",
                "2',6'-dimethoxy-4'-hydroxyacetophenone",
                "2,4-dimethyl-3-pentanone",
                "24-ethylcholesta-4,22-dien-3-one",
                "3-oxocholoyl-CoA",
                "3beta-hydroxy-5alpha-cholestan-15-one",
                "4-Hydroxy-3-methyl-2-butanone",
                "4-acetylchrysophanol",
                "6-Acetylpicropolin",
                "Acetoin acetate",
                "Acetyl-methylcholine",
                "Dioctylketone",
                "Ethyl isopropyl ketone",
                "Methyl isobutyl ketone",
                "N-(2-benzoyl-1-methylvinyl)acetamide",
                "Pulegenone",
                "acetone",
                "acetone d6",
                "acetylacetonate",
                "acetylacetone",
                "benzophenone",
                "benzophenones",
                "beta-diketone",
                "camphor",
                "cyclohexanone",
                "cyclohexanone, 4-(1,1-dimethylethyl)-",
                "dehydroacetic acid",
                "dialkyl ketone",
                "diketone",
                "fenchone",
                "hydroxycyclohexanone",
                "isophorone",
                "isophorone diisocyanate",
                "methyl 4-hydroxy-3-(3-methylbutanoyl)benzoate",
                "methyl ketone",
                "methyl propenyl ketone",
                "p-Ethylacetophenone",
                "p-menthadien-3-one",
                "raspberry ketone",
                "thujone",
                "triacetic acid"
            ],
            "TP": 9,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (ACT)",
            "Butanone (MEK)",
            "Cyclohexanone (CYC)",
            "Diacetyl (DAC)",
            "Ethyl Methyl Ketone (EMK)",
            "Heptanone (HEP)",
            "Hexanone (HEX)",
            "Isobutyl Methyl Ketone (IBMK)",
            "Isophorone (IPH)",
            "Methyl Acetone (MAC)",
            "Methyl Amyl Ketone (MAK)",
            "Methyl Ethyl Ketone (MEK)",
            "Methyl Isobutyl Ketone (MIBK)",
            "Methyl n-Propyl Ketone (MPK)",
            "Methyl Phenyl Ketone (MPK)",
            "Methyl Propyl Ketone (MPK)",
            "Octanone (OCT)",
            "Pentan-2-one (PEN)",
            "Propanone (ACT)",
            "Propiophenone (PPH)",
            "Quinone (QUI)",
            "Triacetone Triperoxide (TATP)",
            "Undecanone (UND)",
            "Xanthone (XAN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "acetone",
                "butanone",
                "cyclohexanone",
                "hexanone",
                "isophorone",
                "methyl isobutyl ketone",
                "pentan-2-one",
                "propiophenone",
                "quinone",
                "xanthone"
            ],
            "mismatches": [
                "Diacetyl (DAC)",
                "Ethyl Methyl Ketone (EMK)",
                "Heptanone (HEP)",
                "Isobutyl Methyl Ketone (IBMK)",
                "Methyl Acetone (MAC)",
                "Methyl Amyl Ketone (MAK)",
                "Methyl Ethyl Ketone (MEK)",
                "Methyl n-Propyl Ketone (MPK)",
                "Methyl Phenyl Ketone (MPK)",
                "Methyl Propyl Ketone (MPK)",
                "Octanone (OCT)",
                "Triacetone Triperoxide (TATP)",
                "Undecanone (UND)"
            ],
            "true_referents": [
                "1,3,5,6-tetrahydroxy-4,7,8-tri(3-methyl-2-butenyl)xanthone",
                "1,3-Diacetylpropane",
                "1-phenyl-2-hexanone",
                "2'-methyl-Propiophenone",
                "2-Methyl-3-heptanone",
                "2-Methyl-4-heptanone",
                "2-octanone",
                "3-Methyl-1-phenyl-1-butanone",
                "3-Methylene-2-octanone",
                "3-hexanone",
                "3-methylcyclohexanone",
                "3-octanone",
                "4-heptanone",
                "4-propoxy-2-butanone",
                "6-Undecanone",
                "Dioctylketone",
                "Ethyl isobutyl ketone",
                "Ethyl isopropyl ketone",
                "Methyl isobutyl ketone",
                "acetone",
                "aminoacetone",
                "butanone",
                "cyclohexanone",
                "cyclohexanones",
                "diacetone alcohol",
                "diketone",
                "extended quinone",
                "hexanone",
                "isophorone",
                "isophorone diisocyanate",
                "m-quinone",
                "methyl ketone",
                "methyl propenyl ketone",
                "p-Hydroxypropiophenone",
                "pentan-2-one",
                "pentan-3-one",
                "propanones",
                "propiophenone",
                "quinone",
                "triptonoterpene",
                "triptonoterpenol",
                "undecan-2-one",
                "xanthone",
                "xanthones"
            ],
            "TP": 10,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (2-propanone)",
            "Butanone (methyl ethyl ketone)",
            "Pentan-2-one",
            "Hexan-3-one",
            "Heptan-4-one",
            "Octan-5-one",
            "Nonan-6-one",
            "Decan-7-one",
            "Undecan-8-one",
            "Dodecan-9-one",
            "Tridecan-10-one",
            "Tetradecan-11-one",
            "Pentadecan-12-one",
            "Hexadecan-13-one",
            "Heptadecan-14-one",
            "Octadecan-15-one",
            "Nonadecan-16-one",
            "Eicosan-17-one",
            "Docosan-18-one",
            "Tetracosan-19-one",
            "Hexacosan-20-one",
            "Octacosan-21-one",
            "Triacontan-22-one",
            "Tetratriacontan-23-one",
            "Pentatriacontan-24-one",
            "Phenylacetone (\u03b1-acetophenone)",
            "Methyl ethyl ketoxime",
            "Diethyl ketone",
            "Diacetone alcohol",
            "Methyl isopropyl ketone",
            "Cyclohexanone",
            "Acetoacetate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetone (2-propanone)",
                "Butanone (methyl ethyl ketone)",
                "Pentan-2-one"
            ],
            "mismatches": [
                "Hexan-3-one",
                "Heptan-4-one",
                "Octan-5-one",
                "Nonan-6-one",
                "Decan-7-one",
                "Undecan-8-one",
                "Dodecan-9-one",
                "Tridecan-10-one",
                "Tetradecan-11-one",
                "Pentadecan-12-one",
                "Hexadecan-13-one",
                "Heptadecan-14-one",
                "Octadecan-15-one",
                "Nonadecan-16-one",
                "Eicosan-17-one",
                "Docosan-18-one",
                "Tetracosan-19-one",
                "Hexacosan-20-one",
                "Octacosan-21-one",
                "Triacontan-22-one",
                "Tetratriacontan-23-one",
                "Pentatriacontan-24-one",
                "Phenylacetone (\u03b1-acetophenone)",
                "Methyl ethyl ketoxime",
                "Diethyl ketone",
                "Diacetone alcohol",
                "Methyl isopropyl ketone",
                "Cyclohexanone",
                "Acetoacetate"
            ],
            "true_referents": [
                "1,14-Pentadecadien-3-one",
                "1,5-Octadien-3-one",
                "1-Decen-3-one",
                "1-Hexadecen-3-one",
                "1-Tetradecen-3-one",
                "1-penten-3-one",
                "12Z-Nonadecen-9-one",
                "17beta,21beta-epoxyhopan-3-one",
                "2-hydroxy-1-phenyl-1-propanone",
                "2-triacontanone",
                "3-Methyl-1-phenyl-1-butanone",
                "3-Methylhexan-2-one",
                "3-Methylpentadecan-2-one",
                "4-propoxy-2-butanone",
                "5-Octen-2-one",
                "6Z-Eicosen-11-one",
                "7-Tridecen-2-one",
                "7-octen-2-one",
                "7Z-Eicosen-11-one",
                "8-Nonen-2-one",
                "Heneicosan-2-one",
                "Heptacosane-6,8-dione",
                "Heptadecan-2-one",
                "Hexadec-8-en-2-one",
                "Hexadecan-2-one",
                "Hexadecan-3-one",
                "Nonan-3-one",
                "Nonan-4-one",
                "acetone",
                "butanone",
                "decan-2-one",
                "hentriacontan-16-one",
                "heptan-2-one",
                "heptan-3-one",
                "indan-1-one",
                "indan-2-one",
                "nonacosan-10-one",
                "nonan-2-one",
                "pentan-2-one",
                "pentan-3-one",
                "tridecan-2-one",
                "undecan-2-one"
            ],
            "TP": 3,
            "FP": 29,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "ketone",
        "domain": "chemistry",
        "response": [
            "Acetone (ACN)",
            "Acetophenone (ACPH)",
            "Butanone (BUT)",
            "Hexanone (HEX)",
            "Cyclohexanone (CYH)",
            "Methyl ethyl ketone (MEK)",
            "Methyl isobutyl ketone (MIBK)",
            "Diacetyl (DA)",
            "Dimethyl ketone (DMK)",
            "3-Hydroxy-2-butanone (3H2B)",
            "2-Butanone (2B)",
            "1-Hydroxy-2-propanone (1H2P)",
            "Ethyl methyl ketone (EMK)",
            "Isophorone (ISOPH)",
            "Mesityl oxide (MESOX)",
            "Dihydromyrcenone (DHM)",
            "Curcumenone (CURC)",
            "Dehydroacetic acid (DHAA)",
            "Indanone (IND)",
            "Tetralone (TET)",
            "Fluorenone (FLUOR)",
            "Acephenone (ACEPH)",
            "Oxindole (OXIND)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "acetone",
                "acetophenone",
                "butanone",
                "hexanone",
                "cyclohexanone",
                "methyl isobutyl ketone",
                "isophorone",
                "dehydroacetic acid",
                "indanone"
            ],
            "mismatches": [
                "Acetone (ACN)",
                "Acetophenone (ACPH)",
                "Butanone (BUT)",
                "Hexanone (HEX)",
                "Cyclohexanone (CYH)",
                "Methyl ethyl ketone (MEK)",
                "Diacetyl (DA)",
                "Dimethyl ketone (DMK)",
                "3-Hydroxy-2-butanone (3H2B)",
                "2-Butanone (2B)",
                "1-Hydroxy-2-propanone (1H2P)",
                "Ethyl methyl ketone (EMK)",
                "Mesityl oxide (MESOX)",
                "Dihydromyrcenone (DHM)",
                "Curcumenone (CURC)",
                "Indanone (IND)",
                "Tetralone (TET)",
                "Fluorenone (FLUOR)",
                "Acephenone (ACEPH)",
                "Oxindole (OXIND)"
            ],
            "true_referents": [
                "(+)-ascomindone D",
                "1,3-Diacetylpropane",
                "1,4-Dibromodiacetyl",
                "1-phenyl-2-hexanone",
                "2,3-bis(hydroxymethyl)-7-hydroxy-6-methoxy-1-tetralone",
                "2-hydroxy-1-phenyl-1-propanone",
                "2-hydroxy-6-oxo-2,4-heptadienoic acid",
                "2-methyl-1-tetralone",
                "3-Hydroxy-1-indanone",
                "3-cyano-2-butanone",
                "3-hexanone",
                "3-methoxy-3-methyl-2-butanone",
                "3-methylcyclohexanone",
                "4-Hydroxy-3-methyl-2-butanone",
                "4-propoxy-2-butanone",
                "Butylone",
                "Curvulone B",
                "Curvulone C",
                "Ethyl isobutyl ketone",
                "Ethyl isopropyl ketone",
                "Methyl isobutyl ketone",
                "Oxindanac",
                "Viridicatumone A",
                "acetone",
                "acetone d6",
                "acetophenone",
                "acetophenones",
                "butanone",
                "cyclohexanone",
                "dehydroacetic acid",
                "dialkyl ketone",
                "dihydromyricetin",
                "dihydroxyacetone",
                "fluanisone",
                "fluoren-9-one",
                "fluoren-9-ones",
                "hexanone",
                "hydroxycyclohexanone",
                "indan-2-one oxime",
                "indanone",
                "indanones",
                "isophorone",
                "isophorone diisocyanate",
                "mesityl(piperidin-4-yl)methanone",
                "mesityl(piperidin-4-yl)methanone hydrochloride",
                "methyl ketone",
                "methyl propenyl ketone",
                "mexenone",
                "propiophenone",
                "teprenone"
            ],
            "TP": 9,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "ketone",
        "domain": "chemistry",
        "response": "[\n        {\n            \"Referent\": \"acetone\",\n            \"Canonical name\": \"(CH3)2CO\"\n        },\n        {\n            \"Referent\": \"diacetyl\",\n            \"Canonical name\": \"(CH3CO)2O\"\n        },\n        {\n            \"Referent\": \"dihydroxyacetone\",\n            \"Canonical name\": \"C3H6O2\"\n        },\n        {\n            \"Referent\": \"methylglyoxal\",\n            \"Canonical name\": \"C3H4O2\"\n        },\n        {\n            \"Referent\": \"pyruvic acid\",\n            \"Canonical name\": \"C3H4O3\"\n        },\n        {\n            \"Referent\": \"acetophenone\",\n            \"Canonical name\": \"(CH3)2C6H5\"\n        },\n        {\n            \"Referent\": \"benzaldehyde\",\n            \"Canonical name\": (CH3)2C6H3CHO\n        },\n        {\n            \"Referent\": \"2-butanone\",\n            \"Canonical name\": (CH3)2C4H6O\n        },\n        {\n            \"Referent\": \"methyl isopropyl ketone\",\n            \"Canonical name\": (CH3)2C5HIO\n        },\n        {\n            \"Referent\": \"methyl vinyl ketone\",\n            \"Canonical name\": (CH3)2C3H2O\n        },\n        {\n            \"Referent\": \"cyclopentanone\",\n            \"Canonical name\": (CH3)2C3H2CO\n        },\n        {\n            \"Referent\": \"2-hexanone\",\n            \"Canonical name\": (CH3)2C4H8O\n        },\n        {\n            \"Referent\": \"2-pentanone\",\n            \"Canonical name\": (CH3)2C3H4O\n        },\n        {\n            \"Referent\": \"3-pentanone\",\n            \"Canonical name\": (CH3)2C3H2O\n        },\n        {\n            \"Referent\": \"2-heptanone\",\n            \"Canonical name\": (CH3)2C3H2CO\n        },\n        {\n            \"Referent\": \"2-octanone\",\n            \"Canonical name\": (CH3)2C3H2CO\n        },\n        {\n            \"Referent\": \"3-octanone\",\n            \"Canonical name\": (CH3)2C3H2O\n        },\n        {\n            \"Referent\": \"2-nonanone\",\n            \"Canonical name\": (CH3)2C3H2CO\n        },\n        {\n            \"Referent\": \"2-undecanone\",\n            \"Canonical name\": (CH3)2C3H2CO\n        },\n        {\n            \"Referent\": \"3-undecanone\",\n            \"Canonical name\": (CH3)2C3H2O\n        },\n        {\n            \"Referent\": \"2-dodecanone\",\n            \"Canonical name\": (CH3)2C3H2CO\n        },\n        {\n            \"Referent\": \"3-dodecanone\",\n            \"Canonical name\": (CH3)2C3H2O\n        },\n        {\n            \"Referent\": \"3-hexen-2-one\",\n            \"Canonical name\": (CH3)2C4H6O\n        },\n        {\n            \"Referent\": \"3-hepten-2-one\",\n            \"Canonical name\": (CH3)2C4H6O\n        },\n        {\n            \"Referent\": \"3-octen-2-one\",\n            \"Canonical name\": (CH3)2C4H6O\n        }\n    ]",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]