[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Glycerol (Glyc)",
            "Ethylene glycol (EG)",
            "1,2-Propanediol (1,2-Pr)",
            "1,3-Propanediol (1,3-Pr)",
            "1,2-Butanediol (1,2-Bu)",
            "1,3-Butanediol (1,3-Bu)",
            "1,4-Butanediol (1,4-Bu)",
            "2,3-Butanediol (2,3-Bu)",
            "Thiodiglycol (TDG)",
            "Diethylene glycol (DEG)",
            "Triethylene glycol (TEG)",
            "1,5-Pentanediol (1,5-Pe)",
            "1,6-Hexanediol (1,6-Hx)",
            "1,7-Heptanediol (1,7-Hp)",
            "1,8-Octanediol (1,8-Oc)",
            "1,9-Nonanediol (1,9-Nn)",
            "1,10-Decanediol (1,10-Dc)",
            "1,2-Cyclohexanediol (1,2-Chd)",
            "1,3-Cyclohexanediol (1,3-Chd)",
            "1,4-Cyclohexanediol (1,4-Chd)",
            "Resorcinol (Res)",
            "Hydroquinone (HQ)",
            "Dihydroxyacetone phosphate (DHAP)",
            "2,3-Butanedione monoxime (DMN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethylene glycol (EG)",
                "1,2-Propanediol (1,2-Pr)",
                "1,3-Propanediol (1,3-Pr)",
                "1,3-Butanediol (1,3-Bu)",
                "2,3-Butanediol (2,3-Bu)",
                "Thiodiglycol (TDG)",
                "Triethylene glycol (TEG)"
            ],
            "mismatches": [
                "Glycerol (Glyc)",
                "1,2-Butanediol (1,2-Bu)",
                "1,4-Butanediol (1,4-Bu)",
                "Diethylene glycol (DEG)",
                "1,5-Pentanediol (1,5-Pe)",
                "1,6-Hexanediol (1,6-Hx)",
                "1,7-Heptanediol (1,7-Hp)",
                "1,8-Octanediol (1,8-Oc)",
                "1,9-Nonanediol (1,9-Nn)",
                "1,10-Decanediol (1,10-Dc)",
                "1,2-Cyclohexanediol (1,2-Chd)",
                "1,3-Cyclohexanediol (1,3-Chd)",
                "1,4-Cyclohexanediol (1,4-Chd)",
                "Resorcinol (Res)",
                "Hydroquinone (HQ)",
                "Dihydroxyacetone phosphate (DHAP)",
                "2,3-Butanedione monoxime (DMN)"
            ],
            "true_referents": [
                "(-)-secoisolariciresinol",
                "(18R)-resolvin E3",
                "(2R,3S)-2-aminooctadec-4-ene-1,3-diol",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(R)-monothioglycerol",
                "(R)-propane-1,2-diol",
                "(R,R)-hydrobenzoin",
                "1,1-dimethoxyethane",
                "1,2-dimethoxyethane",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,5-tetradecanediol",
                "1,7-decanediol",
                "1,7-dodecanediol",
                "1,7-tetradecanediol",
                "1,9-decanediol",
                "2-aminooctadecene-1,3-diol",
                "2-hydroxypropyl dihydrogen phosphate",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-phenyl-1,2-propanediol",
                "3beta-acetoxy-15alpha,22-dihydroxyhopane",
                "L-glycol",
                "butane-1,3-diol",
                "butane-2,3-diol",
                "butanediol",
                "cis-cyclohexane-1,2-diol",
                "cyclohexadienediol",
                "cyclohexane-1,2-diol",
                "decane-1,2-diol",
                "dimethoxymethane",
                "ethylene glycol",
                "glycol",
                "hydrobenzoin",
                "octane-1,2-diol",
                "octane-1,8-diol",
                "octanediol",
                "propane-1,3-diol",
                "propanediol",
                "thiodiglycol",
                "trans-3-ethenylcyclohexa-3,5-diene-1,2-diol",
                "trans-cyclohexane-1,2-diol",
                "triethylene glycol"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "1,2-Propanediol (Propylene glycol, PG)",
            "1,3-Butanediol",
            "1,4-Butanediol",
            "1,5-Pentanediol",
            "1,6-Hexanediol",
            "Ethylene glycol dimethyl ether",
            "1,2-Cyclohexanediol",
            "1,3-Cyclohexanediol",
            "1,4-Cyclohexanediol",
            "1,5-Cyclohexanediol",
            "1,2-Ethanediol (Ethylene glycol)",
            "1,3-Benzenediol (Pyrocatechol)",
            "1,2-Benzenediol (Catechol)",
            "1,4-Benzenediol (Hydroquinone)",
            "2,3-Butanediol",
            "2,5-Hexanediol",
            "2,6-Dimethyl-1,3-benzenediol (Resorcinol)",
            "2,2'-Methylenebis(4-chlorophenol)",
            "2,3-Butanediol (2,3-Dihydroxybutane)",
            "3,4-Dihydroxybenzoic acid (Protocatechuic acid)",
            "3,5-Diiodothyronine",
            "3,4-Dihydroxyphenylalanine (DOPA)",
            "3,5-Dihydroxy-L-tyrosine",
            "1,2-Dimethoxyethane (DME)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,4-Butanediol",
                "2,3-Butanediol"
            ],
            "mismatches": [
                "Ethylene glycol (EG)",
                "1,2-Propanediol (Propylene glycol, PG)",
                "1,3-Butanediol",
                "1,5-Pentanediol",
                "1,6-Hexanediol",
                "Ethylene glycol dimethyl ether",
                "1,2-Cyclohexanediol",
                "1,3-Cyclohexanediol",
                "1,4-Cyclohexanediol",
                "1,5-Cyclohexanediol",
                "1,2-Ethanediol (Ethylene glycol)",
                "1,3-Benzenediol (Pyrocatechol)",
                "1,2-Benzenediol (Catechol)",
                "1,4-Benzenediol (Hydroquinone)",
                "2,5-Hexanediol",
                "2,6-Dimethyl-1,3-benzenediol (Resorcinol)",
                "2,2'-Methylenebis(4-chlorophenol)",
                "2,3-Butanediol (2,3-Dihydroxybutane)",
                "3,4-Dihydroxybenzoic acid (Protocatechuic acid)",
                "3,5-Diiodothyronine",
                "3,4-Dihydroxyphenylalanine (DOPA)",
                "3,5-Dihydroxy-L-tyrosine",
                "1,2-Dimethoxyethane (DME)"
            ],
            "true_referents": [
                "(10S)-Juvenile hormone III diol",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(6R)-5,6,7,8-tetrahydrobiopterin",
                "(6R)-L-threo-tetrahydrobiopterin",
                "(R)-propane-1,2-diol",
                "(S)-chlorphenesin",
                "(Z)-1,2-ethenediol",
                "1,2-bis(3,4-dimethoxyphenyl)propane-1,3-diol",
                "1,2-dodecanediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,3-dihydroxybutan-2-one",
                "1,3-dodecanediol",
                "1,4-dodecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dodecanediol",
                "1-(3,4-dimethoxyphenyl)ethane-1,2-diol",
                "2,3-bis(4-hydroxyphenyl)-1,2-propanediol",
                "2-hydroxy-3-(2-hydroxyethyl)naphthalene-1,4-dione",
                "2-hydroxyethyl salicylate",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-phenyl-1,2-propanediol",
                "24,25-dihydroxydammar-20-en-3-one",
                "4'-chlorobiphenyl-2,3-diol",
                "DDT-2,3-dihydrodiol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butane-2,3-diol",
                "butanediol",
                "calcidiol 3-O-(beta-D-glucuronide)",
                "cis-1,2-dihydro-3-ethylcatechol",
                "cis-cyclohexane-1,2-diol",
                "cyclohex-3-ene-1,2-diol",
                "cyclohexane-1,2-diol",
                "diethylene glycol monoethyl ether",
                "diisopropanolamine",
                "ethanediol",
                "ethylene glycol",
                "ethylene glycol monododecyl ether",
                "hexane-1,6-diol",
                "hexane-2,5-diol",
                "propanediol",
                "trans-cyclohexane-1,2-diol",
                "triethylene glycol"
            ],
            "TP": 2,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (1,2-Ethanediol)",
            "Propylene glycol (1,2-Propanediol)",
            "1,3-Butanediol",
            "1,4-Butanediol",
            "1,2-Pentanediol",
            "1,3-Pentanediol",
            "1,4-Pentanediol",
            "1,5-Pentanediol",
            "1,2-Hexanediol",
            "1,3-Hexanediol",
            "1,4-Hexanediol",
            "1,5-Hexanediol",
            "1,6-Hexanediol",
            "1,2-Octanediol",
            "1,3-Octanediol",
            "1,4-Octanediol",
            "1,5-Octanediol",
            "1,6-Octanediol",
            "1,8-Octanediol",
            "1,2-Decanediol",
            "1,3-Decanediol",
            "1,4-Decanediol",
            "1,5-Decanediol",
            "1,10-Decanediol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethylene glycol (1,2-Ethanediol)",
                "1,3-Butanediol",
                "1,4-Butanediol",
                "1,6-Hexanediol",
                "1,2-Octanediol",
                "1,8-Octanediol",
                "1,2-Decanediol"
            ],
            "mismatches": [
                "Propylene glycol (1,2-Propanediol)",
                "1,2-Pentanediol",
                "1,3-Pentanediol",
                "1,4-Pentanediol",
                "1,5-Pentanediol",
                "1,2-Hexanediol",
                "1,3-Hexanediol",
                "1,4-Hexanediol",
                "1,5-Hexanediol",
                "1,3-Octanediol",
                "1,4-Octanediol",
                "1,5-Octanediol",
                "1,6-Octanediol",
                "1,3-Decanediol",
                "1,4-Decanediol",
                "1,5-Decanediol",
                "1,10-Decanediol"
            ],
            "true_referents": [
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,3-tetradecanediol",
                "1,4-dodecanediol",
                "1,4-tetradecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dodecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "2-methylene-1,4-butanediol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butanediol",
                "decane-1,2-diol",
                "ethylene glycol",
                "ethylene glycol bis(2-aminoethyl)tetraacetate",
                "hexane-1,6-diol",
                "octane-1,2-diol",
                "octane-1,8-diol",
                "octanediol",
                "propanediol"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene Glycol (EG)",
            "Propylene Glycol (PG)",
            "1,2-Propanediol",
            "1,3-Propanediol",
            "Glycerol (GLY)",
            "Butanediol (BDO)",
            "1,4-Butanediol",
            "2,3-Butanediol",
            "Pentanediol",
            "1,5-Pentanediol",
            "Hexanediol",
            "1,6-Hexanediol",
            "Catechol",
            "Pinacol",
            "Trehalose",
            "Sucrose",
            "Maltose",
            "Lactose",
            "Ribitol",
            "Xylitol",
            "Mannitol",
            "Sorbitol",
            "Inositol",
            "Tartaric Acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethylene Glycol (EG)",
                "1,2-Propanediol",
                "1,3-Propanediol",
                "Butanediol (BDO)",
                "1,4-Butanediol",
                "2,3-Butanediol",
                "Pinacol"
            ],
            "mismatches": [
                "Propylene Glycol (PG)",
                "Glycerol (GLY)",
                "Pentanediol",
                "1,5-Pentanediol",
                "Hexanediol",
                "1,6-Hexanediol",
                "Catechol",
                "Trehalose",
                "Sucrose",
                "Maltose",
                "Lactose",
                "Ribitol",
                "Xylitol",
                "Mannitol",
                "Sorbitol",
                "Inositol",
                "Tartaric Acid"
            ],
            "true_referents": [
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(6E)-8-hydroxygeraniol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dihydroxyphenazine N(5)-oxide",
                "1,6-dodecanediol",
                "1-O-dodecylglycerol",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-phenyl-1,2-propanediol",
                "2alpha-acetoxy-28-acetylrubiarboside G",
                "L-glycol",
                "N-icosadienoyl-1-O-beta-D-glucosyl-15-methylhexadecasphing-4-enine",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1')-N-acylicosasphingosine",
                "beta-D-galactosyl-(1<->1')-N-(docosanoyl)hexadecasphingosine",
                "beta-bitter acid",
                "butane-1,4-diol",
                "butane-2,3-diol",
                "butanediol",
                "butanediols",
                "cis-1,2-dihydro-3-ethylcatechol",
                "deoxyaconitine",
                "ethanediol",
                "ethylene glycol",
                "ethylene glycol monophosphate",
                "glycol",
                "hexane-1,6-diol",
                "inositol phosphosphingolipid",
                "inositol-1-phospho-N-acyl-(8E)-phytosphing-8-enine",
                "lavendiol",
                "maniladiol",
                "pinacol",
                "propane-1,2-diol",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "rubianol-e 3-O-(6'-O-acetyl)-beta-D-glucopyranoside",
                "rubiarboside G 28-acetate",
                "tetradecanediol",
                "triethylene glycol"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Propylene glycol (PG)",
            "Butane-1,3-diol",
            "Butane-1,4-diol",
            "Pentane-1,5-diol",
            "Hexane-1,6-diol",
            "Cyclohexane-1,2-diol",
            "Cyclohexane-1,3-diol",
            "Cyclohexane-1,4-diol",
            "1,2-Propanediol",
            "1,3-Propanediol",
            "1,2-Butanediol",
            "1,3-Butanediol",
            "1,2-Pentanediol",
            "1,4-Pentanediol",
            "1,2-Hexanediol",
            "1,3-Hexanediol",
            "Pinacol",
            "Mannitol",
            "Sorbitol",
            "Isosorbide",
            "Glycerol",
            "Dipropylene glycol",
            "Neopentyl glycol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethylene glycol (EG)",
                "Butane-1,3-diol",
                "Butane-1,4-diol",
                "Hexane-1,6-diol",
                "Cyclohexane-1,2-diol",
                "1,2-Propanediol",
                "1,3-Propanediol",
                "Pinacol",
                "Neopentyl glycol"
            ],
            "mismatches": [
                "Propylene glycol (PG)",
                "Pentane-1,5-diol",
                "Cyclohexane-1,3-diol",
                "Cyclohexane-1,4-diol",
                "1,2-Butanediol",
                "1,3-Butanediol",
                "1,2-Pentanediol",
                "1,4-Pentanediol",
                "1,2-Hexanediol",
                "1,3-Hexanediol",
                "Mannitol",
                "Sorbitol",
                "Isosorbide",
                "Glycerol",
                "Dipropylene glycol"
            ],
            "true_referents": [
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,4-tetradecanediol",
                "1,5-tetradecanediol",
                "2-methyl-1,2-butanediol",
                "2-methylpentane-2,4-diol",
                "2-phenyl-1,2-propanediol",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butane-2,3-diol",
                "butanediol",
                "cis-cyclohexane-1,2-diol",
                "cyclohex-3-ene-1,2-diol",
                "cyclohexane-1,2-diol",
                "ethylene glycol",
                "ethylene glycol monophosphate",
                "glycol",
                "hexane-1,6-diol",
                "hexane-2,5-diol",
                "lavendiol",
                "maniladiol",
                "neopentyl glycol",
                "nimodipine",
                "octane-1,2-diol",
                "pinacol",
                "propane-1,2-diol",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "trans-cyclohexane-1,2-diol",
                "triethylene glycol"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Propylene glycol (PG)",
            "Glycerol (Glycerin)",
            "Butylene glycol (BG)",
            "1,2-Butanediol (BDO)",
            "1,3-Butanediol",
            "1,4-Butanediol (BDO)",
            "1,2-Ethanediol (Ethylene glycol)",
            "1,2-Pentanediol",
            "1,2-Hexanediol",
            "2,3-Butanediol",
            "2-Methyl-1,3-butanediol",
            "1,2-Cyclohexanediol",
            "1,2-Octanediol",
            "1,3-Propanediol",
            "1,2-Propylene glycol (Propylene glycol)",
            "2,2-Dimethyl-1,3-propanediol",
            "1,2-Nonanediol",
            "1,2-Decanediol",
            "1,2-Dodecanediol",
            "1,3-Butanediol (Racemic)",
            "1,3-Pentanediol",
            "2,4-Hexanediol",
            "2,5-Hexanediol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethylene glycol",
                "butane-1,3-diol",
                "1,4-butanediol",
                "1,2-dodecanediol",
                "butane-2,3-diol",
                "cyclohexane-1,2-diol",
                "octane-1,2-diol",
                "propane-1,3-diol",
                "1,2-hexanediol"
            ],
            "mismatches": [
                "propylene glycol",
                "glycerol",
                "butylene glycol",
                "1,2-butanediol",
                "1,2-pentanediol",
                "2-methyl-1,3-butanediol",
                "1,2-propylene glycol",
                "2,2-dimethyl-1,3-propanediol",
                "1,2-nonanediol",
                "1,2-decanediol",
                "1,3-butanediol (racemic)",
                "1,3-pentanediol",
                "2,4-hexanediol",
                "2,5-hexanediol"
            ],
            "true_referents": [
                "(2E)-2,6-dimethylocta-2,7-diene-1,6-diol",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(R)-butane-1,3-diol",
                "1,2-dodecanediol",
                "1,2-hexacosanediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,3-tetradecanediol",
                "1,4-dodecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1-O-dodecylglycerol",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-phenyl-1,2-propanediol",
                "3-methylbutane-1,2-diol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butane-2,3-diol",
                "butanediol",
                "butanediols",
                "cis-cyclohexane-1,2-diol",
                "cyclohexane-1,2-diol",
                "decane-1,2-diol",
                "ethanediol",
                "ethylene glycol",
                "glycol",
                "hexane-2,5-diol",
                "octane-1,2-diol",
                "octanediol",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "trans-cyclohexane-1,2-diol",
                "triethylene glycol"
            ],
            "TP": 9,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene Glycol (EG)",
            "Propylene Glycol (PG)",
            "Butanediol (BDO)",
            "Pentanediol (PDO)",
            "Hexanediol (HDO)",
            "Heptanediol (HPDO)",
            "Octanediol (ODO)",
            "Nonanediol (NDO)",
            "Decanediol (DDO)",
            "Undecanediol (UDO)",
            "Dodecanediol (D2DO)",
            "Tridecanediol (TDO)",
            "Tetradecanediol (TDDO)",
            "Pentadecanediol (PDDO)",
            "Hexadecanediol (HDDO)",
            "Heptadecanediol (HDDO)",
            "Octadecanediol (ODDO)",
            "Nonadecanediol (NDDO)",
            "Eicosanediol (EDO)",
            "Heneicosanediol (HEDO)",
            "Docosanediol (DODO)",
            "Tricosanediol (TDO)",
            "Tetracosanediol (TDDO)",
            "Pentacosanediol (PDDO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethylene Glycol (EG)",
                "Butanediol (BDO)",
                "Octanediol (ODO)",
                "Dodecanediol (D2DO)",
                "Tetradecanediol (TDDO)"
            ],
            "mismatches": [
                "Propylene Glycol (PG)",
                "Pentanediol (PDO)",
                "Hexanediol (HDO)",
                "Heptanediol (HPDO)",
                "Nonanediol (NDO)",
                "Decanediol (DDO)",
                "Undecanediol (UDO)",
                "Tridecanediol (TDO)",
                "Pentadecanediol (PDDO)",
                "Hexadecanediol (HDDO)",
                "Heptadecanediol (HDDO)",
                "Octadecanediol (ODDO)",
                "Nonadecanediol (NDDO)",
                "Eicosanediol (EDO)",
                "Heneicosanediol (HEDO)",
                "Docosanediol (DODO)",
                "Tricosanediol (TDO)",
                "Tetracosanediol (TDDO)",
                "Pentacosanediol (PDDO)"
            ],
            "true_referents": [
                "(2R,5R)-hexanediol",
                "1,16-hexadecanediol",
                "1,2-docosanediol",
                "1,2-dodecanediol",
                "1,2-hexacosanediol",
                "1,2-hexadecanediol",
                "1,2-octacosanediol",
                "1,2-octadecanediol",
                "1,2-tetracosanediol",
                "1,2-tetradecanediol",
                "1,3-dodecanediol",
                "1,3-tetradecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "butanediol",
                "butanediols",
                "dodecanediol",
                "ethylene glycol",
                "glycol",
                "hexane-1,6-diol",
                "octadienediol",
                "octanediol",
                "propanediol",
                "tetracosane-1,3-diol",
                "tetradecanediol",
                "triethylene glycol"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Propylene glycol (PG)",
            "Glycerol",
            "1,2-Butanediol",
            "1,3-Butanediol",
            "1,4-Butanediol",
            "1,2-Pentanediol",
            "1,3-Pentanediol",
            "1,4-Pentanediol",
            "1,5-Pentanediol",
            "1,2-Hexanediol",
            "1,3-Hexanediol",
            "1,4-Hexanediol",
            "1,5-Hexanediol",
            "1,6-Hexanediol",
            "1,2-Heptanediol",
            "1,2-Octanediol",
            "1,2-Nonanediol",
            "1,2-Decanediol",
            "1,2-Dodecanediol",
            "1,2-Hexadecanediol",
            "1,2-Octadecanediol",
            "1,2-Eicosanediol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethylene glycol (EG)",
                "1,2-Butanediol",
                "1,3-Butanediol",
                "1,4-Butanediol",
                "1,2-Decanediol",
                "1,2-Dodecanediol",
                "1,2-Hexadecanediol",
                "1,2-Octanediol",
                "1,2-Octadecanediol",
                "1,6-Hexanediol"
            ],
            "mismatches": [
                "Propylene glycol (PG)",
                "Glycerol",
                "1,2-Pentanediol",
                "1,3-Pentanediol",
                "1,4-Pentanediol",
                "1,5-Pentanediol",
                "1,3-Hexanediol",
                "1,4-Hexanediol",
                "1,5-Hexanediol",
                "1,2-Heptanediol",
                "1,2-Nonanediol",
                "1,2-Eicosanediol"
            ],
            "true_referents": [
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "1,16-hexadecanediol",
                "1,2-docosanediol",
                "1,2-dodecanediol",
                "1,2-hexacosanediol",
                "1,2-hexadecanediol",
                "1,2-octacosanediol",
                "1,2-octadecanediol",
                "1,2-tetradecanediol",
                "1,3-tetradecanediol",
                "1,4-dodecanediol",
                "1,4-tetradecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dodecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-phenyl-1,2-propanediol",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butanediol",
                "decane-1,2-diol",
                "ethylene glycol",
                "glycol",
                "hexane-1,6-diol",
                "octane-1,2-diol",
                "octanediol",
                "triethylene glycol"
            ],
            "TP": 10,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Propylene glycol (PG)",
            "Butane-1,4-diol",
            "Glycerol (Glycerin)",
            "1,2-Propanediol",
            "1,3-Propanediol",
            "1,2-Butanediol",
            "1,3-Butanediol",
            "1,4-Butanediol",
            "1,2-Pentanediol",
            "1,3-Pentanediol",
            "1,2-Hexanediol",
            "1,3-Hexanediol",
            "Catechol (1,2-dihydroxybenzene)",
            "Resorcinol (1,3-dihydroxybenzene)",
            "Hydroquinone (1,4-dihydroxybenzene)",
            "Sorbitol",
            "Xylitol",
            "Erythritol",
            "Mannitol",
            "1,2-Cyclohexanediol",
            "Polyethylene glycol (PEG)",
            "Diethylene glycol (DEG)",
            "Triethylene glycol (TEG)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Butane-1,4-diol",
                "1,2-Propanediol",
                "1,3-Propanediol",
                "1,2-Butanediol",
                "1,3-Butanediol",
                "1,2-Hexanediol",
                "1,2-Cyclohexanediol",
                "Ethylene glycol",
                "Triethylene glycol"
            ],
            "mismatches": [
                "Propylene glycol (PG)",
                "Glycerol (Glycerin)",
                "1,3-Hexanediol",
                "1,2-Pentanediol",
                "1,3-Pentanediol",
                "Catechol (1,2-dihydroxybenzene)",
                "Resorcinol (1,3-dihydroxybenzene)",
                "Hydroquinone (1,4-dihydroxybenzene)",
                "Sorbitol",
                "Xylitol",
                "Erythritol",
                "Mannitol",
                "Polyethylene glycol (PEG)",
                "Diethylene glycol (DEG)"
            ],
            "true_referents": [
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(R,R)-hydrobenzoin",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,3-tetradecanediol",
                "1,5-tetradecanediol",
                "1,6-dihydroxyphenazine N(5)-oxide",
                "1-O-dodecylglycerol",
                "2,3-bis(4-hydroxyphenyl)-1,2-propanediol",
                "2-hydroxy-3-(2-hydroxyethyl)naphthalene-1,4-dione",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-phenyl-1,2-propanediol",
                "L-erythro-sphingosine",
                "beta-D-glucosyl-L-erythro-N-acylsphingosine",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butanediol",
                "cis-1,2-dihydro-3-ethylcatechol",
                "cis-cyclohexane-1,2-diol",
                "cyclohexane-1,2-diol",
                "ethylene glycol",
                "ethylene glycol monophosphate",
                "glycol",
                "propane-1,2-diol",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "trans-cyclohexane-1,2-diol",
                "triethylene glycol"
            ],
            "TP": 9,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Propylene glycol (PG)",
            "1,3-Propanediol (PDO)",
            "1,4-Butanediol (BDO)",
            "2,3-Butanediol",
            "1,5-Pentanediol",
            "1,6-Hexanediol",
            "1,2-Cyclohexanediol",
            "Glycerol",
            "Erythritol",
            "Xylitol",
            "Sorbitol",
            "Mannitol",
            "Pinacol",
            "Bisphenol A (BPA)",
            "Catechol",
            "Resorcinol",
            "Hydroquinone",
            "Dopamine",
            "Adrenaline (Epinephrine)",
            "Testosterone",
            "Estradiol",
            "Cortisol",
            "Vitamin C (Ascorbic acid)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Pinacol"
            ],
            "mismatches": [
                "Ethylene glycol (EG)",
                "Propylene glycol (PG)",
                "1,3-Propanediol (PDO)",
                "1,4-Butanediol (BDO)",
                "2,3-Butanediol",
                "1,5-Pentanediol",
                "1,6-Hexanediol",
                "1,2-Cyclohexanediol",
                "Glycerol",
                "Erythritol",
                "Xylitol",
                "Sorbitol",
                "Mannitol",
                "Bisphenol A (BPA)",
                "Catechol",
                "Resorcinol",
                "Hydroquinone",
                "Dopamine",
                "Adrenaline (Epinephrine)",
                "Testosterone",
                "Estradiol",
                "Cortisol",
                "Vitamin C (Ascorbic acid)"
            ],
            "true_referents": [
                "(+)-homalomenol A",
                "(+)-homalomenol B",
                "(+)-phytocassane C",
                "(10S)-Juvenile hormone III diol",
                "(18R)-resolvin E3",
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(6E)-8-hydroxygeraniol",
                "(R,R)-hydrobenzoin",
                "(Z)-1,2-ethenediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dihydroxyphenazine N(5)-oxide",
                "1,6-dodecanediol",
                "16alpha-hydroxytestosterone",
                "19,28-didehydroxyrubiarbonol A",
                "2-hydroxy-3-(2-hydroxyethyl)naphthalene-1,4-dione",
                "2-hydroxyethyl salicylate",
                "2-methyl-1,2-butanediol",
                "3,1'-dihydroxy-gamma-carotene",
                "L-erythro-sphingosine",
                "N-acyl-15-methylhexadecasphinganine-1-phosphoethanolamine",
                "beta-D-glucosyl-L-erythro-N-acylsphingosine",
                "bis(2-butoxyethyl)phthalate",
                "butane-1,4-diol",
                "butane-2,3-diol",
                "butanediol",
                "cis-1,2-dihydro-3-ethylcatechol",
                "cis-cyclohexane-1,2-diol",
                "cortistatin B",
                "cyclohexane-1,2-diol",
                "diisopropanolamine",
                "ethylene glycol",
                "ethylene glycol monophosphate",
                "glycol",
                "hexane-1,6-diol",
                "hydrobenzoin",
                "hypodiol",
                "lavendiol",
                "maniladiol",
                "pinacol",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "psychosine",
                "rubianol-e 3-O-(6'-O-acetyl)-beta-D-glucopyranoside",
                "sapropterin",
                "trans-cyclohexane-1,2-diol",
                "triethylene glycol"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Propylene glycol (PG)",
            "1,3-Butanediol (1,3-BDO)",
            "1,4-Butanediol (1,4-BDO)",
            "2,3-Butanediol (2,3-BDO)",
            "1,2-Pentanediol (1,2-PeDO)",
            "1,5-Pentanediol (1,5-PeDO)",
            "Neopentyl glycol (NPG)",
            "1,6-Hexanediol (1,6-HDO)",
            "2,5-Hexanediol (2,5-HDO)",
            "1,2-Octanediol (1,2-ODO)",
            "1,8-Octanediol (1,8-ODO)",
            "1,10-Decanediol (1,10-DDO)",
            "1,12-Dodecanediol (1,12-DDDO)",
            "Bisphenol A (BPA)",
            "2,2-Dimethyl-1,3-propanediol (NPG)",
            "Catechol",
            "Resorcinol",
            "Hydroquinone (HQ)",
            "cis-1,2-Cyclohexanediol",
            "trans-1,2-Cyclohexanediol",
            "meso-Hydrobenzoin",
            "(2R,3R)-(-)-2,3-Butanediol",
            "(2S,3S)-(+)-2,3-Butanediol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethylene glycol",
                "neopentyl glycol",
                "1,12-dodecanediol",
                "meso-hydrobenzoin",
                "cis-cyclohexane-1,2-diol",
                "trans-cyclohexane-1,2-diol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butane-2,3-diol"
            ],
            "mismatches": [
                "propylene glycol",
                "1,2-pentanediol",
                "1,5-pentanediol",
                "1,6-hexanediol",
                "2,5-hexanediol",
                "1,2-octanediol",
                "1,8-octanediol",
                "1,10-decanediol",
                "bisphenol A",
                "2,2-dimethyl-1,3-propanediol",
                "catechol",
                "resorcinol",
                "hydroquinone",
                "(2R,3R)-(-)-2,3-butanediol",
                "(2S,3S)-(+)-2,3-butanediol"
            ],
            "true_referents": [
                "(18R)-resolvin E3",
                "(2R)-octane-1,2-diol",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(6E)-8-hydroxygeraniol",
                "(R)-butane-1,3-diol",
                "(R,R)-butane-2,3-diol",
                "(R,R)-hydrobenzoin",
                "(S)-butane-1,3-diol",
                "(S,S)-butane-2,3-diol",
                "1,12-dodecanediol",
                "1,2-dodecanediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,4-tetradecanediol",
                "1,5-tetradecanediol",
                "1,6-dihydroxyphenazine N(5)-oxide",
                "1,6-dodecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "19,28-didehydroxyrubiarbonol A",
                "2-methylene-1,4-butanediol",
                "2-phenyl-1,2-propanediol",
                "bis(2-butoxyethyl)phthalate",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butane-2,3-diol",
                "butanediol",
                "cis-1,2-dihydro-3-ethylcatechol",
                "cis-3-ethenylcyclohexa-3,5-diene-1,2-diol",
                "cis-cyclohexane-1,2-diol",
                "decane-1,2-diol",
                "ethylene glycol",
                "glycol",
                "hexane-1,6-diol",
                "hexane-2,5-diol",
                "hydrobenzoin",
                "meso-hydrobenzoin",
                "neopentyl glycol",
                "octane-1,2-diol",
                "octane-1,8-diol",
                "octanediol",
                "propanediol",
                "rubianol-e 3-O-(6'-O-acetyl)-beta-D-glucopyranoside",
                "trans-3-ethenylcyclohexa-3,5-diene-1,2-diol",
                "trans-cyclohexane-1,2-diol",
                "triethylene glycol"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (HOCH2CH2OH)",
            "Propylene glycol (CH3CH(OH)CH2OH)",
            "1,2-Butanediol (HOCH2CH(OH)CH2CH3)",
            "1,3-Butanediol (HOCH2CH2CH(OH)CH3)",
            "1,4-Butanediol (HOCH2CH2CH2CH2OH)",
            "Glycerol (HOCH2CH(OH)CH2OH)",
            "myo-Inositol (C6H6(OH)6)",
            "D-Mannitol (HOCH2(CHOH)4CH2OH)",
            "D-Glucitol (HOCH2(CHOH)4CH2OH)",
            "Catechol (C6H4(OH)2)",
            "Resorcinol (C6H4(OH)2)",
            "Hydroquinone (C6H4(OH)2)",
            "1,2-Cyclohexanediol (C6H10(OH)2)",
            "1,3-Cyclohexanediol (C6H10(OH)2)",
            "1,4-Cyclohexanediol (C6H10(OH)2)",
            "2,3-Butanediol (CH3CH(OH)CH(OH)CH3)",
            "1,2-Pentanediol (HOCH2CH(OH)CH2CH2CH3)",
            "1,5-Pentanediol (HOCH2CH2CH2CH2CH2OH)",
            "1,2-Hexanediol (HOCH2CH(OH)(CH2)3CH3)",
            "1,6-Hexanediol (HOCH2(CH2)4CH2OH)",
            "1,2-Octanediol (HOCH2CH(OH)(CH2)5CH3)",
            "1,8-Octanediol (HOCH2(CH2)6CH2OH)",
            "1,2-Decanediol (HOCH2CH(OH)(CH2)7CH3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethylene glycol (HOCH2CH2OH)",
                "1,2-Cyclohexanediol (C6H10(OH)2)",
                "1,6-Hexanediol (HOCH2(CH2)4CH2OH)",
                "1,8-Octanediol (HOCH2(CH2)6CH2OH)"
            ],
            "mismatches": [
                "Propylene glycol (CH3CH(OH)CH2OH)",
                "1,2-Butanediol (HOCH2CH(OH)CH2CH3)",
                "1,3-Butanediol (HOCH2CH2CH(OH)CH3)",
                "1,4-Butanediol (HOCH2CH2CH2CH2OH)",
                "Glycerol (HOCH2CH(OH)CH2OH)",
                "myo-Inositol (C6H6(OH)6)",
                "D-Mannitol (HOCH2(CHOH)4CH2OH)",
                "D-Glucitol (HOCH2(CHOH)4CH2OH)",
                "Catechol (C6H4(OH)2)",
                "Resorcinol (C6H4(OH)2)",
                "Hydroquinone (C6H4(OH)2)",
                "1,3-Cyclohexanediol (C6H10(OH)2)",
                "1,4-Cyclohexanediol (C6H10(OH)2)",
                "2,3-Butanediol (CH3CH(OH)CH(OH)CH3)",
                "1,2-Pentanediol (HOCH2CH(OH)CH2CH2CH3)",
                "1,5-Pentanediol (HOCH2CH2CH2CH2CH2OH)",
                "1,2-Hexanediol (HOCH2CH(OH)(CH2)3CH3)",
                "1,2-Octanediol (HOCH2CH(OH)(CH2)5CH3)",
                "1,2-Decanediol (HOCH2CH(OH)(CH2)7CH3)"
            ],
            "true_referents": [
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(2E)-2,6-dimethylocta-2,7-diene-1,6-diol",
                "(2R,5R)-hexanediol",
                "(2S)-octane-1,2-diol",
                "(2S,5S)-hexanediol",
                "(3R,4R)-3,4-dihydroxycyclohexa-1,5-diene-1-carboxylic acid",
                "(4S)-2-methylpentane-2,4-diol",
                "(6E)-8-hydroxygeraniol",
                "(E)-4-hydroxynon-2-en-1-ol",
                "(R)-butane-1,3-diol",
                "(S)-butane-1,3-diol",
                "(S)-propane-1,2-diol",
                "(Z)-1,2-ethenediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,5-tetradecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "2,3-bis(4-hydroxyphenyl)-1,2-propanediol",
                "2-hydroxy-3-(2-hydroxyethyl)naphthalene-1,4-dione",
                "2-hydroxyethyl octadecanoate",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "3-ethenylcyclohexa-3,5-diene-1,2-diol",
                "6-(2-hydroxyethoxy)-6-oxohexanoic acid",
                "N-(2-hydroxyhexacosanoyl)-15-methylhexadecasphing-4-enine",
                "N-(2-hydroxyhexacosanoyl)phytosphingosine-1-phospho-(1D-myo-inositol)",
                "butanediol",
                "cis-1,2-dihydro-3-ethylcatechol",
                "cis-cyclohexane-1,2-diol",
                "cyclohex-3-ene-1,2-diol",
                "ethylene glycol",
                "glycol",
                "hexane-1,6-diol",
                "inositol phosphomannosylinositol-1-phosphodihydroceramide",
                "inositol-1-phospho-N-acyl-(8E)-phytosphing-8-enine",
                "octane-1,8-diol",
                "octanediol"
            ],
            "TP": 4,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Propylene glycol (PG)",
            "Glycerol (GLY)",
            "1,2-Butanediol",
            "1,3-Butanediol",
            "1,4-Butanediol (BDO)",
            "1,2-Pentanediol",
            "1,5-Pentanediol",
            "1,2-Hexanediol",
            "1,6-Hexanediol (HDO)",
            "1,2-Octanediol",
            "1,8-Octanediol",
            "1,2-Decanediol",
            "1,10-Decanediol",
            "Erythritol",
            "Threitol",
            "Arabitol",
            "Xylitol",
            "Mannitol",
            "Sorbitol",
            "Galactitol",
            "Inositol",
            "Deoxyribose",
            "Ribose"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethylene glycol",
                "1,2-butanediol",
                "1,3-butanediol",
                "1,4-butanediol",
                "1,2-octanediol",
                "octane-1,8-diol",
                "1,2-decanediol"
            ],
            "mismatches": [
                "propylene glycol",
                "glycerol",
                "1,2-pentanediol",
                "1,5-pentanediol",
                "1,6-hexanediol",
                "1,10-decanediol",
                "erythritol",
                "threitol",
                "arabitol",
                "xylitol",
                "mannitol",
                "sorbitol",
                "galactitol",
                "inositol",
                "deoxyribose",
                "ribose"
            ],
            "true_referents": [
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,4-dithiothreitol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dodecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1-O-dodecylglycerol",
                "2-methyl-1,2-butanediol",
                "5-(4,5-dihydroxypentyl)uracil",
                "8,5'-cyclo-2'-deoxyadenosine",
                "8,5'-cyclo-2'-deoxyguanosine",
                "L-erythro-sphingosine",
                "L-glycol",
                "N-docosenoyl-15-methylhexadecasphing-4-enine-1-phosphocholine",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1')-N-acylicosasphinganine",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1')-N-acylicosasphingosine",
                "beta-D-glucosyl-L-erythro-N-acylsphingosine",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butanediol",
                "decane-1,2-diol",
                "dithioerythritol",
                "ethylene glycol",
                "ethylene glycol monophosphate",
                "glycol",
                "hexane-1,6-diol",
                "inositol phosphosphingolipid",
                "inositol-1-phospho-N-acyl-(8E)-phytosphing-8-enine",
                "octane-1,2-diol",
                "octane-1,8-diol",
                "octanediol",
                "propanediol",
                "rubianol-e 3-O-(6'-O-acetyl)-beta-D-glucopyranoside",
                "rubiarboside G 28-acetate",
                "rubiarboside G 28-al",
                "triethylene glycol"
            ],
            "TP": 7,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Glycerol (Gly)",
            "Erythritol",
            "Mannitol",
            "Sorbitol",
            "Xylitol",
            "Fructose-1,6-bisphosphate",
            "Cyclohexane-1,2-diol",
            "1,2-Ethanediol",
            "1,3-Propanediol",
            "1,4-Butanediol",
            "1,5-Pentanediol",
            "1,6-Hexanediol",
            "1,7-Heptanediol",
            "1,8-Octanediol",
            "1,9-Nonanediol",
            "1,10-Decanediol",
            "1,12-Dodecanediol",
            "1,3-Dihydroxy-2-methylpropane",
            "1,2-Dihydroxy-4-methylpentane",
            "1,3-Dihydroxy-5-methylhexane",
            "1,4-Dihydroxy-2-methylpentane",
            "1,5-Dihydroxy-3-methylhexane",
            "1,6-Dihydroxy-4-methylheptane",
            "1,7-Dihydroxy-5-methyloctane"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cyclohexane-1,2-diol",
                "1,2-Ethanediol",
                "1,3-Propanediol",
                "1,4-Butanediol",
                "1,12-Dodecanediol"
            ],
            "mismatches": [
                "Glycerol (Gly)",
                "Erythritol",
                "Mannitol",
                "Sorbitol",
                "Xylitol",
                "Fructose-1,6-bisphosphate",
                "1,5-Pentanediol",
                "1,6-Hexanediol",
                "1,7-Heptanediol",
                "1,8-Octanediol",
                "1,9-Nonanediol",
                "1,10-Decanediol",
                "1,3-Dihydroxy-2-methylpropane",
                "1,2-Dihydroxy-4-methylpentane",
                "1,3-Dihydroxy-5-methylhexane",
                "1,4-Dihydroxy-2-methylpentane",
                "1,5-Dihydroxy-3-methylhexane",
                "1,6-Dihydroxy-4-methylheptane",
                "1,7-Dihydroxy-5-methyloctane"
            ],
            "true_referents": [
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(4S)-2-methylpentane-2,4-diol",
                "(Z)-1,2-ethenediol",
                "1'-hydroxy-demethylspheroidene",
                "1,12-dodecanediol",
                "1,2,3,4-tetrahydronaphthalene-2,3-diol",
                "1,2-dodecanediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,3-diacetoxypropane",
                "1,3-dihydroxybutan-2-one",
                "1,3-dodecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dodecanediol",
                "1,7-decanediol",
                "1,7-dodecanediol",
                "1,7-tetradecanediol",
                "1,9-decanediol",
                "1-O-dodecylglycerol",
                "1-hydroxy-3-methylbutan-2-one",
                "2-hydroxypropyl dihydrogen phosphate",
                "2-methylene-1,4-butanediol",
                "2-methylpentane-2,4-diol",
                "2-methylpropane-1,2-diol",
                "7-methyl-1,2-dihydronaphthalene-1,2-diol",
                "L-erythro-sphingosine",
                "L-glycol",
                "N-(2-hydroxyhexacosanoyl)phytosphingosine-1-phospho-(1D-myo-inositol)",
                "beta-D-glucosyl-L-erythro-N-acylsphingosine",
                "butane-1,4-diol",
                "butanediol",
                "cis-cyclohexane-1,2-diol",
                "cyclohexane-1,2-diol",
                "ethanediol",
                "ethanediol derivative",
                "ethylene glycol",
                "ethylene glycol monophosphate",
                "glycol",
                "hexane-1,6-diol",
                "octane-1,8-diol",
                "octanediol",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "trans-1,2,3,4-tetrahydronaphthalene-2,3-diol",
                "trans-cyclohexane-1,2-diol"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Butan-1,2-diol",
            "1,3-Butanediol",
            "2,3-Butanediol",
            "Pinacol (PNC)",
            "1,2-Propanediol (PROP)",
            "1,3-Propanediol (PDO)",
            "2,3-Propanediol",
            "But-2-ene-1,4-diol",
            "Catechin (C)",
            "Cholesterol (Chol)",
            "1,2-Cyclohexanediol",
            "1,4-Cyclohexanediol",
            "1,2-Cyclopentanediol",
            "D-mannitol (MAN)",
            "1,2-Decanediol",
            "1,10-Decanediol",
            "Dulcitol (DUL)",
            "Erythritol (Ery)",
            "Galactitol (GAL)",
            "1,2-Hexanediol",
            "1,6-Hexanediol",
            "Meso-erythritol (MERY)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethylene glycol",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butane-2,3-diol",
                "pinacol",
                "propane-1,2-diol",
                "propane-1,3-diol",
                "cyclohexane-1,2-diol",
                "decane-1,2-diol",
                "hexane-1,6-diol"
            ],
            "mismatches": [
                "2,3-propanediol",
                "but-2-ene-1,4-diol",
                "catechin (C)",
                "cholesterol (Chol)",
                "1,4-cyclohexanediol",
                "1,2-cyclopentanediol",
                "D-mannitol (MAN)",
                "1,10-decanediol",
                "dulcitol (DUL)",
                "erythritol (Ery)",
                "galactitol (GAL)",
                "1,2-hexanediol",
                "1,6-hexanediol",
                "meso-erythritol (MERY)"
            ],
            "true_referents": [
                "(+)-phytocassane C",
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(S)-chlorphenesin",
                "(S,S)-butane-2,3-diol",
                "1,2-diguaiacylpropane-1,3-diol",
                "1,2-hexadecanediol",
                "1,2-octacosanediol",
                "1,2-tetradecanediol",
                "1,3-diacetoxypropane",
                "1,6-dodecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "2'-O-methylodoratol",
                "2,3-bis(4-hydroxyphenyl)-1,2-propanediol",
                "2-methyl-1,2-butanediol",
                "2-phenyl-1,2-propanediol",
                "4beta-hydroxycholesterol",
                "6alpha-hydroxycholestanol",
                "L-erythro-N-dodecanoylsphingosine",
                "L-erythro-sphingosine",
                "Man-1-6-Ins-1-P-Cer(d18:0/2-OH-26:0)",
                "Man-1-6-Ins-1-P-Cer(d18:0/2-OH-26:0)(1-)",
                "TCA-ethadyl",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1')-N-acylicosasphinganine",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1')-N-acylicosasphingosine",
                "beta-D-glucosyl-L-erythro-N-acylsphingosine",
                "but-2-yne-1,4-diol",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butane-2,3-diol",
                "butanediol",
                "cardivin C",
                "cis-cyclohexane-1,2-diol",
                "cyclohexane-1,2-diol",
                "decane-1,2-diol",
                "ethylene glycol",
                "hexane-1,6-diol",
                "maniladiol",
                "meso-butane-2,3-diol",
                "octanediol",
                "phthiocerol A",
                "pinacol",
                "propane-1,2-diol",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "trans-cyclohexane-1,2-diol",
                "triethylene glycol"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "diol",
                "Canonical name": "diol"
            },
            {
                "Referent": "1,2-ethanediol",
                "Canonical name": "ethane-1,2-diol"
            },
            {
                "Referent": "1,3-propanediol",
                "Canonical name": "propane-1,3-diol"
            },
            {
                "Referent": "1,4-butanediol",
                "Canonical name": "butane-1,4-diol"
            },
            {
                "Referent": "1,5-pentanediol",
                "Canonical name": "pentane-1,5-diol"
            },
            {
                "Referent": "1,6-hexanediol",
                "Canonical name": "hexane-1,6-diol"
            },
            {
                "Referent": "1,7-heptanediol",
                "Canonical name": "heptane-1,7-diol"
            },
            {
                "Referent": "1,8-octanediol",
                "Canonical name": "octane-1,8-diol"
            },
            {
                "Referent": "1,9-nonanediol",
                "Canonical name": "nonane-1,9-diol"
            },
            {
                "Referent": "1,10-decanediol",
                "Canonical name": "decan-1,10-diol"
            },
            {
                "Referent": "1,11-undecanediol",
                "Canonical name": "undecane-1,11-diol"
            },
            {
                "Referent": "1,12-dodecanediol",
                "Canonical name": "dodecane-1,12-diol"
            },
            {
                "Referent": "1,13-tridecanediol",
                "Canonical name": "tridecane-1,13-diol"
            },
            {
                "Referent": "1,14-tetradecanediol",
                "Canonical name": "tetradecane-1,14-diol"
            },
            {
                "Referent": "1,15-pentadecanediol",
                "Canonical name": "pentadecane-1,15-diol"
            },
            {
                "Referent": "1,16-hexadecanediol",
                "Canonical name": "hexadecane-1,16-diol"
            },
            {
                "Referent": "1,17-heptadecanediol",
                "Canonical name": "heptadecane-1,17-diol"
            },
            {
                "Referent": "1,18-octadecanediol",
                "Canonical name": "octadecane-1,18-diol"
            },
            {
                "Referent": "1,19-nonadecanediol",
                "Canonical name": "nonadecane-1,19-diol"
            },
            {
                "Referent": "1,20-eicosanediol",
                "Canonical name": "eicosane-1,20-diol"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "hexane-1,6-diol",
                "1,16-hexadecanediol"
            ],
            "mismatches": [
                "diol",
                "ethane-1,2-diol",
                "propane-1,3-diol",
                "butane-1,4-diol",
                "pentane-1,5-diol",
                "heptane-1,7-diol",
                "octane-1,8-diol",
                "nonane-1,9-diol",
                "decan-1,10-diol",
                "undecane-1,11-diol",
                "dodecane-1,12-diol",
                "tridecane-1,13-diol",
                "tetradecane-1,14-diol",
                "pentadecane-1,15-diol",
                "heptadecane-1,17-diol",
                "octadecane-1,18-diol",
                "nonadecane-1,19-diol",
                "eicosane-1,20-diol"
            ],
            "true_referents": [
                "(2S,5S)-hexanediol",
                "(4S)-2-methylpentane-2,4-diol",
                "(5Z,11Z,14Z)-8,9-dihydroxyicosatrienoic acid",
                "(5Z,8R,9R,11Z,14Z)-8,9-dihydroxyicosatrienoic acid",
                "(5Z,8S,9S,11Z,14Z)-8,9-dihydroxyicosatrienoic acid",
                "(S)-butane-1,2-diol",
                "(S)-butane-1,3-diol",
                "(S)-propane-1,2-diol",
                "1,16-hexadecanediol",
                "1,2-hexadecanediol",
                "1,9-decanediol",
                "2-methylpentane-2,4-diol",
                "hexane-1,6-diol",
                "octane-1,8-diol"
            ],
            "TP": 2,
            "FP": 18,
            "FN": 0
        }
    }
]