[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "ethylene glycol (EG)",
            "1,2-propanediol (1,2-PD)",
            "1,3-propanediol (1,3-PD)",
            "1,2-butanediol (1,2-BD)",
            "1,3-butanediol (1,3-BD)",
            "1,4-butanediol (1,4-BD)",
            "diethylene glycol (DEG)",
            "triethylene glycol (TEG)",
            "thiodiglycol",
            "1,2-pentanediol",
            "1,3-pentanediol",
            "1,4-pentanediol",
            "1,5-pentanediol",
            "1,2-hexanediol",
            "1,3-hexanediol",
            "1,4-hexanediol",
            "1,6-hexanediol",
            "diethylene glycol monomethyl ether (DMM)",
            "diethylene glycol monoethyl ether (DEE)",
            "diethylene glycol monopropyl ether (DPP)",
            "diethylene glycol monobutyl ether (DnB)",
            "diethylene glycol monophenyl ether (DPh)",
            "diethylene glycol dibutyl ether (DBE)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethylene glycol",
                "propane-1,2-diol",
                "propane-1,3-diol",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "diethylene glycol",
                "triethylene glycol",
                "thiodiglycol",
                "diethylene glycol monoethyl ether"
            ],
            "mismatches": [
                "1,4-butanediol (1,4-BD)",
                "1,2-pentanediol",
                "1,3-pentanediol",
                "1,4-pentanediol",
                "1,5-pentanediol",
                "1,2-hexanediol",
                "1,3-hexanediol",
                "1,4-hexanediol",
                "1,6-hexanediol",
                "diethylene glycol monomethyl ether (DMM)",
                "diethylene glycol monopropyl ether (DPP)",
                "diethylene glycol monobutyl ether (DnB)",
                "diethylene glycol monophenyl ether (DPh)",
                "diethylene glycol dibutyl ether (DBE)"
            ],
            "true_referents": [
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(R)-monothioglycerol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,3-tetradecanediol",
                "1,4-dodecanediol",
                "1,4-tetradecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dodecanediol",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-phenyl-1,2-propanediol",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butanediol",
                "diethylene glycol monoethyl ether",
                "ethylene glycol",
                "ethylene glycol monododecyl ether",
                "glycol",
                "hexane-1,6-diol",
                "monothioglycerol",
                "propane-1,2-diol",
                "propane-1,3-diol",
                "propanediol",
                "thiodiglycol",
                "triethylene glycol",
                "triethylene glycol monomethyl ether"
            ],
            "TP": 9,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "1,2-Propanediol (Propylene glycol, PG)",
            "1,3-Butanediol",
            "1,4-Butanediol",
            "1,2-Butanediol",
            "Glycerol (Glycerin, C3H8O3)",
            "1,2-Cyclohexanediol",
            "1,3-Cyclohexanediol",
            "1,4-Cyclohexanediol",
            "1,5-Pentanediol",
            "2,3-Pentanediol",
            "2,4-Pentanediol",
            "1,2-Hexanediol",
            "1,3-Hexanediol",
            "1,6-Hexanediol",
            "1,2-Heptanediol",
            "1,3-Heptanediol",
            "1,4-Heptanediol",
            "1,2-Octanediol",
            "1,3-Octanediol",
            "1,4-Octanediol",
            "1,2-Nonanediol",
            "1,3-Nonanediol",
            "1,4-Nonanediol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,3-Butanediol",
                "1,4-Butanediol",
                "1,2-Butanediol",
                "1,2-Cyclohexanediol",
                "1,6-Hexanediol",
                "1,2-Octanediol",
                "Ethylene glycol (EG)"
            ],
            "mismatches": [
                "1,2-Propanediol (Propylene glycol, PG)",
                "Glycerol (Glycerin, C3H8O3)",
                "1,3-Cyclohexanediol",
                "1,4-Cyclohexanediol",
                "1,5-Pentanediol",
                "2,3-Pentanediol",
                "2,4-Pentanediol",
                "1,2-Hexanediol",
                "1,3-Hexanediol",
                "1,2-Heptanediol",
                "1,3-Heptanediol",
                "1,4-Heptanediol",
                "1,3-Octanediol",
                "1,4-Octanediol",
                "1,2-Nonanediol",
                "1,3-Nonanediol",
                "1,4-Nonanediol"
            ],
            "true_referents": [
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(R)-propane-1,2-diol",
                "1,2-dodecanediol",
                "1,2-hexacosanediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,3-dodecanediol",
                "1,3-tetradecanediol",
                "1,4-dodecanediol",
                "1,4-tetradecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dodecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1-O-dodecylglycerol",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-phenyl-1,2-propanediol",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butanediol",
                "cis-cyclohexane-1,2-diol",
                "cyclohex-3-ene-1,2-diol",
                "cyclohexane-1,2-diol",
                "ethylene glycol",
                "glycol",
                "hexane-1,6-diol",
                "octane-1,2-diol",
                "octane-1,8-diol",
                "octanediol",
                "propanediol",
                "trans-cyclohexane-1,2-diol",
                "triethylene glycol"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "1,2-Propanediol (Propylene glycol)",
            "1,3-Propanediol",
            "1,2-Butanediol",
            "1,3-Butanediol",
            "1,4-Butanediol",
            "1,2-Pentanediol",
            "1,3-Pentanediol",
            "1,4-Pentanediol",
            "1,5-Pentanediol",
            "1,2-Hexanediol",
            "1,3-Hexanediol",
            "1,4-Hexanediol",
            "1,5-Hexanediol",
            "1,6-Hexanediol",
            "1,2-Heptanediol",
            "1,3-Heptanediol",
            "1,4-Heptanediol",
            "1,5-Heptanediol",
            "1,6-Heptanediol",
            "1,7-Heptanediol",
            "1,2-Octanediol",
            "1,3-Octanediol",
            "1,4-Octanediol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethylene glycol (EG)",
                "1,3-Propanediol",
                "1,2-Butanediol",
                "1,3-Butanediol",
                "1,4-Butanediol",
                "1,2-Octanediol"
            ],
            "mismatches": [
                "1,2-Propanediol (Propylene glycol)",
                "1,2-Pentanediol",
                "1,3-Pentanediol",
                "1,4-Pentanediol",
                "1,5-Pentanediol",
                "1,2-Hexanediol",
                "1,3-Hexanediol",
                "1,4-Hexanediol",
                "1,5-Hexanediol",
                "1,6-Hexanediol",
                "1,2-Heptanediol",
                "1,3-Heptanediol",
                "1,4-Heptanediol",
                "1,5-Heptanediol",
                "1,6-Heptanediol",
                "1,7-Heptanediol",
                "1,3-Octanediol",
                "1,4-Octanediol"
            ],
            "true_referents": [
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(S)-propane-1,2-diol",
                "1,2-dodecanediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,3-dodecanediol",
                "1,3-tetradecanediol",
                "1,4-dodecanediol",
                "1,4-tetradecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dodecanediol",
                "1,6-tetradecanediol",
                "1,7-decanediol",
                "1,7-dodecanediol",
                "1,7-tetradecanediol",
                "1,9-decanediol",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-phenyl-1,2-propanediol",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butanediol",
                "ethylene glycol",
                "hexane-1,6-diol",
                "octane-1,2-diol",
                "octanediol",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "triethylene glycol"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene Glycol (EG)",
            "Propylene Glycol (PG)",
            "1,3-Propanediol",
            "1,4-Butanediol (BDO)",
            "Glycerol (GLY)",
            "Pentaerythritol",
            "Xylitol",
            "Mannitol",
            "Sorbitol",
            "Erythritol",
            "Threitol",
            "Ribitol",
            "Inositol",
            "Dulcitol",
            "Galactitol",
            "Quercidiol",
            "Diethylene Glycol (DEG)",
            "Triethylene Glycol (TEG)",
            "Polyethylene Glycol (PEG)",
            "Dipropylene Glycol (DPG)",
            "Trimethylolpropane (TMP)",
            "Neopentyl Glycol (NPG)",
            "2-Methyl-2,4-Pentanediol",
            "Hexylene Glycol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethylene Glycol (EG)",
                "Neopentyl Glycol (NPG)",
                "Triethylene Glycol (TEG)",
                "2-Methyl-2,4-Pentanediol"
            ],
            "mismatches": [
                "Propylene Glycol (PG)",
                "1,3-Propanediol",
                "1,4-Butanediol (BDO)",
                "Glycerol (GLY)",
                "Pentaerythritol",
                "Xylitol",
                "Mannitol",
                "Sorbitol",
                "Erythritol",
                "Threitol",
                "Ribitol",
                "Inositol",
                "Dulcitol",
                "Galactitol",
                "Quercidiol",
                "Diethylene Glycol (DEG)",
                "Polyethylene Glycol (PEG)",
                "Dipropylene Glycol (DPG)",
                "Trimethylolpropane (TMP)",
                "Hexylene Glycol"
            ],
            "true_referents": [
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(4S)-2-methylpentane-2,4-diol",
                "1,2-diguaiacylpropane-1,3-diol",
                "1,3-diacetoxypropane",
                "1,4-dithiothreitol",
                "1,4-tetradecanediol",
                "1-O-dodecylglycerol",
                "2-methylpentane-2,4-diol",
                "2-methylpropane-1,2-diol",
                "2alpha-acetoxy-28-acetylrubiarboside G",
                "L-erythro-sphingosine",
                "L-glycol",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1')-N-acylicosasphinganine",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1')-N-acylicosasphingosine",
                "beta-D-glucosyl-L-erythro-N-acylsphingosine",
                "butane-1,4-diol",
                "butanediol",
                "cyathadiol",
                "daturadiol",
                "dithioerythritol",
                "ethylene glycol",
                "ethylene glycol monophosphate",
                "glycol",
                "inositol phosphosphingolipid",
                "inositol-1-phospho-N-acyl-(8E)-phytosphing-8-enine",
                "lavendiol",
                "neopentyl glycol",
                "odoratol",
                "pentaerythritol dinitrate",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "rubianol-e 3-O-(6'-O-acetyl)-beta-D-glucopyranoside",
                "rubiarboside G 28-acetate",
                "triethylene glycol",
                "triethylene glycol monomethyl ether"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Propylene glycol (PG)",
            "1,3-Propanediol (PDO)",
            "1,2-Butanediol",
            "1,3-Butanediol",
            "1,4-Butanediol",
            "1,2-Pentanediol",
            "1,5-Pentanediol",
            "1,3-Pentanediol",
            "2,3-Butanediol",
            "1,2-Hexanediol",
            "1,6-Hexanediol",
            "1,3-Hexanediol",
            "1,4-Hexanediol",
            "1,7-Heptanediol",
            "1,2-Octanediol",
            "1,8-Octanediol",
            "1,3-Octanediol",
            "2,2-Dimethyl-1,3-propanediol",
            "2-Methyl-2,4-pentanediol",
            "2,3-Pentanediol",
            "1,9-Nonanediol",
            "1,10-Decanediol",
            "1,12-Dodecanediol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethylene glycol",
                "1,3-propanediol",
                "1,3-butanediol",
                "1,4-butanediol",
                "2,3-butanediol",
                "1,2-octanediol",
                "1,8-octanediol",
                "1,12-dodecanediol"
            ],
            "mismatches": [
                "propylene glycol",
                "1,2-butanediol",
                "1,2-pentanediol",
                "1,5-pentanediol",
                "1,3-pentanediol",
                "1,2-hexanediol",
                "1,6-hexanediol",
                "1,3-hexanediol",
                "1,4-hexanediol",
                "1,7-heptanediol",
                "1,3-octanediol",
                "2,2-dimethyl-1,3-propanediol",
                "2-methyl-2,4-pentanediol",
                "2,3-pentanediol",
                "1,9-nonanediol",
                "1,10-decanediol"
            ],
            "true_referents": [
                "(2E)-2,6-dimethylocta-2,7-diene-1,6-diol",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(4S)-2-methylpentane-2,4-diol",
                "1,12-dodecanediol",
                "1,2-dodecanediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,3-dodecanediol",
                "1,3-tetradecanediol",
                "1,4-dodecanediol",
                "1,4-tetradecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dodecanediol",
                "1,7-decanediol",
                "1,7-dodecanediol",
                "1,7-tetradecanediol",
                "1,9-decanediol",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-methylpentane-2,4-diol",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butane-2,3-diol",
                "butanediol",
                "ethylene glycol",
                "glycol",
                "hexane-1,6-diol",
                "octane-1,2-diol",
                "octane-1,8-diol",
                "octanediol",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "triethylene glycol"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethanediol (Ethylene Glycol)",
            "Propylene Glycol (1,2-Propanediol)",
            "Butanediol (1,4-Butanediol)",
            "Glycerol (Glycerin)",
            "1,2-Butanediol",
            "1,3-Butanediol",
            "1,2-Pentanediol",
            "2,3-Butanediol",
            "1,2-Hexanediol",
            "2,4-Hexanediol",
            "1,3-Pentanediol",
            "1,2-Cyclohexanediol",
            "1,2-Propylene Glycol Dicaprylate",
            "1,2-Ethanediol",
            "2,2-Dimethyl-1,3-propanediol",
            "1,3-Hexanediol",
            "1,4-Butanediol Dimethyl Ether",
            "1,2-Octanediol",
            "1,2-Nonanediol",
            "1,2-Decanediol",
            "2,3-Pentanediol",
            "1,3-Cyclopentanediol",
            "1,2-Phenylethanediol",
            "1,2-Dodecanediol",
            "1,2-Tetradecanediol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,2-Butanediol",
                "1,3-Butanediol",
                "2,3-Butanediol",
                "1,2-Ethanediol",
                "1,2-Octanediol",
                "1,2-Dodecanediol",
                "1,2-Tetradecanediol"
            ],
            "mismatches": [
                "Ethanediol (Ethylene Glycol)",
                "Propylene Glycol (1,2-Propanediol)",
                "Butanediol (1,4-Butanediol)",
                "Glycerol (Glycerin)",
                "1,2-Pentanediol",
                "2,4-Hexanediol",
                "1,3-Pentanediol",
                "1,2-Cyclohexanediol",
                "1,2-Propylene Glycol Dicaprylate",
                "2,2-Dimethyl-1,3-propanediol",
                "1,3-Hexanediol",
                "1,4-Butanediol Dimethyl Ether",
                "1,2-Nonanediol",
                "1,2-Decanediol",
                "2,3-Pentanediol",
                "1,3-Cyclopentanediol",
                "1,2-Phenylethanediol"
            ],
            "true_referents": [
                "(2E)-2,6-dimethylocta-2,7-diene-1,6-diol",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(Z)-1,2-ethenediol",
                "1,2-dodecanediol",
                "1,2-hexacosanediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,3-tetradecanediol",
                "1,4-dodecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1-O-dodecylglycerol",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-phenyl-1,2-propanediol",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butane-2,3-diol",
                "butanediol",
                "cis-cyclohexane-1,2-diol",
                "cyclohexane-1,2-diol",
                "decane-1,2-diol",
                "ethanediol",
                "ethanediol derivative",
                "ethylene glycol",
                "ethylene glycol dimethacrylate",
                "glycol",
                "octane-1,2-diol",
                "octanediol",
                "propanediol",
                "trans-cyclohexane-1,2-diol",
                "triethylene glycol"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene Glycol (EG)",
            "Propylene Glycol (PG)",
            "Glycerol (G)",
            "1,2-Propanediol (1,2-PD)",
            "1,3-Propanediol (1,3-PD)",
            "1,2-Butanediol (1,2-BD)",
            "1,3-Butanediol (1,3-BD)",
            "1,4-Butanediol (1,4-BD)",
            "1,2-Pentanediol (1,2-PD)",
            "1,5-Pentanediol (1,5-PD)",
            "1,2-Hexanediol (1,2-HD)",
            "1,6-Hexanediol (1,6-HD)",
            "1,2-Heptanediol (1,2-HD)",
            "1,7-Heptanediol (1,7-HD)",
            "1,2-Octanediol (1,2-OD)",
            "1,8-Octanediol (1,8-OD)",
            "1,2-Nonanediol (1,2-ND)",
            "1,9-Nonanediol (1,9-ND)",
            "1,2-Decanediol (1,2-DD)",
            "1,10-Decanediol (1,10-DD)",
            "1,2-Undecanediol (1,2-UD)",
            "1,11-Undecanediol (1,11-UD)",
            "1,2-Dodecanediol (1,2-DD)",
            "1,12-Dodecanediol (1,12-DD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethylene glycol",
                "propane-1,2-diol",
                "propane-1,3-diol",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "1,2-dodecanediol",
                "1,12-dodecanediol"
            ],
            "mismatches": [
                "propylene glycol",
                "glycerol",
                "1,4-butanediol",
                "1,2-pentanediol",
                "1,5-pentanediol",
                "1,2-hexanediol",
                "1,2-heptanediol",
                "1,7-heptanediol",
                "1,2-octanediol",
                "1,8-octanediol",
                "1,2-nonanediol",
                "1,9-nonanediol",
                "1,2-decanediol",
                "1,10-decanediol",
                "1,2-undecanediol",
                "1,11-undecanediol"
            ],
            "true_referents": [
                "(1S,2S)-DDT-2,3-dihydrodiol",
                "(2R)-octane-1,2-diol",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "1,10-dodecanediol",
                "1,11-dodecanediol",
                "1,12-dodecanediol",
                "1,2-dodecanediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,3-dodecanediol",
                "1,4-dodecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dodecanediol",
                "1,7-decanediol",
                "1,7-dodecanediol",
                "1,7-tetradecanediol",
                "1,9-decanediol",
                "1-O-dodecylglycerol",
                "2-aminooctadecene-1,3-diol",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-phenyl-1,2-propanediol",
                "L-glycol",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butanediol",
                "decane-1,2-diol",
                "ethylene glycol",
                "glycol",
                "hexane-1,6-diol",
                "octane-1,2-diol",
                "octane-1,8-diol",
                "octanediol",
                "propane-1,2-diol",
                "propane-1,3-diol",
                "propanediol",
                "triethylene glycol",
                "undecane-1,11-diol"
            ],
            "TP": 7,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Isopropanol",
            "Glycerol",
            "Propylene glycol",
            "1,2-Butanediol",
            "1,3-Butanediol",
            "1,4-Butanediol",
            "1,2,3-Propanetriol",
            "1,2,4-Butanetriol",
            "1,2,3-Butanetriol",
            "1,2,3,4-Butanetetrol",
            "1,2,3,4,5-Pentanol",
            "1,2,3,4,6-Pentahexanol",
            "1,2,3,4,6-Pentapentanol",
            "1,2,3,4,6-Pentahexanol",
            "1,2,3,4,5,6-Hexanol",
            "1,2,3,4,5,6-Heptanol",
            "1,2,3,4,5,6,7-Octanol",
            "1,2,3,4,5,6,7,8-Nonanol",
            "1,2,3,4,5,6,7,8,9-Decanol",
            "1,2,3,4,5,6,7,8,9,10-Undecanol",
            "1,2,3,4,5,6,7,8,9,10,11-Dodecanol",
            "1,2,3,4,5,6,7,8,9,10,11,12-Tridecanol",
            "1,2,3,4,5,6,7,8,9,10,11,12,13-Tetradecanol",
            "1,2,3,4,5,6,7,8,9,10,11,12,13,14-Pentadecanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,2-Butanediol",
                "1,3-Butanediol",
                "1,4-Butanediol",
                "Ethylene glycol (EG)"
            ],
            "mismatches": [
                "Isopropanol",
                "Glycerol",
                "Propylene glycol",
                "1,2,3-Propanetriol",
                "1,2,4-Butanetriol",
                "1,2,3-Butanetriol",
                "1,2,3,4-Butanetetrol",
                "1,2,3,4,5-Pentanol",
                "1,2,3,4,6-Pentahexanol",
                "1,2,3,4,6-Pentapentanol",
                "1,2,3,4,5,6-Hexanol",
                "1,2,3,4,5,6-Heptanol",
                "1,2,3,4,5,6,7-Octanol",
                "1,2,3,4,5,6,7,8-Nonanol",
                "1,2,3,4,5,6,7,8,9-Decanol",
                "1,2,3,4,5,6,7,8,9,10-Undecanol",
                "1,2,3,4,5,6,7,8,9,10,11-Dodecanol",
                "1,2,3,4,5,6,7,8,9,10,11,12-Tridecanol",
                "1,2,3,4,5,6,7,8,9,10,11,12,13-Tetradecanol",
                "1,2,3,4,5,6,7,8,9,10,11,12,13,14-Pentadecanol"
            ],
            "true_referents": [
                "(2R)-octane-1,2-diol",
                "(2R,5R)-hexanediol",
                "(2S)-octane-1,2-diol",
                "(4S)-2-methylpentane-2,4-diol",
                "(8E)-undeca-1,8-dien-5-yne-3,7-diol",
                "(R)-butane-1,3-diol",
                "1,10-dodecanediol",
                "1,11-dodecanediol",
                "1,2-tetradecanediol",
                "1,3-tetradecanediol",
                "1,4-tetradecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1,9-dodecanediol",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-methylpentane-2,4-diol",
                "2-methylpropane-1,2-diol",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butane-2,3-diol",
                "butanediol",
                "decane-1,2-diol",
                "ethylene glycol",
                "flavan-3,3',4,4',5,5',7-heptol",
                "glycol",
                "hexane-1,6-diol",
                "hexane-2,5-diol",
                "octane-1,8-diol",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "triethylene glycol",
                "undecane-1,11-diol"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Diethylene glycol (DEG)",
            "Propylene glycol (PG)",
            "1,2-Propanediol",
            "1,3-Propanediol",
            "1,4-Butanediol",
            "1,5-Pentanediol",
            "1,6-Hexanediol",
            "1,2-Hexanediol",
            "1,3-Hexanediol",
            "1,4-Hexanediol",
            "Catechol (1,2-Dihydroxybenzene)",
            "Resorcinol (1,3-Dihydroxybenzene)",
            "Hydroquinone (1,4-Dihydroxybenzene)",
            "Cyclohexanediol",
            "1,2-Butanediol",
            "1,3-Butanediol",
            "2-Methyl-1,3-Propanediol",
            "2,3-Butanediol",
            "Tetrahydrofuran-2,5-diol",
            "Bisphenol A (2,2-bis(4-hydroxyphenyl)propane)",
            "1,2-Ethanediol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethylene glycol (EG)",
                "1,2-Propanediol",
                "1,3-Propanediol",
                "1,4-Butanediol",
                "1,2-Hexanediol",
                "1,2-Butanediol",
                "1,3-Butanediol",
                "2,3-Butanediol",
                "1,2-Ethanediol"
            ],
            "mismatches": [
                "Diethylene glycol (DEG)",
                "Propylene glycol (PG)",
                "1,5-Pentanediol",
                "1,3-Hexanediol",
                "1,4-Hexanediol",
                "Catechol (1,2-Dihydroxybenzene)",
                "Resorcinol (1,3-Dihydroxybenzene)",
                "Hydroquinone (1,4-Dihydroxybenzene)",
                "Cyclohexanediol",
                "2-Methyl-1,3-Propanediol",
                "Tetrahydrofuran-2,5-diol",
                "Bisphenol A (2,2-bis(4-hydroxyphenyl)propane)"
            ],
            "true_referents": [
                "(2R,4S)-2-methyl-2,4-dihydroxydihydrofuran-3-one",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(R,R)-hydrobenzoin",
                "(Z)-1,2-ethenediol",
                "1,2-bis(3,4-dimethoxyphenyl)propane-1,3-diol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,4-dodecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dihydroxyphenazine N(5)-oxide",
                "1,6-dodecanediol",
                "2,3-bis(4-hydroxyphenyl)-1,2-propanediol",
                "2,5-furandimethanol",
                "2-hydroxy-3-(2-hydroxyethyl)naphthalene-1,4-dione",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-methylpropane-1,2-diol",
                "2-phenyl-1,2-propanediol",
                "bis(2-butoxyethyl)phthalate",
                "butane-1,2-diol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butane-2,3-diol",
                "butanediol",
                "cis-1,2-dihydro-3-ethylcatechol",
                "cyclohexadienediol",
                "cyclohexane-1,2-diol",
                "ethanediol",
                "ethanediol derivative",
                "ethylene glycol",
                "glycol",
                "hexane-1,6-diol",
                "hexane-2,5-diol",
                "propane-1,2-diol",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "trans-cyclohexane-1,2-diol",
                "triethylene glycol"
            ],
            "TP": 9,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Propylene glycol (PG)",
            "1,3-Propanediol (PDO)",
            "1,4-Butanediol (BDO)",
            "1,3-Butanediol",
            "2,3-Butanediol",
            "1,5-Pentanediol",
            "1,6-Hexanediol",
            "Neopentyl glycol",
            "Trimethylolpropane (TMP)",
            "Glycerol (Glycerin)",
            "Erythritol",
            "Xylitol",
            "Sorbitol",
            "Mannitol",
            "Maltitol",
            "Lactitol",
            "Isomalt",
            "Catechol",
            "Resorcinol",
            "Hydroquinone",
            "Pyrogallol",
            "Phloroglucinol",
            "Pinacol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethylene glycol",
                "neopentyl glycol",
                "pinacol"
            ],
            "mismatches": [
                "propylene glycol (PG)",
                "1,3-propanediol (PDO)",
                "1,4-butanediol (BDO)",
                "1,3-butanediol",
                "2,3-butanediol",
                "1,5-pentanediol",
                "1,6-hexanediol",
                "trimethylolpropane (TMP)",
                "glycerol (glycerin)",
                "erythritol",
                "xylitol",
                "sorbitol",
                "mannitol",
                "maltitol",
                "lactitol",
                "isomalt",
                "catechol",
                "resorcinol",
                "hydroquinone",
                "pyrogallol",
                "phloroglucinol"
            ],
            "true_referents": [
                "(18R)-resolvin E3",
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(6E)-8-hydroxygeraniol",
                "(R,R)-hydrobenzoin",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,3-diacetoxypropane",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dihydroxyphenazine N(5)-oxide",
                "1,6-dodecanediol",
                "1-O-dodecylglycerol",
                "19,28-didehydroxyrubiarbonol A",
                "2-hydroxy-3-(2-hydroxyethyl)naphthalene-1,4-dione",
                "2-methyl-1,2-butanediol",
                "2-methylpropane-1,2-diol",
                "8-Gingediol",
                "L-erythro-sphingosine",
                "L-glycol",
                "beta-D-glucosyl-L-erythro-N-acylsphingosine",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butane-2,3-diol",
                "butanediol",
                "cis-1,2-dihydro-3-ethylcatechol",
                "ethylene glycol",
                "ethylene glycol monophosphate",
                "glycol",
                "hexane-1,6-diol",
                "hydrobenzoin",
                "lavendiol",
                "maniladiol",
                "monobutyrin",
                "neopentyl glycol",
                "pinacol",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "rubianol-e 3-O-(6'-O-acetyl)-beta-D-glucopyranoside",
                "triethylene glycol",
                "triethylene glycol monomethyl ether",
                "veratrylglycerol beta-guaiacyl ether"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Propylene glycol (PG)",
            "1,3-Butanediol (1,3-BDO)",
            "2,3-Butanediol (2,3-BDO)",
            "1,4-Butanediol (1,4-BDO)",
            "1,5-Pentanediol (1,5-PDO)",
            "Neopentyl glycol (NPG)",
            "1,6-Hexanediol (1,6-HDO)",
            "2-Methyl-2,4-pentanediol (MPD)",
            "2-Ethyl-1,3-hexanediol (EHD)",
            "Diethylene glycol (DEG)",
            "Triethylene glycol (TEG)",
            "Tetraethylene glycol",
            "Dipropylene glycol (DPG)",
            "Tripropylene glycol (TPG)",
            "1,2-Pentanediol",
            "1,2-Hexanediol",
            "2,5-Hexanediol",
            "3-Methyl-1,3-butanediol",
            "3-Methyl-1,5-pentanediol",
            "2-Methyl-1,3-propanediol",
            "2-Methyl-2,3-butanediol",
            "2-Butyl-2-ethyl-1,3-propanediol",
            "2,2-Diethyl-1,3-propanediol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethylene glycol",
                "neopentyl glycol",
                "triethylene glycol",
                "2,3-butanediol",
                "1,4-butanediol",
                "2-methyl-2,4-pentanediol",
                "3-methylbutane-1,2-diol"
            ],
            "mismatches": [
                "propylene glycol",
                "1,3-butanediol",
                "1,5-pentanediol",
                "1,6-hexanediol",
                "2-ethyl-1,3-hexanediol",
                "diethylene glycol",
                "tetraethylene glycol",
                "dipropylene glycol",
                "tripropylene glycol",
                "1,2-pentanediol",
                "1,2-hexanediol",
                "2,5-hexanediol",
                "3-methyl-1,5-pentanediol",
                "2-methyl-1,3-propanediol",
                "2-methyl-2,3-butanediol",
                "2-butyl-2-ethyl-1,3-propanediol",
                "2,2-diethyl-1,3-propanediol"
            ],
            "true_referents": [
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "1,2-dodecanediol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,3-tetradecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1,6-dodecanediol",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-methylpentane-2,4-diol",
                "2-methylpropane-1,2-diol",
                "2-phenyl-1,2-propanediol",
                "3-methylbutane-1,2-diol",
                "L-glycol",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butane-2,3-diol",
                "butanediol",
                "ethylene glycol",
                "glycol",
                "hexane-1,6-diol",
                "hexane-2,5-diol",
                "neopentyl glycol",
                "propane-1,3-diol",
                "propanediol",
                "triethylene glycol"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "ethylene glycol (C2H6O2)",
            "1,2-propanediol (C3H8O2)",
            "1,3-propanediol (C3H8O2)",
            "1,2-butanediol (C4H10O2)",
            "1,3-butanediol (C4H10O2)",
            "1,4-butanediol (C4H10O2)",
            "2,3-butanediol (C4H10O2)",
            "1,2-pentanediol (C5H12O2)",
            "1,3-pentanediol (C5H12O2)",
            "1,4-pentanediol (C5H12O2)",
            "1,5-pentanediol (C5H12O2)",
            "2,3-pentanediol (C5H12O2)",
            "2,4-pentanediol (C5H12O2)",
            "3,4-pentanediol (C5H12O2)",
            "1,2-hexanediol (C6H14O2)",
            "1,3-hexanediol (C6H14O2)",
            "1,4-hexanediol (C6H14O2)",
            "1,5-hexanediol (C6H14O2)",
            "1,6-hexanediol (C6H14O2)",
            "2,3-hexanediol (C6H14O2)",
            "2,4-hexanediol (C6H14O2)",
            "2,5-hexanediol (C6H14O2)",
            "3,4-hexanediol (C6H14O2)",
            "3,5-hexanediol (C6H14O2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethylene glycol (C2H6O2)",
                "1,3-propanediol (C3H8O2)"
            ],
            "mismatches": [
                "1,2-propanediol (C3H8O2)",
                "1,2-butanediol (C4H10O2)",
                "1,3-butanediol (C4H10O2)",
                "1,4-butanediol (C4H10O2)",
                "2,3-butanediol (C4H10O2)",
                "1,2-pentanediol (C5H12O2)",
                "1,3-pentanediol (C5H12O2)",
                "1,4-pentanediol (C5H12O2)",
                "1,5-pentanediol (C5H12O2)",
                "2,3-pentanediol (C5H12O2)",
                "2,4-pentanediol (C5H12O2)",
                "3,4-pentanediol (C5H12O2)",
                "1,2-hexanediol (C6H14O2)",
                "1,3-hexanediol (C6H14O2)",
                "1,4-hexanediol (C6H14O2)",
                "1,5-hexanediol (C6H14O2)",
                "1,6-hexanediol (C6H14O2)",
                "2,3-hexanediol (C6H14O2)",
                "2,4-hexanediol (C6H14O2)",
                "2,5-hexanediol (C6H14O2)",
                "3,4-hexanediol (C6H14O2)",
                "3,5-hexanediol (C6H14O2)"
            ],
            "true_referents": [
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(R)-propane-1,2-diol",
                "1,2-hexadecanediol",
                "1,2-tetradecanediol",
                "1,5-tetradecanediol",
                "1,6-dodecanediol",
                "2-methyl-1,2-butanediol",
                "2-methylene-1,4-butanediol",
                "2-phenyl-1,2-propanediol",
                "butanediol",
                "ethylene glycol",
                "glycol",
                "propane-1,3-diol",
                "propanediol"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Ethylene glycol (EG)",
            "Propylene glycol (PG)",
            "Butanediol (BD)",
            "Pentanediol (PD)",
            "Hexanediol (HD)",
            "Glycerol (GL)",
            "Erythritol (ER)",
            "Threitol (TR)",
            "Erythrulose (EL)",
            "Ribitol (RB)",
            "Arabitol (AB)",
            "Xylitol (XL)",
            "Mannitol (MT)",
            "Sorbitol (SB)",
            "Galactitol (GT)",
            "Inositol (IN)",
            "Deoxyribose (DR)",
            "Ribose (RB)",
            "Arabinose (AR)",
            "Xylose (XY)",
            "Galactose (GA)",
            "Glucose (GL)",
            "Mannose (MN)",
            "Fructose (FR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethylene glycol (EG)",
                "Butanediol (BD)"
            ],
            "mismatches": [
                "Propylene glycol (PG)",
                "Pentanediol (PD)",
                "Hexanediol (HD)",
                "Glycerol (GL)",
                "Erythritol (ER)",
                "Threitol (TR)",
                "Erythrulose (EL)",
                "Ribitol (RB)",
                "Arabitol (AB)",
                "Xylitol (XL)",
                "Mannitol (MT)",
                "Sorbitol (SB)",
                "Galactitol (GT)",
                "Inositol (IN)",
                "Deoxyribose (DR)",
                "Ribose (RB)",
                "Arabinose (AR)",
                "Xylose (XY)",
                "Galactose (GA)",
                "Glucose (GL)",
                "Mannose (MN)",
                "Fructose (FR)"
            ],
            "true_referents": [
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(S)-styrene glycol",
                "1,2-hexadecanediol",
                "1,5-dodecanediol",
                "1,5-tetradecanediol",
                "1-(beta-D-xylosyl)-N-oleoylsphingosine",
                "1-O-dodecylglycerol",
                "2'-O-methylodoratol",
                "2-methyl-1,2-butanediol",
                "2alpha-acetoxy-28-acetylrubiarboside G",
                "5-(4,5-dihydroxypentyl)uracil",
                "8,5'-cyclo-2'-deoxyadenosine",
                "8,5'-cyclo-2'-deoxyguanosine",
                "L-1,4-dithiothreitol",
                "L-erythro-N-dodecanoylsphingosine",
                "L-erythro-sphingosine",
                "L-glycol",
                "N-tetracosadienoyl-D-galactosylsphingosine",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1')-N-acylicosasphinganine",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1')-N-acylicosasphingosine",
                "beta-D-glucosyl-(1<->1')-N-pentacosanoyl-14-methylhexadecasphingosine",
                "beta-D-glucosyl-(1<->1')-N-tricosanoyl-14-methylhexadecasphingosine",
                "beta-D-glucosyl-(1<->1')-N-tricosanoyl-15-methylhexadecasphinganine",
                "beta-D-glucosyl-L-erythro-N-acylsphingosine",
                "butanediol",
                "butanediols",
                "dithioerythritol",
                "dodecanediol",
                "erythrodiol",
                "erythrono-1,4-lactone",
                "ethylene glycol",
                "ethylene glycol monophosphate",
                "glycol",
                "inositol phosphodihydroceramide(1-)",
                "inositol phosphomannosylinositol-1-phosphodihydroceramide",
                "inositol-1-phospho-N-acyl-(8E)-phytosphing-8-enine",
                "rubianol-e 3-O-(6'-O-acetyl)-beta-D-glucopyranoside",
                "rubiarbonone E 19-acetate",
                "rubiarboside G 28-acetate",
                "rubiarboside G 28-al",
                "triethylene glycol",
                "xylosyl-beta-D-ceramide(d18:1(4E))"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Glycerol (Glycerin)",
            "Erythritol",
            "Threitol",
            "Ribitol",
            "Arabitol",
            "Xylitol",
            "Dulcitol",
            "Galactitol",
            "Iditol",
            "Mannitol",
            "Sorbitol",
            "Inositol",
            "Cyclohexane-1,2-diol",
            "Cyclohexane-1,3-diol",
            "Cyclohexane-1,4-diol",
            "Cyclohexane-1,2,4-triol",
            "1,2,3-Propanetriol",
            "1,2,4-Butanetriol",
            "1,2,5-Pentanetriol",
            "1,2,6-Hexanetriol",
            "1,2,7-Heptanetriol",
            "1,2,8-Octanetriol",
            "1,2,9-Nonanetriol",
            "1,2,10-Decanetriol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cyclohexane-1,2-diol"
            ],
            "mismatches": [
                "Glycerol (Glycerin)",
                "Erythritol",
                "Threitol",
                "Ribitol",
                "Arabitol",
                "Xylitol",
                "Dulcitol",
                "Galactitol",
                "Iditol",
                "Mannitol",
                "Sorbitol",
                "Inositol",
                "Cyclohexane-1,3-diol",
                "Cyclohexane-1,4-diol",
                "Cyclohexane-1,2,4-triol",
                "1,2,3-Propanetriol",
                "1,2,4-Butanetriol",
                "1,2,5-Pentanetriol",
                "1,2,6-Hexanetriol",
                "1,2,7-Heptanetriol",
                "1,2,8-Octanetriol",
                "1,2,9-Nonanetriol",
                "1,2,10-Decanetriol"
            ],
            "true_referents": [
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(2R)-octane-1,2-diol",
                "(2R,5R)-hexanediol",
                "(2S, 3S, 4R)-2-[(2'R)-2'-hydroxyhexacosanoylamino]-1, 3, 4-octadecanetriol",
                "(2S, 3S, 4R)-2-[(2'R)-2'-hydroxypentacosanoylamino]-1, 3, 4-octadecanetriol",
                "(2S, 3S, 4R)-2-[(2'R)-2'-hydroxytricosanoylamino]-1, 3, 4-octadecanetriol",
                "(2S, 3S, 4R)-2-[(2R)-2-hydroxytetracosanoylamino]-1, 3, 4-octadecanetriol",
                "(R)-butane-1,3-diol",
                "1,2-diguaiacylpropane-1,3-diol",
                "1,3-diacetoxypropane",
                "1,4-dithiothreitol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1-O-dodecylglycerol",
                "11-O-acetylcyathatriol",
                "2-methylpentane-2,4-diol",
                "2alpha-acetoxy-28-acetylrubiarboside G",
                "L-erythro-sphingosine",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1')-N-acylicosasphinganine",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1')-N-acylicosasphingosine",
                "beta-D-glucosyl-L-erythro-N-acylsphingosine",
                "butane-1,3-diol",
                "butane-1,4-diol",
                "butanediol",
                "cis-cyclohexane-1,2-diol",
                "cyclohex-3-ene-1,2-diol",
                "cyclohexane-1,2-diol",
                "dec-9-ene-1,2-diol",
                "decane-1,2-diol",
                "dithioerythritol",
                "ethylene glycol",
                "ethylene glycol monophosphate",
                "glycol",
                "inositol phosphosphingolipid",
                "inositol-1-phospho-N-acyl-(8E)-phytosphing-8-enine",
                "octane-1,2-diol",
                "octane-1,8-diol",
                "odoratol",
                "propane-1,3-diol",
                "propane-1,3-diols",
                "propanediol",
                "rubianol-e 3-O-(6'-O-acetyl)-beta-D-glucopyranoside",
                "rubiarboside G 28-acetate",
                "rubiarboside G 28-al",
                "trans-cyclohexane-1,2-diol",
                "triethylene glycol"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            "Glycerol (GLY)",
            "Erythritol",
            "Threitol",
            "Arabitol",
            "Xylitol",
            "Ribitol",
            "Adonitol",
            "Ducitol",
            "Sorbitol",
            "Mannitol",
            "Galactitol",
            "Iditol",
            "Volemitol",
            "Isomaltol",
            "Dulcitol",
            "L-iditol",
            "Allitol",
            "Altitol",
            "Maltitol",
            "D-sorbitol",
            "L-sorbitol",
            "Myo-inositol",
            "Scyllo-inositol",
            "Chiro-inositol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Glycerol (GLY)",
                "Erythritol",
                "Threitol",
                "Arabitol",
                "Xylitol",
                "Ribitol",
                "Adonitol",
                "Ducitol",
                "Sorbitol",
                "Mannitol",
                "Galactitol",
                "Iditol",
                "Volemitol",
                "Isomaltol",
                "Dulcitol",
                "L-iditol",
                "Allitol",
                "Altitol",
                "Maltitol",
                "D-sorbitol",
                "L-sorbitol",
                "Myo-inositol",
                "Scyllo-inositol",
                "Chiro-inositol"
            ],
            "true_referents": [
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "1,2-diguaiacylpropane-1,3-diol",
                "1,3-diacetoxypropane",
                "1,4-dithiothreitol",
                "1-(beta-D-xylosyl)-N-oleoylsphingosine",
                "1-O-dodecylglycerol",
                "2'-O-methylodoratol",
                "2-methylene-1,4-butanediol",
                "2alpha-acetoxy-28-acetylrubiarboside G",
                "D-glucosylsphingosine",
                "DDT-2,3-dihydrodiol",
                "L-erythro-sphingosine",
                "L-glycol",
                "N-(2-hydroxyhexacosanoyl)phytosphingosine-1-phospho-(1D-myo-inositol)",
                "N-(2R-Hydroxyhexacosanoyl)-2S-amino-1,3S,4R-octadecanetriol",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1')-N-acylicosasphinganine",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1')-N-acylicosasphingosine",
                "beta-D-glucosyl-L-erythro-N-acylsphingosine",
                "butanediol",
                "dithioerythritol",
                "elongatol A",
                "elongatol E",
                "ethylene glycol",
                "ethylene glycol monophosphate",
                "glycol",
                "hexane-1,6-diol",
                "icosane-1,3-diol",
                "inositol phosphomannosylinositol-1-phospho-C20-phytoceramide",
                "inositol phosphomannosylinositol-1-phosphodihydroceramide",
                "inositol-1-phospho-N-acyl-(8E)-phytosphing-8-enine",
                "lavendiol",
                "octanediol",
                "odoratol",
                "propanediol",
                "rubianol-e 3-O-(6'-O-acetyl)-beta-D-glucopyranoside",
                "rubiarboside G 28-acetate",
                "rubiarboside G 28-al"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "diol",
        "domain": "chemistry",
        "response": [
            [
                "Referent",
                "Ethanol"
            ],
            [
                "Referent",
                "Propanol"
            ],
            [
                "Referent",
                "Butanol"
            ]
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Ethanol",
                "Propanol",
                "Butanol"
            ],
            "true_referents": [
                "(R)-butane-1,3-diol",
                "(R)-propane-1,2-diol",
                "butanediol",
                "ethylene glycol",
                "glycol",
                "propanediol"
            ],
            "TP": 0,
            "FP": 3,
            "FN": 0
        }
    }
]