[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            "1,2,3-Propanetriol (Glycerol)",
            "1,2,3-Butanetriol",
            "1,2,4-Butanetriol",
            "1,2,3-Pentanetriol",
            "1,2,4-Pentanetriol",
            "1,2,5-Pentanetriol",
            "1,2,3-Hexanetriol",
            "1,2,4-Hexanetriol",
            "1,2,5-Hexanetriol",
            "1,2,6-Hexanetriol",
            "1,2,3-Heptanetriol",
            "1,2,4-Heptanetriol",
            "1,2,5-Heptanetriol",
            "1,2,6-Heptanetriol",
            "1,2,3-Octanetriol",
            "1,2,4-Octanetriol",
            "1,2,5-Octanetriol",
            "1,2,6-Octanetriol",
            "1,2,7-Octanetriol",
            "1,2,3-Nonanetriol",
            "1,2,4-Nonanetriol",
            "1,2,5-Nonanetriol",
            "1,2,6-Nonanetriol",
            "1,2,7-Nonanetriol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,2,3-Butanetriol",
                "1,2,4-Butanetriol"
            ],
            "mismatches": [
                "1,2,3-Propanetriol (Glycerol)",
                "1,2,3-Pentanetriol",
                "1,2,4-Pentanetriol",
                "1,2,5-Pentanetriol",
                "1,2,3-Hexanetriol",
                "1,2,4-Hexanetriol",
                "1,2,5-Hexanetriol",
                "1,2,6-Hexanetriol",
                "1,2,3-Heptanetriol",
                "1,2,4-Heptanetriol",
                "1,2,5-Heptanetriol",
                "1,2,6-Heptanetriol",
                "1,2,3-Octanetriol",
                "1,2,4-Octanetriol",
                "1,2,5-Octanetriol",
                "1,2,6-Octanetriol",
                "1,2,7-Octanetriol",
                "1,2,3-Nonanetriol",
                "1,2,4-Nonanetriol",
                "1,2,5-Nonanetriol",
                "1,2,6-Nonanetriol",
                "1,2,7-Nonanetriol"
            ],
            "true_referents": [
                "1,2,3-butanetriol",
                "1,2,4-butanetriol",
                "1,3,5-pentanetriol",
                "1-Octylglycerol",
                "2-amino-1,3,4-tetradecanetriol",
                "Glycerol 1-propanoate",
                "anisotanol A",
                "benzenetriol",
                "heptane-1,2,3-triol",
                "phytantriol"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            "Glycerol (C3H8O3)",
            "Inositol (C6H12O6)",
            "Sorbitol (C6H14O6)",
            "Erythritol (C4H10O4)",
            "Mannitol (C6H14O6)",
            "Xylitol (C5H12O5)",
            "Ribitol (C5H12O5)",
            "Arabinitol (C5H12O5)",
            "Galactitol (C6H14O6)",
            "Dihydroxyacetone (C3H6O3)",
            "1,2,3-Propanetriol",
            "1,3,5-Trioxane",
            "1,3,6-Trioxocane",
            "1,2,4-Butanetriol",
            "1,3,5-Triol",
            "1,2,3-Butanetriol",
            "1,2,3-Propandiol",
            "1,3-Dihydroxy-2-propanone",
            "2,3,4-Trihydroxybutanal",
            "1,2,3-Trihydroxybenzene",
            "1,3,5-Trioxane-2,4-diol",
            "1,2,3-Trihydroxypropane",
            "3,4,5-Trihydroxybenzene-1,2-diol",
            "2,3,4-Trihydroxybutan-1-ol",
            "1,2,4-Trihydroxybenzene"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,2,3-Butanetriol",
                "1,2,4-Butanetriol",
                "1,2,3-Trihydroxybenzene",
                "Glycerol (C3H8O3)"
            ],
            "mismatches": [
                "Inositol (C6H12O6)",
                "Sorbitol (C6H14O6)",
                "Erythritol (C4H10O4)",
                "Mannitol (C6H14O6)",
                "Xylitol (C5H12O5)",
                "Ribitol (C5H12O5)",
                "Arabinitol (C5H12O5)",
                "Galactitol (C6H14O6)",
                "Dihydroxyacetone (C3H6O3)",
                "1,2,3-Propanetriol",
                "1,3,5-Trioxane",
                "1,3,6-Trioxocane",
                "1,3,5-Triol",
                "1,2,3-Propandiol",
                "1,3-Dihydroxy-2-propanone",
                "2,3,4-Trihydroxybutanal",
                "1,3,5-Trioxane-2,4-diol",
                "1,2,3-Trihydroxypropane",
                "3,4,5-Trihydroxybenzene-1,2-diol",
                "2,3,4-Trihydroxybutan-1-ol"
            ],
            "true_referents": [
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(2R)-2,3-Dihydroxypropyl nonadecanoate",
                "(2R,3R)-heptane-1,2,3-triol",
                "(4xi)-2-O-(4-hydroxybenzoyl)-6-O-(3,4,5-trihydroxybenzoyl)-D-ribo-hexopyranose",
                "(R)-glycerol 1-acetate",
                "1,2,3-butanetriol",
                "1,2,4-butanetriol",
                "1,5-anhydro-D-fructose",
                "1-(1,2-dihexanoylphosphatidyl)inositol-5-phosphate",
                "1-(1,2-dioctanoylphosphatidyl)inositol",
                "1-O-(2-O-alpha-D-galactopyranosyl-alpha-D-glucopyranosyl)-glycerol",
                "1-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-erucoylglycerol",
                "1-phosphatidyl-1D-myo-inositol 4,5-bisphosphate",
                "2,2,4-trihydroxybutanoic acid",
                "2,3,4-trihydroxbenzophenone",
                "2,3,4-trihydroxypentanoic acid",
                "2,3-dihydroxypropyl heptadecanoate",
                "2,3-dihydroxypropylicos-11-enoate",
                "2,4,5-Trihydroxytoluene",
                "2,4,5-trihydroxyphenylacetic acid",
                "2,4,6-trihydroxybenzaldehyde",
                "2,4,6-trihydroxybenzophenone",
                "2,6-O-bis(alpha-D-mannopyranosyl)-1-phosphatidyl-1D-myo-inositol",
                "2-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "3-Methoxy-1,2-propanediol",
                "5alpha-androstane-3beta,6alpha,17beta-triol",
                "5alpha-androstane-3beta,7alpha,17beta-triol",
                "androst-5-ene-3beta,7alpha,17beta-triol",
                "arabidopside A",
                "benzene-1,2,3,4,5-pentol",
                "benzene-1,2,4-triol",
                "benzenetriol",
                "glycerol",
                "heptane-1,2,3-triol",
                "rubiarbonol A 3-O-beta-D-glucopyranosyl-(1->2)-beta-D-glucopyranoside"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            "1,2,3-Triol (Glycerol)",
            "1,2,4-Butanetriol",
            "1,3,5-Pentanetriol",
            "2,3,4-Pentanetriol",
            "1,2,3-Propantriol",
            "1,3,5-Trihydroxybenzene (Phloroglucinol)",
            "1,2,3-Trihydroxypropane",
            "1,2,4-Trihydroxybutane",
            "1,2,3-Trihydroxycyclohexane",
            "1,2,4-Trihydroxycyclohexane",
            "1,3,5-Trihydroxycyclohexane",
            "1,2,3,4-Tetrahydroxybutane",
            "1,2,3,4,5-Pentahydroxypentane",
            "1,2,3,4,5,6-Hexahydroxyhexane",
            "1,2,3-Trihydroxy-4-methylpentane",
            "1,2,3-Trihydroxy-5-methylhexane",
            "1,2,3-Trihydroxy-6-methylheptane",
            "1,2,3-Trihydroxy-7-methyloctane",
            "1,2,3-Trihydroxy-8-methylnonane",
            "1,2,3-Trihydroxy-9-methyldecane",
            "1,2,3-Trihydroxy-10-methyldecane",
            "1,2,3-Trihydroxy-11-methyldodecane",
            "1,2,3-Trihydroxy-12-methyldodecane"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,2,4-Butanetriol",
                "1,3,5-Pentanetriol",
                "phloroglucinol"
            ],
            "mismatches": [
                "1,2,3-Triol (Glycerol)",
                "2,3,4-Pentanetriol",
                "1,2,3-Propantriol",
                "1,2,3-Trihydroxypropane",
                "1,2,4-Trihydroxybutane",
                "1,2,3-Trihydroxycyclohexane",
                "1,2,4-Trihydroxycyclohexane",
                "1,3,5-Trihydroxycyclohexane",
                "1,2,3,4-Tetrahydroxybutane",
                "1,2,3,4,5-Pentahydroxypentane",
                "1,2,3,4,5,6-Hexahydroxyhexane",
                "1,2,3-Trihydroxy-4-methylpentane",
                "1,2,3-Trihydroxy-5-methylhexane",
                "1,2,3-Trihydroxy-6-methylheptane",
                "1,2,3-Trihydroxy-7-methyloctane",
                "1,2,3-Trihydroxy-8-methylnonane",
                "1,2,3-Trihydroxy-9-methyldecane",
                "1,2,3-Trihydroxy-10-methyldecane",
                "1,2,3-Trihydroxy-11-methyldodecane",
                "1,2,3-Trihydroxy-12-methyldodecane"
            ],
            "true_referents": [
                "(2R,3R)-heptane-1,2,3-triol",
                "1,2,3-butanetriol",
                "1,2,4-butanetriol",
                "1,3,5-pentanetriol",
                "1-Hydroxy-3-(octanoyloxy)propan-2-yl decanoate",
                "2',4',6'-trihydroxyacetophenone",
                "2,2,4-trihydroxybutanoic acid",
                "2,3,4-trihydroxbenzophenone",
                "2,3,4-trihydroxypentanoic acid",
                "2,3-dihydroxypropyl 12-methyltridecanoate",
                "2,3-dihydroxypropyl heptadecanoate",
                "2,4,5-Trihydroxytoluene",
                "2,4,6-trihydroxybenzaldehyde",
                "2,4,6-trihydroxyphenylhexan-1-one",
                "2-acyl-4,6-diprenylphloroglucinol",
                "2-amino-1,3,4-tetradecanetriol",
                "5alpha-androstane-3beta,6alpha,17beta-triol",
                "benzenetriol",
                "heptane-1,2,3-triol",
                "methyl 3,4,5-trihydroxybenzoate",
                "phloroglucinol",
                "phytantriol"
            ],
            "TP": 3,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            "Glycerol (GLY)",
            "Mannitol (MNL)",
            "Sorbitol (SOR)",
            "Xylitol (XYL)",
            "Erythritol (ERY)",
            "Dulcitol (DUC)",
            "Galactitol (GAL)",
            "Inositol (INS)",
            "Quercitol (QCT)",
            "Ribitol (RIB)",
            "Myo-inositol phosphate (MIP)",
            "Phytic acid (IP6)",
            "Trehalose (TRE)",
            "Raffinose (RAF)",
            "Melibiose (MEL)",
            "Stachyose (STA)",
            "Fucose (FUC)",
            "Rhamnose (RHA)",
            "Sedoheptulose (SED)",
            "Psicose (PSI)",
            "Tagatose (TAG)",
            "Altrulose (ALT)",
            "Iditol (IDI)",
            "Volitol (VOL)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "glycerol"
            ],
            "mismatches": [
                "Mannitol (MNL)",
                "Sorbitol (SOR)",
                "Xylitol (XYL)",
                "Erythritol (ERY)",
                "Dulcitol (DUC)",
                "Galactitol (GAL)",
                "Inositol (INS)",
                "Quercitol (QCT)",
                "Ribitol (RIB)",
                "Myo-inositol phosphate (MIP)",
                "Phytic acid (IP6)",
                "Trehalose (TRE)",
                "Raffinose (RAF)",
                "Melibiose (MEL)",
                "Stachyose (STA)",
                "Fucose (FUC)",
                "Rhamnose (RHA)",
                "Sedoheptulose (SED)",
                "Psicose (PSI)",
                "Tagatose (TAG)",
                "Altrulose (ALT)",
                "Iditol (IDI)",
                "Volitol (VOL)"
            ],
            "true_referents": [
                "(R)-edelfosine",
                "(S)-edelfosine",
                "1,3,5-pentanetriol",
                "1,5-anhydro-D-fructose",
                "1-(1,2-dihexanoylphosphatidyl)inositol-5-phosphate",
                "1-(1,2-dioctanoylphosphatidyl)inositol",
                "1-(D-glucopyranosyloxy)-3-hydroxypropan-2-yl D-galactopyranoside",
                "1-(D-glucopyranosyloxy)-3-hydroxypropan-2-yl L-fucopyranoside",
                "1-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-archaetidyl-D-myo-inositol",
                "1-erucoylglycerol",
                "1-phosphatidyl-1D-myo-inositol 3,5-bisphosphate",
                "1-phosphatidyl-1D-myo-inositol 3-phosphate",
                "1-phosphatidyl-1D-myo-inositol 5-phosphate",
                "2',3'-secoguanosine",
                "2,6-O-bis(alpha-D-mannopyranosyl)-1-phosphatidyl-1D-myo-inositol",
                "2-(D-glucopyranosyloxy)-3-hydroxypropyl L-fucopyranoside",
                "2-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "2-O-(alpha-D-glucopyranosyl)glycerol",
                "2-O-(alpha-D-mannopyranosyl)-1-phosphatidyl-1D-myo-inositol",
                "2-O-(beta-D-glucosyl)glycerol",
                "2-deoxypentose",
                "2alpha,3beta,23alpha-trihydroxyurs-12-en-28-oic acid 28-O-beta-D-glucopyranoside",
                "N-(2R-Hydroxyhexacosanoyl)-2S-amino-1,3S,4R-octadecanetriol",
                "POB-PE",
                "PON-PE",
                "Sphingofungin D",
                "TAG(18:3n3/14:0/22:6n3)",
                "angelitriol",
                "aurafuron A",
                "batilol",
                "benzene-1,2,3,4,5-pentol",
                "beta-D-erythrofuranose",
                "beta-chrysopine",
                "deoxycohumulone",
                "desmethylxanthohumol",
                "fruticoside A",
                "galactosylglycerol",
                "glyceride",
                "glycerol",
                "glycerol phosphate",
                "mono-beta-D-galactosyl diacylglycerol",
                "phosphatidic acid",
                "phosphatidic acid (16:0/18:1)",
                "phosphatidylinositol mannoside",
                "pyriculol",
                "quercetin 3-O-(2'',3''-digalloyl)-beta-D-galactopyranoside",
                "rel-2alpha,3alpha,23-trihydroxy-19-oxo-18,19-seco-urs-11,13(18)-dien-28-oic acid",
                "rubiarbonol A 3-O-beta-D-glucopyranosyl-(1->2)-beta-D-glucopyranoside",
                "rubiarbonol A 7-acetate",
                "rubiarbonol L"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            "Glycerol (C3H8O3)",
            "1,2,3-Propanetriol",
            "1,2,3-Butanetriol",
            "1,2,4-Butanetriol",
            "1,3,5-Cyclohexanetriol",
            "1,2,3-Cyclopropanetriol",
            "1,2,3-Cyclopentanetriol",
            "1,2,3-Cycloheptanetriol",
            "1,2,3-Cyclooctanetriol",
            "1,2,3-Cyclononanetriol",
            "1,2,3-Cyclodecanetriol",
            "1,2,3-Cycloundecanetriol",
            "1,2,3-Cyclododecanetriol",
            "1,2,3-Cyclotridecanetriol",
            "1,2,3-Cyclotetradecanetriol",
            "1,2,3-Cyclopentadecanetriol",
            "1,2,3-Cyclohexadecanetriol",
            "1,2,3-Cycloheptadecanetriol",
            "1,2,3-Cyclooctadecanetriol",
            "1,2,3-Cyclononadecanetriol",
            "1,2,3-Cycloeicosanetriol",
            "1,2,3-Cycloheneicosanetriol",
            "1,2,3-Cyclodocosanetriol",
            "1,2,3-Cyclotricosanetriol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,2,3-Butanetriol",
                "1,2,4-Butanetriol",
                "glycerol"
            ],
            "mismatches": [
                "1,2,3-Propanetriol",
                "1,3,5-Cyclohexanetriol",
                "1,2,3-Cyclopropanetriol",
                "1,2,3-Cyclopentanetriol",
                "1,2,3-Cycloheptanetriol",
                "1,2,3-Cyclooctanetriol",
                "1,2,3-Cyclononanetriol",
                "1,2,3-Cyclodecanetriol",
                "1,2,3-Cycloundecanetriol",
                "1,2,3-Cyclododecanetriol",
                "1,2,3-Cyclotridecanetriol",
                "1,2,3-Cyclotetradecanetriol",
                "1,2,3-Cyclopentadecanetriol",
                "1,2,3-Cyclohexadecanetriol",
                "1,2,3-Cycloheptadecanetriol",
                "1,2,3-Cyclooctadecanetriol",
                "1,2,3-Cyclononadecanetriol",
                "1,2,3-Cycloeicosanetriol",
                "1,2,3-Cycloheneicosanetriol",
                "1,2,3-Cyclodocosanetriol",
                "1,2,3-Cyclotricosanetriol"
            ],
            "true_referents": [
                "(2S, 3S, 4R)-2-[(2'R)-2'-hydroxypentacosanoylamino]-1, 3, 4-octadecanetriol",
                "(2S, 3S, 4R)-2-[(2R)-2-hydroxytetracosanoylamino]-1, 3, 4-octadecanetriol",
                "(R)-glycerol 1-acetate",
                "1,2,3-Tris(1-ethoxyethoxy)propane",
                "1,2,3-butanetriol",
                "1,2,3-trilinolenoylglycerol",
                "1,2,4-butanetriol",
                "1,3,5-pentanetriol",
                "11-O-acetylcyathatriol",
                "2-amino-1,3,4-tetradecanetriol",
                "3-Methoxy-1,2-propanediol",
                "benzenetriol",
                "cyathatriol",
                "glycerol",
                "heptane-1,2,3-triol",
                "phytantriol"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            "Glycerol (C3H8O3)",
            "1,2,3-Propanetriol (C3H8O3)",
            "Glycerin (C3H8O3)",
            "Ribitol (C5H12O5)",
            "Arabitol (C5H12O5)",
            "Xylitol (C5H12O5)",
            "Mannitol (C6H14O6)",
            "Sorbitol (C6H14O6)",
            "Galactitol (C6H14O6)",
            "Dulcitol (C6H14O6)",
            "Inositol (C6H12O6)",
            "Triacetin (C9H14O5)",
            "Trimethylolpropane (C6H14O3)",
            "1,2,3-Butanetriol (C4H10O3)",
            "1,2,4-Butanetriol (C4H10O3)",
            "1,2,3-Pentanetriol (C5H12O3)",
            "1,2,3-Hexanetriol (C6H14O3)",
            "1,2,3-Butanetriol (C4H10O3)",
            "1,2,3-Cyclopropanetriol (C6H10O3)",
            "1,2,3-Propane-1,2,3-triol (C3H8O3)",
            "1,2,3-Pentanetriol (C5H12O3)",
            "1,2,3-Hexanetriol (C6H14O3)",
            "1,2,3-Octanetriol (C8H18O3)",
            "1,2,3-Nonanetriol (C9H20O3)",
            "1,2,3-Decanetriol (C10H22O3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "glycerol",
                "triacetin",
                "1,2,3-butanetriol",
                "1,2,4-butanetriol",
                "1,3,5-pentanetriol"
            ],
            "mismatches": [
                "1,2,3-propanetriol",
                "glycerin",
                "ribitol",
                "arabitol",
                "xylitol",
                "mannitol",
                "sorbitol",
                "galactitol",
                "dulcitol",
                "inositol",
                "trimethylolpropane",
                "1,2,3-pentanetriol",
                "1,2,3-hexanetriol",
                "1,2,3-cyclopropanetriol",
                "1,2,3-propane-1,2,3-triol",
                "1,2,3-octanetriol",
                "1,2,3-nonanetriol",
                "1,2,3-decanetriol"
            ],
            "true_referents": [
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(2R,3R)-heptane-1,2,3-triol",
                "(2S, 3S, 4R)-2-[(2R)-2-hydroxytetracosanoylamino]-1, 3, 4-octadecanetriol",
                "(4xi)-2-O-(4-hydroxybenzoyl)-6-O-(3,4,5-trihydroxybenzoyl)-D-ribo-hexopyranose",
                "(R)-glycerol 1-acetate",
                "1,2,3-Tris(1-ethoxyethoxy)propane",
                "1,2,3-butanetriol",
                "1,2,4-butanetriol",
                "1,2-di-(13-methyltetradecanoyl)-3-(13-methyltetradecyl)glycerol",
                "1,3,5-pentanetriol",
                "1,5-anhydro-D-fructose",
                "1-(1,2-dihexanoylphosphatidyl)inositol-5-phosphate",
                "1-(1,2-dioctanoylphosphatidyl)inositol",
                "1-Hydroxy-3-(octanoyloxy)propan-2-yl decanoate",
                "1-O-(2-O-alpha-D-galactopyranosyl-alpha-D-glucopyranosyl)-glycerol",
                "1-O-(4-O-alpha-D-glucoopyranosyl-beta-D-galactopyranosyl)-glycerol",
                "1-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "1-O-(D-glucosyl)glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-phosphatidyl-1D-myo-inositol 4,5-bisphosphate",
                "2,6-O-bis(alpha-D-mannopyranosyl)-1-phosphatidyl-1D-myo-inositol",
                "2-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "2-acyl-4,6-diprenylphloroglucinol",
                "2-amino-1,3,4-tetradecanetriol",
                "6-pentadecylbenzene-1,2,4-triol",
                "arabidopside A",
                "benzene-1,2,4-triol",
                "benzenetriol",
                "glycerol",
                "heptane-1,2,3-triol",
                "rubiarbonol A 3-O-beta-D-glucopyranosyl-(1->2)-beta-D-glucopyranoside",
                "triacetin",
                "tricin 4'-O-(erythro-beta-guaiacylglyceryl) ether 9''-O-beta-D-glucopyranoside"
            ],
            "TP": 5,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            "Glycerol (Gly)",
            "Erythritol (Ery)",
            "Threitol (Thr)",
            "Pentaerythritol (Pent)",
            "1,2,3-Propanetriol (123-Pro)",
            "1,2,4-Butanetriol (124-But)",
            "1,2,3-Butanetriol (123-But)",
            "1,2,3-Pentanetriol (123-Pent)",
            "2,3,4-Pentanetriol (234-Pent)",
            "1,2,3-Hexanetriol (123-Hex)",
            "1,2,4-Hexanetriol (124-Hex)",
            "1,3,5-Hexanetriol (135-Hex)",
            "1,2,3-Heptanetriol (123-Hept)",
            "1,2,4-Heptanetriol (124-Hept)",
            "1,3,5-Heptanetriol (135-Hept)",
            "1,2,3-Octanetriol (123-Oct)",
            "1,2,4-Octanetriol (124-Oct)",
            "1,3,5-Octanetriol (135-Oct)",
            "1,2,3-Nonanetriol (123-Non)",
            "1,2,4-Nonanetriol (124-Non)",
            "1,3,5-Nonanetriol (135-Non)",
            "1,2,3-Decanetriol (123-Dec)",
            "1,2,4-Decanetriol (124-Dec)",
            "1,3,5-Decanetriol (135-Dec)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,2,3-Butanetriol",
                "1,2,4-Butanetriol",
                "1,2,3-Heptanetriol",
                "Glycerol"
            ],
            "mismatches": [
                "Erythritol",
                "Threitol",
                "Pentaerythritol",
                "1,2,3-Propanetriol",
                "1,2,3-Pentanetriol",
                "2,3,4-Pentanetriol",
                "1,2,3-Hexanetriol",
                "1,2,4-Hexanetriol",
                "1,3,5-Hexanetriol",
                "1,2,4-Heptanetriol",
                "1,3,5-Heptanetriol",
                "1,2,3-Octanetriol",
                "1,2,4-Octanetriol",
                "1,3,5-Octanetriol",
                "1,2,3-Nonanetriol",
                "1,2,4-Nonanetriol",
                "1,3,5-Nonanetriol",
                "1,2,3-Decanetriol",
                "1,2,4-Decanetriol",
                "1,3,5-Decanetriol"
            ],
            "true_referents": [
                "(2R,3R)-heptane-1,2,3-triol",
                "(2S, 3S, 4R)-2-[(2R)-2-hydroxytetracosanoylamino]-1, 3, 4-octadecanetriol",
                "1,2,3-butanetriol",
                "1,2,4-butanetriol",
                "1,3,5-pentanetriol",
                "1-Octylglycerol",
                "1-decanoyl-3-oleoylglycerol",
                "1-erucoylglycerol",
                "2,4,5-Trimethoxytoluene",
                "2-amino-1,3,4-tetradecanetriol",
                "3-Methoxy-1,2-propanediol",
                "Ins-1-P-Cer(t18:0/2-OH-24:0)",
                "N-threonyl-glycosylphosphatidylinositolethanolamine",
                "benzene-1,2,3,4,5-pentol",
                "benzenetriol",
                "glyceride",
                "glycerol",
                "glycerol phosphate",
                "heptane-1,2,3-triol",
                "thiomarinol G"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            "Glycerol",
            "1,2,3-Propanetriol",
            "Erythritol",
            "1,2,4-Butanetriol",
            "1,2,3-Butanetriol",
            "1,2,3-Hexanetriol",
            "1,2,3-Pentanetriol",
            "1,2,3-Heptanetriol",
            "1,2,3-Octanetriol",
            "1,2,3-Nonanetriol",
            "1,2,3-Decanetriol",
            "1,2,3-Undecanetriol",
            "1,2,3-Dodecanetriol",
            "1,2,3-Tridecanetriol",
            "1,2,3-Tetradecanetriol",
            "1,2,3-Pentadecanetriol",
            "1,2,3-Hexadecanetriol",
            "1,2,3-Heptadecanetriol",
            "1,2,3-Octadecanetriol",
            "1,2,3-Nonadecanetriol",
            "1,2,3-Eicosanetriol",
            "1,2,3-Docosanetriol",
            "1,2,3-Tetracosanetriol",
            "1,2,3-Hexacosanetriol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glycerol",
                "1,2,4-Butanetriol",
                "1,2,3-Butanetriol"
            ],
            "mismatches": [
                "1,2,3-Propanetriol",
                "Erythritol",
                "1,2,3-Hexanetriol",
                "1,2,3-Pentanetriol",
                "1,2,3-Heptanetriol",
                "1,2,3-Octanetriol",
                "1,2,3-Nonanetriol",
                "1,2,3-Decanetriol",
                "1,2,3-Undecanetriol",
                "1,2,3-Dodecanetriol",
                "1,2,3-Tridecanetriol",
                "1,2,3-Tetradecanetriol",
                "1,2,3-Pentadecanetriol",
                "1,2,3-Hexadecanetriol",
                "1,2,3-Heptadecanetriol",
                "1,2,3-Octadecanetriol",
                "1,2,3-Nonadecanetriol",
                "1,2,3-Eicosanetriol",
                "1,2,3-Docosanetriol",
                "1,2,3-Tetracosanetriol",
                "1,2,3-Hexacosanetriol"
            ],
            "true_referents": [
                "(2S, 3S, 4R)-2-[(2R)-2-hydroxytetracosanoylamino]-1, 3, 4-octadecanetriol",
                "1,2,3-butanetriol",
                "1,2,4-butanetriol",
                "1,2-diicosatetraenoyl-3-docosahexaenoyl-sn-glycerol",
                "1,3,5-pentanetriol",
                "1-Eicosadienoyl-2-docosahexaenoyl-sn-glycero-3-phosphoethanolamine",
                "1-decanoyl-3-oleoylglycerol",
                "1-erucoylglycerol",
                "1-octadecanoyl-2-eicosanoyl-sn-glycero-3-phosphoethanolamine",
                "1-tetracosanoylglycerol",
                "2-amino-1,3,4-tetradecanetriol",
                "3-Methoxy-1,2-propanediol",
                "N-(2R-Hydroxyhexacosanoyl)-2S-amino-1,3S,4R-octadecanetriol",
                "benzenetriol",
                "diglycerol",
                "glyceride",
                "glycerol",
                "heptane-1,2,3-triol",
                "phytantriol"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "triol",
        "domain": "chemistry",
        "response": "",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            "Glycerol (1,2,3-Propanetriol)",
            "Butanetriol (1,2,3-Butanetriol)",
            "Pentanetriol (1,2,3-Pentanetriol)",
            "Hexanetriol (1,2,6-Hexanetriol)",
            "Trimethylolpropane (TMP)",
            "Trimethylolethane (TME)",
            "Phloroglucinol (1,3,5-Trihydroxybenzene)",
            "Pyrogallol (1,2,3-Trihydroxybenzene)",
            "Hydroxytyrosol (3,4-DHPEA-EtOH)",
            "Gallic acid (3,4,5-Trihydroxybenzoic acid)",
            "Epigallocatechin (EGC)",
            "Epicatechin gallate (ECG)",
            "Epigallocatechin gallate (EGCG)",
            "Myo-inositol",
            "Pinacol (2,3-Dimethyl-2,3-butanediol)",
            "Glyceraldehyde",
            "Dihydroxyacetone (DHA)",
            "Erythritol",
            "Xylitol",
            "Sorbitol",
            "Mannitol",
            "Inositol",
            "Propane-1,2,3-triol",
            "Butane-1,2,3-triol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "phloroglucinol",
                "pyrogallol",
                "glycerol",
                "1,2,3-butanetriol"
            ],
            "mismatches": [
                "Glycerol (1,2,3-Propanetriol)",
                "Pentanetriol (1,2,3-Pentanetriol)",
                "Hexanetriol (1,2,6-Hexanetriol)",
                "Trimethylolpropane (TMP)",
                "Trimethylolethane (TME)",
                "Hydroxytyrosol (3,4-DHPEA-EtOH)",
                "Gallic acid (3,4,5-Trihydroxybenzoic acid)",
                "Epigallocatechin (EGC)",
                "Epicatechin gallate (ECG)",
                "Epigallocatechin gallate (EGCG)",
                "Myo-inositol",
                "Pinacol (2,3-Dimethyl-2,3-butanediol)",
                "Glyceraldehyde",
                "Dihydroxyacetone (DHA)",
                "Erythritol",
                "Xylitol",
                "Sorbitol",
                "Mannitol",
                "Inositol",
                "Propane-1,2,3-triol",
                "Butane-1,2,3-triol"
            ],
            "true_referents": [
                "(+)-catechin-3-O-gallate",
                "(+)-epicatechin-3-O-gallate",
                "(-)-catechin-3-O-gallate",
                "(-)-epicatechin-3-O-gallate",
                "(-)-epicatechin-5-gallate",
                "(-)-epigallocatechin 3-gallate",
                "(2R,3R)-heptane-1,2,3-triol",
                "(R)-glycerol 1-acetate",
                "1,2,3-butanetriol",
                "1,2,4-butanetriol",
                "1,3,5-pentanetriol",
                "1-(1,2-dioctanoylphosphatidyl)inositol",
                "1-(D-glucopyranosyloxy)-3-hydroxypropan-2-yl D-galactopyranoside",
                "1-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-archaetidyl-D-myo-inositol",
                "1-erucoylglycerol",
                "1-phosphatidyl-1D-myo-inositol",
                "2,3-dihydroxypropyl heptadecanoate",
                "2,4,5-Trimethoxytoluene",
                "2,4,6-trihydroxybenzaldehyde",
                "2-acyl-4,6-diprenylphloroglucinol",
                "2-amino-1,3,4-tetradecanetriol",
                "2alpha,3alpha,23-trihydroxyolean-12-en-28-oic acid",
                "3-(Acetyloxy)-2-hydroxypropyl octadecanoate",
                "3-Methoxy-1,2-propanediol",
                "3-O-(alpha-L-oleandrosyl)oleandolide",
                "C-glycosylphytoceramide",
                "alkylglycerol",
                "benzene-1,2,4-triol",
                "benzenetriol",
                "diacylglycerol 2-trimethylaminoethylphosphonate",
                "diphosphatidyl propylene glycol",
                "epicatechin 3-O-(3'-O-methylgallate)",
                "glycerol",
                "glycophytoceramide",
                "glycosylglycerol",
                "heptane-1,2,3-triol",
                "phloroglucinol",
                "phosphatidylinositol",
                "phosphatidylinositol mannoside",
                "phosphoinositide",
                "phytantriol",
                "pyriculol",
                "pyrogallol",
                "triethanolamine"
            ],
            "TP": 4,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            "Glycerol (propane-1,2,3-triol)",
            "1,2,4-Butanetriol",
            "2-Hydroxymethyl-1,3-propanediol",
            "1,2,6-Hexanetriol",
            "3-Methyl-1,3,5-pentanetriol",
            "1,2,3-Pentanetriol",
            "2-Ethyl-2-(hydroxymethyl)-1,3-propanediol",
            "2,2-Bis(hydroxymethyl)-1,3-propanediol",
            "1,2,3-Heptanetriol",
            "2,2-Dimethyl-1,3-propanediol (neopentyl glycol)",
            "Trimethylolpropane (TMP)",
            "2-Amino-2-(hydroxymethyl)-1,3-propanediol (TRIS)",
            "Phloroglucinol (1,3,5-trihydroxybenzene)",
            "Pyrogallol (1,2,3-trihydroxybenzene)",
            "Hydroxyhydroquinone (1,2,4-trihydroxybenzene)",
            "3,4,5-Trihydroxybenzoic acid (gallic acid)",
            "2,3,4-Trihydroxybutyric acid (erythronic acid)",
            "2,3,5-Trihydroxyhexanoic acid",
            "2,4,5-Trihydroxypentanoic acid (apionic acid)",
            "3,7,11,15-Tetramethyl-1,2,3-hexadecanetriol (phytantriol)",
            "2-C-Methyl-D-erythritol",
            "Panthenol (provitamin B5)",
            "Tromethamine (THAM)",
            "Serinol (2-amino-1,3-propanediol)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,2,4-Butanetriol",
                "Phloroglucinol (1,3,5-trihydroxybenzene)",
                "Pyrogallol (1,2,3-trihydroxybenzene)",
                "2,3,4-Trihydroxybutyric acid (erythronic acid)",
                "3,7,11,15-Tetramethyl-1,2,3-hexadecanetriol (phytantriol)"
            ],
            "mismatches": [
                "Glycerol (propane-1,2,3-triol)",
                "2-Hydroxymethyl-1,3-propanediol",
                "1,2,6-Hexanetriol",
                "3-Methyl-1,3,5-pentanetriol",
                "1,2,3-Pentanetriol",
                "2-Ethyl-2-(hydroxymethyl)-1,3-propanediol",
                "2,2-Bis(hydroxymethyl)-1,3-propanediol",
                "1,2,3-Heptanetriol",
                "2,2-Dimethyl-1,3-propanediol (neopentyl glycol)",
                "Trimethylolpropane (TMP)",
                "2-Amino-2-(hydroxymethyl)-1,3-propanediol (TRIS)",
                "Hydroxyhydroquinone (1,2,4-trihydroxybenzene)",
                "3,4,5-Trihydroxybenzoic acid (gallic acid)",
                "2,3,5-Trihydroxyhexanoic acid",
                "2,4,5-Trihydroxypentanoic acid (apionic acid)",
                "2-C-Methyl-D-erythritol",
                "Panthenol (provitamin B5)",
                "Tromethamine (THAM)",
                "Serinol (2-amino-1,3-propanediol)"
            ],
            "true_referents": [
                "(-)-catechin-3-O-gallate",
                "(2S, 3S, 4R)-2-[(2'R)-2'-hydroxypentacosanoylamino]-1, 3, 4-octadecanetriol",
                "1,2,3-butanetriol",
                "1,2,4-butanetriol",
                "1,3,5-pentanetriol",
                "1-alkyl-2,3-diacylglycerol",
                "1-erucoylglycerol",
                "1-lauroyl-2-oleoyl-sn-glycerol",
                "2,2,4-trihydroxybutanoic acid",
                "2,3,4-trihydroxbenzophenone",
                "2,3,4-trihydroxypentanoic acid",
                "2,3-dihydroxypropyl (Z)-10-methyloctadec-9-enoate",
                "2,3-dihydroxypropyl 12-methyltridecanoate",
                "2,3-dilinolenoyl-sn-glycerol",
                "2,3-dilinoleoyl-sn-glycerol",
                "2,4,5-Trimethoxytoluene",
                "2,4,5-trihydroxyphenylacetic acid",
                "2,4,6-trihydroxybenzaldehyde",
                "2,4,6-trihydroxybenzophenone",
                "2,5-dihydroxy-3-phenyl-6-(3,4,5-trihydroxyphenyl)-1,4-benzoquinone",
                "2-acyl-4,6-diprenylphloroglucinol",
                "2-amino-1,3,4-tetradecanetriol",
                "3-(4-Hydroxy-3-methoxyphenyl)-1,2-propanediol 2-O-(galloyl-glucoside)",
                "3-Methoxy-1,2-propanediol",
                "9,10,18-trihydroxyoctadecanoic acid",
                "Glycerol 1-propanoate",
                "N-tris(hydroxymethyl)methylglycine",
                "alkylglycerol",
                "benzenetriol",
                "diacylglycerol 2-trimethylaminoethylphosphonate",
                "glycerol",
                "heptane-1,2,3-triol",
                "phloroglucinol",
                "phosphatidyl-N,N-dimethylethanolamine",
                "phytantriol",
                "pyriculol",
                "pyrogallol",
                "thiomarinol G",
                "triethanolamine"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            "Glycerol (C3H8O3)",
            "Erythritol (C4H10O4)",
            "Threitol (C4H10O3)",
            "Ribitol (C5H12O5)",
            "Xylitol (C5H12O5)",
            "Arabitol (C5H12O5)",
            "Mannitol (C6H14O6)",
            "Galactitol (C6H14O6)",
            "Iditol (C6H14O6)",
            "Allitol (C6H14O6)",
            "Dulcitol (C6H14O6)",
            "Sorbitol (C6H14O6)",
            "myo-Inositol (C6H12O6)",
            "scyllo-Inositol (C6H12O6)",
            "muco-Inositol (C6H12O6)",
            "epi-Inositol (C6H12O6)",
            "cis-Inositol (C6H12O6)",
            "allo-Inositol (C6H12O6)",
            "Perseitol (C7H16O7)",
            "Volemitol (C7H16O7)",
            "Glycero-D-gulo-heptitol (C7H16O7)",
            "Sedoheptitol (C7H16O7)",
            "D-Glycero-D-manno-heptitol (C7H16O7)",
            "D-Glycero-L-manno-heptitol (C7H16O7)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "glycerol"
            ],
            "mismatches": [
                "Erythritol",
                "Threitol",
                "Ribitol",
                "Xylitol",
                "Arabitol",
                "Mannitol",
                "Galactitol",
                "Iditol",
                "Allitol",
                "Dulcitol",
                "Sorbitol",
                "myo-Inositol",
                "scyllo-Inositol",
                "muco-Inositol",
                "epi-Inositol",
                "cis-Inositol",
                "allo-Inositol",
                "Perseitol",
                "Volemitol",
                "Glycero-D-gulo-heptitol",
                "Sedoheptitol",
                "D-Glycero-D-manno-heptitol",
                "D-Glycero-L-manno-heptitol"
            ],
            "true_referents": [
                "(+)-(7S,8S)-guaiacylglycerol-beta-vanillic acid ether",
                "(1R)-1,5-anhydro-1-[(3S,4S,5R)-3-(hexacosanoylamino)-4,5-dihydroxynonadecyl]-D-galactitol",
                "(4xi)-2-O-(4-hydroxybenzoyl)-6-O-(3,4,5-trihydroxybenzoyl)-D-ribo-hexopyranose",
                "(R)-glycerol 1-acetate",
                "1,3,5-pentanetriol",
                "1,5-anhydro-D-fructose",
                "1-(1,2-dioctanoylphosphatidyl)inositol",
                "1-O-(2-O-alpha-D-galactopyranosyl-alpha-D-glucopyranosyl)-glycerol",
                "1-O-(4-O-alpha-D-glucoopyranosyl-beta-D-galactopyranosyl)-glycerol",
                "1-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "1-O-(D-glucosyl)glycerol",
                "1-O-(alpha-D-glucosyl)glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-archaetidyl-D-myo-inositol",
                "1-erucoylglycerol",
                "1-monohexosyl-2,3-diacylglycerol",
                "1-octanoyl-3-(beta-D-galactosyl)-sn-glycerol",
                "1-phosphatidyl-1D-myo-inositol",
                "2,6-O-bis(alpha-D-mannopyranosyl)-1-phosphatidyl-1D-myo-inositol",
                "2-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "2-acyl-4,6-diprenylphloroglucinol",
                "6-(N-acetyl-alpha-D-glucosaminyl)-1-phosphatidyl-1D-myo-inositol",
                "6-(alpha-D-glucosaminyl)-1-phosphatidyl-1D-myo-inositol",
                "6-O-(N-acetyl-D-glucosaminyl)-1-phosphatidyl-1D-myo-inositol",
                "N-(2R-Hydroxyhexacosanoyl)-2S-amino-1,3S,4R-octadecanetriol",
                "arabidopside A",
                "benzene-1,2,3,4,5-pentol",
                "benzene-1,2,3,4-tetrol",
                "glycerol",
                "glycosylglycerol",
                "rubiarbonol A 3-O-beta-D-glucopyranosyl-(1->2)-beta-D-glucopyranoside"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            "Glycerol (Gly)",
            "1,2,3-Propanetriol",
            "Trihydroxypropane",
            "1,2,3-Trihydroxypropane",
            "Propan-1,2,3-triol",
            "Glycerin",
            "Trihydric alcohol",
            "1,2,3-Trihydroxypropane",
            "Propanetriol",
            "Trihydroxyalkane",
            "Trihydroxypropyl alcohol",
            "1,2,3-Trihydroxypropyl alcohol",
            "Glyceritol",
            "Glycyl alcohol",
            "Glyceryl alcohol",
            "Glycerite",
            "Trihydroxypropanal",
            "Propanetriol-1,2,3",
            "Trihydroxypropyl group",
            "Trihydroxyalkyl group",
            "Trihydroxymethyl group",
            "Trihydroxymethanyl group",
            "Trihydroxymethyl moiety",
            "Trihydroxypropyl moiety"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,2,3-Propanetriol",
                "Propan-1,2,3-triol",
                "Glycerin"
            ],
            "mismatches": [
                "Glycerol (Gly)",
                "Trihydroxypropane",
                "1,2,3-Trihydroxypropane",
                "Trihydric alcohol",
                "Trihydroxyalkane",
                "Trihydroxypropyl alcohol",
                "1,2,3-Trihydroxypropyl alcohol",
                "Glyceritol",
                "Glycyl alcohol",
                "Glyceryl alcohol",
                "Glycerite",
                "Trihydroxypropanal",
                "Propanetriol-1,2,3",
                "Trihydroxypropyl group",
                "Trihydroxyalkyl group",
                "Trihydroxymethyl group",
                "Trihydroxymethanyl group",
                "Trihydroxymethyl moiety",
                "Trihydroxypropyl moiety"
            ],
            "true_referents": [
                "(2R,3R)-heptane-1,2,3-triol",
                "1,2,3-butanetriol",
                "1,2,4-butanetriol",
                "2,2,4-trihydroxybutanoic acid",
                "2,3,4-trihydroxy-6-(hydroxymethyl)-5-methylbenzylacohol",
                "2,3,4-trihydroxypentanoic acid",
                "2,3-Dihydroxypropyl octadec-9-enoate",
                "2,3-dihydroxypropyl 12-methyltridecanoate",
                "2,3-dihydroxypropyl heptadecanoate",
                "2,4,5-Trihydroxytoluene",
                "3-Methoxy-1,2-propanediol",
                "9,10,18-trihydroxyoctadecanoic acid",
                "Glycerol 1-propanoate",
                "benzene-1,2,4-triol",
                "benzenetriol",
                "diglycerol",
                "glucosylglycerol",
                "glyceride",
                "glycerol",
                "glycerol mono(keto-meromycolate)",
                "glycerol phosphate",
                "heptane-1,2,3-triol",
                "methyl 3,4,5-trihydroxybenzoate"
            ],
            "TP": 3,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "triol",
        "domain": "chemistry",
        "response": "[\n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triolein (TO)\", \n  \"Triole",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            "1,3,5-Triol (1,3,5-trihydroxycyclohexane)",
            "2\u03b1,3\u03b2,16\u03b2-Triol (2\u03b1,3\u03b2,16\u03b2-trihydroxy-5\u03b2-androstan-17-one)",
            "2\u03b1,5\u03b1,10\u03b2-Triol (2\u03b1,5\u03b1,10\u03b2-trihydroxy-5\u03b1-androstan-17-one)",
            "3\u03b1,7\u03b1,12\u03b1-Triol (3\u03b1,7\u03b1,12\u03b1-trihydroxy-5\u03b2-cholan-24-oic acid)",
            "\u03b1-Eleostearic triol (9-hydroxy-10,13-dioxo-11-octadecaenoic acid)",
            "Betulinic triol (3\u03b2,28,29-trihydroxy-20(29)-lupen-30-oic acid)",
            "Castasterone triol (2,3,22,23-tetrahydroxy-24-nor-5\u03b2-cholan-16,22-lactone)",
            "Cholecalciferol triol (1,3,25-trihydroxy-vitamin D3)",
            "Cholesterol triol (3\u03b2,5\u03b1,6\u03b2-trihydroxy-cholestan-7-one)",
            "Cycloartenol triol (4,4,14\u03b1-trimethyl-3\u03b2,9\u03b2,19-trihydroxy-24Z-\u039422-cholesten-7-one)",
            "Epibrassinolide triol (2,3,22,23-tetrahydroxy-24-nor-5\u03b2-cholan-16,22-lactone)",
            "Ergosterol triol (3\u03b2,5\u03b1,6\u03b2-trihydroxy-ergostan-7-one)",
            "24-Epiheterochromin triol (2,3,22,23-tetrahydroxy-24-nor-5\u03b2-cholan-16,22-lactone)",
            "28-Homobrassinolide triol (2,3,22,23-tetrahydroxy-24-nor-5\u03b2-cholan-16,22-lactone)",
            "Typhasterol triol (2,3,22,23-tetrahydroxy-24-nor-5\u03b2-cholan-16,22-lactone)",
            "Sitosterol triol (3\u03b2,5\u03b1,6\u03b2-trihydroxy-sitostan-7-one)",
            "Stigmasterol triol (3\u03b2,5\u03b1,6\u03b2-trihydroxy-stigmastan-7-one)",
            "Ursadiol triol (3\u03b2,20,22-trihydroxy-urs-12-en-28-oic acid)",
            "Vernolic triol (9-hydroxy-10,13-dioxo-11-octadecaenoic acid)",
            "Zymosterol triol (3\u03b2,5\u03b1,6\u03b2-trihydroxy-cholestan-7-one)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "1,3,5-Triol (1,3,5-trihydroxycyclohexane)",
                "2\u03b1,3\u03b2,16\u03b2-Triol (2\u03b1,3\u03b2,16\u03b2-trihydroxy-5\u03b2-androstan-17-one)",
                "2\u03b1,5\u03b1,10\u03b2-Triol (2\u03b1,5\u03b1,10\u03b2-trihydroxy-5\u03b1-androstan-17-one)",
                "3\u03b1,7\u03b1,12\u03b1-Triol (3\u03b1,7\u03b1,12\u03b1-trihydroxy-5\u03b2-cholan-24-oic acid)",
                "\u03b1-Eleostearic triol (9-hydroxy-10,13-dioxo-11-octadecaenoic acid)",
                "Betulinic triol (3\u03b2,28,29-trihydroxy-20(29)-lupen-30-oic acid)",
                "Castasterone triol (2,3,22,23-tetrahydroxy-24-nor-5\u03b2-cholan-16,22-lactone)",
                "Cholecalciferol triol (1,3,25-trihydroxy-vitamin D3)",
                "Cholesterol triol (3\u03b2,5\u03b1,6\u03b2-trihydroxy-cholestan-7-one)",
                "Cycloartenol triol (4,4,14\u03b1-trimethyl-3\u03b2,9\u03b2,19-trihydroxy-24Z-\u039422-cholesten-7-one)",
                "Epibrassinolide triol (2,3,22,23-tetrahydroxy-24-nor-5\u03b2-cholan-16,22-lactone)",
                "Ergosterol triol (3\u03b2,5\u03b1,6\u03b2-trihydroxy-ergostan-7-one)",
                "24-Epiheterochromin triol (2,3,22,23-tetrahydroxy-24-nor-5\u03b2-cholan-16,22-lactone)",
                "28-Homobrassinolide triol (2,3,22,23-tetrahydroxy-24-nor-5\u03b2-cholan-16,22-lactone)",
                "Typhasterol triol (2,3,22,23-tetrahydroxy-24-nor-5\u03b2-cholan-16,22-lactone)",
                "Sitosterol triol (3\u03b2,5\u03b1,6\u03b2-trihydroxy-sitostan-7-one)",
                "Stigmasterol triol (3\u03b2,5\u03b1,6\u03b2-trihydroxy-stigmastan-7-one)",
                "Ursadiol triol (3\u03b2,20,22-trihydroxy-urs-12-en-28-oic acid)",
                "Vernolic triol (9-hydroxy-10,13-dioxo-11-octadecaenoic acid)",
                "Zymosterol triol (3\u03b2,5\u03b1,6\u03b2-trihydroxy-cholestan-7-one)"
            ],
            "true_referents": [
                "(24R)-1alpha,24-dihydroxy-22-oxavitamin D3",
                "(25R)-7alpha,26-dihydroxycholesterol",
                "(3beta,16alpha)-13,28-epoxyoleanane-3,16,30-triol",
                "1,2-dicaproyl-3-oleoylglycerol",
                "1,2-dioleoyl-3-beta-D-galactosylglycerol",
                "1-arachidonoyl-3-oleoylglycerol",
                "1-decanoyl-3-oleoylglycerol",
                "1-linolenoyl-3-oleoylglycerol",
                "13,14,15,16-tetranorlabdane-8alpha,12,18-triol",
                "1alpha,25-dihydroxy-2beta-(1,3-dihydroxypropoxy)vitamin D3",
                "1alpha,25-dihydroxy-2beta-(3-hydroxypropoxy)vitamin D3",
                "1alpha,25-dihydroxy-2beta-(4-hydroxybutoxy)vitamin D3",
                "2,4,5-Trihydroxytoluene",
                "2,4,6-trihydroxyphenylhexan-1-one",
                "2alpha,3beta,23alpha-trihydroxyurs-12-en-28-oic acid 28-O-beta-D-glucopyranoside",
                "3-O-(alpha-L-oleandrosyl)oleandolide",
                "3beta,15alpha,22-trihydroxyhopane",
                "5alpha-androstane-3beta,6alpha,17beta-triol",
                "5alpha-androstane-3beta,7alpha,17beta-triol",
                "6-pentadecylbenzene-1,2,4-triol",
                "7alpha,26-dihydroxycholesterol",
                "androst-5-ene-3alpha,16beta,17beta-triol",
                "androst-5-ene-3beta,7alpha,17beta-triol",
                "benzene-1,2,4-triol",
                "heptane-1,2,3-triol",
                "rel-hopan-27-al-6beta,11alpha,22-triol",
                "stigmastane-3beta,5alpha,6beta-triol"
            ],
            "TP": 0,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "triol",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "triol",
                "Canonical name": "triol"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "triol"
            ],
            "true_referents": [
                "benzene-1,2,4-triol",
                "heptane-1,2,3-triol",
                "hopane-6beta,7beta,22-triol"
            ],
            "TP": 0,
            "FP": 1,
            "FN": 0
        }
    }
]