[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triglyceride (TG)",
            "Phospholipid",
            "Wax",
            "Sphingolipid",
            "Cholesterol ester",
            "Glycerol",
            "Lecithin",
            "Sphingomyelin",
            "Glycolipid",
            "Eicosanoid",
            "Diacylglycerol (DAG)",
            "Monoacylglycerol",
            "Plasmalogen",
            "Oleic acid",
            "Palmitic acid",
            "Linoleic acid",
            "Arachidonic acid",
            "Docosahexaenoic acid (DHA)",
            "Eicosapentaenoic acid (EPA)",
            "Stearic acid",
            "Lauric acid",
            "Myristic acid",
            "Capric acid",
            "Caprylic acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triglyceride",
                "Phospholipid",
                "Wax",
                "Sphingolipid",
                "Sphingomyelin",
                "Glycolipid",
                "Monoacylglycerol",
                "Oleic acid",
                "Linoleic acid",
                "Arachidonic acid",
                "Docosahexaenoic acid"
            ],
            "mismatches": [
                "Triglyceride (TG)",
                "Cholesterol ester",
                "Glycerol",
                "Lecithin",
                "Eicosanoid",
                "Diacylglycerol (DAG)",
                "Plasmalogen",
                "Palmitic acid",
                "Eicosapentaenoic acid (EPA)",
                "Stearic acid",
                "Lauric acid",
                "Myristic acid",
                "Capric acid",
                "Caprylic acid"
            ],
            "true_referents": [
                "6-Methyl caprylic acid",
                "8-propionyl caprylic acid",
                "9-oxo capric acid",
                "Lauryl oleate",
                "Palmitic acid(d3)",
                "Physalien",
                "acacic acid",
                "aminophospholipid",
                "arachidonic acid",
                "cholesteryl ester",
                "diacylglycerol-O(34:1)",
                "diarachidonoylglycerol",
                "docosahexaenoic acid",
                "glyceric acid",
                "glyceride",
                "glycolipid",
                "glycosphingolipid",
                "linoleic acid",
                "monoacylglycerol",
                "monooleoylglycerol",
                "myristoleic acid",
                "octacosapentaenoic acid",
                "oleic acid",
                "phosphatidylcholine",
                "phospholipid",
                "prostaglandin",
                "sarmentologenin",
                "sphingolipid",
                "sphingomyelin",
                "sphingosine",
                "stearolic acid",
                "triglyceride",
                "trimethyl acrylic acid",
                "wax",
                "wax ester"
            ],
            "TP": 11,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Acetic acid ethyl ester (Ethyl acetate)",
            "Butyric acid methyl ester (Methyl butyrate)",
            "Caprylic acid ethyl ester (Ethyl caprylate)",
            "Decanoic acid methyl ester (Methyl caprate)",
            "Dodecanoic acid ethyl ester (Ethyl laurate)",
            "Eicosanoic acid methyl ester (Methyl arachidate)",
            "Hexanoic acid ethyl ester (Ethyl caproate)",
            "Lauric acid methyl ester (Methyl dodecylate)",
            "Linoleic acid ethyl ester (Ethyl linoleate)",
            "Myristic acid ethyl ester (Ethyl myristate)",
            "Oleic acid methyl ester (Methyl oleate)",
            "Palmitic acid ethyl ester (Ethyl palmitate)",
            "Palmitoleic acid ethyl ester (Ethyl palmitoleate)",
            "Pentanoic acid ethyl ester (Ethyl valerate)",
            "Phenyl acetate",
            "Propionic acid ethyl ester (Ethyl propionate)",
            "Stearic acid ethyl ester (Ethyl stearate)",
            "Tetradecanoic acid methyl ester (Methyl myristate)",
            "Triglyceride (Triacylglycerol)",
            "Valeric acid ethyl ester (Ethyl pentanoate)",
            "Zeaxanthin dipalmitate",
            "Zinc stearate",
            "Glyceryl trioleate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl butyrate",
                "Methyl arachidate",
                "Ethyl laurate",
                "Ethyl linoleate",
                "Ethyl myristate",
                "Ethyl palmitoleate",
                "Ethyl propionate",
                "Triglyceride",
                "Ethyl pentanoate"
            ],
            "mismatches": [
                "Acetic acid ethyl ester (Ethyl acetate)",
                "Caprylic acid ethyl ester (Ethyl caprylate)",
                "Decanoic acid methyl ester (Methyl caprate)",
                "Hexanoic acid ethyl ester (Ethyl caproate)",
                "Lauric acid methyl ester (Methyl dodecylate)",
                "Oleic acid methyl ester (Methyl oleate)",
                "Palmitic acid ethyl ester (Ethyl palmitate)",
                "Pentanoic acid ethyl ester (Ethyl valerate)",
                "Phenyl acetate",
                "Stearic acid ethyl ester (Ethyl stearate)",
                "Tetradecanoic acid methyl ester (Methyl myristate)",
                "Zeaxanthin dipalmitate",
                "Zinc stearate",
                "Glyceryl trioleate"
            ],
            "true_referents": [
                "1-O-(phenylacetyl)glycerol",
                "3-methyl-tetradecanoic acid",
                "Ethyl pentanoate",
                "Glyceryl lactooleate",
                "Lauryl myristoleate",
                "Methyl butyrate",
                "Methyl stearate",
                "Oleyl palmitate",
                "Stearidonic Acid ethyl ester",
                "alpha-ethyl valeric acid",
                "ethyl hexanoate",
                "ethyl laurate",
                "ethyl linoleate",
                "ethyl myristate",
                "ethyl palmitoleate",
                "ethyl propionate",
                "fatty acid ethyl ester",
                "glyceride",
                "meso-zeaxanthin",
                "methyl arachidate",
                "methyl decanoate",
                "methyl myristoleate",
                "methyl oleate",
                "propionic acid",
                "propyl acetate",
                "triglyceride",
                "zeaxanthin",
                "zeaxanthin bis(beta-D-glucoside)"
            ],
            "TP": 9,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triacylglycerol (TAG)",
            "Diacylglycerol (DAG)",
            "Monoacylglycerol (MAG)",
            "Wax ester",
            "Phosphatidylcholine",
            "Phosphatidylethanolamine",
            "Phosphatidylserine",
            "Phosphatidylinositol",
            "Phosphatidic acid",
            "Sphingomyelin",
            "Cerebroside",
            "Ganglioside",
            "Cholesteryl ester",
            "Acylcarnitine",
            "Acetyl-CoA",
            "Propionyl-CoA",
            "Butyryl-CoA",
            "Palmitoyl-CoA",
            "Stearoyl-CoA",
            "Oleoyl-CoA",
            "Linoleoyl-CoA",
            "Arachidonoyl-CoA",
            "Eicosapentaenoyl-CoA",
            "Docosahexaenoyl-CoA"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Monoacylglycerol (MAG)",
                "Wax ester",
                "Phosphatidylcholine",
                "Phosphatidylethanolamine",
                "Phosphatidic acid",
                "Sphingomyelin",
                "Cerebroside",
                "Ganglioside",
                "Cholesteryl ester",
                "Propionyl-CoA",
                "Butyryl-CoA",
                "Palmitoyl-CoA",
                "Stearoyl-CoA",
                "Oleoyl-CoA",
                "Linoleoyl-CoA",
                "Arachidonoyl-CoA"
            ],
            "mismatches": [
                "Triacylglycerol (TAG)",
                "Diacylglycerol (DAG)",
                "Phosphatidylserine",
                "Phosphatidylinositol",
                "Acylcarnitine",
                "Acetyl-CoA",
                "Eicosapentaenoyl-CoA",
                "Docosahexaenoyl-CoA"
            ],
            "true_referents": [
                "3-substituted propionyl-CoA",
                "L-alpha-Phosphatidylcholine",
                "acetoacetyl-CoA",
                "arachidonoyl-CoA",
                "butyryl-CoA",
                "cerebroside",
                "cholesteryl ester",
                "diacylglycerol-O(34:1)",
                "diarachidonoylglycerol",
                "dioleoyl phosphatidylethanolamine",
                "docosahexaenoic acid",
                "fatty acylcarnitine",
                "ganglioside",
                "linoleoyl-CoA",
                "lysophosphatidylserine",
                "monoacylglycerol",
                "monooleoylglycerol",
                "oleoyl-CoA",
                "palmitoyl-CoA",
                "phosphatidic acid",
                "phosphatidic acid (16:0/18:1)",
                "phosphatidylcholine",
                "phosphatidylethanolamine",
                "phosphatidylglycerol",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "propionyl-CoA",
                "sphingolipid",
                "sphingomyelin",
                "stearoyl-CoA",
                "triacylglycerol 16:0_16:0_16:0",
                "triglyceride",
                "wax ester"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triacylglycerol (TAG)",
            "Phosphatidylcholine (PC)",
            "Phosphatidylethanolamine (PE)",
            "Phosphatidylserine (PS)",
            "Phosphatidylinositol (PI)",
            "Sphingomyelin",
            "Ceramide",
            "Cholesteryl ester",
            "Glyceryl monooleate",
            "Glyceryl dilaurate",
            "Methyl palmitate",
            "Ethyl oleate",
            "Butyl stearate",
            "Cetyl palmitate",
            "Isopropyl myristate",
            "Retinyl palmitate",
            "Tocopheryl acetate",
            "Linoleyl acetate",
            "Oleyl alcohol",
            "Waxes (e.g., beeswax)",
            "Cutin",
            "Suberin",
            "Sucrose polyester",
            "Prostaglandin ester"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl palmitate",
                "Ethyl oleate",
                "Ceramide",
                "Cholesteryl ester",
                "Retinyl palmitate",
                "Sphingomyelin"
            ],
            "mismatches": [
                "Triacylglycerol (TAG)",
                "Phosphatidylcholine (PC)",
                "Phosphatidylethanolamine (PE)",
                "Phosphatidylserine (PS)",
                "Phosphatidylinositol (PI)",
                "Glyceryl monooleate",
                "Glyceryl dilaurate",
                "Butyl stearate",
                "Cetyl palmitate",
                "Isopropyl myristate",
                "Tocopheryl acetate",
                "Linoleyl acetate",
                "Oleyl alcohol",
                "Waxes (e.g., beeswax)",
                "Cutin",
                "Suberin",
                "Sucrose polyester",
                "Prostaglandin ester"
            ],
            "true_referents": [
                "Linoleyl oleate",
                "Methyl palmitate",
                "Oleyl palmitate",
                "Prostaglandin a1 ethyl ester",
                "Sucrose monopalmitate",
                "Sucrose monostearate",
                "Tocopheronic acid",
                "abacopterin A",
                "alpha-tocopheronolactone",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1)-ceramide",
                "blazein",
                "butyl octadecanoate",
                "ceramide",
                "cholesteryl ester",
                "dilauroyl phosphatidylglycerol",
                "disuccinimidyl suberate",
                "ethyl oleate",
                "isopropyl palmitate",
                "monoacylglycerol",
                "monooleoylglycerol",
                "oleyl acetate",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "phosphatidylserine (18:0/22:6)",
                "polyoxyl 40 stearate",
                "prostaglandin E2 1-glyceryl ester",
                "protectin",
                "retinyl palmitate",
                "sphingolipid",
                "sphingomyelin",
                "triacylglycerol 16:0_16:0_16:0",
                "triglyceride",
                "wax",
                "wax ester"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Ethyl oleate (EO)",
            "Methyl linoleate (ML)",
            "Glyceryl tristearate (Tristearin)",
            "Glyceryl trioleate (Triolein)",
            "Methyl palmitate (MP)",
            "Ethyl stearate (ES)",
            "Butyl stearate (BS)",
            "Isopropyl myristate (IPM)",
            "Propylene glycol monostearate (PGMS)",
            "Cetyl palmitate (CP)",
            "Glyceryl monostearate (GMS)",
            "Glyceryl monolaurate (GML)",
            "Methyl laurate (MLA)",
            "Ethyl palmitate (EP)",
            "Octyl palmitate (OP)",
            "Glyceryl monopalmitate (GMP)",
            "Glyceryl trilaurate (Trilaurin)",
            "Isopropyl palmitate (IPP)",
            "Butyl laurate (BL)",
            "Ethyl laurate (EL)",
            "Methyl stearate (MS)",
            "Glyceryl tripalmitate (Tripalmitin)",
            "Ethyl caprylate (EC)",
            "Butyl oleate (BO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl oleate (EO)",
                "Methyl linoleate (ML)",
                "Methyl palmitate (MP)",
                "Methyl laurate (MLA)",
                "Octyl palmitate (OP)",
                "Isopropyl palmitate (IPP)",
                "Ethyl laurate (EL)",
                "Methyl stearate (MS)",
                "Butyl oleate (BO)"
            ],
            "mismatches": [
                "Glyceryl tristearate (Tristearin)",
                "Glyceryl trioleate (Triolein)",
                "Ethyl stearate (ES)",
                "Butyl stearate (BS)",
                "Isopropyl myristate (IPM)",
                "Propylene glycol monostearate (PGMS)",
                "Cetyl palmitate (CP)",
                "Glyceryl monostearate (GMS)",
                "Glyceryl monolaurate (GML)",
                "Ethyl palmitate (EP)",
                "Glyceryl monopalmitate (GMP)",
                "Glyceryl trilaurate (Trilaurin)",
                "Butyl laurate (BL)",
                "Glyceryl tripalmitate (Tripalmitin)",
                "Ethyl caprylate (EC)"
            ],
            "true_referents": [
                "1,2,3-tripalmitoleoylglycerol",
                "1-monopalmitoylglycerol",
                "1-monostearoylglycerol",
                "3-hydroxylaurate",
                "Elaidyl palmitate",
                "Ethylene glycol distearate",
                "Methyl palmitate",
                "Methyl stearate",
                "Myristoleyl laurate",
                "Oleyl laurate",
                "Propylene glycol stearate",
                "butyrate ester",
                "decyl palmitate",
                "ethyl decanoate",
                "ethyl laurate",
                "ethyl oleate",
                "isomyristate",
                "isopropyl palmitate",
                "methyl laurate",
                "methyl linoleate",
                "n-butyl oleate",
                "octyl palmitate",
                "triolein",
                "tristearoylglycerol"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triglyceride (TG)",
            "Phospholipid (PL)",
            "Sphingolipid (SL)",
            "Glycerolipid (GL)",
            "Fatty Acid Methyl Ester (FAME)",
            "Butyl Stearate (BS)",
            "Ethyl Laurate (EL)",
            "Methyl Palmitate (MP)",
            "Isopropyl Myristate (IPM)",
            "Octyl Palmitate (OP)",
            "Benzyl Oleate (BO)",
            "Decyl Oleate (DO)",
            "Propyl Linoleate (PLi)",
            "Hexyl Stearate (HS)",
            "Coco-Caprylate (CC)",
            "Cetyl Palmitate (CP)",
            "Lauryl Acetate (LA)",
            "Ethyl Myristate (EM)",
            "Methyl Stearate (MS)",
            "Glyceryl Monostearate (GMS)",
            "Glyceryl Trioleate (GTO)",
            "Caprylic Acid Triglyceride (CAT)",
            "Palmitic Acid Ethyl Ester (PAEE)",
            "Methyl Ricinoleate (MR)",
            "Capric Acid Triglyceride (CATG)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triglyceride (TG)",
                "Phospholipid (PL)",
                "Sphingolipid (SL)",
                "Glycerolipid (GL)",
                "Fatty Acid Methyl Ester (FAME)",
                "Ethyl Laurate (EL)",
                "Methyl Palmitate (MP)",
                "Octyl Palmitate (OP)",
                "Decyl Oleate (DO)",
                "Propyl Linoleate (PLi)",
                "Ethyl Myristate (EM)",
                "Methyl Stearate (MS)"
            ],
            "mismatches": [
                "Butyl Stearate (BS)",
                "Isopropyl Myristate (IPM)",
                "Benzyl Oleate (BO)",
                "Hexyl Stearate (HS)",
                "Coco-Caprylate (CC)",
                "Cetyl Palmitate (CP)",
                "Lauryl Acetate (LA)",
                "Glyceryl Monostearate (GMS)",
                "Glyceryl Trioleate (GTO)",
                "Caprylic Acid Triglyceride (CAT)",
                "Palmitic Acid Ethyl Ester (PAEE)",
                "Methyl Ricinoleate (MR)",
                "Capric Acid Triglyceride (CATG)"
            ],
            "true_referents": [
                "1,2,3-tripalmitoleoylglycerol",
                "1-capryloyl-3-oleoylglycerol",
                "1-monostearoylglycerol",
                "2-Hydroxypropyl stearate",
                "6-Methyl caprylic acid",
                "8-propionyl caprylic acid",
                "Lauryl oleate",
                "Methyl palmitate",
                "Methyl stearate",
                "acryloyl-CoA",
                "butyrate ester",
                "decyl oleate",
                "decyl palmitate",
                "ethyl laurate",
                "ethyl myristate",
                "fatty acid ethyl ester",
                "fatty acid methyl ester",
                "glyceride",
                "glycerolipid",
                "glycerophospholipid",
                "isomyristate",
                "n-butyl oleate",
                "octyl palmitate",
                "phosphatidylcholine",
                "phospholipid",
                "propyl linoleate",
                "ricinoleate",
                "sphingolipid",
                "sphingosine",
                "tetratriacontanoic acid",
                "triglyceride"
            ],
            "TP": 12,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triacylglycerol (TAG)",
            "Phosphatidylcholine (PC)",
            "Phosphatidylethanolamine (PE)",
            "Phosphatidylserine (PS)",
            "Phosphatidylinositol (PI)",
            "Phosphatidic acid (PA)",
            "Phosphatidylglycerol (PG)",
            "Cardiolipin (CL)",
            "Sphingomyelin (SM)",
            "Ceramide (Cer)",
            "Glycosphingolipid (GSL)",
            "Cerebroside (Cer)",
            "Ganglioside (Gang)",
            "Monoacylglycerol (MAG)",
            "Diacylglycerol (DAG)",
            "Polyunsaturated fatty acid esters of hydroxy fatty acids (PUFA-HFAs)",
            "Ethyl oleate (EO)",
            "Methyl linoleate (ML)",
            "Methyl palmitate (MP)",
            "Ethyl stearate (ES)",
            "Ethyl palmitate (EP)",
            "Methyl myristate (MM)",
            "Methyl stearate (MS)",
            "Ethyl myristate (EM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Phosphatidylcholine",
                "Phosphatidylethanolamine",
                "Phosphatidylinositol",
                "Phosphatidic acid",
                "Phosphatidylglycerol",
                "Cardiolipin",
                "Sphingomyelin",
                "Ceramide",
                "Glycosphingolipid",
                "Cerebroside",
                "Ganglioside",
                "Monoacylglycerol",
                "Diacylglycerol",
                "Ethyl oleate",
                "Methyl linoleate",
                "Methyl palmitate",
                "Methyl stearate",
                "Ethyl myristate"
            ],
            "mismatches": [
                "Triacylglycerol (TAG)",
                "Phosphatidylserine (PS)",
                "Polyunsaturated fatty acid esters of hydroxy fatty acids (PUFA-HFAs)",
                "Ethyl stearate (ES)",
                "Ethyl palmitate (EP)",
                "Methyl myristate (MM)"
            ],
            "true_referents": [
                "C20 ceramide",
                "Elaidyl palmitate",
                "Methyl palmitate",
                "Methyl stearate",
                "Myristoleyl myristate",
                "cardiolipin",
                "ceramide",
                "cerebroside",
                "diacylglycerol-O(34:1)",
                "diarachidonoylglycerol",
                "ethyl myristate",
                "ethyl oleate",
                "ganglioside",
                "glycosphingolipid",
                "hydroxy polyunsaturated fatty acid",
                "methyl linoleate",
                "monoacylglycerol",
                "monooleoylglycerol",
                "omega-hydroxy fatty ester",
                "phosphatidic acid",
                "phosphatidic acid (16:0/18:1)",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylglycerol",
                "phosphatidylglycerol phosphate",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "phosphatidylserine (18:0/22:6)",
                "phosphoglycosphingolipid",
                "sphingomyelin",
                "sphingomyelin 35:0",
                "triacylglycerol 16:0_16:0_16:0",
                "triglyceride"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Methyl oleate",
            "Ethyl stearate",
            "Butyl palmitate",
            "Isopropyl linoleate",
            "Glyceryl trilinoleate",
            "Methyl linolenate",
            "Ethyl arachidate",
            "Butyl behenate",
            "Isopropyl myristate",
            "Glyceryl tripalmitate",
            "Methyl ricinoleate",
            "Ethyl laurate",
            "Butyl oleate",
            "Isopropyl linolenate",
            "Glyceryl tristearate",
            "Methyl arachidate",
            "Ethyl behenate",
            "Butyl myristate",
            "Isopropyl palmitate",
            "Glyceryl trioleate",
            "Methyl myristate",
            "Ethyl linoleate",
            "Butyl stearate",
            "Isopropyl oleate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl oleate",
                "Methyl linolenate",
                "Ethyl arachidate",
                "Ethyl laurate",
                "Isopropyl palmitate",
                "Methyl arachidate",
                "Ethyl linoleate"
            ],
            "mismatches": [
                "Ethyl stearate",
                "Butyl palmitate",
                "Isopropyl linoleate",
                "Glyceryl trilinoleate",
                "Butyl behenate",
                "Isopropyl myristate",
                "Glyceryl tripalmitate",
                "Methyl ricinoleate",
                "Butyl oleate",
                "Isopropyl linolenate",
                "Glyceryl tristearate",
                "Ethyl behenate",
                "Butyl myristate",
                "Glyceryl trioleate",
                "Methyl myristate",
                "Butyl stearate",
                "Isopropyl oleate"
            ],
            "true_referents": [
                "1,2,3-trilinoleoylglycerol",
                "1,2,3-tripalmitoleoylglycerol",
                "Glyceryl lactooleate",
                "Isopropyl octanoate",
                "Myristoleyl myristate",
                "Oleyl behenate",
                "Oleyl palmitate",
                "Oleyl stearate",
                "butyl octadecanoate",
                "butyl octanoate",
                "ethyl arachidate",
                "ethyl laurate",
                "ethyl linoleate",
                "isooctyl laurate",
                "isopropyl ester",
                "isopropyl palmitate",
                "methyl arachidate",
                "methyl behenate",
                "methyl linolenate",
                "methyl myristoleate",
                "methyl oleate",
                "propyl linoleate",
                "ricinoleate",
                "tristearoylglycerol"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triglyceride",
            "Methyl stearate (MS)",
            "Ethyl palmitate (EP)",
            "Propyl oleate",
            "Butyl linoleate",
            "Glyceryl trioleate",
            "Glyceryl tristearate",
            "Dimethyl adipate",
            "Diethyl sebacate",
            "Dipropyl laurate",
            "Dibutyl phthalate (DBP)",
            "Isopropyl myristate",
            "Lauryl acetate",
            "Myristyl propionate",
            "Palmitoyl chloride",
            "Stearoyl-CoA",
            "Oleyl alcohol",
            "Linoleic acid ethyl ester",
            "Arachidyl benzoate",
            "Caprylic acid methyl ester",
            "Cetearyl alcohol",
            "Squalene acetate",
            "Phytanic acid ester",
            "Lauric acid ethyl ester"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triglyceride",
                "Methyl stearate",
                "Dimethyl adipate",
                "Dibutyl phthalate",
                "Stearoyl-CoA"
            ],
            "mismatches": [
                "Ethyl palmitate (EP)",
                "Propyl oleate",
                "Butyl linoleate",
                "Glyceryl trioleate",
                "Glyceryl tristearate",
                "Diethyl sebacate",
                "Dipropyl laurate",
                "Isopropyl myristate",
                "Lauryl acetate",
                "Myristyl propionate",
                "Palmitoyl chloride",
                "Oleyl alcohol",
                "Linoleic acid ethyl ester",
                "Arachidyl benzoate",
                "Caprylic acid methyl ester",
                "Cetearyl alcohol",
                "Squalene acetate",
                "Phytanic acid ester",
                "Lauric acid ethyl ester"
            ],
            "true_referents": [
                "6-Methyl caprylic acid",
                "Diisopropyl phthalate",
                "Dimethyl adipate",
                "Elaidyl palmitate",
                "Glyceryl lactooleate",
                "Lauryl oleate",
                "Linoleyl oleate",
                "Methyl stearate",
                "Myristoleyl myristate",
                "Oleyl laurate",
                "Palmitoleyl stearate",
                "arachidyl oleate",
                "cholesteryl acetate",
                "dibutyl phthalate",
                "dimethyl sebacate",
                "ethyl linoleate",
                "fatty acid methyl ester",
                "fatty acid phytyl ester",
                "glyceride",
                "isopropyl palmitate",
                "oleyl acetate",
                "propyl octanoate",
                "squalene",
                "stearoyl-CoA",
                "triglyceride",
                "tristearoylglycerol"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triglyceride (TG)",
            "Phospholipid",
            "Cholesteryl ester",
            "Wax ester",
            "Glycerophospholipid",
            "Sphingolipid",
            "Ceramide",
            "Diglyceride (DG)",
            "Monoglyceride (MG)",
            "Lecithin",
            "Plasmalogen",
            "Cardiolipin",
            "Sphingomyelin",
            "Glycosphingolipid",
            "Sterol ester",
            "Acylglycerol",
            "Lysophospholipid",
            "Platelet-activating factor (PAF)",
            "Cerebroside",
            "Ganglioside",
            "Prostaglandin",
            "Leukotriene",
            "Thromboxane",
            "Isoprostane"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triglyceride",
                "Phospholipid",
                "Cholesteryl ester",
                "Wax ester",
                "Glycerophospholipid",
                "Sphingolipid",
                "Ceramide",
                "Diglyceride",
                "Cardiolipin",
                "Sphingomyelin",
                "Glycosphingolipid",
                "Sterol ester",
                "Cerebroside",
                "Ganglioside",
                "Prostaglandin",
                "Leukotriene",
                "Thromboxane",
                "Isoprostane"
            ],
            "mismatches": [
                "Triglyceride (TG)",
                "Diglyceride (DG)",
                "Monoglyceride (MG)",
                "Lecithin",
                "Plasmalogen",
                "Acylglycerol",
                "Lysophospholipid",
                "Platelet-activating factor (PAF)"
            ],
            "true_referents": [
                "1,3-diglyceride",
                "1-monoglyceride",
                "F2-isoprostane",
                "PA(PGF1alpha/a-25:0)",
                "Physalien",
                "aminophospholipid",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1)-ceramide",
                "cardiolipin",
                "ceramide",
                "cerebroside",
                "cholesteryl ester",
                "diglyceride",
                "dihexadecanoylglycerol",
                "ganglioside",
                "glyceride",
                "glycerophosphoglycerol",
                "glycerophospholipid",
                "glycosphingolipid",
                "isoprostane",
                "leukotriene",
                "leukotriene E4",
                "lysophosphatidylcholine",
                "lysophosphatidylglycerol",
                "monoacylglycerol",
                "phosphatidylcholine",
                "phosphoglycosphingolipid",
                "phospholipid",
                "prostaglandin",
                "sarmentologenin",
                "sphingolipid",
                "sphingomyelin",
                "sphingosine",
                "steroid ester",
                "sterol ester",
                "thromboxane",
                "thromboxanes A",
                "triglyceride",
                "wax ester"
            ],
            "TP": 18,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triglyceride",
            "Phospholipid",
            "Wax ester",
            "Cholesteryl ester",
            "Vitamin A ester (Retinyl ester)",
            "Vitamin D ester",
            "Vitamin E ester (Tocopheryl ester)",
            "Vitamin K ester",
            "Monoacylglycerol (MAG)",
            "Diacylglycerol (DAG)",
            "Triacylglycerol (TAG)",
            "Sphingolipid",
            "Glycosphingolipid",
            "Ganglioside",
            "Cerebroside",
            "Sterol ester",
            "Fatty acid methyl ester (FAME)",
            "Fatty acid ethyl ester (FAEE)",
            "Polyunsaturated fatty acid ester (PUFA ester)",
            "Omega-3 fatty acid ester",
            "Omega-6 fatty acid ester",
            "Prostaglandin ester",
            "Leukotriene ester",
            "Thromboxane ester"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triglyceride",
                "Phospholipid",
                "Wax ester",
                "Cholesteryl ester",
                "Retinyl ester",
                "Monoacylglycerol",
                "Diacylglycerol",
                "Triacylglycerol",
                "Sphingolipid",
                "Glycosphingolipid",
                "Ganglioside",
                "Cerebroside",
                "Sterol ester",
                "Fatty acid methyl ester",
                "Fatty acid ethyl ester"
            ],
            "mismatches": [
                "Vitamin D ester",
                "Vitamin E ester (Tocopheryl ester)",
                "Vitamin K ester",
                "Polyunsaturated fatty acid ester (PUFA ester)",
                "Omega-3 fatty acid ester",
                "Omega-6 fatty acid ester",
                "Prostaglandin ester",
                "Leukotriene ester",
                "Thromboxane ester"
            ],
            "true_referents": [
                "Prostaglandin a1 ethyl ester",
                "Tocopheronic acid",
                "all-trans-retinyl ester",
                "cerebroside",
                "cholesteryl ester",
                "diacylglycerol-O(34:1)",
                "diarachidonoylglycerol",
                "fatty acid ester",
                "fatty acid ethyl ester",
                "fatty acid methyl ester",
                "ganglioside",
                "glyceride",
                "glycosphingolipid",
                "leukotriene E4 methyl ester",
                "monoacylglycerol",
                "monooleoylglycerol",
                "phosphatidylcholine",
                "phosphoglycosphingolipid",
                "phospholipid",
                "polyunsaturated fatty ester",
                "prostaglandin E2 1-glyceryl ester",
                "retinyl ester",
                "sphingolipid",
                "sphingosine",
                "steroid ester",
                "sterol ester",
                "thromboxanes A",
                "thromboxanes B",
                "triacylglycerol 16:0_16:0_16:0",
                "triglyceride",
                "wax ester"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Ethyl butyrate (C6H12O2)",
            "Methyl salicylate (C8H8O3)",
            "Isoamyl acetate (C7H14O2)",
            "Ethyl acetate (C4H8O2)",
            "Benzyl acetate (C9H10O2)",
            "Geranyl acetate (C12H20O2)",
            "Linalyl acetate (C12H20O2)",
            "Citronellyl acetate (C12H22O2)",
            "Isobutyl acetate (C6H12O2)",
            "Ethyl propionate (C5H10O2)",
            "Ethyl caproate (C8H16O2)",
            "Ethyl caprylate (C10H20O2)",
            "Ethyl laurate (C14H28O2)",
            "Ethyl palmitate (C18H36O2)",
            "Ethyl stearate (C20H40O2)",
            "Isopropyl myristate (C17H34O2)",
            "Glyceryl tristearate (C57H110O6)",
            "Glyceryl tripalmitate (C51H98O6)",
            "Triacetin (C9H14O6)",
            "Polyvinyl acetate (C4H6O2)n",
            "Cellulose acetate (C6H7O5)n",
            "Diethyl phthalate (C12H14O4)",
            "Dimethyl phthalate (C10H10O4)",
            "Dibutyl phthalate (C16H22O4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl butyrate",
                "Geranyl acetate",
                "Ethyl propionate",
                "Ethyl laurate",
                "Triacetin",
                "Dibutyl phthalate"
            ],
            "mismatches": [
                "Methyl salicylate",
                "Isoamyl acetate",
                "Ethyl acetate",
                "Benzyl acetate",
                "Linalyl acetate",
                "Citronellyl acetate",
                "Isobutyl acetate",
                "Ethyl caproate",
                "Ethyl caprylate",
                "Ethyl palmitate",
                "Ethyl stearate",
                "Isopropyl myristate",
                "Glyceryl tristearate",
                "Glyceryl tripalmitate",
                "Polyvinyl acetate",
                "Cellulose acetate",
                "Diethyl phthalate",
                "Dimethyl phthalate"
            ],
            "true_referents": [
                "(15Z,18Z,21Z,24Z,27Z)-triacontapentaenoate",
                "(E)-16-octadecenoic acid methyl ester",
                "(R)-linalyl acetate",
                "(S)-linalyl acetate",
                "1,2,3-tripalmitoleoylglycerol",
                "1-(alpha-Methyl-4-(2-methylpropyl)benzeneacetate)-beta-D-Glucopyranuronic acid",
                "2-ethylhexyl acetate",
                "4,4'-diapolycopen-4-al",
                "6-((Z)-14-hydroxypentadec-8-en-1-yl)salicylic acid",
                "Diisopropyl phthalate",
                "Ethyl (E)-2-dodecenoate",
                "Ethylene glycol distearate",
                "Fauronyl acetate",
                "benzylideneacetone",
                "citronellol",
                "citronellol acetate",
                "decyl palmitate",
                "dibutyl phthalate",
                "ethyl acetoacetate",
                "ethyl butyrate",
                "ethyl laurate",
                "ethyl propionate",
                "geranyl acetate",
                "hexyl acetate",
                "isoamyl isobutyrate",
                "isoamyl propanoate",
                "isobutyric acid",
                "isomyristate",
                "isopropyl salicylate",
                "monohexyl phthalate",
                "octyl acetate",
                "propionate",
                "saturated fatty ester C40H80O2",
                "triacetin"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Ethyl acetate (EtOAc)",
            "Methyl oleate",
            "Glyceryl trioleate (Triolein)",
            "Glyceryl tripalmitate (Tripalmitin)",
            "Glyceryl tristearate (Tristearin)",
            "Methyl stearate",
            "Ethyl linoleate",
            "Isopropyl myristate (IPM)",
            "Butyl stearate",
            "Cetyl palmitate",
            "Myristyl myristate",
            "Propyl laurate",
            "Hexyl laurate",
            "Octyl palmitate",
            "Decyl oleate",
            "Dodecyl stearate",
            "Tetradecyl myristate",
            "Hexadecyl palmitate",
            "Octadecyl oleate",
            "Eicosyl stearate",
            "Docosyl palmitate",
            "Tetracosyl myristate",
            "Hexacosyl stearate",
            "Octacosyl oleate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl oleate",
                "Triolein",
                "Methyl stearate",
                "Ethyl linoleate",
                "Octyl palmitate",
                "Decyl oleate"
            ],
            "mismatches": [
                "Ethyl acetate (EtOAc)",
                "Glyceryl tripalmitate (Tripalmitin)",
                "Glyceryl tristearate (Tristearin)",
                "Isopropyl myristate (IPM)",
                "Butyl stearate",
                "Cetyl palmitate",
                "Myristyl myristate",
                "Propyl laurate",
                "Hexyl laurate",
                "Dodecyl stearate",
                "Tetradecyl myristate",
                "Hexadecyl palmitate",
                "Octadecyl oleate",
                "Eicosyl stearate",
                "Docosyl palmitate",
                "Tetracosyl myristate",
                "Hexacosyl stearate",
                "Octacosyl oleate"
            ],
            "true_referents": [
                "1,2,3-tripalmitoleoylglycerol",
                "1-O-hexacosyl oleate",
                "Methyl stearate",
                "Myristoleyl myristate",
                "Oleyl laurate",
                "Oleyl palmitate",
                "butyl octadecanoate",
                "decyl oleate",
                "decyl palmitate",
                "dodecyl palmitate",
                "ethyl acetoacetate",
                "ethyl laurate",
                "ethyl linoleate",
                "hexacosanol",
                "isomyristate",
                "methyl oleate",
                "octacosanoate",
                "octadecanoic acid",
                "octyl palmitate",
                "stearyl palmitate",
                "triolein",
                "tristearoylglycerol"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "lipid",
        "domain": "chemistry",
        "response": "[\n  \"Glycerol triacetate (Triacetin)\", \n  \"Glycerol monopalmitate\", \n  \"Glycerol monostearate\", \n  \"Glycerol monoleate\", \n  \"Glycerol dioleate\", \n  \"Glycerol distearate\", \n  \"Glycerol trioleate\", \n  \"Glycerol trilinoleate\", \n  \"Glycerol trilinolenate\", \n  \"Triolein\", \n  \"Trioleyl phosphate\", \n  \"Trioleyl citrate\", \n  \"Trioleyl tartrate\", \n  \"Trioleyl succinate\", \n  \"Trioleyl lactate\", \n  \"Trioleyl adipate\", \n  \"Trioleyl phosphate\", \n  \"Trioleyl citrate\", \n  \"Trioleyl tartrate\", \n  \"Trioleyl succinate\", \n  \"Trioleyl lactate\", \n  \"Trioleyl adipate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\", \n  \"Glyceryl trioleate\",",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Glycerol trioleate (GTO)",
            "Glycerol tristearate",
            "Triacetin (Glycerol triacetate)",
            "Glycerol trilaurate",
            "Glycerol triarachidate",
            "Glycerol tripalmitate",
            "Glycerol tricaprylate",
            "Glycerol tricaprate",
            "Glycerol triundecylenate",
            "Glycerol triheneicosate",
            "Isopropyl myristate",
            "Isopropyl palmitate",
            "Isopropyl stearate",
            "Diisopropyl adipate",
            "Dioctyl adipate",
            "Dioctyl succinate",
            "Dibutyl phthalate",
            "Dioctyl phthalate",
            "Diethyl phthalate",
            "Dibutyl sebacate",
            "Dioctyl sebacate",
            "Dioctyl maleate",
            "Dioctyl fumarate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triacetin (Glycerol triacetate)",
                "Isopropyl palmitate",
                "Diisopropyl adipate",
                "Dibutyl phthalate"
            ],
            "mismatches": [
                "Glycerol trioleate (GTO)",
                "Glycerol tristearate",
                "Glycerol trilaurate",
                "Glycerol triarachidate",
                "Glycerol tripalmitate",
                "Glycerol tricaprylate",
                "Glycerol tricaprate",
                "Glycerol triundecylenate",
                "Glycerol triheneicosate",
                "Isopropyl myristate",
                "Isopropyl stearate",
                "Dioctyl adipate",
                "Dioctyl succinate",
                "Diethyl phthalate",
                "Dibutyl sebacate",
                "Dioctyl sebacate",
                "Dioctyl maleate",
                "Dioctyl fumarate"
            ],
            "true_referents": [
                "1,2,3-tripalmitoleoylglycerol",
                "1,2-dicaproyl-3-palmitoylglycerol",
                "1-capryloyl-3-oleoylglycerol",
                "3-hydroxylaurate",
                "Dibutyl adipate",
                "Dibutyl decanedioate",
                "Diethyl succinate",
                "Diisopropyl adipate",
                "Diisopropyl phthalate",
                "Glycerol 1-propanoate diacetate",
                "Glycerol triundecanoate",
                "Octadecyl fumarate",
                "Triethylene glycol bis(2-ethylhexanoate)",
                "dibutyl phthalate",
                "dimethyl sebacate",
                "dipentyl phthalate",
                "ethyl arachidate",
                "isopropyl palmitate",
                "triacetin",
                "triradylglycerol",
                "tristearoylglycerol"
            ],
            "TP": 4,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "lipid",
        "domain": "chemistry",
        "response": "error when calling model 'amazon.titan-text-express-v1': empty response",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]