[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triglyceride (TG)",
            "Phosphatidylcholine (PC)",
            "Cholesterol",
            "Sphingomyelin (SM)",
            "Glycolipid",
            "Plasmalogen (PL)",
            "Lipid A",
            "Eicosanoid",
            "Cardiolipin (CL)",
            "Lecithin",
            "Bile acid",
            "Steroid hormone",
            "Ceramide (Cer)",
            "Ganglioside",
            "Wax",
            "Lipopolysaccharide (LPS)",
            "Triacylglycerol (TAG)",
            "Phosphatidylinositol (PI)",
            "Phosphatidylethanolamine (PE)",
            "Phosphatidylserine (PS)",
            "Diacylglycerol (DAG)",
            "Monoglyceride (MG)",
            "Oleic acid",
            "Lanosterol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholesterol",
                "Glycolipid",
                "Lipid A",
                "Bile acid",
                "Steroid hormone",
                "Ganglioside",
                "Wax",
                "Oleic acid",
                "Lanosterol"
            ],
            "mismatches": [
                "Triglyceride (TG)",
                "Phosphatidylcholine (PC)",
                "Sphingomyelin (SM)",
                "Plasmalogen (PL)",
                "Eicosanoid",
                "Cardiolipin (CL)",
                "Lecithin",
                "Ceramide (Cer)",
                "Lipopolysaccharide (LPS)",
                "Triacylglycerol (TAG)",
                "Phosphatidylinositol (PI)",
                "Phosphatidylethanolamine (PE)",
                "Phosphatidylserine (PS)",
                "Diacylglycerol (DAG)",
                "Monoglyceride (MG)"
            ],
            "true_referents": [
                "(+)-copalol",
                "(+)-pulegone",
                "(+)-trans-Pulegol",
                "1-monoglyceride",
                "23-hydroxy steroid",
                "C20 ceramide",
                "alpha-D-galactosyl-(1->3)-lipopolysaccharide",
                "bile acid",
                "cardiolipin",
                "ceramide",
                "cholesterol",
                "diacylglycerol-O(34:1)",
                "diarachidonoylglycerol",
                "ganglioside",
                "glucosyllipopolysaccharide",
                "glyceride",
                "glycolipid",
                "glycosphingolipid",
                "lanosterol",
                "lipid A",
                "lipopolysaccharide",
                "monoacylglycerol",
                "oleic acid",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "phosphatidylserine (18:0/22:6)",
                "phospholipid",
                "prostaglandin",
                "sphingomyelin",
                "sphingomyelin 35:0",
                "steroid",
                "steroid hormone",
                "triacylglycerol 16:0_16:0_16:0",
                "triglyceride",
                "wax",
                "wax ester"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triglycerides (TG)",
            "Phospholipids",
            "Cholesterol",
            "Steroids",
            "Fatty acids",
            "Waxes",
            "Glycolipids",
            "Sphingolipids",
            "Cholesteryl esters",
            "Lecithin (Phosphatidylcholine)",
            "Phosphatidylethanolamine",
            "Phosphatidylinositol",
            "Phosphatidylserine",
            "Cardiolipin",
            "Sphingomyelin",
            "Ceramides",
            "Gangliosides",
            "Eicosanoids",
            "Prostaglandins",
            "Leukotrienes",
            "Thromboxanes",
            "Endocannabinoids",
            "Dopamine",
            "Lipoproteins",
            "Very-low-density lipoprotein (VLDL)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholesterol",
                "Cholesteryl esters",
                "Phosphatidylethanolamine",
                "Phosphatidylinositol",
                "Cardiolipin",
                "Sphingomyelin",
                "Glycolipids",
                "Sphingolipids",
                "Ceramides",
                "Gangliosides",
                "Prostaglandins",
                "Leukotrienes",
                "Thromboxanes",
                "Endocannabinoids"
            ],
            "mismatches": [
                "Triglycerides (TG)",
                "Phospholipids",
                "Steroids",
                "Fatty acids",
                "Waxes",
                "Lecithin (Phosphatidylcholine)",
                "Phosphatidylserine",
                "Ceramides",
                "Eicosanoids",
                "Dopamine",
                "Lipoproteins",
                "Very-low-density lipoprotein (VLDL)"
            ],
            "true_referents": [
                "C20 ceramide",
                "D-dopa",
                "Delta(9)-tetrahydrocannabinol",
                "Delta(9)-tetrahydrocannabinolic acid",
                "anabolic androgenic steroid",
                "cardiolipin",
                "ceramide",
                "cholesterol",
                "cholesteryl ester",
                "dioleoyl phosphatidylethanolamine",
                "endocannabinoid",
                "essential fatty acid",
                "fatty acid",
                "ganglioside",
                "glyceride",
                "glycolipid",
                "glycosphingolipid",
                "leukotriene",
                "leukotriene E4",
                "lipopeptide",
                "lipoprotein cholesterol",
                "low-density lipoprotein cholesterol",
                "lysophosphatidylserine",
                "oleic acid",
                "phosphatidylcholine",
                "phosphatidylethanolamine",
                "phosphatidylglycerol",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "phospholipid",
                "prostaglandin",
                "prostanoid",
                "sphingolipid",
                "sphingomyelin",
                "sphingosine",
                "steroid",
                "steroid hormone",
                "thromboxane",
                "thromboxanes A",
                "triglyceride",
                "wax",
                "wax ester"
            ],
            "TP": 14,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triacylglycerol (TAG)",
            "Phosphatidylcholine (PC)",
            "Phosphatidylethanolamine (PE)",
            "Phosphatidylserine (PS)",
            "Phosphatidylinositol (PI)",
            "Sphingomyelin (SM)",
            "Cholesterol",
            "Cholesteryl ester",
            "Ceramide",
            "Glycosylceramide",
            "Sphingolipid",
            "Ganglioside",
            "Cardiolipin",
            "Phosphatidic acid (PA)",
            "Lysophosphatidic acid (LPA)",
            "Lysophosphatidylcholine (LPC)",
            "Diacylglycerol (DAG)",
            "Eicosanoid",
            "Prostaglandin",
            "Leukotriene",
            "Thromboxane",
            "Oxysterol",
            "Fatty acid",
            "Wax ester"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholesterol",
                "Cholesteryl ester",
                "Ceramide",
                "Glycosylceramide",
                "Sphingolipid",
                "Ganglioside",
                "Cardiolipin",
                "Prostaglandin",
                "Leukotriene",
                "Thromboxane",
                "Oxysterol",
                "Fatty acid",
                "Wax ester"
            ],
            "mismatches": [
                "Triacylglycerol (TAG)",
                "Phosphatidylcholine (PC)",
                "Phosphatidylethanolamine (PE)",
                "Phosphatidylserine (PS)",
                "Phosphatidylinositol (PI)",
                "Sphingomyelin (SM)",
                "Phosphatidic acid (PA)",
                "Lysophosphatidic acid (LPA)",
                "Lysophosphatidylcholine (LPC)",
                "Diacylglycerol (DAG)",
                "Eicosanoid"
            ],
            "true_referents": [
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1)-ceramide",
                "cardiolipin",
                "ceramide",
                "cholesterol",
                "cholesteryl ester",
                "diacylglycerol-O(34:1)",
                "diarachidonoylglycerol",
                "essential fatty acid",
                "fatty acid",
                "ganglioside",
                "glycosylceramide",
                "leukotriene",
                "leukotriene E4",
                "lysophosphatidic acid",
                "lysophosphatidic acids",
                "lysophosphatidylcholine",
                "lysophosphatidylcholine (0:0/18:3)",
                "oleic acid",
                "oxysterol",
                "phosphatidic acid",
                "phosphatidic acid (16:0/18:1)",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "phosphatidylserine (18:0/22:6)",
                "prostaglandin",
                "sphingolipid",
                "sphingomyelin",
                "sphingomyelin 35:0",
                "sphingosine",
                "thromboxane",
                "thromboxanes A",
                "triacylglycerol 16:0_16:0_16:0",
                "triglyceride",
                "wax ester"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Cholesterol (CHOL)",
            "Triacylglycerol (TAG)",
            "Phosphatidylcholine (PC)",
            "Sphingomyelin (SM)",
            "Ceramide (CER)",
            "Glycolipid (GL)",
            "Phosphatidylethanolamine (PE)",
            "Phosphatidylserine (PS)",
            "Phosphatidylinositol (PI)",
            "Cardiolipin (CL)",
            "Docosahexaenoic acid (DHA)",
            "Eicosapentaenoic acid (EPA)",
            "Linoleic acid (LA)",
            "Oleic acid (OA)",
            "Palmitic acid (PA)",
            "Stearic acid (SA)",
            "Arachidonic acid (ARA)",
            "Prostaglandin E2 (PGE2)",
            "Leukotriene B4 (LTB4)",
            "Sphingosine (SPH)",
            "Diacylglycerol (DAG)",
            "Lysophosphatidylcholine (LPC)",
            "Wax esters (WE)",
            "Sebum (SEB)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholesterol (CHOL)",
                "Triacylglycerol (TAG)",
                "Phosphatidylcholine (PC)",
                "Sphingomyelin (SM)",
                "Ceramide (CER)",
                "Glycolipid (GL)",
                "Phosphatidylethanolamine (PE)",
                "Phosphatidylserine (PS)",
                "Phosphatidylinositol (PI)",
                "Cardiolipin (CL)",
                "Docosahexaenoic acid (DHA)",
                "Linoleic acid (LA)",
                "Oleic acid (OA)",
                "Palmitic acid (PA)",
                "Arachidonic acid (ARA)",
                "Prostaglandin E2 (PGE2)",
                "Leukotriene B4 (LTB4)",
                "Sphingosine (SPH)",
                "Lysophosphatidylcholine (LPC)",
                "Wax esters (WE)"
            ],
            "mismatches": [
                "Eicosapentaenoic acid (EPA)",
                "Stearic acid (SA)",
                "Diacylglycerol (DAG)",
                "Sebum (SEB)"
            ],
            "true_referents": [
                "C20 ceramide",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "arachidonic acid",
                "cardiolipin",
                "ceramide",
                "cholesterol",
                "diacylglycerol-O(34:1)",
                "diarachidonoylglycerol",
                "dimethyl sebacate",
                "docosahexaenoic acid",
                "glycolipid",
                "glycophospholipid",
                "leukotriene B4",
                "linoleic acid",
                "lysophosphatidylcholine",
                "lysophosphatidylcholine (0:0/18:3)",
                "octacosapentaenoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "phosphatidylserine (18:0/22:6)",
                "prostaglandin E2",
                "sphingomyelin",
                "sphingomyelin 35:0",
                "sphingosine",
                "sphingosine(1+)",
                "stearolic acid",
                "triacylglycerol 16:0_16:0_16:0",
                "triglyceride",
                "wax ester"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Cholesterol (CHO)",
            "Triglyceride (TG)",
            "Phosphatidylcholine (PC)",
            "Phosphatidylserine (PS)",
            "Phosphatidylethanolamine (PE)",
            "Phosphatidylinositol (PI)",
            "Sphingomyelin (SM)",
            "Ceramide (Cer)",
            "Glycosphingolipid (GSL)",
            "Lysophosphatidylcholine (LPC)",
            "Lysophosphatidylethanolamine (LPE)",
            "Cardiolipin (CL)",
            "Diacylglycerol (DAG)",
            "Monoacylglycerol (MAG)",
            "Fatty Acid (FA)",
            "Eicosanoid",
            "Prostaglandin (PG)",
            "Leukotriene (LT)",
            "Thromboxane (TX)",
            "Steroid",
            "Bile Acid",
            "Lipoprotein",
            "Phosphatidic Acid (PA)",
            "Isoprenoid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholesterol (CHO)",
                "Triglyceride (TG)",
                "Phosphatidylcholine (PC)",
                "Phosphatidylethanolamine (PE)",
                "Phosphatidylinositol (PI)",
                "Sphingomyelin (SM)",
                "Ceramide (Cer)",
                "Glycosphingolipid (GSL)",
                "Lysophosphatidylcholine (LPC)",
                "Lysophosphatidylethanolamine (LPE)",
                "Cardiolipin (CL)",
                "Monoacylglycerol (MAG)",
                "Prostaglandin (PG)",
                "Leukotriene (LT)",
                "Thromboxane (TX)",
                "Steroid",
                "Bile Acid",
                "Phosphatidic Acid (PA)",
                "Isoprenoid"
            ],
            "mismatches": [
                "Phosphatidylserine (PS)",
                "Diacylglycerol (DAG)",
                "Fatty Acid (FA)",
                "Eicosanoid",
                "Lipoprotein"
            ],
            "true_referents": [
                "C20 ceramide",
                "androsterone",
                "bile acid",
                "cardiolipin",
                "ceramide",
                "cholesterol",
                "diacylglycerol-O(34:1)",
                "diarachidonoylglycerol",
                "fatty acid",
                "glyceride",
                "glycosphingolipid",
                "isoprene",
                "isoprenoid",
                "isoprenoid phosphate",
                "leukotriene",
                "leukotriene E4",
                "lipopeptide",
                "lipoprotein cholesterol",
                "low-density lipoprotein cholesterol",
                "lysophosphatidylcholine",
                "lysophosphatidylcholine (0:0/18:3)",
                "lysophosphatidylethanolamine",
                "lysophosphatidylethanolamine (0:0/18:2)",
                "monoacylglycerol",
                "monooleoylglycerol",
                "octadecanoic acid",
                "phosphatidic acid",
                "phosphatidic acid (16:0/18:1)",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "phosphatidylserine (18:0/22:6)",
                "phosphoglycosphingolipid",
                "prostaglandin",
                "sphingomyelin",
                "sphingomyelin 35:0",
                "steroid",
                "steroid hormone",
                "thromboxane",
                "thromboxane anion",
                "triglyceride"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Phospholipids (PL)",
            "Triglycerides (TG)",
            "Cholesterol (CH)",
            "Sphingolipids (SL)",
            "Glycolipids (GL)",
            "Fatty acids (FA)",
            "Steroids (ST)",
            "Lecithin (LEC)",
            "Ceramides (CER)",
            "Arachidonic acid (AA)",
            "Docosahexaenoic acid (DHA)",
            "Linoleic acid (LA)",
            "Palmitic acid (PA)",
            "Oleic acid (OA)",
            "Phosphatidylcholine (PC)",
            "Phosphatidylethanolamine (PE)",
            "Phosphatidylserine (PS)",
            "Cholesteryl esters (CE)",
            "Cardiolipin (CL)",
            "Fat-soluble vitamins (FSV)",
            "Eicosapentaenoic acid (EPA)",
            "Stearic acid (SA)",
            "Myristic acid (MA)",
            "Capric acid (CA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholesterol",
                "Sphingolipids (SL)",
                "Glycolipids (GL)",
                "Fatty acids (FA)",
                "Steroids (ST)",
                "Ceramides (CER)",
                "Arachidonic acid (AA)",
                "Docosahexaenoic acid (DHA)",
                "Linoleic acid (LA)",
                "Oleic acid (OA)",
                "Phosphatidylcholine (PC)",
                "Phosphatidylethanolamine (PE)",
                "Cholesteryl esters (CE)",
                "Cardiolipin (CL)"
            ],
            "mismatches": [
                "Phospholipids (PL)",
                "Triglycerides (TG)",
                "Lecithin (LEC)",
                "Palmitic acid (PA)",
                "Phosphatidylserine (PS)",
                "Fat-soluble vitamins (FSV)",
                "Eicosapentaenoic acid (EPA)",
                "Stearic acid (SA)",
                "Myristic acid (MA)",
                "Capric acid (CA)"
            ],
            "true_referents": [
                "10-hydroxycapric acid",
                "5-Hydroxycapric acid",
                "C20 ceramide",
                "Fattiviracin FV-9",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "Tocopheronic acid",
                "amino fatty acid",
                "anabolic androgenic steroid",
                "arachidonic acid",
                "cardiolipin",
                "ceramide",
                "cholesterol",
                "cholesteryl ester",
                "docosahexaenoic acid",
                "fatty acid",
                "glyceride",
                "glycolipid",
                "glycosphingolipid",
                "linoleic acid",
                "myristoleic acid",
                "octacosapentaenoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylserine (18:0/22:6)",
                "phospholipid",
                "sphingolipid",
                "sphingosine",
                "stearolic acid",
                "steroid",
                "steroid hormone",
                "trienoic fatty acid",
                "triglyceride",
                "vitamin A"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Cholesterol (Chol)",
            "Triglycerides (TG)",
            "Phospholipids (PL)",
            "Sphingolipids (SL)",
            "Glycolipids (GL)",
            "Diglycerides (DG)",
            "Monoglycerides (MG)",
            "Ceramides (Cer)",
            "Prostaglandins (PG)",
            "Leukotrienes (LT)",
            "Thromboxanes (TX)",
            "Lipopolysaccharides (LPS)",
            "Cardiolipins (CL)",
            "Phosphatidylcholine (PC)",
            "Phosphatidylethanolamine (PE)",
            "Phosphatidylserine (PS)",
            "Phosphatidylinositol (PI)",
            "Sterol esters (SE)",
            "Waxes (Wax)",
            "Omega-3 fatty acids (\u03c9-3)",
            "Omega-6 fatty acids (\u03c9-6)",
            "Saturated Fatty Acids (SFA)",
            "Monounsaturated Fatty Acids (MUFA)",
            "Polyunsaturated Fatty Acids (PUFA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cholesterol",
                "triglyceride",
                "sphingolipid",
                "glycolipid",
                "diglyceride",
                "prostaglandin",
                "leukotriene",
                "thromboxane",
                "lipopolysaccharide",
                "cardiolipin",
                "phosphatidylcholine",
                "phosphatidylethanolamine",
                "phosphatidylserine",
                "phosphatidylinositol",
                "sterol ester",
                "wax",
                "omega-3 fatty acid",
                "omega-6 fatty acid",
                "saturated fatty acid",
                "monounsaturated fatty acid",
                "polyunsaturated fatty acid"
            ],
            "mismatches": [
                "monoglycerides (MG)",
                "ceramides (Cer)"
            ],
            "true_referents": [
                "1,3-diglyceride",
                "1-monoglyceride",
                "2,3,4-saturated fatty acid",
                "2,3,4-saturated fatty acid(1-)",
                "C20 ceramide",
                "alpha-D-galactosyl-(1->3)-lipopolysaccharide",
                "cardiolipin",
                "ceramide",
                "cholesterol",
                "cholesteryl ester",
                "diglyceride",
                "glucosyllipopolysaccharide",
                "glyceride",
                "glycolipid",
                "glycosphingolipid",
                "leukotriene",
                "leukotriene E4",
                "lipopolysaccharide",
                "monoacylglycerol",
                "monounsaturated fatty acid",
                "octacosapentaenoic acid",
                "omega-3 fatty acid",
                "omega-6 fatty acid",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "phosphatidylserine (18:0/22:6)",
                "phospholipid",
                "polyunsaturated fatty acid",
                "prostaglandin",
                "saturated fatty acid",
                "sphingolipid",
                "sphingosine",
                "sterol",
                "sterol ester",
                "thromboxane",
                "thromboxanes A",
                "triglyceride",
                "unsaturated fatty acid",
                "wax",
                "wax ester"
            ],
            "TP": 21,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triglycerides",
            "Phospholipids",
            "Cholesterol",
            "Sphingolipids",
            "Waxes",
            "Steroids",
            "Fatty acids",
            "Glycolipids",
            "Lipoproteins",
            "Ceramides",
            "Eicosanoids",
            "Lipopolysaccharides",
            "Plasmalogens",
            "Glycerophospholipids",
            "Lipid droplets",
            "Lipid bilayers",
            "Chylomicrons",
            "Lipid rafts",
            "Lipid peroxides",
            "Lipid metabolism",
            "Lipidomics",
            "Lipid signaling",
            "Lipid rafts",
            "Lipidomics"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholesterol",
                "Glycolipids",
                "Lipopolysaccharides",
                "Glycerophospholipids"
            ],
            "mismatches": [
                "Triglycerides",
                "Phospholipids",
                "Sphingolipids",
                "Waxes",
                "Steroids",
                "Fatty acids",
                "Lipoproteins",
                "Ceramides",
                "Eicosanoids",
                "Plasmalogens",
                "Lipid droplets",
                "Lipid bilayers",
                "Chylomicrons",
                "Lipid rafts",
                "Lipid peroxides",
                "Lipid metabolism",
                "Lipidomics",
                "Lipid signaling"
            ],
            "true_referents": [
                "C20 ceramide",
                "D-glucosyllipopolysaccharide",
                "Physalien",
                "a phosphatidylcholine hydroperoxide",
                "anabolic androgenic steroid",
                "ceramide",
                "cholesterol",
                "essential fatty acid",
                "fatty acid",
                "glucosyllipopolysaccharide",
                "glyceride",
                "glycerolipid",
                "glycerophosphoglycerols",
                "glycerophospholipid",
                "glycolipid",
                "glycosphingolipid",
                "linoleic acid hydroperoxide",
                "lipid As",
                "lipid hydroperoxide",
                "lipid micelle",
                "lipopeptide",
                "lipopolysaccharide",
                "lipoprotein cholesterol",
                "low-density lipoprotein cholesterol",
                "oleic acid",
                "phosphatidic acid",
                "phosphatidylcholine",
                "phospholipid",
                "prostaglandin",
                "prostanoid",
                "sarmentologenin",
                "sphingolipid",
                "sphingomyelin",
                "sphingosine",
                "steroid",
                "steroid hormone",
                "triacylglycerol 16:0_16:0_16:0",
                "triglyceride",
                "wax",
                "wax ester"
            ],
            "TP": 4,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triglyceride (TAG)",
            "Phosphatidylcholine (PC)",
            "Cholesterol",
            "Sphingomyelin",
            "Ceramide",
            "Phosphatidylserine (PS)",
            "Phosphatidylethanolamine (PE)",
            "Eicosapentaenoic acid (EPA)",
            "Docosahexaenoic acid (DHA)",
            "Oleic acid",
            "Palmitic acid",
            "Stearic acid",
            "Linoleic acid",
            "Arachidonic acid",
            "Waxes",
            "Glycolipids",
            "Glycerolipids",
            "Glycerophospholipids",
            "Sphingolipids",
            "Steroids",
            "Vitamin D",
            "Vitamin E",
            "Vitamin K",
            "Lanosterol",
            "Retinoic acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholesterol",
                "Sphingomyelin",
                "Ceramide",
                "Docosahexaenoic acid",
                "Oleic acid",
                "Linoleic acid",
                "Arachidonic acid",
                "Glycolipids",
                "Glycerolipids",
                "Glycerophospholipids",
                "Sphingolipids",
                "Vitamin D",
                "Lanosterol"
            ],
            "mismatches": [
                "Triglyceride (TAG)",
                "Phosphatidylcholine (PC)",
                "Phosphatidylserine (PS)",
                "Phosphatidylethanolamine (PE)",
                "Eicosapentaenoic acid (EPA)",
                "Palmitic acid",
                "Stearic acid",
                "Waxes",
                "Steroids",
                "Vitamin E",
                "Vitamin K",
                "Retinoic acid"
            ],
            "true_referents": [
                "Palmitic acid(d3)",
                "Tocopheronic acid",
                "alpha-tocopheronolactone",
                "anabolic androgenic steroid",
                "arachidonic acid",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1)-ceramide",
                "beta-Tocopheryl quinone",
                "ceramide",
                "cholesterol",
                "docosahexaenoic acid",
                "glyceride",
                "glycerolipid",
                "glycerophosphoglycerols",
                "glycerophospholipid",
                "glycolipid",
                "glycosphingolipid",
                "lanosterol",
                "linoleic acid",
                "octacosapentaenoic acid",
                "oleic acid",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylserine (18:0/22:6)",
                "sphingolipid",
                "sphingomyelin",
                "sphingosine",
                "stearolic acid",
                "steroid",
                "steroid hormone",
                "triglyceride",
                "vitamin D",
                "vitamin D5",
                "wax",
                "wax ester"
            ],
            "TP": 13,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Cholesterol (CHEBI:16113)",
            "Triglyceride (CHEBI:17855)",
            "Phosphatidylcholine (CHEBI:16038)",
            "Sphingomyelin (CHEBI:17636)",
            "Ceramide (CHEBI:17761)",
            "Prostaglandin E2 (CHEBI:15551)",
            "Arachidonic acid (CHEBI:15843)",
            "Docosahexaenoic acid (CHEBI:36005)",
            "Eicosapentaenoic acid (CHEBI:28364)",
            "Cardiolipin (CHEBI:28494)",
            "Ganglioside GM1 (CHEBI:50699)",
            "Leukotriene B4 (CHEBI:15647)",
            "Platelet-activating factor (CHEBI:16595)",
            "Diacylglycerol (CHEBI:18035)",
            "Phosphatidylethanolamine (CHEBI:16038)",
            "Phosphatidylserine (CHEBI:16337)",
            "Steroid hormone (CHEBI:26962)",
            "Wax ester (CHEBI:35756)",
            "Glycosphingolipid (CHEBI:33563)",
            "Fatty acid (CHEBI:35366)",
            "Lysophosphatidylcholine (CHEBI:18348)",
            "Sphingosine (CHEBI:16393)",
            "Vitamin D (CHEBI:27300)",
            "Bile acid (CHEBI:3098)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholesterol (CHEBI:16113)",
                "Triglyceride (CHEBI:17855)",
                "Sphingomyelin (CHEBI:17636)",
                "Ceramide (CHEBI:17761)",
                "Prostaglandin E2 (CHEBI:15551)",
                "Arachidonic acid (CHEBI:15843)",
                "Docosahexaenoic acid (CHEBI:36005)",
                "Cardiolipin (CHEBI:28494)",
                "Ganglioside GM1 (CHEBI:50699)",
                "Leukotriene B4 (CHEBI:15647)",
                "Steroid hormone (CHEBI:26962)",
                "Wax ester (CHEBI:35756)",
                "Glycosphingolipid (CHEBI:33563)",
                "Fatty acid (CHEBI:35366)",
                "Lysophosphatidylcholine (CHEBI:18348)",
                "Sphingosine (CHEBI:16393)",
                "Vitamin D (CHEBI:27300)",
                "Bile acid (CHEBI:3098)"
            ],
            "mismatches": [
                "Phosphatidylcholine (CHEBI:16038)",
                "Eicosapentaenoic acid (CHEBI:28364)",
                "Platelet-activating factor (CHEBI:16595)",
                "Diacylglycerol (CHEBI:18035)",
                "Phosphatidylethanolamine (CHEBI:16038)",
                "Phosphatidylserine (CHEBI:16337)"
            ],
            "true_referents": [
                "(5Z,7E,9E,14Z,17Z)-icosapentaenoic acid",
                "24,25-Dihydroxyvitamin D",
                "C21-steroid hormone",
                "PA(2:0/PGF1alpha)",
                "PA(PGF1alpha/a-25:0)",
                "arachidonic acid",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1)-ceramide",
                "bile acid",
                "cardiolipin",
                "ceramide",
                "cholesterol",
                "diacylglycerol-O(34:1)",
                "docosahexaenoic acid",
                "eicosa-5,8,11,14,17-pentaenoic acid",
                "fatty acid",
                "fatty acid anion 19:0",
                "ganglioside GM1",
                "glyceride",
                "glycosphingolipid",
                "leukotriene B4",
                "lysophosphatidylcholine",
                "lysophosphatidylcholine (0:0/18:3)",
                "phosphatidylcholine (P-16:0/18:3)",
                "phosphatidylethanolamine (P-16:0/18:2)",
                "phosphatidylserine (18:0/22:6)",
                "phosphoglycosphingolipid",
                "prostaglandin E2",
                "sphingomyelin",
                "sphingomyelin 34:0",
                "sphingosine",
                "sphingosine(1+)",
                "steroid hormone",
                "triglyceride",
                "vitamin D",
                "wax ester"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triglyceride (TG)",
            "Phosphatidylcholine (PC)",
            "Phosphatidylethanolamine (PE)",
            "Phosphatidylserine (PS)",
            "Phosphatidylinositol (PI)",
            "Sphingomyelin (SM)",
            "Cholesterol (Chol)",
            "Cholesteryl ester (CE)",
            "Ceramide (Cer)",
            "Glucosylceramide (GlcCer)",
            "Galactosylceramide (GalCer)",
            "Lactosylceramide (LacCer)",
            "Ganglioside GM3",
            "Ganglioside GM2",
            "Ganglioside GM1",
            "Sulfatide (ST)",
            "Plasmalogen",
            "Cardiolipin (CL)",
            "Lysophosphatidylcholine (LPC)",
            "Lysophosphatidylethanolamine (LPE)",
            "Monoacylglycerol (MAG)",
            "Diacylglycerol (DAG)",
            "Wax ester",
            "Sterol ester"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triglyceride (TG)",
                "Phosphatidylcholine (PC)",
                "Phosphatidylethanolamine (PE)",
                "Phosphatidylserine (PS)",
                "Phosphatidylinositol (PI)",
                "Sphingomyelin (SM)",
                "Cholesterol (Chol)",
                "Cholesteryl ester (CE)",
                "Ceramide (Cer)",
                "Glucosylceramide (GlcCer)",
                "Galactosylceramide (GalCer)",
                "Lactosylceramide (LacCer)",
                "Ganglioside GM3",
                "Ganglioside GM2",
                "Ganglioside GM1",
                "Sulfatide (ST)",
                "Cardiolipin (CL)",
                "Lysophosphatidylcholine (LPC)",
                "Lysophosphatidylethanolamine (LPE)",
                "Monoacylglycerol (MAG)",
                "Wax ester",
                "Sterol ester"
            ],
            "mismatches": [
                "Plasmalogen",
                "Diacylglycerol (DAG)"
            ],
            "true_referents": [
                "C20 ceramide",
                "C24 Sulfatide",
                "Lactosylceramide (d18:1/12:0)",
                "Physalien",
                "aminophospholipid",
                "cardiolipin",
                "ceramide",
                "cholesterol",
                "cholesteryl ester",
                "diacylglycerol-O(34:1)",
                "diarachidonoylglycerol",
                "galactosylceramide",
                "ganglioside GM1",
                "ganglioside GM2 (2:0)",
                "ganglioside GM3",
                "glucosylceramide",
                "glyceride",
                "lysophosphatidylcholine",
                "lysophosphatidylcholine (0:0/18:3)",
                "lysophosphatidylethanolamine",
                "lysophosphatidylethanolamine (0:0/18:2)",
                "monoacylglycerol",
                "monooleoylglycerol",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "phosphatidylserine (18:0/22:6)",
                "sarmentologenin",
                "sphingomyelin",
                "sphingomyelin 35:0",
                "steroid ester",
                "sterol ester",
                "triglyceride",
                "wax ester"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Cholesterol (C27H46O)",
            "Phosphatidylcholine (PC)",
            "Triacylglycerol (TAG)",
            "Sphingomyelin (SM)",
            "Fatty acid (FA)",
            "Steroid hormone (e.g., Estrogen, Testosterone)",
            "Wax ester",
            "Prostaglandin (PG)",
            "Leukotriene (LT)",
            "Phosphatidylethanolamine (PE)",
            "Phosphatidylserine (PS)",
            "Phosphatidylinositol (PI)",
            "Cardiolipin (CL)",
            "Ceramide (Cer)",
            "Glycolipid (e.g., Ganglioside)",
            "Lipoprotein (e.g., HDL, LDL, VLDL)",
            "Vitamin A (Retinol)",
            "Vitamin D (Calciferol)",
            "Vitamin E (Tocopherol)",
            "Vitamin K (Phylloquinone)",
            "Bile acid (e.g., Cholic acid, Chenodeoxycholic acid)",
            "Monoacylglycerol (MAG)",
            "Diacylglycerol (DAG)",
            "Phosphatidylglycerol (PG)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Phosphatidylcholine",
                "Sphingomyelin",
                "Fatty acid",
                "Steroid hormone",
                "Wax ester",
                "Prostaglandin",
                "Leukotriene",
                "Phosphatidylethanolamine",
                "Phosphatidylserine",
                "Phosphatidylinositol",
                "Cardiolipin",
                "Ceramide",
                "Glycolipid",
                "Vitamin A",
                "Vitamin D",
                "Bile acid",
                "Monoacylglycerol",
                "Phosphatidylglycerol"
            ],
            "mismatches": [
                "Cholesterol (C27H46O)",
                "Triacylglycerol (TAG)",
                "Vitamin E (Tocopherol)",
                "Vitamin K (Phylloquinone)",
                "Diacylglycerol (DAG)",
                "Lipoprotein (e.g., HDL, LDL, VLDL)"
            ],
            "true_referents": [
                "(24S,25)-epoxy-7alpha-hydroxycholesterol",
                "(E,E)-Boviquinone 3",
                "C20 ceramide",
                "Tocopheronic acid",
                "alhpa-tocopheronic acid",
                "alpha-tocopheronolactone",
                "beta-Tocopheryl quinone",
                "beta-carotene",
                "bile acid",
                "cardiolipin",
                "ceramide",
                "diacylglycerol-O(34:1)",
                "diarachidonoylglycerol",
                "estradiol",
                "fatty acid",
                "ganglioside",
                "glycolipid",
                "high-density lipoprotein cholesterol",
                "leukotriene",
                "leukotriene E4",
                "lipoprotein cholesterol",
                "low-density lipoprotein cholesterol",
                "monoacylglycerol",
                "monooleoylglycerol",
                "multiorthoquinone",
                "octadecanoic acid",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylglycerol",
                "phosphatidylglycerol phosphate",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "phosphatidylserine (18:0/22:6)",
                "prostaglandin",
                "retinol",
                "sphingomyelin",
                "sphingomyelin 35:0",
                "steroid",
                "steroid hormone",
                "triacylglycerol 16:0_16:0_16:0",
                "triglyceride",
                "vitamin A",
                "vitamin D",
                "vitamin D5",
                "wax ester"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Cholesterol (CHOL)",
            "Triglyceride (TG)",
            "Phosphatidylcholine (PC)",
            "Phosphatidylethanolamine (PE)",
            "Phosphatidylserine (PS)",
            "Phosphatidylinositol (PI)",
            "Sphingomyelin (SM)",
            "Diacylglycerol (DAG)",
            "Monoacylglycerol (MAG)",
            "Fatty Acid (FA)",
            "Palmitic Acid (PA)",
            "Stearic Acid (SA)",
            "Oleic Acid (OA)",
            "Linoleic Acid (LA)",
            "Arachidonic Acid (AA)",
            "Eicosapentaenoic Acid (EPA)",
            "Docosahexaenoic Acid (DHA)",
            "Cardiolipin (CL)",
            "Ganglioside (GM)",
            "Ceramide (Cer)",
            "Phosphatidic Acid (PA)",
            "Lysophosphatidylcholine (LPC)",
            "Lysophosphatidylethanolamine (LPE)",
            "Lysophosphatidylserine (LPS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholesterol (CHOL)",
                "Triglyceride (TG)",
                "Phosphatidylcholine (PC)",
                "Phosphatidylethanolamine (PE)",
                "Phosphatidylserine (PS)",
                "Phosphatidylinositol (PI)",
                "Sphingomyelin (SM)",
                "Monoacylglycerol (MAG)",
                "Fatty Acid (FA)",
                "Oleic Acid (OA)",
                "Linoleic Acid (LA)",
                "Arachidonic Acid (AA)",
                "Docosahexaenoic Acid (DHA)",
                "Cardiolipin (CL)",
                "Ceramide (Cer)",
                "Phosphatidic Acid (PA)",
                "Lysophosphatidylcholine (LPC)",
                "Lysophosphatidylethanolamine (LPE)"
            ],
            "mismatches": [
                "Diacylglycerol (DAG)",
                "Palmitic Acid (PA)",
                "Stearic Acid (SA)",
                "Eicosapentaenoic Acid (EPA)",
                "Ganglioside (GM)",
                "Lysophosphatidylserine (LPS)"
            ],
            "true_referents": [
                "C20 ceramide",
                "Ganglioside GM1 (18:1/12:0)",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "arachidonic acid",
                "cardiolipin",
                "ceramide",
                "cholesterol",
                "diacylglycerol-O(34:1)",
                "diarachidonoylglycerol",
                "docosahexaenoic acid",
                "fatty acid",
                "glyceride",
                "linoleic acid",
                "lysophosphatidylcholine",
                "lysophosphatidylcholine (0:0/18:3)",
                "lysophosphatidylethanolamine",
                "lysophosphatidylethanolamine (0:0/18:2)",
                "lysophosphatidylserine",
                "monoacylglycerol",
                "monooleoylglycerol",
                "octacosapentaenoic acid",
                "octadecanoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "phosphatidic acid",
                "phosphatidic acid (16:0/18:1)",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "phosphatidylserine (18:0/22:6)",
                "sphingomyelin",
                "sphingomyelin 35:0",
                "stearolic acid",
                "triglyceride"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Cholesterol (Chol)",
            "Phosphatidylcholine (PC)",
            "Phosphatidylethanolamine (PE)",
            "Sphingomyelin (SM)",
            "Triacylglycerol (TAG)",
            "Dipalmitoylphosphatidylcholine (DPPC)",
            "Lysophosphatidylcholine (LPC)",
            "Lysophosphatidylethanolamine (LPE)",
            "Phosphatidylserine (PS)",
            "Phosphatidylinositol (PI)",
            "Glycosphingolipid",
            "Ceramide",
            "Sphingosine",
            "Glycophospholipid",
            "Lipopolysaccharide (LPS)",
            "Lipoteichoic acid (LTA)",
            "Cardiolipin",
            "Phosphatidylglycerol (PG)",
            "Phosphatidylglycerophosphate (PGP)",
            "Sphingomyelinase",
            "Phospholipase A2",
            "Lipid A",
            "Glycosphingolipid-anchored protein",
            "Sphingosine-1-phosphate (S1P)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholesterol (Chol)",
                "Phosphatidylcholine (PC)",
                "Phosphatidylethanolamine (PE)",
                "Sphingomyelin (SM)",
                "Triacylglycerol (TAG)",
                "Lysophosphatidylcholine (LPC)",
                "Lysophosphatidylethanolamine (LPE)",
                "Ceramide",
                "Sphingosine",
                "Glycophospholipid",
                "Lipopolysaccharide (LPS)",
                "Cardiolipin",
                "Phosphatidylglycerol (PG)",
                "Lipid A",
                "Sphingosine-1-phosphate (S1P)"
            ],
            "mismatches": [
                "Dipalmitoylphosphatidylcholine (DPPC)",
                "Phosphatidylserine (PS)",
                "Phosphatidylinositol (PI)",
                "Lipoteichoic acid (LTA)",
                "Phosphatidylglycerophosphate (PGP)",
                "Sphingomyelinase",
                "Phospholipase A2",
                "Glycosphingolipid-anchored protein"
            ],
            "true_referents": [
                "alpha-D-galactosyl-(1->3)-lipopolysaccharide",
                "beta-D-galactosyl-(1->4)-beta-D-glucosyl-(1<->1)-ceramide",
                "cardiolipin",
                "ceramide",
                "cholesterol",
                "dipalmitoyl phosphatidylglycerol",
                "diphosphatidyl propylene glycol",
                "glucosyllipopolysaccharide",
                "glycoglycerolipid",
                "glycophospholipid",
                "glycosphingolipid",
                "lipid A",
                "lipoic acid",
                "lipopolysaccharide",
                "lysophosphatidylcholine",
                "lysophosphatidylcholine (0:0/18:3)",
                "lysophosphatidylethanolamine",
                "lysophosphatidylethanolamine (0:0/18:2)",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylglycerol",
                "phosphatidylglycerol phosphate",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "phosphatidylserine (18:0/22:6)",
                "phosphoglycosphingolipid",
                "prostaglandin A2",
                "sphinganine",
                "sphingolipid",
                "sphingomyelin",
                "sphingomyelin 35:0",
                "sphingosine",
                "sphingosine 1-phosphate",
                "triacylglycerol 16:0_16:0_16:0",
                "triglyceride"
            ],
            "TP": 15,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            "Triglyceride (TG)",
            "Phosphatidylcholine (PC)",
            "Sphingomyelin (SM)",
            "Cholesterol",
            "Ganglioside (GM1)",
            "Ceramide (Cer)",
            "Sphingosine (Sph)",
            "Fatty acid (FA)",
            "Phosphatidylinositol (PI)",
            "Cardiolipin (CL)",
            "Lecithin",
            "Lipoxin (LX)",
            "Prostaglandin (PG)",
            "Leukotriene (LT)",
            "Thromboxane (TX)",
            "Eicosapentaenoic acid (EPA)",
            "Docosahexaenoic acid (DHA)",
            "Omega-3 fatty acid",
            "Omega-6 fatty acid",
            "Saturated fatty acid",
            "Monounsaturated fatty acid",
            "Polyunsaturated fatty acid",
            "Glycosphingolipid",
            "Phosphoglyceride",
            "Diacylglycerol (DAG)",
            "Monoglyceride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholesterol",
                "Ceramide (Cer)",
                "Sphingosine (Sph)",
                "Fatty acid (FA)",
                "Phosphatidylinositol (PI)",
                "Cardiolipin (CL)",
                "Lipoxin (LX)",
                "Prostaglandin (PG)",
                "Leukotriene (LT)",
                "Thromboxane (TX)",
                "Docosahexaenoic acid (DHA)",
                "Omega-3 fatty acid",
                "Omega-6 fatty acid",
                "Saturated fatty acid",
                "Monounsaturated fatty acid",
                "Polyunsaturated fatty acid",
                "Glycosphingolipid"
            ],
            "mismatches": [
                "Triglyceride (TG)",
                "Phosphatidylcholine (PC)",
                "Sphingomyelin (SM)",
                "Ganglioside (GM1)",
                "Lecithin",
                "Eicosapentaenoic acid (EPA)",
                "Phosphoglyceride",
                "Diacylglycerol (DAG)",
                "Monoglyceride"
            ],
            "true_referents": [
                "2,3,4-saturated fatty acid",
                "2,3,4-saturated fatty acid(1-)",
                "C20 ceramide",
                "cardiolipin",
                "ceramide",
                "cholesterol",
                "docosahexaenoic acid",
                "fatty acid",
                "ganglioside GM1",
                "glyceride",
                "glycerophosphoglycerol",
                "glycosphingolipid",
                "leukotriene",
                "leukotriene E4",
                "lipoxin",
                "monounsaturated fatty acid",
                "octacosapentaenoic acid",
                "octadecanoic acid",
                "omega-3 fatty acid",
                "omega-6 fatty acid",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylglycerol",
                "phosphatidylinositol",
                "phosphatidylinositol phosphate",
                "phosphoglycosphingolipid",
                "phospholipid",
                "polyunsaturated fatty acid",
                "polyunsaturated fatty ester",
                "prostaglandin",
                "saturated fatty acid",
                "sphingomyelin",
                "sphingomyelin 35:0",
                "sphingosine",
                "sphingosine(1+)",
                "thromboxane",
                "thromboxane anion",
                "triglyceride",
                "unsaturated fatty acid"
            ],
            "TP": 17,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "lipid",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "lipid",
                "Canonical Name": "lipid"
            },
            {
                "Referent": "phospholipid",
                "Canonical Name": "phospholipid"
            },
            {
                "Referent": "glycerolipid",
                "Canonical Name": "glycerolipid"
            },
            {
                "Referent": "glycerophospholipid",
                "Canonical Name": "glycerophospholipid"
            },
            {
                "Referent": "phosphatide",
                "Canonical Name": "phosphatide"
            },
            {
                "Referent": "fat",
                "Canonical Name": "fat"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            },
            {
                "Referent": "lipide",
                "Canonical Name": "lipide"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "phospholipid"
            ],
            "mismatches": [
                "lipid",
                "glycerolipid",
                "glycerophospholipid",
                "phosphatide",
                "fat",
                "lipide"
            ],
            "true_referents": [
                "cis-9,10-epoxyoctadecanoic acid",
                "diacylglycerol (18:0/18:1/0:0)",
                "lysophosphatidylcholine(0:0/16:0)",
                "lysophosphatidylcholine(0:0/18:0)",
                "phosphatidylcholine O-44:0",
                "phosphatidylglycerol",
                "phospholipid",
                "triacylglycerol 16:0_16:0_16:0",
                "triacylglycerol 16:0_16:0_18:0"
            ],
            "TP": 1,
            "FP": 6,
            "FN": 0
        }
    }
]