[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "sodium lauryl sulfate (SLS)",
            "sodium dodecyl sulfate (SDS)",
            "dodecyl dimethyl benzyl ammonium chloride (DDAC)",
            "ethanol",
            "propylene glycol",
            "glycerol",
            "sorbitol",
            "polyethylene glycol (PEG)",
            "dodecyltrimethylammonium bromide (DTAB)",
            "cetyltrimethylammonium bromide (CTAB)",
            "decyltrimethylammonium bromide (DTAB-10)",
            "tetradecyltrimethylammonium bromide (DTAB-14)",
            "hexadecyltrimethylammonium bromide (DTAB-16)",
            "octadecyltrimethylammonium bromide (DTAB-18)",
            "sodium cholate",
            "sodium deoxycholate",
            "sodium taurocholate",
            "sodium taurodeoxycholate",
            "Tween 20",
            "Tween 80",
            "Brij 35",
            "Pluronic F127",
            "Cremophor EL",
            "SDS-PAGE buffer"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "sodium dodecyl sulfate (SDS)",
                "dodecyltrimethylammonium bromide (DTAB)",
                "cetyltrimethylammonium bromide (CTAB)",
                "glycerol"
            ],
            "mismatches": [
                "sodium lauryl sulfate (SLS)",
                "dodecyl dimethyl benzyl ammonium chloride (DDAC)",
                "ethanol",
                "propylene glycol",
                "sorbitol",
                "polyethylene glycol (PEG)",
                "decyltrimethylammonium bromide (DTAB-10)",
                "tetradecyltrimethylammonium bromide (DTAB-14)",
                "hexadecyltrimethylammonium bromide (DTAB-16)",
                "octadecyltrimethylammonium bromide (DTAB-18)",
                "sodium cholate",
                "sodium deoxycholate",
                "sodium taurocholate",
                "sodium taurodeoxycholate",
                "Tween 20",
                "Tween 80",
                "Brij 35",
                "Pluronic F127",
                "Cremophor EL",
                "SDS-PAGE buffer"
            ],
            "true_referents": [
                "(R)-edelfosine",
                "1-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "2,3-Diacetoxypropyl stearate",
                "4-dodecylbenzenesulfonic acid",
                "D-alanyl-L-alanyl poly(glycerol phosphate)",
                "Glycerol 1-propanoate",
                "LPE O-16:1",
                "LPE O-18:2",
                "PG(18:0/20:3)",
                "PG(35:3)",
                "PG(P-16:0/18:0)",
                "PG(P-18:0/19:0)",
                "SDZ 35-682",
                "Triton X-100",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "choline alfoscerate",
                "decyltrimethylammonium bromide",
                "diglycerol",
                "diphosphatidyl propylene glycol",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glyceride",
                "glycerol",
                "nonionic surfactant",
                "nonyl phenoxypolyethoxylethanol",
                "oleyl acetate",
                "phosphatidylcholine 27:1",
                "phosphatidylinositol 35:1",
                "pluronic P-123",
                "sodium 2-butyloctyl sulfate",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "sodium tetradecyl sulfate"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Sodium dodecyl sulfate (SDS)",
            "Cetyltrimethylammonium bromide (CTAB)",
            "Triton X-100",
            "Tween 20",
            "Tween 80",
            "Brij 35",
            "Sodium lauryl ether sulfate (SLES)",
            "Lecithin",
            "Sorbitan monostearate",
            "Pluronic F-68",
            "Chloroform",
            "Carbon tetrachloride",
            "Detergent (generic)",
            "Surfactin",
            "Biosurfactant (generic)",
            "Polysorbate 20",
            "Polysorbate 80",
            "Sodium lauryl sulfate (SLS)",
            "Sodium dodecylbenzenesulfonate (SDBS)",
            "Benzalkonium chloride",
            "Cetylpyridinium chloride",
            "Octylphenol ethoxylate",
            "Alkyl polyglucoside",
            "Lauryl glucoside"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triton X-100",
                "Detergent (generic)",
                "Surfactin",
                "Polysorbate 20",
                "Polysorbate 80",
                "Benzalkonium chloride",
                "Cetylpyridinium chloride"
            ],
            "mismatches": [
                "Sodium dodecyl sulfate (SDS)",
                "Cetyltrimethylammonium bromide (CTAB)",
                "Tween 20",
                "Tween 80",
                "Brij 35",
                "Sodium lauryl ether sulfate (SLES)",
                "Lecithin",
                "Sorbitan monostearate",
                "Pluronic F-68",
                "Chloroform",
                "Carbon tetrachloride",
                "Biosurfactant (generic)",
                "Sodium lauryl sulfate (SLS)",
                "Sodium dodecylbenzenesulfonate (SDBS)",
                "Octylphenol ethoxylate",
                "Alkyl polyglucoside",
                "Lauryl glucoside"
            ],
            "true_referents": [
                "1,2,3-Tris(chloromethoxy)propane",
                "1-alkylglycerol",
                "1-monostearoylglycerol",
                "2-(perfluorohexyl)ethyl dimorpholinophosphinate",
                "2-(perfluorooctyl)ethyl dimorpholinophosphinate",
                "2-ethylhexyl sulfate",
                "2-lauroylglycerol",
                "3-dodecylbenzenesulfonic acid",
                "4-dodecylbenzenesulfonic acid",
                "4-octylphenol",
                "PG(18:0/20:3)",
                "PG(35:3)",
                "PG(P-16:0/18:0)",
                "PG(P-18:0/19:0)",
                "SDZ 35-682",
                "Triton X-100",
                "alkylglycerol",
                "benzalkonium chloride",
                "cetylpyridinium bromide",
                "cetylpyridinium chloride",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "detergent",
                "dibutyrin",
                "dodecylbenzenesulfonic acid",
                "glycerolipid",
                "nonionic surfactant",
                "nonyl phenoxypolyethoxylethanol",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "phosphatidylinositol 35:1",
                "pluronic P-123",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "sodium dodecyl sulfate",
                "surfactin",
                "surfactin A",
                "surfactin B",
                "triethanolamine",
                "triethanolamine hydrochloride"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Soap (Sodium Lauryl Sulfate)",
            "Detergent (Sodium Dodecyl Sulfate)",
            "Shampoo",
            "Dishwashing Liquid",
            "Body Wash",
            "Hand Soap",
            "Laundry Detergent",
            "Bubble Bath",
            "Toothpaste",
            "Mouthwash",
            "Hand Sanitizer",
            "Shaving Cream",
            "Washing Powder",
            "Liquid Hand Soap",
            "Bath Bomb",
            "Car Wash Soap",
            "Floor Cleaner",
            "Window Cleaner",
            "Dish Soap",
            "Bath Soap",
            "Hand Dishwashing Liquid",
            "Liquid Laundry Soap",
            "Liquid Hand Soap with Antibacterial",
            "Bubble Solution"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Detergent (Sodium Dodecyl Sulfate)"
            ],
            "mismatches": [
                "Soap (Sodium Lauryl Sulfate)",
                "Shampoo",
                "Dishwashing Liquid",
                "Body Wash",
                "Hand Soap",
                "Laundry Detergent",
                "Bubble Bath",
                "Toothpaste",
                "Mouthwash",
                "Hand Sanitizer",
                "Shaving Cream",
                "Washing Powder",
                "Liquid Hand Soap",
                "Bath Bomb",
                "Car Wash Soap",
                "Floor Cleaner",
                "Window Cleaner",
                "Dish Soap",
                "Bath Soap",
                "Hand Dishwashing Liquid",
                "Liquid Laundry Soap",
                "Liquid Hand Soap with Antibacterial",
                "Bubble Solution"
            ],
            "true_referents": [
                "CL(10:0/10:0/10:0/11:0)",
                "PC(20:0/24:0)",
                "PHOOA-PE",
                "PON-PE",
                "Triton X-100",
                "benzalkonium chloride",
                "detergent",
                "nonionic surfactant",
                "sodium dodecyl sulfate",
                "surfactin"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Sodium Dodecyl Sulfate (SDS)",
            "Detergent",
            "Soap",
            "Surfactant",
            "Bile Salts",
            "Pulmonary Surfactant (PS)",
            "Docosahexaenoic Acid (DHA)",
            "Polyoxyethylene Glycol Octylphenol Ether (Triton X-100)",
            "Polyethylene Glycol (PEG)",
            "Alkyl Polyglucoside (APG)",
            "Cocamidopropyl Betaine (CAPB)",
            "Sodium Lauryl Ether Sulfate (SLES)",
            "Lecithin",
            "Lysophosphatidylcholine (LPC)",
            "Fluorosurfactant",
            "Silicone Surfactant",
            "Saponin",
            "Glycolipids",
            "Fatty Acid",
            "Emulsifier",
            "Wetting Agent",
            "Dispersant",
            "Foaming Agent",
            "Protein Denaturant (in some cases)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium Dodecyl Sulfate (SDS)",
                "Detergent",
                "Polyoxyethylene Glycol Octylphenol Ether (Triton X-100)",
                "Cocamidopropyl Betaine (CAPB)",
                "Lysophosphatidylcholine (LPC)"
            ],
            "mismatches": [
                "Soap",
                "Surfactant",
                "Bile Salts",
                "Pulmonary Surfactant (PS)",
                "Docosahexaenoic Acid (DHA)",
                "Polyethylene Glycol (PEG)",
                "Alkyl Polyglucoside (APG)",
                "Sodium Lauryl Ether Sulfate (SLES)",
                "Lecithin",
                "Fluorosurfactant",
                "Silicone Surfactant",
                "Saponin",
                "Glycolipids",
                "Fatty Acid",
                "Emulsifier",
                "Wetting Agent",
                "Dispersant",
                "Foaming Agent",
                "Protein Denaturant (in some cases)"
            ],
            "true_referents": [
                "1-linolenoyl-3-oleoylglycerol",
                "1-stearoyl-3-oleoylglycerol",
                "2-ethylhexyl sulfate",
                "Capsoside A",
                "D-alanyl-L-alanyl poly(glycerol phosphate)",
                "Glycolipid G2",
                "Glycolipid G3",
                "Glycolipid G4",
                "PS-PA",
                "Triton X-100",
                "alpha-D-glucuronosyl diglyceride",
                "amphiphile",
                "beta-D-galactopyranosyl diglyceride",
                "cocamidopropyl betaine",
                "detergent",
                "digitonin",
                "diphosphatidyl propylene glycol",
                "dodecylbenzenesulfonic acid",
                "glyceride",
                "glycerol phenylbutyrate",
                "glycerolipid",
                "lauramidopropyl betaine",
                "lysophosphatidylcholine",
                "lysophosphatidylcholine (0:0/18:3)",
                "nonionic surfactant",
                "nonyl phenoxypolyethoxylethanol",
                "omega-3-arachidonoyl-containing glycerolipid",
                "perfluorobutanesulfonic acid",
                "perfluorononanoic acid",
                "perfluorooctanoic acid",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "phosphatidylinositol",
                "polysorbate 80",
                "sodium dodecyl sulfate",
                "surfactin",
                "surfactin A",
                "triglyceride"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Sodium Lauryl Sulfate (SLS)",
            "Sodium Laureth Sulfate (SLES)",
            "Cocamidopropyl Betaine (CAPB)",
            "Lauryl Glucoside",
            "Decyl Glucoside",
            "Polysorbate 20",
            "Polysorbate 80",
            "Cetyl Alcohol",
            "Stearyl Alcohol",
            "Sorbitan Monostearate",
            "Sorbitan Monolaurate",
            "Sorbitan Monooleate",
            "Glyceryl Stearate",
            "Lecithin",
            "Benzalkonium Chloride",
            "Sodium Cocoyl Isethionate",
            "Cocamidopropyl Hydroxysultaine",
            "Disodium Laureth Sulfosuccinate",
            "Ammonium Lauryl Sulfate",
            "Ammonium Laureth Sulfate",
            "Lauramine Oxide",
            "Myristamine Oxide",
            "Cocamide MEA",
            "Cocamide DEA"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Polysorbate 20",
                "Polysorbate 80",
                "Benzalkonium Chloride"
            ],
            "mismatches": [
                "Sodium Lauryl Sulfate (SLS)",
                "Sodium Laureth Sulfate (SLES)",
                "Cocamidopropyl Betaine (CAPB)",
                "Lauryl Glucoside",
                "Decyl Glucoside",
                "Cetyl Alcohol",
                "Stearyl Alcohol",
                "Sorbitan Monostearate",
                "Sorbitan Monolaurate",
                "Sorbitan Monooleate",
                "Glyceryl Stearate",
                "Lecithin",
                "Sodium Cocoyl Isethionate",
                "Cocamidopropyl Hydroxysultaine",
                "Disodium Laureth Sulfosuccinate",
                "Ammonium Lauryl Sulfate",
                "Ammonium Laureth Sulfate",
                "Lauramine Oxide",
                "Myristamine Oxide",
                "Cocamide MEA",
                "Cocamide DEA"
            ],
            "true_referents": [
                "(R)-edelfosine",
                "1-O-(D-glucosyl)glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-monostearoylglycerol",
                "1-myristoyl-3-oleoylglycerol",
                "1-stearoyl-2-oleoylglycerol",
                "1-stearoyl-3-oleoylglycerol",
                "2-O-(alpha-D-glucopyranosyl)glycerol",
                "2-butyloctyl hydrogen sulfate",
                "2-ethylhexyl sulfate",
                "2-lauroylglycerol",
                "4-dodecylbenzenesulfonic acid",
                "Phosphatidylethanolamine lyso alkenyl 18",
                "alkylglycerol",
                "benzalkonium chloride",
                "cetyltrimethylammonium chloride",
                "cocamidopropyl betaine",
                "dodecylbenzenesulfonic acid",
                "dodecyldimethylamine N-oxide",
                "dodecyltrimethylammonium bromide",
                "glyceride",
                "glycerol",
                "glycerol phenylbutyrate",
                "glycerolipid",
                "lauramidopropyl betaine",
                "lauryl sulfobetaine",
                "monoacyl-3-O-(beta-D-galactosyl)-sn-glycerol",
                "monoacylglycerol",
                "monooctanoylglycerol",
                "monooleoylglycerol",
                "nonionic surfactant",
                "oleyl acetate",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "triethanolamine",
                "tristearoylglycerol"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Sodium Lauryl Sulfate (SLS)",
            "Cocamidopropyl Betaine (CAPB)",
            "Triton X-100",
            "Tween 20",
            "Sodium Dodecyl Sulfate (SDS)",
            "Polysorbate 80",
            "Octylphenol Ethoxylate",
            "Cetyl Trimethyl Ammonium Bromide (CTAB)",
            "Dodecylbenzenesulfonic Acid",
            "Nonylphenol Ethoxylate",
            "Sodium Oleate",
            "Sorbitan Monostearate (Span 60)",
            "Lauryl Glucoside",
            "Stearyl Alcohol",
            "Polyethylene Glycol (PEG) 400",
            "Alkyl Polyglycosides",
            "Cocamidopropyl Hydroxysultaine",
            "Glycerol Monolaurate",
            "Sodium Stearoyl Lactylate",
            "Lecithin",
            "Sodium Caprate",
            "Phenonip",
            "Silicone Surfactants",
            "Benzalkonium Chloride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cocamidopropyl Betaine (CAPB)",
                "Triton X-100",
                "Sodium Dodecyl Sulfate (SDS)",
                "Polysorbate 80",
                "Cetyl Trimethyl Ammonium Bromide (CTAB)",
                "Dodecylbenzenesulfonic Acid",
                "Benzalkonium Chloride"
            ],
            "mismatches": [
                "Sodium Lauryl Sulfate (SLS)",
                "Tween 20",
                "Octylphenol Ethoxylate",
                "Nonylphenol Ethoxylate",
                "Sodium Oleate",
                "Sorbitan Monostearate (Span 60)",
                "Lauryl Glucoside",
                "Stearyl Alcohol",
                "Polyethylene Glycol (PEG) 400",
                "Alkyl Polyglycosides",
                "Cocamidopropyl Hydroxysultaine",
                "Glycerol Monolaurate",
                "Sodium Stearoyl Lactylate",
                "Lecithin",
                "Sodium Caprate",
                "Phenonip",
                "Silicone Surfactants"
            ],
            "true_referents": [
                "1-alkylglycerol",
                "1-monostearoylglycerol",
                "1-stearoyl-2-oleoylglycerol",
                "1-stearoyl-3-oleoylglycerol",
                "2-butyloctyl hydrogen sulfate",
                "2-dodecylbenzenesulfonic acid",
                "2-ethylhexyl sulfate",
                "2-lauroylglycerol",
                "3-dodecylbenzenesulfonic acid",
                "4-octylphenol",
                "PG(18:0/20:3)",
                "PG(P-16:0/18:0)",
                "PG(P-18:0/19:0)",
                "PHHdiA-PI",
                "PHODA-PI",
                "PHOOA-PI",
                "Triton X-100",
                "alkylglycerol",
                "benzalkonium chloride",
                "bisphenol A (3-chloro-2-hydroxypropyl) (2,3-dihydroxypropyl) ether",
                "cetyltrimethylammonium bromide",
                "cocamidopropyl betaine",
                "diphosphatidyl propylene glycol",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glycerol phenylbutyrate",
                "glycerolipid",
                "lauramidopropyl betaine",
                "monoacylglycerol",
                "monoalkylglycerol",
                "nonionic surfactant",
                "nonyl phenoxypolyethoxylethanol",
                "oleyl oleate",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "polyoxyl 40 stearate",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 80",
                "sodium 2-butyloctyl sulfate",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "sodium tetradecyl sulfate",
                "surfactin",
                "surfactin A"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Sodium Lauryl Sulfate (SLS)",
            "Dioctyl Sodium Sulfosuccinate (DSS)",
            "Sodium Laureth Sulfate (SLES)",
            "Cocamidopropyl Betaine (CAPB)",
            "Ammonium Lauryl Sulfate (ALS)",
            "Decyl Glucoside",
            "Lauryl Glucoside",
            "Caprylic/Capric Glucoside",
            "Sodium Cocoyl Isethionate (SCI)",
            "Sodium Lauroyl Isethionate (SLI)",
            "Sodium Lauroyl Methyl Isethionate (SLMI)",
            "Sodium Lauroyl Sarcosinate",
            "Sodium Cocoamphoacetate",
            "Sodium Methyl Cocoyl Taurate",
            "Sodium Lauroyl Glutamate",
            "Sodium Cocoyl Glutamate",
            "Sodium Cocoyl Glycinate",
            "Sodium Lauroyl Lactylate",
            "Sodium Caproyl/Lauroyl Lactylate",
            "Sodium Cocoyl Apple Amino Acids",
            "Sodium Cocoyl Hydrolyzed Soy Protein",
            "Sodium Cocoyl Hydrolyzed Wheat Protein",
            "Sodium Cocoyl Hydrolyzed Collagen",
            "Sodium Cocoyl Hydrolyzed Keratin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cocamidopropyl betaine"
            ],
            "mismatches": [
                "Sodium Lauryl Sulfate (SLS)",
                "Dioctyl Sodium Sulfosuccinate (DSS)",
                "Sodium Laureth Sulfate (SLES)",
                "Ammonium Lauryl Sulfate (ALS)",
                "Decyl Glucoside",
                "Lauryl Glucoside",
                "Caprylic/Capric Glucoside",
                "Sodium Cocoyl Isethionate (SCI)",
                "Sodium Lauroyl Isethionate (SLI)",
                "Sodium Lauroyl Methyl Isethionate (SLMI)",
                "Sodium Lauroyl Sarcosinate",
                "Sodium Cocoamphoacetate",
                "Sodium Methyl Cocoyl Taurate",
                "Sodium Lauroyl Glutamate",
                "Sodium Cocoyl Glutamate",
                "Sodium Cocoyl Glycinate",
                "Sodium Lauroyl Lactylate",
                "Sodium Caproyl/Lauroyl Lactylate",
                "Sodium Cocoyl Apple Amino Acids",
                "Sodium Cocoyl Hydrolyzed Soy Protein",
                "Sodium Cocoyl Hydrolyzed Wheat Protein",
                "Sodium Cocoyl Hydrolyzed Collagen",
                "Sodium Cocoyl Hydrolyzed Keratin"
            ],
            "true_referents": [
                "1,2-Distearoyl-sn-glycero-3-phosphate (sodium salt)",
                "1,2-caproyl-3-alpha-linolenoylglycerol",
                "1,2-dioleoyl-3-lauroyl-sn-glycerol",
                "1-O-(D-glucosyl)glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-O-(phenylacetyl)glycerol",
                "1-Palmitoyl-2-hydroxy-sn-glycero-3-PE",
                "1-capryloyl-3-oleoylglycerol",
                "1-lauroyl-sn-glycerol",
                "1-oleoyl-3-palmitoylglycerol",
                "1-palmitoyl-2-glutaryl phosphatidylcholine",
                "1-palmityl-2-acetyl-3-lauroyl-sn-glycerol",
                "2,3-Diacetoxypropyl stearate",
                "2-O-(alpha-D-glucopyranosyl)glycerol",
                "2-lauroylglycerol",
                "3-(Acetyloxy)-2-hydroxypropyl icosanoate",
                "4-dodecylbenzenesulfonic acid",
                "alpha-D-glucosyl-(1->6)-alpha-D-glucosyl-(1->6)-alpha-D-glucosyl-(1->3')-1-alkyl-2-acylglycerol",
                "cocamidopropyl betaine",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glycerol phenylbutyrate",
                "lauramidopropyl betaine",
                "lauryl sulfobetaine",
                "linoleoyl containing 1,2,3-triacyl-sn-glycerol",
                "nonionic surfactant",
                "oleyl acetate",
                "sodium 2-butyloctyl sulfate",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "sodium tetradecyl sulfate"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Surfactant",
            "Soap",
            "Detergent",
            "Shampoo",
            "Bubble bath",
            "Hand sanitizer",
            "Emulsifier",
            "Wetting agent",
            "Foaming agent",
            "Fabric softener",
            "Laundry detergent",
            "Toothpaste",
            "Mouthwash",
            "Cosmetic cream",
            "Body wash",
            "Floor cleaner",
            "Shaving cream",
            "Paint additive",
            "Insecticide",
            "Firefighting foam",
            "Industrial cleaner",
            "Disinfectant",
            "Lubricant",
            "Textile dye"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Detergent"
            ],
            "mismatches": [
                "Surfactant",
                "Soap",
                "Shampoo",
                "Bubble bath",
                "Hand sanitizer",
                "Emulsifier",
                "Wetting agent",
                "Foaming agent",
                "Fabric softener",
                "Laundry detergent",
                "Toothpaste",
                "Mouthwash",
                "Cosmetic cream",
                "Body wash",
                "Floor cleaner",
                "Shaving cream",
                "Paint additive",
                "Insecticide",
                "Firefighting foam",
                "Industrial cleaner",
                "Disinfectant",
                "Lubricant",
                "Textile dye"
            ],
            "true_referents": [
                "CL(10:0/10:0/10:0/11:0)",
                "PHOOA-PE",
                "PON-PE",
                "Triton X-100",
                "amphiphile",
                "benzalkonium chloride",
                "detergent",
                "glycerol",
                "nonionic surfactant",
                "perfluorohexyloctane",
                "perfluorooctanoic acid",
                "polysorbate 80",
                "sodium dodecyl sulfate",
                "surfactin",
                "surfactin A"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Sodium dodecyl sulfate (SDS)",
            "Sodium lauryl sulfate (SLS)",
            "Triton X-100",
            "Tween 20 (Polysorbate 20)",
            "Tween 80 (Polysorbate 80)",
            "Cetyltrimethylammonium bromide (CTAB)",
            "Benzalkonium chloride",
            "Cocamidopropyl betaine",
            "Nonidet P-40",
            "Brij 35",
            "Span 20 (Sorbitan monolaurate)",
            "Span 80 (Sorbitan monooleate)",
            "Decyl glucoside",
            "Lauryl glucoside",
            "Hexadecyltrimethylammonium bromide",
            "Poloxamer 407",
            "Steareth-20",
            "Propylene glycol monostearate",
            "Alkyl polyglucoside",
            "Lauramine oxide",
            "Oleth-20",
            "Capryl glucoside",
            "Lauryl ether sulfate",
            "Dimethyldioctadecylammonium bromide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triton X-100",
                "polysorbate 20",
                "polysorbate 80",
                "cetyltrimethylammonium bromide",
                "benzalkonium chloride",
                "cocamidopropyl betaine",
                "Nonidet P-40"
            ],
            "mismatches": [
                "Sodium dodecyl sulfate (SDS)",
                "Sodium lauryl sulfate (SLS)",
                "Brij 35",
                "Span 20 (Sorbitan monolaurate)",
                "Span 80 (Sorbitan monooleate)",
                "Decyl glucoside",
                "Lauryl glucoside",
                "Hexadecyltrimethylammonium bromide",
                "Poloxamer 407",
                "Steareth-20",
                "Propylene glycol monostearate",
                "Alkyl polyglucoside",
                "Lauramine oxide",
                "Oleth-20",
                "Capryl glucoside",
                "Lauryl ether sulfate",
                "Dimethyldioctadecylammonium bromide"
            ],
            "true_referents": [
                "1-O-(D-glucosyl)glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-alkylglycerol",
                "1-capryl-2-oleoyl-sn-glycerol",
                "1-monostearoylglycerol",
                "2-O-(alpha-D-glucopyranosyl)glycerol",
                "2-ethylhexyl sulfate",
                "2-lauroylglycerol",
                "20:0-18:1-PS",
                "20:0-18:2-PS",
                "20:0-18:3-PS",
                "Nonidet P-40",
                "PC O-20:4",
                "PG(35:3)",
                "Phosphatidylethanolamine lyso alkenyl 18",
                "SDZ 35-682",
                "Triton X-100",
                "alkylglycerol",
                "benzalkonium chloride",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "cocamidopropyl betaine",
                "decyltrimethylammonium bromide",
                "dodecylbenzenesulfonic acid",
                "dodecyldimethylamine N-oxide",
                "dodecyltrimethylammonium bromide",
                "lauramidopropyl betaine",
                "monoacylglycerol 20:2",
                "monoacylglycerol 20:4",
                "nonionic surfactant",
                "phosphatidylinositol 35:1",
                "phosphatidylinositol 40:6",
                "pluronic P-123",
                "polyoxyl 40 stearate",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "sodium dodecyl sulfate",
                "sodium octadecanoate"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Sodium dodecyl sulfate (SDS)",
            "Triton X-100",
            "Tween 20",
            "Cetrimonium bromide (CTAB)",
            "Sodium laureth sulfate (SLES)",
            "Cocamidopropyl betaine",
            "Polysorbate 80",
            "Octyl glucoside",
            "Lauryl glucoside",
            "Sodium lauryl sarcosinate",
            "Alkyl polyglucoside",
            "Sodium lauroyl sarcosinate",
            "Cocamide MEA",
            "Decyl glucoside",
            "Sodium cocoyl isethionate",
            "Ammonium lauryl sulfate",
            "Sodium stearate",
            "Lecithin",
            "Saponin",
            "Bile salts",
            "Pluronic F-127",
            "Span 80",
            "Benzalkonium chloride",
            "Dodecyltrimethylammonium bromide (DTAB)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triton X-100",
                "Cocamidopropyl betaine",
                "Polysorbate 80",
                "Benzalkonium chloride",
                "Dodecyltrimethylammonium bromide (DTAB)"
            ],
            "mismatches": [
                "Sodium dodecyl sulfate (SDS)",
                "Tween 20",
                "Cetrimonium bromide (CTAB)",
                "Sodium laureth sulfate (SLES)",
                "Octyl glucoside",
                "Lauryl glucoside",
                "Sodium lauryl sarcosinate",
                "Alkyl polyglucoside",
                "Sodium lauroyl sarcosinate",
                "Cocamide MEA",
                "Decyl glucoside",
                "Sodium cocoyl isethionate",
                "Ammonium lauryl sulfate",
                "Sodium stearate",
                "Lecithin",
                "Saponin",
                "Bile salts",
                "Pluronic F-127",
                "Span 80"
            ],
            "true_referents": [
                "(2R)-3-(Octadecyloxy)-2-(pentadecanoyloxy)propyl tetracosanoate",
                "1,2-dioleoyl-3-lauroyl-sn-glycerol",
                "1-O-(D-glucosyl)glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-Octylglycerol",
                "1-alkylglycerol",
                "1-stearoyl-3-oleoylglycerol",
                "2-(perfluorohexyl)ethyl dimorpholinophosphinate",
                "2-(perfluorooctyl)ethyl dimorpholinophosphinate",
                "2-O-(alpha-D-glucopyranosyl)glycerol",
                "2-lauroylglycerol",
                "4-dodecylbenzenesulfonic acid",
                "Capsoside A",
                "PG(18:0/20:3)",
                "PG(P-16:0/18:0)",
                "PG(P-18:0/19:0)",
                "PS(18:0/20:0)",
                "PS(18:2_20:0)",
                "Triton X-100",
                "alkylglycerol",
                "benzalkonium chloride",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "cocamidopropyl betaine",
                "decyltrimethylammonium bromide",
                "digitonin",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glycerolipid",
                "lauramidopropyl betaine",
                "nonionic surfactant",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "phosphatidylinositol",
                "pluronic P-123",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 80",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "triethanolamine",
                "triglyceride"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Sodium dodecyl sulfate (SDS)",
            "Cetrimonium bromide (CTAB)",
            "Benzalkonium chloride (BAC)",
            "Sodium laureth sulfate (SLES)",
            "Cocamidopropyl betaine (CAPB)",
            "Polysorbate 20 (Tween 20)",
            "Polysorbate 80 (Tween 80)",
            "Sodium stearate",
            "Sodium laurate",
            "Decyl glucoside",
            "Lauryl glucoside",
            "Octyl sulfosuccinate",
            "Lecithin",
            "Saponin",
            "Bile salts",
            "Sodium cholate",
            "Sodium deoxycholate",
            "Dimethyldodecylamine oxide (DDAO)",
            "Hexadecyltrimethylammonium bromide (CTAB)",
            "Polyoxyethylene (10) oleyl ether (Brij 97)",
            "Polyoxyethylene (20) cetyl ether (Brij 58)",
            "Polyoxyethylene (20) stearyl ether (Brij 78)",
            "Polyoxyethylene (100) stearyl ether (Brij 700)",
            "Polyethylene glycol tert-octylphenyl ether (Triton X-100)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium dodecyl sulfate (SDS)",
                "Benzalkonium chloride (BAC)",
                "Cocamidopropyl betaine (CAPB)",
                "Polysorbate 20 (Tween 20)",
                "Polysorbate 80 (Tween 80)",
                "Polyethylene glycol tert-octylphenyl ether (Triton X-100)"
            ],
            "mismatches": [
                "Cetrimonium bromide (CTAB)",
                "Sodium laureth sulfate (SLES)",
                "Sodium stearate",
                "Sodium laurate",
                "Decyl glucoside",
                "Lauryl glucoside",
                "Octyl sulfosuccinate",
                "Lecithin",
                "Saponin",
                "Bile salts",
                "Sodium cholate",
                "Sodium deoxycholate",
                "Dimethyldodecylamine oxide (DDAO)",
                "Hexadecyltrimethylammonium bromide (CTAB)",
                "Polyoxyethylene (10) oleyl ether (Brij 97)",
                "Polyoxyethylene (20) cetyl ether (Brij 58)",
                "Polyoxyethylene (20) stearyl ether (Brij 78)",
                "Polyoxyethylene (100) stearyl ether (Brij 700)"
            ],
            "true_referents": [
                "1,2,3-Tris(1-ethoxyethoxy)propane",
                "1,2-ditetradecanoyl-3-(6-sulfoquinovopyranosyl)glycerol",
                "1-O-(D-glucosyl)glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-stearoyl-3-oleoylglycerol",
                "2-O-(alpha-D-glucopyranosyl)glycerol",
                "2-lauroylglycerol",
                "4-dodecylbenzenesulfonic acid",
                "Capsoside A",
                "Diglyceryl monooleate",
                "Triton X-100",
                "benzalkonium chloride",
                "cetyltrimethylammonium bromide",
                "choline alfoscerate",
                "cocamidopropyl betaine",
                "digitonin",
                "dodecylbenzenesulfonic acid",
                "dodecyldimethylamine N-oxide",
                "dodecyltrimethylammonium bromide",
                "glycerol ether",
                "glycerol phenylbutyrate",
                "glycerolipid",
                "lauramidopropyl betaine",
                "nonionic surfactant",
                "nonyl phenoxypolyethoxylethanol",
                "oleyl oleate",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "phosphatidylinositol",
                "polyoxyl 40 stearate",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "sodium 2-butyloctyl sulfate",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "sodium tetradecyl sulfate",
                "triethanolamine",
                "triglyceride"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Soap (C16H35NaO2)",
            "Detergent",
            "Surfactant",
            "Emulsifier",
            "Wetting agent",
            "Foaming agent",
            "Sodium lauryl sulfate (SLS)",
            "Sodium dodecyl sulfate (SDS)",
            "Ammonium lauryl sulfate",
            "Alkyl benzene sulfonate",
            "Cocamidopropyl betaine",
            "Sodium stearate",
            "Lecithin",
            "Saponin",
            "Bile salt",
            "Polysorbate 20 (Tween 20)",
            "Polysorbate 80 (Tween 80)",
            "Span 20",
            "Span 80",
            "Triton X-100",
            "Sodium cholate",
            "Sodium deoxycholate",
            "Cetyltrimethylammonium bromide (CTAB)",
            "Aerosol OT"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Detergent",
                "Cocamidopropyl betaine",
                "Polysorbate 20 (Tween 20)",
                "Polysorbate 80 (Tween 80)",
                "Triton X-100",
                "Sodium dodecyl sulfate (SDS)",
                "Cetyltrimethylammonium bromide (CTAB)"
            ],
            "mismatches": [
                "Soap (C16H35NaO2)",
                "Surfactant",
                "Emulsifier",
                "Wetting agent",
                "Foaming agent",
                "Sodium lauryl sulfate (SLS)",
                "Ammonium lauryl sulfate",
                "Alkyl benzene sulfonate",
                "Sodium stearate",
                "Lecithin",
                "Saponin",
                "Bile salt",
                "Span 20",
                "Span 80",
                "Sodium cholate",
                "Sodium deoxycholate",
                "Aerosol OT"
            ],
            "true_referents": [
                "(2R)-2-(Palmitoyloxy)-3-(phosphonooxy)propyl stearate",
                "(2S)-3-Hydroxy-2-(octanoyloxy)propyl decanoate",
                "1-stearoyl-3-oleoylglycerol",
                "20:2-18:3-PS",
                "3-dodecylbenzenesulfonic acid",
                "4-dodecylbenzenesulfonic acid",
                "AOPE",
                "Capsoside A",
                "OA-PS",
                "PG(18:0/20:3)",
                "PG(20:4/20:4)",
                "PS(18:0/20:0)",
                "PS(18:2_20:0)",
                "Triton X-100",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "choline alfoscerate",
                "cocamidopropyl betaine",
                "detergent",
                "digitonin",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glycerolipid",
                "lauramidopropyl betaine",
                "nonionic surfactant",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "phosphatidylinositol",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "sodium 2-butyloctyl sulfate",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "sodium tetradecyl sulfate",
                "surfactin",
                "surfactin A",
                "tristearoylglycerol"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Soap (SOAP)",
            "Detergent (DET)",
            "Surfactant (SURF)",
            "Wetting agent (WET)",
            "Emulsifier (EMU)",
            "Dispersant (DIS)",
            "Foaming agent (FOA)",
            "Penetrant (PEN)",
            "Solubilizer (SOL)",
            "Degreaser (DEG)",
            "Shampoo (SHA)",
            "Dishwashing liquid (DIS)",
            "Laundry detergent (LAU)",
            "Household cleaner (HOU)",
            "Industrial cleaner (IND)",
            "Cosmetic ingredient (COS)",
            "Pharmaceutical excipient (PHA)",
            "Agricultural adjuvant (AGR)",
            "Firefighting foam (FIR)",
            "Oil spill dispersant (OIL)",
            "Textile processing aid (TEX)",
            "Concrete admixture (CON)",
            "Paints and coatings additive (PAI)",
            "Printing ink additive (INK)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "detergent"
            ],
            "mismatches": [
                "Soap (SOAP)",
                "Surfactant (SURF)",
                "Wetting agent (WET)",
                "Emulsifier (EMU)",
                "Dispersant (DIS)",
                "Foaming agent (FOA)",
                "Penetrant (PEN)",
                "Solubilizer (SOL)",
                "Degreaser (DEG)",
                "Shampoo (SHA)",
                "Dishwashing liquid (DIS)",
                "Laundry detergent (LAU)",
                "Household cleaner (HOU)",
                "Industrial cleaner (IND)",
                "Cosmetic ingredient (COS)",
                "Pharmaceutical excipient (PHA)",
                "Agricultural adjuvant (AGR)",
                "Firefighting foam (FIR)",
                "Oil spill dispersant (OIL)",
                "Textile processing aid (TEX)",
                "Concrete admixture (CON)",
                "Paints and coatings additive (PAI)",
                "Printing ink additive (INK)"
            ],
            "true_referents": [
                "DG(37:2)",
                "OHOHA-PC",
                "OKODA-PS",
                "PHOOA-PE",
                "PIP(16:1(9Z)/TXB2)",
                "PIP(TXB2/22:2(13Z,16Z))",
                "PS-PA",
                "Triton X-100",
                "acyl-GPI",
                "amphiphile",
                "benzalkonium chloride",
                "cocamidopropyl betaine",
                "detergent",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glycerol phenylbutyrate",
                "nonionic surfactant",
                "oleyl acetate",
                "perfluorobutanesulfonic acid",
                "perfluorohexyloctane",
                "perfluorononanoic acid",
                "perfluorooctanoic acid",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "quaternium-52",
                "sodium dodecyl sulfate",
                "surfactin",
                "surfactin A",
                "triethanolamine"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Surfactant (Surfactant)",
            "Detergent (Detergent)",
            "Soap (Soap)",
            "Shampoo (Shampoo)",
            "Toothpaste (Toothpaste)",
            "Milk (Milk)",
            "Blood plasma (Blood plasma)",
            "Lipid (Lipid)",
            "Phospholipid (Phospholipid)",
            "Cholesterol (Cholesterol)",
            "Bile acid (Bile acid)",
            "Emulsifier (Emulsifier)",
            "Tween (Tween)",
            "Brij (Brij)",
            "Span (Span)",
            "Tween 20 (Tween 20)",
            "Brij 35 (Brij 35)",
            "Span 80 (Span 80)",
            "Polysorbate 20 (Polysorbate 20)",
            "Polysorbate 80 (Polysorbate 80)",
            "Sodium lauryl sulfate (SLS)",
            "Sodium laureth sulfate (SLES)",
            "Cetrimonium bromide (Cetrimonium bromide)",
            "Cetylpyridinium chloride (Cetylpyridinium chloride)",
            "Docusate sodium (Docusate sodium)",
            "Sorbitan monolaurate (Sorbitan monolaurate)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Polysorbate 20",
                "Polysorbate 80",
                "Cetylpyridinium chloride"
            ],
            "mismatches": [
                "Surfactant",
                "Detergent",
                "Soap",
                "Shampoo",
                "Toothpaste",
                "Milk",
                "Blood plasma",
                "Lipid",
                "Phospholipid",
                "Cholesterol",
                "Bile acid",
                "Emulsifier",
                "Tween",
                "Brij",
                "Span",
                "Tween 20",
                "Brij 35",
                "Span 80",
                "Sodium lauryl sulfate",
                "Sodium laureth sulfate",
                "Cetrimonium bromide",
                "Docusate sodium",
                "Sorbitan monolaurate"
            ],
            "true_referents": [
                "1-linolenoyl-3-oleoylglycerol",
                "1-stearoyl-3-oleoylglycerol",
                "4-dodecylbenzenesulfonic acid",
                "MG(0:0/15:0/0:0)",
                "PA(A-21:0/I-22:0)",
                "PA(A-25:0/I-17:0)",
                "PG(14:0/20:0)",
                "PG(17:0/18:0)",
                "PG(18:0/20:3)",
                "PG(35:3)",
                "PG(P-16:0/18:0)",
                "PG(P-18:0/19:0)",
                "PS(18:0/20:0)",
                "PS(18:2_20:0)",
                "SDZ 35-682",
                "amphiphile",
                "cetylpyridinium bromide",
                "cetylpyridinium chloride",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "detergent",
                "diphosphatidyl propylene glycol",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glyceride",
                "glycerol",
                "glycerolipid",
                "lysophosphatidylcholine(0:0/20:5)",
                "nonionic surfactant",
                "phosphatidylcholine",
                "phosphatidylcholine (18:0/22:5)",
                "phosphatidylcholine (18:1/22:5)",
                "phosphatidylcholine (P-16:0/18:3)",
                "phosphatidylglycerol",
                "phosphatidylinositol 35:1",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "sodium dodecyl sulfate",
                "surfactin",
                "surfactin A",
                "triglyceride"
            ],
            "TP": 3,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Soap (S)",
            "Detergent (D)",
            "Sodium dodecyl sulfate (SDS)",
            "Cetylpyridinium chloride (CPC)",
            "Triton X-100 (TX-100)",
            "Brij 35 (B35)",
            "Tween 20 (T20)",
            "Tween 80 (T80)",
            "Glycerol (G)",
            "Bile salts (BS)",
            "Lecithin (L)",
            "Saponin (Sap)",
            "Cholic acid (CA)",
            "Deoxycholic acid (DCA)",
            "Chenodeoxycholic acid (CDCA)",
            "Ursodeoxycholic acid (UDCA)",
            "Cycloheximide (CHX)",
            "Digitonin (Dgt)",
            "Tyloxapol (Tlxp)",
            "Heptylphyside (Hp)",
            "Octoxynol (Oxynol)",
            "Polysorbate 20 (P20)",
            "Polysorbate 80 (P80)",
            "Sodium lauryl sulfate (SLS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Detergent",
                "Sodium dodecyl sulfate",
                "Cetylpyridinium chloride",
                "Triton X-100",
                "Glycerol",
                "Digitonin",
                "Tyloxapol",
                "Polysorbate 20",
                "Polysorbate 80"
            ],
            "mismatches": [
                "Soap (S)",
                "Brij 35 (B35)",
                "Tween 20 (T20)",
                "Tween 80 (T80)",
                "Bile salts (BS)",
                "Lecithin (L)",
                "Saponin (Sap)",
                "Cholic acid (CA)",
                "Deoxycholic acid (DCA)",
                "Chenodeoxycholic acid (CDCA)",
                "Ursodeoxycholic acid (UDCA)",
                "Cycloheximide (CHX)",
                "Heptylphyside (Hp)",
                "Octoxynol (Oxynol)",
                "Sodium lauryl sulfate (SLS)"
            ],
            "true_referents": [
                "(9Z)-octadecen-1-ol",
                "1,2-Dioleoyl-3-stearoyl-rac-glycerol",
                "1-heneicosanoyl-glycero-3-phosphate",
                "1-octanoyl-2-oleoylglycerol",
                "1-stearoyl-3-oleoylglycerol",
                "18:0-t16:1-PG",
                "CDP-DG(a-21:0/18:1(12Z)-2OH(9,10))",
                "Capsoside A",
                "GMGT-0",
                "Glycerol triundecanoate",
                "L-alpha-Phosphatidylcholine",
                "PG(14:0/20:0)",
                "PG(16:0/19:0)",
                "PG(18:0/20:3)",
                "SDZ 35-682",
                "TG(15:0/20:0/o-18:0)",
                "Triton X-100",
                "batilol",
                "cetylpyridinium bromide",
                "cetylpyridinium chloride",
                "cetyltrimethylammonium chloride",
                "detergent",
                "digalactosyldiacylglycerol 34:0",
                "digitonin",
                "dioleoyl phosphatidic acid",
                "dioleoylglycerol",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glucosylglycerol",
                "glyceride",
                "glycerol",
                "lysophosphatidylcholine",
                "nonionic surfactant",
                "nonyl phenoxypolyethoxylethanol",
                "phosphatidylcholine 44:1-2OH",
                "phosphatidylcholine 44:2-2OH",
                "phosphatidylinositol 35:1",
                "phosphatidylinositol 35:2",
                "polysorbate 20",
                "polysorbate 60",
                "polysorbate 80",
                "sodium 2-butyloctyl sulfate",
                "sodium dodecyl sulfate",
                "surfactin A",
                "surfactin D",
                "triethanolamine",
                "tyloxapol"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": "error when calling model 'amazon.titan-text-express-v1': empty response",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]