[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Lung Surfactant (LS)",
            "Detergent Surfactant",
            "Foam Surfactant",
            "Emulsifier Surfactant",
            "Surface Active Agent",
            "Wetting Agent",
            "Sodium Lauryl Sulfate (SLS)",
            "Cetyl Alcohol",
            "Polysorbate 80 (TWEEN 80)",
            "Lecithin",
            "Pluronic F-68",
            "Tween 20",
            "Brij 35",
            "Span 80",
            "Sodium Dodecyl Sulfate (SDS)",
            "Triton X-100",
            "Ethanol",
            "Glycerol Monostearate",
            "Soybean Oil",
            "Poloxamer 188",
            "Tween 80",
            "Pluronic P-123",
            "Sodium Cholate",
            "Brij 58"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triton X-100",
                "Pluronic P-123",
                "Sodium Dodecyl Sulfate (SDS)",
                "Polysorbate 80 (TWEEN 80)"
            ],
            "mismatches": [
                "Lung Surfactant (LS)",
                "Detergent Surfactant",
                "Foam Surfactant",
                "Emulsifier Surfactant",
                "Surface Active Agent",
                "Wetting Agent",
                "Sodium Lauryl Sulfate (SLS)",
                "Cetyl Alcohol",
                "Lecithin",
                "Pluronic F-68",
                "Tween 20",
                "Brij 35",
                "Span 80",
                "Ethanol",
                "Glycerol Monostearate",
                "Soybean Oil",
                "Poloxamer 188",
                "Tween 80",
                "Sodium Cholate",
                "Brij 58"
            ],
            "true_referents": [
                "1-linolenoyl-3-oleoylglycerol",
                "1-monostearoylglycerol",
                "2-(perfluorohexyl)ethyl dimorpholinophosphinate",
                "2-(perfluorooctyl)ethyl dimorpholinophosphinate",
                "PG(18:0/20:3)",
                "PG(35:3)",
                "PG(P-16:0/18:0)",
                "PG(P-18:0/19:0)",
                "PG-PI",
                "PS(18:0/20:0)",
                "PS(18:2_20:0)",
                "SDZ 35-682",
                "TG(59:1)",
                "TG(59:8)",
                "Triton X-100",
                "alkylglycerol",
                "choline alfoscerate",
                "detergent",
                "dodecylbenzenesulfonic acid",
                "glyceride",
                "glycerol",
                "glycerolipid",
                "nonionic surfactant",
                "oleyl acetate",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "phosphatidylinositol 35:1",
                "pluronic P-123",
                "polidocanol",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 80",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "surfactin",
                "surfactin A",
                "surfactin B",
                "tristearoylglycerol"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Pulmonary surfactant (PS)",
            "Dipalmitoylphosphatidylcholine (DPPC)",
            "Surfactant protein A (SP-A)",
            "Surfactant protein B (SP-B)",
            "Surfactant protein C (SP-C)",
            "Surfactant protein D (SP-D)",
            "Surfactant protein E (SP-E)",
            "Bovine lung surfactant extract (BLSE)",
            "Curosurf (Beractant)",
            "Infasurf (Calfactant)",
            "Survanta (Poractant alfa)",
            "Alveofact (Beractant)",
            "Surfaxin (Lipoid acid protein complex)",
            "Liposomal surfactant",
            "Synthetic surfactant",
            "Surfactant replacement therapy",
            "Surfactant-associated protein (SAP)",
            "Surfactant metabolism",
            "Surfactant synthesis",
            "Surfactant dysfunction",
            "Reticular basement membrane (RBM) surfactant",
            "Surfactant-associated protein C (SP-C)",
            "Surfactant-associated protein D (SP-D)",
            "Surfactant-associated protein E (SP-E)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Pulmonary surfactant (PS)",
                "Dipalmitoylphosphatidylcholine (DPPC)",
                "Surfactant protein A (SP-A)",
                "Surfactant protein B (SP-B)",
                "Surfactant protein C (SP-C)",
                "Surfactant protein D (SP-D)",
                "Surfactant protein E (SP-E)",
                "Bovine lung surfactant extract (BLSE)",
                "Curosurf (Beractant)",
                "Infasurf (Calfactant)",
                "Survanta (Poractant alfa)",
                "Alveofact (Beractant)",
                "Surfaxin (Lipoid acid protein complex)",
                "Liposomal surfactant",
                "Synthetic surfactant",
                "Surfactant replacement therapy",
                "Surfactant-associated protein (SAP)",
                "Surfactant metabolism",
                "Surfactant synthesis",
                "Surfactant dysfunction",
                "Reticular basement membrane (RBM) surfactant",
                "Surfactant-associated protein C (SP-C)",
                "Surfactant-associated protein D (SP-D)",
                "Surfactant-associated protein E (SP-E)"
            ],
            "true_referents": [
                "POV-PA",
                "PS-PA",
                "Triton X-100",
                "detergent",
                "dipalmitoyl phosphatidylglycerol",
                "diphosphatidyl propylene glycol",
                "enantio-PAF C-16",
                "nonionic surfactant",
                "phosphatidylcholine",
                "pluronic P-123",
                "sodium dodecyl sulfate",
                "surfactin",
                "surfactin A",
                "surfactin B",
                "surfactin C",
                "surfactin D",
                "tricaproin"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Soap (Sodium stearate)",
            "Detergent (Sodium dodecyl sulfate)",
            "Lipid bilayers",
            "Phospholipids",
            "Bile salts",
            "Polysorbate 80",
            "Span 80",
            "Tween 20",
            "Cetyltrimethylammonium bromide",
            "Sodium lauryl ether sulfate",
            "Glyceryl monostearate",
            "Sorbitan monolaurate",
            "Polyethylene glycol",
            "Lecithin",
            "Sucrose monolaurate",
            "Polyoxyethylene sorbitan monooleate",
            "Docusate sodium",
            "Octoxynol 9",
            "Sodium cholate",
            "Sodium deoxycholate",
            "Sodium taurocholate",
            "Lauromacrogol",
            "Polyoxyethylene 20 sorbitan monolaurate",
            "Nonoxynol 9"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Detergent (Sodium dodecyl sulfate)",
                "Polysorbate 80",
                "Cetyltrimethylammonium bromide"
            ],
            "mismatches": [
                "Soap (Sodium stearate)",
                "Lipid bilayers",
                "Phospholipids",
                "Bile salts",
                "Span 80",
                "Tween 20",
                "Sodium lauryl ether sulfate",
                "Glyceryl monostearate",
                "Sorbitan monolaurate",
                "Polyethylene glycol",
                "Lecithin",
                "Sucrose monolaurate",
                "Polyoxyethylene sorbitan monooleate",
                "Docusate sodium",
                "Octoxynol 9",
                "Sodium cholate",
                "Sodium deoxycholate",
                "Sodium taurocholate",
                "Lauromacrogol",
                "Polyoxyethylene 20 sorbitan monolaurate",
                "Nonoxynol 9"
            ],
            "true_referents": [
                "(9Z)-octadecen-1-ol",
                "1,3-dihydroxypropan-2-yl nonadec-9-enoate",
                "1-lauroyl-2-oleoylglycerol",
                "1-lauroyl-3-oleoylglycerol",
                "1-monolauroylglycerol",
                "1-monostearoylglycerol",
                "1-octanoyl-2-oleoylglycerol",
                "1-stearoyl-3-oleoylglycerol",
                "4-octylphenol",
                "PG(18:0/20:3)",
                "PG(P-16:0/18:0)",
                "PG(P-18:0/19:0)",
                "PS(18:0/20:0)",
                "PS(18:2_20:0)",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "choline alfoscerate",
                "detergent",
                "diphosphatidyl propylene glycol",
                "glycerol",
                "glycerolipid",
                "monoacyl-3-O-(beta-D-galactosyl)-sn-glycerol",
                "monoacylglycerol",
                "nonionic surfactant",
                "nonyl phenoxypolyethoxylethanol",
                "phosphatidylcholine",
                "phosphatidylcholine 32:0",
                "phosphatidylglycerol",
                "polyoxyl 40 stearate",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "sodium 2-butyloctyl sulfate",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "sodium tetradecyl sulfate",
                "triglyceride"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Dipalmitoylphosphatidylcholine (DPPC)",
            "Pulmonary Surfactant (PS)",
            "Docusate Sodium (DSS)",
            "Sodium Lauryl Sulfate (SLS)",
            "Polyoxyethylene Sorbitan Monolaurate (Tween 20)",
            "Bile Acids (BA)",
            "Alveolar Surfactant Protein A (SP-A)",
            "Alveolar Surfactant Protein C (SP-C)",
            "Alveolar Surfactant Protein D (SP-D)",
            "Phosphatidylglycerol (PG)",
            "Sphingomyelin (SM)",
            "Cationic Surfactants (CS)",
            "Anionic Surfactants (AS)",
            "Nonionic Surfactants (NS)",
            "Zwitterionic Surfactants (ZS)",
            "Fluorosurfactants (FS)",
            "Silicone Surfactants (SS)",
            "Sophorolipids (SL)",
            "Rhamnolipids (RL)",
            "Mannosylerythritol Ceterate (MEC)",
            "Polysorbate 80 (P80)",
            "Cetylpyridinium Chloride (CPC)",
            "Sodium Caproate (SC)",
            "Decyl Glucoside (DG)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cetylpyridinium Chloride (CPC)",
                "Phosphatidylglycerol (PG)",
                "Polysorbate 80 (P80)",
                "Nonionic Surfactants (NS)"
            ],
            "mismatches": [
                "Dipalmitoylphosphatidylcholine (DPPC)",
                "Pulmonary Surfactant (PS)",
                "Docusate Sodium (DSS)",
                "Sodium Lauryl Sulfate (SLS)",
                "Polyoxyethylene Sorbitan Monolaurate (Tween 20)",
                "Bile Acids (BA)",
                "Alveolar Surfactant Protein A (SP-A)",
                "Alveolar Surfactant Protein C (SP-C)",
                "Alveolar Surfactant Protein D (SP-D)",
                "Sphingomyelin (SM)",
                "Cationic Surfactants (CS)",
                "Anionic Surfactants (AS)",
                "Zwitterionic Surfactants (ZS)",
                "Fluorosurfactants (FS)",
                "Silicone Surfactants (SS)",
                "Sophorolipids (SL)",
                "Rhamnolipids (RL)",
                "Mannosylerythritol Ceterate (MEC)",
                "Sodium Caproate (SC)",
                "Decyl Glucoside (DG)"
            ],
            "true_referents": [
                "1-O-(D-glucosyl)glycerol",
                "1-Palmitoyl-2-(5-keto-6-octendioyl)-sn-glycero-3-phosphatidylcholine",
                "1-monomyristoylglycerol",
                "2,3-Diacetoxypropyl stearate",
                "2-decanoylglycerol",
                "3-dodecylbenzenesulfonic acid",
                "4-dodecylbenzenesulfonic acid",
                "L-alpha-Phosphatidylcholine",
                "L-alpha-phosphatidylglycerol",
                "L-rhamnosyl-3-hydroxydecanoyl-3-hydroxydecanoic acid",
                "N-retinylidene-N-retinylphosphatidylethanolamine",
                "PS-PA",
                "cardiolipin (20:2/16:1/18:1/18:3)",
                "cardiolipin 34:2_34:2",
                "cetylpyridinium bromide",
                "cetylpyridinium chloride",
                "cetyltrimethylammonium chloride",
                "dipalmitoyl phosphatidylglycerol",
                "diphosphatidyl propylene glycol",
                "dodecylbenzenesulfonic acid",
                "glycerol mono(keto-meromycolate)",
                "nonionic surfactant",
                "perfluorobutanesulfonic acid",
                "perfluorononanoic acid",
                "perfluorooctanoic acid",
                "phosphatidyl-N-methylethanolamine",
                "phosphatidylcholine",
                "phosphatidylcholine (22:4/22:6)",
                "phosphatidylglycerol",
                "phosphatidylglycerol phosphate",
                "phosphatidylserine amidated glycine zwitterion",
                "polysorbate 20",
                "polysorbate 60",
                "polysorbate 80",
                "sodium 2-butyloctyl sulfate",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "sodium tetradecyl sulfate",
                "surfactin",
                "surfactin A",
                "surfactin B",
                "surfactin C",
                "surfactin D"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Sodium dodecyl sulfate (SDS)",
            "Triton X-100",
            "Tween 20",
            "Tween 80",
            "Cetyltrimethylammonium bromide (CTAB)",
            "Cocamidopropyl betaine",
            "Sodium lauryl sulfate (SLS)",
            "Octylphenol ethoxylate",
            "Lauryl glucoside",
            "Decyl glucoside",
            "Polysorbate 60",
            "Polysorbate 40",
            "N-alkyl dimethyl benzyl ammonium chloride",
            "Sodium stearate",
            "Sodium oleate",
            "Sodium palmitate",
            "Sodium myristate",
            "Sodium laurate",
            "Cholesterol",
            "Lecithin",
            "Glyceryl monostearate",
            "Sorbitan monostearate",
            "Sorbitan tristearate",
            "Span 80"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triton X-100",
                "Polysorbate 60",
                "Polysorbate 40",
                "Cetyltrimethylammonium bromide",
                "Cocamidopropyl betaine"
            ],
            "mismatches": [
                "Sodium dodecyl sulfate (SDS)",
                "Tween 20",
                "Tween 80",
                "Sodium lauryl sulfate (SLS)",
                "Octylphenol ethoxylate",
                "Lauryl glucoside",
                "Decyl glucoside",
                "N-alkyl dimethyl benzyl ammonium chloride",
                "Sodium stearate",
                "Sodium oleate",
                "Sodium palmitate",
                "Sodium myristate",
                "Sodium laurate",
                "Cholesterol",
                "Lecithin",
                "Glyceryl monostearate",
                "Sorbitan monostearate",
                "Sorbitan tristearate",
                "Span 80"
            ],
            "true_referents": [
                "1,2-Distearoyl-sn-glycero-3-phosphate (sodium salt)",
                "1,3-distearoyl-2-palmitoylglycerol",
                "1-O-(D-glucosyl)glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-monostearoylglycerol",
                "1-myristoyl-2-oleoylglycerol",
                "2-O-(alpha-D-glucopyranosyl)glycerol",
                "2-ethylhexyl sulfate",
                "2-lauroylglycerol",
                "4-octylphenol",
                "PG(18:0/20:3)",
                "PG(P-16:0/18:0)",
                "PG(P-18:0/19:0)",
                "PS(18:0/20:0)",
                "PS(18:2_20:0)",
                "Triton X-100",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "cocamidopropyl betaine",
                "decyltrimethylammonium bromide",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glyceride",
                "glycerolipid",
                "lauramidopropyl betaine",
                "nonionic surfactant",
                "nonyl phenoxypolyethoxylethanol",
                "oleyl oleate",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "triglyceride",
                "tristearoylglycerol"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Lecithin (PC)",
            "Sodium dodecyl sulfate (SDS)",
            "Triton X-100 (TX-100)",
            "Polysorbate 20 (Tween 20)",
            "Polysorbate 80 (Tween 80)",
            "Cetyltrimethylammonium bromide (CTAB)",
            "Sorbitan monolaurate (Span 20)",
            "Sodium lauryl sulfate (SLS)",
            "Bile salts (e.g., sodium taurocholate)",
            "Dodecylbenzenesulfonic acid (DBSA)",
            "Octylphenol ethoxylate (OPE)",
            "Cocamidopropyl betaine (CAPB)",
            "Polyvinyl alcohol (PVA)",
            "Silicone surfactants (e.g., polydimethylsiloxane)",
            "Fluorinated surfactants (e.g., perfluorooctanoic acid)",
            "Amphiphilic peptides (e.g., surfactin)",
            "Sodium oleate (SO)",
            "Alkyl polyglucosides (APG)",
            "Dodecyltrimethylammonium chloride (DTAC)",
            "Glyceryl monostearate (GMS)",
            "Ethylene oxide-propylene oxide block copolymers (Pluronic)",
            "Sodium stearoyl lactylate (SSL)",
            "Polyethylene glycol (PEG) derivatives",
            "Sodium caseinate (SC)",
            "Cholesterol (CH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triton X-100",
                "polysorbate 20",
                "polysorbate 80",
                "cetyltrimethylammonium bromide",
                "dodecylbenzenesulfonic acid",
                "cocamidopropyl betaine",
                "perfluorooctanoic acid",
                "surfactin"
            ],
            "mismatches": [
                "Lecithin (PC)",
                "Sodium dodecyl sulfate (SDS)",
                "Sorbitan monolaurate (Span 20)",
                "Sodium lauryl sulfate (SLS)",
                "Bile salts (e.g., sodium taurocholate)",
                "Octylphenol ethoxylate (OPE)",
                "Polyvinyl alcohol (PVA)",
                "Silicone surfactants (e.g., polydimethylsiloxane)",
                "Amphiphilic peptides (e.g., surfactin)",
                "Sodium oleate (SO)",
                "Alkyl polyglucosides (APG)",
                "Dodecyltrimethylammonium chloride (DTAC)",
                "Glyceryl monostearate (GMS)",
                "Ethylene oxide-propylene oxide block copolymers (Pluronic)",
                "Sodium stearoyl lactylate (SSL)",
                "Polyethylene glycol (PEG) derivatives",
                "Sodium caseinate (SC)",
                "Cholesterol (CH)"
            ],
            "true_referents": [
                "1,2-distearoyl-3-alpha-D-galactosyl-sn-glycerol",
                "1-monostearoylglycerol",
                "1-stearoyl-3-oleoylglycerol",
                "2-ethylhexyl sulfate",
                "3-dodecylbenzenesulfonic acid",
                "4-dodecylbenzenesulfonic acid",
                "4-octylphenol",
                "D-alanyl-L-alanyl poly(glycerol phosphate)",
                "Triton X-100",
                "alpha-D-glucuronosyl diglyceride",
                "amphiphile",
                "beta-D-galactopyranosyl diglyceride",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "cocamidopropyl betaine",
                "decyltrimethylammonium bromide",
                "diphosphatidyl propylene glycol",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glycerol phenylbutyrate",
                "glycosylglycerol derivative",
                "lauramidopropyl betaine",
                "medium-chain 1,2-diacyl-3-beta-D-galactosyl-sn-glycerol",
                "monoacylglycerol 20:2",
                "monoacylglycerol 20:4",
                "nonionic surfactant",
                "nonyl phenoxypolyethoxylethanol",
                "oleyl oleate",
                "perfluorobutanesulfonic acid",
                "perfluorononanoic acid",
                "perfluorooctanoic acid",
                "phosphatidylcholine",
                "phosphatidylcholine (18:0/22:4)",
                "phosphatidylcholine (P-18:0/22:6)",
                "pluronic P-123",
                "polyoxyl 40 stearate",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "surfactin",
                "surfactin A",
                "triethanolamine"
            ],
            "TP": 8,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Pulmonary Surfactant (PS)",
            "Dipalmitoylphosphatidylcholine (DPPC)",
            "Sodium Dodecyl Sulfate (SDS)",
            "Cetyl Trimethylammonium Bromide (CTAB)",
            "Polyoxyethylene Sorbitan Monolaurate (Tween 20)",
            "Bile Salt (BS)",
            "Phosphatidylglycerol (PG)",
            "Lecithin",
            "Sorbitan Monostearate (Span 60)",
            "Polyoxyethylene Sorbitan Monostearate (Tween 60)",
            "Lung Surfactant Protein B (SP-B)",
            "Lung Surfactant Protein C (SP-C)",
            "Lung Surfactant Protein A (SP-A)",
            "Lung Surfactant Protein D (SP-D)",
            "Perfluorocarbon-based Surfactant (PFC)",
            "Poloxamer 188 (P188)",
            "Sodium Lauryl Ether Sulfate (SLES)",
            "Sodium Lauroyl Sarcosinate (SLSa)",
            "Decyl Glucoside",
            "Cocamidopropyl Betaine (CAPB)",
            "Sodium Cocoyl Isethionate (SCI)",
            "Sodium Lauroyl Methyl Isethionate (SLMI)",
            "Glycolipid Biosurfactant",
            "Rhamnolipid Biosurfactant"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium Dodecyl Sulfate (SDS)",
                "Cetyl Trimethylammonium Bromide (CTAB)",
                "Phosphatidylglycerol (PG)",
                "Cocamidopropyl Betaine (CAPB)"
            ],
            "mismatches": [
                "Pulmonary Surfactant (PS)",
                "Dipalmitoylphosphatidylcholine (DPPC)",
                "Polyoxyethylene Sorbitan Monolaurate (Tween 20)",
                "Bile Salt (BS)",
                "Lecithin",
                "Sorbitan Monostearate (Span 60)",
                "Polyoxyethylene Sorbitan Monostearate (Tween 60)",
                "Lung Surfactant Protein B (SP-B)",
                "Lung Surfactant Protein C (SP-C)",
                "Lung Surfactant Protein A (SP-A)",
                "Lung Surfactant Protein D (SP-D)",
                "Perfluorocarbon-based Surfactant (PFC)",
                "Poloxamer 188 (P188)",
                "Sodium Lauryl Ether Sulfate (SLES)",
                "Sodium Lauroyl Sarcosinate (SLSa)",
                "Decyl Glucoside",
                "Sodium Cocoyl Isethionate (SCI)",
                "Sodium Lauroyl Methyl Isethionate (SLMI)",
                "Glycolipid Biosurfactant",
                "Rhamnolipid Biosurfactant"
            ],
            "true_referents": [
                "1-O-(D-glucosyl)glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-monostearoylglycerol",
                "1-palmityl-2-acetyl-3-lauroyl-sn-glycerol",
                "1-stearoyl-3-oleoylglycerol",
                "2,3-Diacetoxypropyl stearate",
                "2-O-(alpha-D-glucopyranosyl)glycerol",
                "2-ethylhexyl sulfate",
                "Glycolipid G3",
                "Glycolipid G4",
                "L-alpha-phosphatidylglycerol",
                "L-rhamnosyl-3-hydroxydecanoyl-3-hydroxydecanoic acid",
                "LPE O-18:2",
                "PS-PA",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "cocamidopropyl betaine",
                "digalactosylglycerol derivative",
                "dipalmitoyl phosphatidylglycerol",
                "diphosphatidyl propylene glycol",
                "dodecylbenzenesulfonic acid",
                "glycerol phenylbutyrate",
                "glycerolipid",
                "lauramidopropyl betaine",
                "lauryl sulfobetaine",
                "nonionic surfactant",
                "perfluorohexyloctane",
                "perfluorononanoic acid",
                "perfluorooctanoic acid",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "phosphatidylglycerol phosphate",
                "pluronic P-123",
                "polyoxyl 40 stearate",
                "polysorbate 20",
                "polysorbate 60",
                "polysorbate 80",
                "sodium 2-butyloctyl sulfate",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "surfactin",
                "surfactin A",
                "surfactin B",
                "surfactin C",
                "surfactin D"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Pulmonary surfactant (PS)",
            "Artificial lung surfactant",
            "Alveolar surfactant",
            "Surfactant protein A (SP-A)",
            "Surfactant protein B (SP-B)",
            "Surfactant protein C (SP-C)",
            "Surfactant protein D (SP-D)",
            "Natural lung surfactant",
            "Exogenous surfactant",
            "Endogenous surfactant",
            "Surfactant replacement therapy",
            "Surfactant deficiency",
            "Lung compliance",
            "Surface tension",
            "Pulmonary function",
            "Respiratory distress syndrome (RDS)",
            "Neonatal respiratory distress syndrome (NRDS)",
            "Bronchopulmonary dysplasia (BPD)",
            "Lung development",
            "Alveolar stability",
            "Lung surfactant production",
            "Lung surfactant secretion",
            "Pulmonary alveoli",
            "Alveolar collapse"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Pulmonary surfactant (PS)",
                "Artificial lung surfactant",
                "Alveolar surfactant",
                "Surfactant protein A (SP-A)",
                "Surfactant protein B (SP-B)",
                "Surfactant protein C (SP-C)",
                "Surfactant protein D (SP-D)",
                "Natural lung surfactant",
                "Exogenous surfactant",
                "Endogenous surfactant",
                "Surfactant replacement therapy",
                "Surfactant deficiency",
                "Lung compliance",
                "Surface tension",
                "Pulmonary function",
                "Respiratory distress syndrome (RDS)",
                "Neonatal respiratory distress syndrome (NRDS)",
                "Bronchopulmonary dysplasia (BPD)",
                "Lung development",
                "Alveolar stability",
                "Lung surfactant production",
                "Lung surfactant secretion",
                "Pulmonary alveoli",
                "Alveolar collapse"
            ],
            "true_referents": [
                "(R)-edelfosine",
                "LPC(24:5)",
                "Lyso-PAF C-16-d4",
                "LysoPC P-18:0/0:0",
                "PA-PG",
                "PA-PS",
                "PAP",
                "PE-NMe2(16:0/15:0)",
                "PE-NMe2(18:0/15:0)",
                "PG(20:4/20:4)",
                "PG(P-20:0/22:0)",
                "PIP(18:0/PGF1alpha)",
                "PIP(22:2(13Z,16Z)/PGF1alpha)",
                "PIP(PGF1alpha/18:0)",
                "PS-PA",
                "Triton X-100",
                "amphiphile",
                "cardiolipin 34:2_34:2",
                "diradylglycerol",
                "lysophosphatidylcholine 24:1",
                "nonionic surfactant",
                "phosphatidylcholine",
                "phosphatidylcholine (18:0/22:4)",
                "phosphatidylmethanol 34:1",
                "surfactin",
                "surfactin A",
                "surfactin B",
                "surfactin C",
                "surfactin D",
                "texas red DHPE(1-)"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Sodium dodecyl sulfate (SDS)",
            "Triton X-100",
            "Polysorbate 80",
            "Tween 20",
            "Cetyltrimethylammonium bromide (CTAB)",
            "Lecithin",
            "Sodium laureth sulfate (SLES)",
            "Span 80",
            "Lauryl glucoside",
            "Ammonium lauryl sulfate",
            "Brij 35",
            "Nonidet P-40",
            "Pluronic F68",
            "Dodecyl \u03b2-D-maltoside",
            "Ceteareth-20",
            "Decyl glucoside",
            "Polyoxyethylene sorbitan monolaurate",
            "N-Octyl-\u03b2-D-glucopyranoside",
            "Sorbitan monostearate",
            "CHAPS (3-[(3-Cholamidopropyl) dimethylammonio]-1-propanesulfonate)",
            "Caprylic acid",
            "Stearic acid",
            "Cetyl alcohol",
            "Hexadecyltrimethylammonium bromide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triton X-100",
                "Nonidet P-40",
                "cetyltrimethylammonium bromide",
                "dodecyl beta-D-maltoside",
                "sodium dodecyl sulfate"
            ],
            "mismatches": [
                "Sodium dodecyl sulfate (SDS)",
                "Polysorbate 80",
                "Tween 20",
                "Cetyltrimethylammonium bromide (CTAB)",
                "Lecithin",
                "Sodium laureth sulfate (SLES)",
                "Span 80",
                "Lauryl glucoside",
                "Ammonium lauryl sulfate",
                "Brij 35",
                "Pluronic F68",
                "Ceteareth-20",
                "Decyl glucoside",
                "Polyoxyethylene sorbitan monolaurate",
                "N-Octyl-\u03b2-D-glucopyranoside",
                "Sorbitan monostearate",
                "CHAPS (3-[(3-Cholamidopropyl) dimethylammonio]-1-propanesulfonate)",
                "Caprylic acid",
                "Stearic acid",
                "Cetyl alcohol",
                "Hexadecyltrimethylammonium bromide"
            ],
            "true_referents": [
                "1,2-diacyl-sn-glycero-3-phosphosulfocholine",
                "1-(18-mercaptooctadecanoyl)-sn-glycerol 3-phosphate",
                "1-O-(2-O-alpha-D-galactopyranosyl-alpha-D-glucopyranosyl)-glycerol",
                "1-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "1-O-(D-glucosyl)glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-capryloyl-3-oleoylglycerol",
                "1-monostearoylglycerol",
                "1-stearoyl-3-oleoylglycerol",
                "1-tetradecanoyl-2-hexadecanoyl-sn-glycero-3-phosphosulfocholine",
                "11-(perfluorohexyl)undecyl dimorpholinophosphinate",
                "2-(perfluorohexyl)ethyl dimorpholinophosphinate",
                "2-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "2-O-(alpha-D-glucopyranosyl)glycerol",
                "2-lauroylglycerol",
                "4-dodecylbenzenesulfonic acid",
                "Nonidet P-40",
                "PG(18:0/20:3)",
                "PG(35:3)",
                "PG(P-16:0/18:0)",
                "PG(P-18:0/19:0)",
                "PS(18:0/20:0)",
                "PS(18:2_20:0)",
                "SDZ 35-682",
                "Triton X-100",
                "alkylglycerol",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "dodecyl beta-D-maltoside",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glycerol",
                "glycerolipid",
                "mono-beta-D-galactosyl diacylglycerol",
                "monoacylglycerol 20:2",
                "monoacylglycerol 20:5",
                "nonionic surfactant",
                "oleyl acetate",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "phosphatidylinositol 35:1",
                "phosphatidylinositol 40:6",
                "pluronic P-123",
                "polyoxyl 40 stearate",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 80",
                "sodium dodecyl sulfate",
                "tristearoylglycerol"
            ],
            "TP": 5,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Sodium dodecyl sulfate (SDS)",
            "Polysorbate 20 (Tween 20)",
            "Polysorbate 80 (Tween 80)",
            "Cetrimonium bromide (CTAB)",
            "Triton X-100",
            "Cocamidopropyl betaine",
            "Sodium laureth sulfate (SLES)",
            "Dipalmitoylphosphatidylcholine (DPPC)",
            "Benzalkonium chloride",
            "Lecithin",
            "Sodium stearate",
            "Octoxynol-9",
            "Ammonium lauryl sulfate",
            "Sodium lauroyl sarcosinate",
            "Cocamide MEA",
            "Span 80",
            "Sodium lauryl sulfoacetate",
            "Lauryl glucoside",
            "Decyl glucoside",
            "Coco glucoside",
            "Alkyl polyglucoside",
            "Sodium cocoyl isethionate",
            "Disodium cocoamphodiacetate",
            "Sodium cocoamphoacetate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium dodecyl sulfate (SDS)",
                "Polysorbate 20 (Tween 20)",
                "Polysorbate 80 (Tween 80)",
                "Triton X-100",
                "Cocamidopropyl betaine",
                "Benzalkonium chloride"
            ],
            "mismatches": [
                "Cetrimonium bromide (CTAB)",
                "Sodium laureth sulfate (SLES)",
                "Dipalmitoylphosphatidylcholine (DPPC)",
                "Lecithin",
                "Sodium stearate",
                "Octoxynol-9",
                "Ammonium lauryl sulfate",
                "Sodium lauroyl sarcosinate",
                "Cocamide MEA",
                "Span 80",
                "Sodium lauryl sulfoacetate",
                "Lauryl glucoside",
                "Decyl glucoside",
                "Coco glucoside",
                "Alkyl polyglucoside",
                "Sodium cocoyl isethionate",
                "Disodium cocoamphodiacetate",
                "Sodium cocoamphoacetate"
            ],
            "true_referents": [
                "(2R)-2,3-Dihydroxypropyl nonadecanoate",
                "(9Z)-1-O-octadec-9-enyl glycerol",
                "(9Z)-octadecen-1-ol",
                "1,2-dioleoyl-3-lauroyl-sn-glycerol",
                "1-(D-glucopyranosyloxy)-3-hydroxypropan-2-yl D-galactopyranoside",
                "1-O-(D-glucosyl)glycerol",
                "1-O-(beta-D-glucosyl)glycerol",
                "1-alkylglycerol",
                "2-O-(alpha-D-glucopyranosyl)glycerol",
                "2-lauroylglycerol",
                "4-dodecylbenzenesulfonic acid",
                "4-octylphenol",
                "Glycerol 1-propanoate diacetate",
                "PS(18:0/20:0)",
                "PS(18:2_20:0)",
                "Triton X-100",
                "alkylglycerol",
                "benzalkonium chloride",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "cocamidopropyl betaine",
                "detergent",
                "dipalmitoyl phosphatidylglycerol",
                "diphosphatidyl propylene glycol",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glycerolipid",
                "lauramidopropyl betaine",
                "nonionic surfactant",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "sodium 2-butyloctyl sulfate",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "triethanolamine"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Sodium dodecyl sulfate (SDS)",
            "Cetyltrimethylammonium bromide (CTAB)",
            "Triton X-100",
            "Tween 20",
            "Tween 80",
            "Cocamidopropyl betaine (CAPB)",
            "Sodium lauryl ether sulfate (SLES)",
            "Sodium lauroyl sarcosinate",
            "Dioctyl sodium sulfosuccinate (DSS)",
            "Benzalkonium chloride (BAC)",
            "Polysorbate 20",
            "Polysorbate 60",
            "Polysorbate 80",
            "Lecithin",
            "Pulmonary surfactant",
            "Dipalmitoylphosphatidylcholine (DPPC)",
            "Sphingomyelin",
            "Phosphatidylglycerol",
            "Surfactin",
            "Rhamnolipids",
            "Sophorolipids",
            "Linear alkylbenzene sulfonates (LAS)",
            "Alcohol ethoxylates (AE)",
            "Alkyl polyglucoside (APG)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium dodecyl sulfate (SDS)",
                "Cetyltrimethylammonium bromide (CTAB)",
                "Triton X-100",
                "Cocamidopropyl betaine (CAPB)",
                "Benzalkonium chloride (BAC)",
                "Polysorbate 20",
                "Polysorbate 60",
                "Polysorbate 80",
                "Phosphatidylglycerol",
                "Surfactin"
            ],
            "mismatches": [
                "Tween 20",
                "Tween 80",
                "Sodium lauryl ether sulfate (SLES)",
                "Sodium lauroyl sarcosinate",
                "Dioctyl sodium sulfosuccinate (DSS)",
                "Lecithin",
                "Pulmonary surfactant",
                "Dipalmitoylphosphatidylcholine (DPPC)",
                "Sphingomyelin",
                "Rhamnolipids",
                "Sophorolipids",
                "Linear alkylbenzene sulfonates (LAS)",
                "Alcohol ethoxylates (AE)",
                "Alkyl polyglucoside (APG)"
            ],
            "true_referents": [
                "1,2,3-Tris(1-ethoxyethoxy)propane",
                "1,2-dioleoyl-3-lauroyl-sn-glycerol",
                "2-ethylhexyl sulfate",
                "3-dodecylbenzenesulfonic acid",
                "PG(18:0/20:3)",
                "PG(P-16:0/18:0)",
                "PG(P-18:0/19:0)",
                "Triton X-100",
                "alpha-D-glucuronosyl diglyceride",
                "benzalkonium chloride",
                "beta-D-galactopyranosyl diglyceride",
                "cardiolipin",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "cocamidopropyl betaine",
                "dipalmitoyl phosphatidylglycerol",
                "diphosphatidyl propylene glycol",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glycerol phenylbutyrate",
                "glycerolipid",
                "lauramidopropyl betaine",
                "lauryl sulfobetaine",
                "nonionic surfactant",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "phosphatidylglycerol phosphate",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "sodium 2-butyloctyl sulfate",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium tetradecyl sulfate",
                "surfactin",
                "surfactin A",
                "surfactin B",
                "triethanolamine"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Lecithin (PC)",
            "Phosphatidylglycerol (PG)",
            "Phosphatidylinositol (PI)",
            "Phosphatidylserine (PS)",
            "Phosphatidylethanolamine (PE)",
            "Sphingomyelin (SM)",
            "Dipalmitoylphosphatidylcholine (DPPC)",
            "Poractant alfa (Curosurf)",
            "Beractant (Survanta)",
            "Calfactant (Infasurf)",
            "Lucinactant (Surfaxin)",
            "Sinapultide (Venticute)",
            "Sodium dodecyl sulfate (SDS)",
            "Cetrimonium bromide (CTAB)",
            "Tween 20 (Polysorbate 20)",
            "Tween 80 (Polysorbate 80)",
            "Triton X-100",
            "Span 20 (Sorbitan monolaurate)",
            "Span 80 (Sorbitan monooleate)",
            "Sodium cholate",
            "Sodium deoxycholate",
            "Pluronic F-68",
            "Aerosol-OT (Dioctyl sodium sulfosuccinate)",
            "Perfluorooctanoic acid (PFOA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triton X-100",
                "Sodium dodecyl sulfate",
                "cetyltrimethylammonium bromide",
                "polysorbate 20",
                "polysorbate 80",
                "perfluorooctanoic acid"
            ],
            "mismatches": [
                "Lecithin (PC)",
                "Phosphatidylglycerol (PG)",
                "Phosphatidylinositol (PI)",
                "Phosphatidylserine (PS)",
                "Phosphatidylethanolamine (PE)",
                "Sphingomyelin (SM)",
                "Dipalmitoylphosphatidylcholine (DPPC)",
                "Poractant alfa (Curosurf)",
                "Beractant (Survanta)",
                "Calfactant (Infasurf)",
                "Lucinactant (Surfaxin)",
                "Sinapultide (Venticute)",
                "Span 20 (Sorbitan monolaurate)",
                "Span 80 (Sorbitan monooleate)",
                "Sodium cholate",
                "Sodium deoxycholate",
                "Pluronic F-68",
                "Aerosol-OT (Dioctyl sodium sulfosuccinate)"
            ],
            "true_referents": [
                "(S)-edelfosine",
                "1-Palmitoyl-2-(5-keto-6-octendioyl)-sn-glycero-3-phosphatidylcholine",
                "2-(perfluorohexyl)ethyl dimorpholinophosphinate",
                "2-(perfluorooctyl)ethyl dimorpholinophosphinate",
                "2-butyloctyl hydrogen sulfate",
                "L-alpha-phosphatidylglycerol",
                "POV-PA",
                "Triton X-100",
                "cetyltrimethylammonium bromide",
                "choline alfoscerate",
                "dipalmitoyl phosphatidylglycerol",
                "diphosphatidyl propylene glycol",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glycerophosphatidylethanolamine",
                "laureth-5",
                "levobupivacaine",
                "monoacylglycerol 20:2",
                "monoacylglycerol 20:4",
                "nonionic surfactant",
                "perfluorohexyloctane",
                "perfluorononanoic acid",
                "perfluorooctanoic acid",
                "phosphatidyl-N-methylethanolamine",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylglycerol",
                "phosphatidylglycerol phosphate",
                "phosphatidylinositol",
                "phosphatidylinositol monophosphate",
                "phosphatidylinositol phosphate",
                "phosphatidylserine (18:0/22:6)",
                "phosphatidylserine (18:1/22:6)",
                "pluronic P-123",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "sodium 2-butyloctyl sulfate",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "sodium tetradecyl sulfate",
                "surfactin",
                "surfactin A",
                "surfactin C"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Phosphatidylcholine (PC)",
            "Phosphatidylethanolamine (PE)",
            "Phosphatidylserine (PS)",
            "Phosphatidylinositol (PI)",
            "Sphingomyelin (SM)",
            "Dipalmitoylphosphatidylcholine (DPPC)",
            "Poractant alfa",
            "Beractant",
            "Calfactant",
            "Lucinactant",
            "Pulmonary surfactant protein A (SP-A)",
            "Pulmonary surfactant protein B (SP-B)",
            "Pulmonary surfactant protein C (SP-C)",
            "Pulmonary surfactant protein D (SP-D)",
            "Sodium dodecyl sulfate (SDS)",
            "Cetyltrimethylammonium bromide (CTAB)",
            "Polysorbate 20 (Tween 20)",
            "Polysorbate 80 (Tween 80)",
            "Triton X-100",
            "Saponin",
            "Digitonin",
            "Sodium lauryl sulfate (SLS)",
            "Cocamidopropyl betaine",
            "Laureth-9"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Phosphatidylcholine (PC)",
                "Phosphatidylethanolamine (PE)",
                "Sodium dodecyl sulfate (SDS)",
                "Cetyltrimethylammonium bromide (CTAB)",
                "Polysorbate 20 (Tween 20)",
                "Polysorbate 80 (Tween 80)",
                "Triton X-100",
                "Digitonin",
                "Cocamidopropyl betaine"
            ],
            "mismatches": [
                "Phosphatidylserine (PS)",
                "Phosphatidylinositol (PI)",
                "Sphingomyelin (SM)",
                "Dipalmitoylphosphatidylcholine (DPPC)",
                "Poractant alfa",
                "Beractant",
                "Calfactant",
                "Lucinactant",
                "Pulmonary surfactant protein A (SP-A)",
                "Pulmonary surfactant protein B (SP-B)",
                "Pulmonary surfactant protein C (SP-C)",
                "Pulmonary surfactant protein D (SP-D)",
                "Saponin",
                "Sodium lauryl sulfate (SLS)",
                "Laureth-9"
            ],
            "true_referents": [
                "1-Palmitoyl-2-(5-keto-6-octendioyl)-sn-glycero-3-phosphatidylcholine",
                "Capsoside A",
                "L-alpha-Phosphatidylcholine",
                "L-alpha-phosphatidylglycerol",
                "LBPA(16:1(9Z)/18:1(9Z))",
                "LPC 8:0",
                "Triton X-100",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "cocamidopropyl betaine",
                "detergent",
                "digitonin",
                "dipalmitoyl phosphatidylglycerol",
                "diphosphatidyl propylene glycol",
                "dipropionin",
                "dodecylbenzenesulfonic acid",
                "glycerophosphatidylethanolamine",
                "lauramidopropyl betaine",
                "laureth-5",
                "nonionic surfactant",
                "phosphatidyl-N-methylethanolamine",
                "phosphatidylcholine",
                "phosphatidylcholine (P-18:0/22:6)",
                "phosphatidylethanolamine",
                "phosphatidylethanolamine (P-18:0/20:4)",
                "phosphatidylinositol",
                "phosphatidylinositol monophosphate",
                "phosphatidylinositol phosphate",
                "phosphatidylserine (18:0/22:6)",
                "phosphatidylserine (18:1/22:6)",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 60",
                "polysorbate 80",
                "sodium dodecyl sulfate",
                "surfactin",
                "surfactin A",
                "surfactin B",
                "surfactin C",
                "surfactin D",
                "trilaurin"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "Surfactant protein A (SP-A) in lung surfactant (1)",
            "Bile salts as surfactants in the gut (2)",
            "Detergents as synthetic surfactants in biochemistry (3)",
            "Phospholipids as natural surfactants in cell membranes (4)",
            "Ceramides as surfactants in skin and hair (5)",
            "Sodium lauryl sulfate (SLS) as a surfactant in personal care products (6)",
            "Triton X-100 as a non-ionic surfactant in molecular biology (7)",
            "Brij 35 as a non-ionic surfactant in protein purification (8)",
            "Tween 80 as a non-ionic surfactant in food processing (9)",
            "Cetrimide as a cationic surfactant in antiseptic creams (10)",
            "Quaternary ammonium compounds as cationic surfactants in disinfectants (11)",
            "Alkyl sulfates as anionic surfactants in laundry detergents (12)",
            "Sodium dodecyl sulfate (SDS) as an anionic surfactant in protein denaturation (13)",
            "Coco-glucoside as a natural surfactant in cosmetics (14)",
            "Decyl glucoside as a natural surfactant in personal care products (15)",
            "Gluconate as a surfactant in pharmaceutical formulations (16)",
            "Poloxamer as a non-ionic surfactant in ophthalmic solutions (17)",
            "Cremophor EL as a non-ionic surfactant in injectable formulations (18)",
            "Sorbitan esters as non-ionic surfactants in food emulsions (19)",
            "Polyoxyethylene as a non-ionic surfactant in cleaning products (20)",
            "Glycols as surfactants in pharmaceutical formulations (21)",
            "Cyclodextrins as surfactants in pharmaceutical formulations (22)",
            "Surfactin as a natural surfactant produced by Bacillus subtilis (23)",
            "Rhamnolipid as a natural surfactant produced by Pseudomonas aeruginosa (24)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Triton X-100",
                "sodium dodecyl sulfate",
                "surfactin"
            ],
            "mismatches": [
                "Surfactant protein A (SP-A) in lung surfactant (1)",
                "Bile salts as surfactants in the gut (2)",
                "Detergents as synthetic surfactants in biochemistry (3)",
                "Phospholipids as natural surfactants in cell membranes (4)",
                "Ceramides as surfactants in skin and hair (5)",
                "Sodium lauryl sulfate (SLS) as a surfactant in personal care products (6)",
                "Brij 35 as a non-ionic surfactant in protein purification (8)",
                "Tween 80 as a non-ionic surfactant in food processing (9)",
                "Cetrimide as a cationic surfactant in antiseptic creams (10)",
                "Quaternary ammonium compounds as cationic surfactants in disinfectants (11)",
                "Alkyl sulfates as anionic surfactants in laundry detergents (12)",
                "Coco-glucoside as a natural surfactant in cosmetics (14)",
                "Decyl glucoside as a natural surfactant in personal care products (15)",
                "Gluconate as a surfactant in pharmaceutical formulations (16)",
                "Poloxamer as a non-ionic surfactant in ophthalmic solutions (17)",
                "Cremophor EL as a non-ionic surfactant in injectable formulations (18)",
                "Sorbitan esters as non-ionic surfactants in food emulsions (19)",
                "Polyoxyethylene as a non-ionic surfactant in cleaning products (20)",
                "Glycols as surfactants in pharmaceutical formulations (21)",
                "Cyclodextrins as surfactants in pharmaceutical formulations (22)",
                "Rhamnolipid as a natural surfactant produced by Pseudomonas aeruginosa (24)"
            ],
            "true_referents": [
                "2-O-(alpha-D-glucopyranosyl)glycerol",
                "4-dodecylbenzenesulfonic acid",
                "Glycerol 1-propanoate diacetate",
                "Triton X-100",
                "amphiphile",
                "benzalkonium chloride",
                "cetyltrimethylammonium bromide",
                "cetyltrimethylammonium chloride",
                "decyltrimethylammonium bromide",
                "detergent",
                "diphosphatidyl propylene glycol",
                "dodecyl beta-D-maltoside",
                "dodecylbenzenesulfonic acid",
                "dodecyltrimethylammonium bromide",
                "glyceride",
                "glycerol",
                "glycosylglycerol derivative",
                "mannosyl diphosphorylinositol ceramide",
                "nonionic surfactant",
                "nonyl phenoxypolyethoxylethanol",
                "phosphatidylcholine 32:4",
                "phosphatidylcholine 35:4",
                "polysorbate 80",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "surfactin",
                "surfactin A",
                "surfactin B",
                "surfactin C",
                "surfactin D"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": [
            "soap (CMC)",
            "detergent",
            "Triton X-100",
            "Sodium lauryl sulfate (SLS)",
            "Cetylpyridinium chloride (CPC)",
            "Polysorbate 80 (Tween 80)",
            "Span 80",
            "Tween 20",
            "Glycerol ester",
            "Lecithin",
            "Tyloxapol",
            "Pluronic F-68",
            "Cremophor EL",
            "Sodium cholate",
            "Cholic acid",
            "Bile salts",
            "Digitonin",
            "Octoxynol-9",
            "Nonoxynol-9",
            "Cholesterol",
            "Amphipathic peptides",
            "Lipids",
            "Phospholipids",
            "Emulsan"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "detergent",
                "Triton X-100",
                "Cetylpyridinium chloride (CPC)",
                "Polysorbate 80 (Tween 80)",
                "Tyloxapol",
                "Digitonin"
            ],
            "mismatches": [
                "soap (CMC)",
                "Sodium lauryl sulfate (SLS)",
                "Span 80",
                "Tween 20",
                "Glycerol ester",
                "Lecithin",
                "Pluronic F-68",
                "Cremophor EL",
                "Sodium cholate",
                "Cholic acid",
                "Bile salts",
                "Octoxynol-9",
                "Nonoxynol-9",
                "Cholesterol",
                "Amphipathic peptides",
                "Lipids",
                "Phospholipids",
                "Emulsan"
            ],
            "true_referents": [
                "(9Z)-1-O-octadec-9-enyl glycerol",
                "(9Z)-octadecen-1-ol",
                "(R)-edelfosine",
                "1,3-dihydroxypropan-2-yl nonadec-9-enoate",
                "1-stearoyl-3-oleoylglycerol",
                "2-(perfluorohexyl)ethyl dimorpholinophosphinate",
                "2-(perfluorooctyl)ethyl dimorpholinophosphinate",
                "4-octylphenol",
                "L-alpha-Phosphatidylcholine",
                "LPE O-16:1",
                "LPE O-18:2",
                "PG(18:0/20:3)",
                "PG(P-16:0/18:0)",
                "PG(P-18:0/19:0)",
                "PS(18:0/20:0)",
                "PS(18:2_20:0)",
                "Triton X-100",
                "amphiphile",
                "batilol",
                "benzalkonium chloride",
                "cetylpyridinium bromide",
                "cetylpyridinium chloride",
                "cetyltrimethylammonium chloride",
                "choline alfoscerate",
                "detergent",
                "digitonin",
                "dipropionin",
                "dodecylbenzenesulfonic acid",
                "glyceride",
                "glycerol",
                "glycerol phosphate",
                "glycerolipid",
                "nonionic surfactant",
                "nonyl phenoxypolyethoxylethanol",
                "phosphatidic acid",
                "phosphatidylcholine",
                "phosphatidylglycerol",
                "pluronic P-123",
                "polysorbate 20",
                "polysorbate 40",
                "polysorbate 80",
                "sodium dodecanoate",
                "sodium dodecyl sulfate",
                "sodium octadecanoate",
                "surfactin C",
                "tergitol",
                "triglyceride",
                "tyloxapol"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "surfactant",
        "domain": "chemistry",
        "response": "Sorry - this model is unable to respond to this request.",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]