[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Palmitic acid (C16:0)",
            "Stearic acid (C18:0)",
            "Oleic acid (C18:1n-9)",
            "Linoleic acid (C18:2n-6)",
            "Linolenic acid (C18:3n-3)",
            "Arachidic acid (C20:0)",
            "Eicosanoic acid (C20:1n-9)",
            "Behenic acid (C22:0)",
            "Lignoceric acid (C24:0)",
            "Erucic acid (C22:1n-9)",
            "Docosanoic acid (C22:0)",
            "Docosenoic acid (C24:1n-9)",
            "Tetracosanoic acid (C24:0)",
            "Hexacosanoic acid (C26:0)",
            "Octacosanoic acid (C28:0)",
            "Tricosanoic acid (C23:0)",
            "Pentacosanoic acid (C25:0)",
            "Heptacosanoic acid (C27:0)",
            "Nonacosanoic acid (C29:0)",
            "Heneicosanoic acid (C21:0)",
            "Tricosanoic acid (C23:0)",
            "Pentacosanoic acid (C25:0)",
            "Docosapentaenoic acid (C22:5n-3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "docosanoic acid",
                "docosenoic acid",
                "erucic acid",
                "linoleic acid",
                "linolenic acid",
                "nonacosanoic acid",
                "oleic acid",
                "stearic acid(d3)"
            ],
            "mismatches": [
                "palmitic acid (C16:0)",
                "arachidic acid (C20:0)",
                "eicosanoic acid (C20:1n-9)",
                "behenic acid (C22:0)",
                "lignoceric acid (C24:0)",
                "tetracosanoic acid (C24:0)",
                "hexacosanoic acid (C26:0)",
                "octacosanoic acid (C28:0)",
                "tricosanoic acid (C23:0)",
                "pentacosanoic acid (C25:0)",
                "heptacosanoic acid (C27:0)",
                "heneicosanoic acid (C21:0)",
                "docosapentaenoic acid (C22:5n-3)"
            ],
            "true_referents": [
                "(10E)-octadecenoic acid",
                "(20R)-20-hydroxyhenicosanoic acid",
                "(2E)-2-heptadecenoic acid",
                "(3E)-3-hexadecenoic acid",
                "(3R)-3,22-dihydroxybehenic acid",
                "(3S)-3-hydroxydocosanoyl-CoA",
                "(6Z,9Z,12Z,15Z,18Z,21Z)-tetracosahexaenoic acid",
                "(9E)-tetradecenoic acid",
                "(9E,11E)-octadecadienoic acid",
                "10-nonadecenoic acid",
                "2-hexadecynoic acid",
                "2-hydroxybehenic acid",
                "2-nonadecenoic acid",
                "2-oxo-heneicosanoic acid",
                "2-oxo-pentadecanoic acid",
                "3-hydroxydocosanoic acid",
                "3-methyl-heneicosanoic acid",
                "3-oxo-heneicosanoic acid",
                "3-oxo-tridecanoic acid",
                "4,8-dimethyl-hexadecanoic acid",
                "4,8-dimethyl-pentadecanoic acid",
                "6,9-Hexadecadienoic acid",
                "7-heptadecenoic acid",
                "7-heptadecynoic acid",
                "7-hexadecynoic acid",
                "8-methyl-hexadecanoic acid",
                "8-methyl-octadecanoic acid",
                "9-Eicosenoic acid",
                "Glycerol 1-hexadecanoate",
                "Linoleic acid(d4)",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "all-cis-docosa-4,7,10,13,16,19-hexaenoic acid",
                "arachidonic acid",
                "docosadienoic acid",
                "docosahexaenoic acid",
                "docosanoic acid",
                "docosapentaenoic acid",
                "docosatrienoic acid",
                "docosenoic acid",
                "erucic acid",
                "ethyl (11Z)-docosenoate",
                "ethyl arachidate",
                "linoleic acid",
                "linolenic acid",
                "nonacosanoic acid",
                "octadecanoic acid",
                "octadecenoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "pentadecanoic acid",
                "pentadecenoic acid",
                "tetracosahexaenoic acid"
            ],
            "TP": 8,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Palmitic acid (C16:0)",
            "Stearic acid (C18:0)",
            "Oleic acid (C18:1, n-9)",
            "Linoleic acid (C18:2, n-6)",
            "Alpha-linolenic acid (C18:3, n-3)",
            "Arachidonic acid (C20:4, n-6)",
            "Eicosapentaenoic acid (EPA, C20:5, n-3)",
            "Docosahexaenoic acid (DHA, C22:6, n-3)",
            "Myristic acid (C14:0)",
            "Palmitoleic acid (C16:1, n-7)",
            "Gadoleic acid (C20:1, n-9)",
            "Behenic acid (C22:0)",
            "Lignoceric acid (C24:0)",
            "Erucic acid (C22:1, n-9)",
            "Lauric acid (C12:0)",
            "Capric acid (C10:0)",
            "Caprylic acid (C8:0)",
            "Vaccenic acid (C18:1, t11)",
            "Nervonic acid (C24:1, n-9)",
            "Heneicosanoic acid (C21:0)",
            "Tricosanoic acid (C23:0)",
            "Tetracosanoic acid (C24:0)",
            "Docosanoic acid (C22:0)",
            "Tetracosanoic acid (C24:0)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "alpha-linolenic acid",
                "arachidonic acid",
                "docosahexaenoic acid",
                "gadoleic acid",
                "palmitoleic acid",
                "vaccenic acid",
                "docosanoic acid"
            ],
            "mismatches": [
                "Palmitic acid (C16:0)",
                "Stearic acid (C18:0)",
                "Oleic acid (C18:1, n-9)",
                "Linoleic acid (C18:2, n-6)",
                "Eicosapentaenoic acid (EPA, C20:5, n-3)",
                "Myristic acid (C14:0)",
                "Behenic acid (C22:0)",
                "Lignoceric acid (C24:0)",
                "Lauric acid (C12:0)",
                "Capric acid (C10:0)",
                "Caprylic acid (C8:0)",
                "Nervonic acid (C24:1, n-9)",
                "Heneicosanoic acid (C21:0)",
                "Tricosanoic acid (C23:0)",
                "Tetracosanoic acid (C24:0)"
            ],
            "true_referents": [
                "(10E)-octadecenoic acid",
                "(2E)-2-heptadecenoic acid",
                "(3E)-3-hexadecenoic acid",
                "(3R)-3,22-dihydroxybehenic acid",
                "(3S)-3-hydroxydocosanoyl-CoA",
                "(6Z,9Z,12Z,15Z,18Z,21Z)-tetracosahexaenoic acid",
                "(7Z,10Z)-hexadecadienoic acid",
                "(9E)-tetradecenoic acid",
                "(9E,11E)-octadecadienoic acid",
                "(E)-hexadec-2-enoic acid",
                "(E)-octadeca-15-en-9,11,13-triynoic acid",
                "1-alpha-linolenoylglycerol",
                "2,6-dimethyl-hexadecanoic acid",
                "2-hydroxybehenic acid",
                "2-oxo-heneicosanoic acid",
                "3-hydroxydocosanoic acid",
                "3-methyl-heneicosanoic acid",
                "3-oxo-heneicosanoic acid",
                "3-oxo-tridecanoic acid",
                "4,8,12,15,18-eicosapentaenoic acid",
                "4,8-dimethyl-hexadecanoic acid",
                "4,8-dimethyl-pentadecanoic acid",
                "7-Palmitoleic acid",
                "8-methyl-hexadecanoic acid",
                "8-methyl-octadecanoic acid",
                "Glycerol 1-hexadecanoate",
                "Margaric acid(d3)",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "all-cis-docosa-4,7,10,13,16,19-hexaenoic acid",
                "alpha-linolenic acid",
                "arachidonic acid",
                "cis-vaccenic acid",
                "docosadienoic acid",
                "docosahexaenoic acid",
                "docosanoic acid",
                "docosatrienoic acid",
                "eicosa-5,8,11,14,17-pentaenoic acid",
                "epoxydocosapentaenoic acid",
                "erucic acid",
                "ethyl arachidonate",
                "gadoleic acid",
                "hexadecanoic acid",
                "linoleic acid",
                "linolenic acid",
                "myristic acid-13C3",
                "myristoleic acid",
                "octadecanoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "palmitoleic acid",
                "tetracosahexaenoic acid",
                "trans-vaccenic acid",
                "vaccenic acid"
            ],
            "TP": 7,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Palmitic acid (C16:0)",
            "Stearic acid (C18:0)",
            "Arachidic acid (C20:0)",
            "Behenic acid (C22:0)",
            "Lignoceric acid (C24:0)",
            "Cerotic acid (C26:0)",
            "Montanic acid (C28:0)",
            "Melissic acid (C30:0)",
            "Palmitoleic acid (C16:1)",
            "Oleic acid (C18:1)",
            "Gadoleic acid (C20:1)",
            "Erucic acid (C22:1)",
            "Nervonic acid (C24:1)",
            "Linoleic acid (C18:2)",
            "Linolenic acid (C18:3)",
            "Arachidonic acid (C20:4)",
            "Eicosapentaenoic acid (EPA, C20:5)",
            "Docosahexaenoic acid (DHA, C22:6)",
            "Erucic acid (C22:1)",
            "Docosatetraenoic acid (C22:4)",
            "Docosapentaenoic acid (C22:5)",
            "Tetracosapentaenoic acid (C24:5)",
            "Tetracosahexaenoic acid (C24:6)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Palmitoleic acid",
                "Oleic acid",
                "Gadoleic acid",
                "Erucic acid",
                "Linoleic acid",
                "Linolenic acid",
                "Arachidonic acid",
                "Docosahexaenoic acid",
                "Docosatetraenoic acid",
                "Docosapentaenoic acid",
                "Tetracosahexaenoic acid"
            ],
            "mismatches": [
                "Palmitic acid (C16:0)",
                "Stearic acid (C18:0)",
                "Arachidic acid (C20:0)",
                "Behenic acid (C22:0)",
                "Lignoceric acid (C24:0)",
                "Cerotic acid (C26:0)",
                "Montanic acid (C28:0)",
                "Melissic acid (C30:0)",
                "Nervonic acid (C24:1)",
                "Eicosapentaenoic acid (EPA, C20:5)",
                "Erucic acid (C22:1)",
                "Tetracosapentaenoic acid (C24:5)"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(10E)-octadecenoic acid",
                "(17R)-hydroxydocosahexaenoic acid",
                "(2E,4E,6E,8E,10E)-octadecapentaenoic acid",
                "(3R)-3,22-dihydroxybehenic acid",
                "(4E,7E,10E,13E)-Hexadeca-4,7,10,13-tetraenoic acid",
                "(6Z,9Z,12Z,15Z,18Z,21Z)-tetracosahexaenoic acid",
                "(E)-hexadec-2-enoic acid",
                "(R)-lamenallenic acid",
                "(S)-laballenic acid",
                "(S)-lamenallenic acid",
                "1-arachidonoylglycerol",
                "1-erucoylglycerol",
                "2-hydroxybehenic acid",
                "4,8,12,15,18-eicosapentaenoic acid",
                "4,8-dimethyl-hexadecanoic acid",
                "4,8-dimethyl-pentadecanoic acid",
                "5,7,9,11,13-tetradecapentaenoic acid",
                "7,10,13,16-docosatetraenoic acid",
                "7-Palmitoleic acid",
                "8,11,14-Octadecatriynoic acid",
                "8-methyl-hexadecanoic acid",
                "8-methyl-octadecanoic acid",
                "Ceriporic acid A",
                "Ceriporic acid C",
                "Ceriporic acid D",
                "Glycerol 1-hexadecanoate",
                "Linoleic acid(d4)",
                "Margaric acid(d3)",
                "Paleic acid",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "all-cis-docosa-7,10,13,16-tetraenoic acid",
                "arachidonic acid",
                "docosahexaenoic acid",
                "docosapentaenoic acid",
                "docosatetraenoic acid",
                "docosatrienoic acid",
                "erucic acid",
                "ethyl arachidate",
                "gadoleic acid",
                "linoleic acid",
                "linolenic acid",
                "octadecanoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "palmitoleic acid",
                "tetracosahexaenoic acid"
            ],
            "TP": 11,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Stearic acid (C18:0)",
            "Oleic acid (C18:1)",
            "Linoleic acid (C18:2)",
            "Alpha-linolenic acid (ALA, C18:3)",
            "Palmitic acid (C16:0)",
            "Myristic acid (C14:0)",
            "Palmitoleic acid (C16:1)",
            "Arachidic acid (C20:0)",
            "Behenic acid (C22:0)",
            "Lignoceric acid (C24:0)",
            "Docosahexaenoic acid (DHA, C22:6)",
            "Eicosapentaenoic acid (EPA, C20:5)",
            "Gamma-linolenic acid (GLA, C18:3)",
            "Arachidonic acid (AA, C20:4)",
            "Capric acid (C10:0)",
            "Lauric acid (C12:0)",
            "Caprylic acid (C8:0)",
            "Undecylenic acid (C11:1)",
            "Erucic acid (C22:1)",
            "Nervonic acid (C24:1)",
            "Petroselinic acid (C18:1)",
            "Gondoic acid (C20:1)",
            "Montanic acid (C24:0)",
            "Cetoleic acid (C22:1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "docosahexaenoic acid",
                "gamma-linolenic acid",
                "arachidonic acid",
                "erucic acid",
                "petroselinic acid",
                "cetoleic acid"
            ],
            "mismatches": [
                "stearic acid (C18:0)",
                "oleic acid (C18:1)",
                "linoleic acid (C18:2)",
                "alpha-linolenic acid (ALA, C18:3)",
                "palmitic acid (C16:0)",
                "myristic acid (C14:0)",
                "palmitoleic acid (C16:1)",
                "arachidic acid (C20:0)",
                "behenic acid (C22:0)",
                "lignoceric acid (C24:0)",
                "eicosapentaenoic acid (EPA, C20:5)",
                "capric acid (C10:0)",
                "lauric acid (C12:0)",
                "caprylic acid (C8:0)",
                "undecylenic acid (C11:1)",
                "nervonic acid (C24:1)",
                "gondoic acid (C20:1)",
                "montanic acid (C24:0)"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(-)-vernolic acid",
                "(3E)-3-hexadecenoic acid",
                "(3R)-3,22-dihydroxybehenic acid",
                "(7Z,10Z)-hexadecadienoic acid",
                "(E)-hexadec-2-enoic acid",
                "(R)-lamenallenic acid",
                "(S)-lamenallenic acid",
                "1-alpha-linolenoylglycerol",
                "1-erucoylglycerol",
                "11(E)-(3,4-dimethyl-5-(pent-1-en-1-yl)furan-2-yl)-undecanoic acid",
                "11-phenyl-7E-undecenoic acid",
                "2,6-dimethyl-hexadecanoic acid",
                "2-hydroxybehenic acid",
                "4,8,12,15,18-eicosapentaenoic acid",
                "4,8-dimethyl-hexadecanoic acid",
                "4,8-dimethyl-pentadecanoic acid",
                "7-Palmitoleic acid",
                "8-methyl-hexadecanoic acid",
                "8-methyl-octadecanoic acid",
                "Avenoleic acid",
                "Glycerol 1-hexadecanoate",
                "Linoleic acid(d4)",
                "Margaric acid(d3)",
                "Mycolipanolic acid (C24)",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "alpha-linolenic acid",
                "arachidonic acid",
                "cetoleic acid",
                "cholesteryl gamma-linolenate",
                "docosahexaenoic acid",
                "docosapentaenoic acid",
                "docosatrienoic acid",
                "erucic acid",
                "ethyl arachidate",
                "gamma-linolenic acid",
                "gorlic acid",
                "hexadecanoic acid",
                "linoleic acid",
                "methyl arachidonate",
                "methyl gamma-linolenate",
                "myristic acid-13C3",
                "myristoleic acid",
                "octadecanoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "palmitoleic acid",
                "petroselaidic acid",
                "petroselinamide",
                "petroselinic acid",
                "trans-gondoic acid"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Arachidic Acid (C20:0)",
            "Behenic Acid (C22:0)",
            "Lignoceric Acid (C24:0)",
            "Cerotic Acid (C26:0)",
            "Montanic Acid (C28:0)",
            "Melissic Acid (C30:0)",
            "Palmitic Acid (C16:0)",
            "Stearic Acid (C18:0)",
            "Oleic Acid (C18:1)",
            "Linoleic Acid (C18:2)",
            "Linolenic Acid (C18:3)",
            "Arachidonic Acid (C20:4)",
            "Eicosapentaenoic Acid (C20:5)",
            "Docosahexaenoic Acid (C22:6)",
            "Erucic Acid (C22:1)",
            "Nervonic Acid (C24:1)",
            "Lauric Acid (C12:0)",
            "Myristic Acid (C14:0)",
            "Pentadecanoic Acid (C15:0)",
            "Heptadecanoic Acid (C17:0)",
            "Tricosanoic Acid (C23:0)",
            "Pentacosanoic Acid (C25:0)",
            "Heptacosanoic Acid (C27:0)",
            "Nonacosanoic Acid (C29:0)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "palmitic acid",
                "stearic acid",
                "oleic acid",
                "linoleic acid",
                "linolenic acid",
                "arachidonic acid",
                "docosahexaenoic acid",
                "erucic acid",
                "heptadecanoic acid",
                "nonacosanoic acid",
                "pentadecanoic acid"
            ],
            "mismatches": [
                "arachidic acid (C20:0)",
                "behenic acid (C22:0)",
                "lignoceric acid (C24:0)",
                "cerotic acid (C26:0)",
                "montanic acid (C28:0)",
                "melissic acid (C30:0)",
                "eicosapentaenoic acid (C20:5)",
                "nervonic acid (C24:1)",
                "lauric acid (C12:0)",
                "myristic acid (C14:0)",
                "tricosanoic acid (C23:0)",
                "pentacosanoic acid (C25:0)",
                "heptacosanoic acid (C27:0)"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(3R)-3,22-dihydroxybehenic acid",
                "(3S)-3-hydroxydocosanoyl-CoA",
                "(9E)-pentadecenoic acid",
                "(E)-hexadec-2-enoic acid",
                "(R)-lamenallenic acid",
                "(S)-laballenic acid",
                "(S)-lamenallenic acid",
                "1-arachidonoylglycerol",
                "1-erucoylglycerol",
                "10-nonadecenoic acid",
                "2,6-dimethyl-hexadecanoic acid",
                "2-hydroxybehenic acid",
                "2-nonadecenoic acid",
                "2-oxo-pentadecanoic acid",
                "3-hydroxydocosanoic acid",
                "3-oxo-tridecanoic acid",
                "4,8,12,15,18-eicosapentaenoic acid",
                "4,8-dimethyl-hexadecanoic acid",
                "4,8-dimethyl-pentadecanoic acid",
                "7-heptadecenoic acid",
                "7-heptadecynoic acid",
                "7-hexadecynoic acid",
                "7-methyl-hexadecanoic acid",
                "8,11,14-Octadecatriynoic acid",
                "8-methyl-hexadecanoic acid",
                "8-methyl-octadecanoic acid",
                "Ceriporic acid A",
                "Ceriporic acid C",
                "Ceriporic acid D",
                "Glycerol 1-hexadecanoate",
                "Linoleic acid(d4)",
                "Paleic acid",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "arachidonic acid",
                "docosahexaenoic acid",
                "docosapentaenoic acid",
                "docosatrienoic acid",
                "erucic acid",
                "ethyl arachidate",
                "heptadecanoic acid",
                "hexadecanoic acid",
                "linoleic acid",
                "linolenic acid",
                "myristic acid-13C3",
                "myristoleic acid",
                "nonacosanoic acid",
                "octadecanoic acid",
                "octadecatetraenoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "pentadecanoic acid",
                "pentadecenoic acid"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Palmitic acid (C16:0)",
            "Stearic acid (C18:0)",
            "Arachidic acid (C20:0)",
            "Behenic acid (C22:0)",
            "Lignoceric acid (C24:0)",
            "Oleic acid (C18:1)",
            "Linoleic acid (C18:2)",
            "Alpha-linolenic acid (C18:3)",
            "Arachidonic acid (C20:4)",
            "Eicosapentaenoic acid (C20:5, EPA)",
            "Docosahexaenoic acid (C22:6, DHA)",
            "Myristic acid (C14:0)",
            "Capric acid (C10:0)",
            "Caprylic acid (C8:0)",
            "Palmitoleic acid (C16:1)",
            "Gadoleic acid (C20:1)",
            "Nervonic acid (C24:1)",
            "Pentacosanoic acid (C25:0)",
            "Hexacosanoic acid (C26:0)",
            "Heptacosanoic acid (C27:0)",
            "Nonacosanoic acid (C29:0)",
            "Triacontanoic acid (C30:0)",
            "Heneicosanoic acid (C21:0)",
            "Docosapentaenoic acid (C22:5, DPA)",
            "Tetracosanoic acid (C24:0)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Palmitic acid",
                "Stearic acid",
                "Oleic acid",
                "Linoleic acid",
                "alpha-linolenic acid",
                "arachidonic acid",
                "docosahexaenoic acid",
                "myristic acid",
                "palmitoleic acid",
                "gadoleic acid",
                "nonacosanoic acid",
                "docosapentaenoic acid"
            ],
            "mismatches": [
                "Arachidic acid (C20:0)",
                "Behenic acid (C22:0)",
                "Lignoceric acid (C24:0)",
                "Eicosapentaenoic acid (C20:5, EPA)",
                "Capric acid (C10:0)",
                "Caprylic acid (C8:0)",
                "Nervonic acid (C24:1)",
                "Pentacosanoic acid (C25:0)",
                "Hexacosanoic acid (C26:0)",
                "Heptacosanoic acid (C27:0)",
                "Triacontanoic acid (C30:0)",
                "Heneicosanoic acid (C21:0)",
                "Tetracosanoic acid (C24:0)"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(10E)-octadecenoic acid",
                "(3E)-3-hexadecenoic acid",
                "(3E,5E)-tridecadienoic acid",
                "(3R)-3,22-dihydroxybehenic acid",
                "(7Z,10Z)-hexadecadienoic acid",
                "1-alpha-linolenoylglycerol",
                "1-arachidonoylglycerol",
                "10-nonadecenoic acid",
                "2-hexadecynoic acid",
                "2-hydroxybehenic acid",
                "2-nonadecenoic acid",
                "2-oxo-heneicosanoic acid",
                "2-oxo-pentadecanoic acid",
                "3-methyl-heneicosanoic acid",
                "3-octadecynoic acid",
                "3-oxo-heneicosanoic acid",
                "4,8,12,15,18-eicosapentaenoic acid",
                "4,8-dimethyl-hexadecanoic acid",
                "4,8-dimethyl-pentadecanoic acid",
                "6,9-Hexadecadienoic acid",
                "7-Palmitoleic acid",
                "7-heptadecenoic acid",
                "7-heptadecynoic acid",
                "7-hexadecynoic acid",
                "8-methyl-hexadecanoic acid",
                "8-methyl-octadecanoic acid",
                "Glycerol 1-hexadecanoate",
                "Linoleic acid(d4)",
                "Margaric acid(d3)",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "alpha-linolenic acid",
                "arachidonic acid",
                "docosadienoic acid",
                "docosahexaenoic acid",
                "docosapentaenoic acid",
                "docosatrienoic acid",
                "ethyl arachidate",
                "gadoleic acid",
                "linoleic acid",
                "myristic acid-13C3",
                "myristoleic acid",
                "nonacosanoic acid",
                "octadecanoic acid",
                "octadecatetraenoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "palmitoleic acid",
                "pentadecanoic acid",
                "pentadecenoic acid",
                "tridecadienoic acid"
            ],
            "TP": 12,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Arachidic Acid (AA)",
            "Behenic Acid (BA)",
            "Lignoceric Acid (LA)",
            "Cerotic Acid (CA)",
            "Montanic Acid (MA)",
            "Melissic Acid (MeA)",
            "Myristic Acid (MyA)",
            "Palmitic Acid (PA)",
            "Stearic Acid (SA)",
            "Arachidonic Acid (AA)",
            "Eicosapentaenoic Acid (EPA)",
            "Docosahexaenoic Acid (DHA)",
            "Linoleic Acid (LA)",
            "Alpha-Linolenic Acid (ALA)",
            "Gamma-Linolenic Acid (GLA)",
            "Dihomo-Gamma-Linolenic Acid (DGLA)",
            "Oleic Acid (OA)",
            "Elaidic Acid (EA)",
            "Gondoic Acid (GA)",
            "Erucic Acid (ErA)",
            "Nervonic Acid (NA)",
            "Docosapentaenoic Acid (DPA)",
            "Docosatetraenoic Acid (DTA)",
            "Tetracosahexaenoic Acid (THA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Arachidonic Acid (AA)",
                "Docosahexaenoic Acid (DHA)",
                "Linoleic Acid (LA)",
                "Alpha-Linolenic Acid (ALA)",
                "Gamma-Linolenic Acid (GLA)",
                "Oleic Acid (OA)",
                "Elaidic Acid (EA)",
                "Erucic Acid (ErA)",
                "Docosapentaenoic Acid (DPA)",
                "Docosatetraenoic Acid (DTA)",
                "Tetracosahexaenoic Acid (THA)"
            ],
            "mismatches": [
                "Arachidic Acid (AA)",
                "Behenic Acid (BA)",
                "Lignoceric Acid (LA)",
                "Cerotic Acid (CA)",
                "Montanic Acid (MA)",
                "Melissic Acid (MeA)",
                "Myristic Acid (MyA)",
                "Palmitic Acid (PA)",
                "Stearic Acid (SA)",
                "Eicosapentaenoic Acid (EPA)",
                "Dihomo-Gamma-Linolenic Acid (DGLA)",
                "Gondoic Acid (GA)",
                "Nervonic Acid (NA)"
            ],
            "true_referents": [
                "(-)-vernolic acid",
                "(S)-lamenallenic acid",
                "1-erucoylglycerol",
                "1-gamma-linolenoyl 2-acylglycerolipid",
                "12-oxo-octadecanoic acid",
                "2-hydroxybehenic acid",
                "4,8,12,15,18-eicosapentaenoic acid",
                "5-DOXYL-stearic acid",
                "Anteisomyristic acid",
                "Ceriporic acid C",
                "Ceriporic acid D",
                "Dihomo-linoleate (20:2n6)",
                "Elaidolinolenic acid",
                "Himeic acid A",
                "Himeic acid B",
                "Lyngbic acid",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "alpha-licanic acid",
                "alpha-linolenic acid",
                "arachidonic acid",
                "arachidyl oleate",
                "beta-calendic acid",
                "docosadienoic acid",
                "docosahexaenoic acid",
                "docosanoic acid",
                "docosapentaenoic acid",
                "docosatetraenoic acid",
                "docosatrienoic acid",
                "elaidic acid",
                "erucic acid",
                "erucoyl-CoA",
                "gadelaidic acid",
                "gamma-linolenic acid",
                "gorlic acid",
                "hydroxydocosahexaenoic acid",
                "isomyristic acid",
                "linoleic acid",
                "linolenic acid",
                "methyl arachidonate",
                "myristoleic acid",
                "octadecanoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "phytanic acid",
                "stearolic acid",
                "tetracosahexaenoic acid",
                "trans-12-elaidic acid",
                "trans-gondoic acid"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Palmitic acid (C16:0)",
            "Stearic acid (C18:0)",
            "Oleic acid (C18:1)",
            "Linoleic acid (C18:2)",
            "Alpha-linolenic acid (C18:3)",
            "Arachidic acid (C20:0)",
            "Eicosapentaenoic acid (EPA)",
            "Docosahexaenoic acid (DHA)",
            "Behenic acid (C22:0)",
            "Lignoceric acid (C24:0)",
            "Myristoleic acid (C14:1)",
            "Palmitoleic acid (C16:1)",
            "Margaric acid (C17:0)",
            "Eicosenoic acid (C20:1)",
            "Erucic acid (C22:1)",
            "Nervonic acid (C24:1)",
            "Lauric acid (C12:0)",
            "Myristic acid (C14:0)",
            "Arachidonic acid (C20:4)",
            "Dihomo-gamma-linolenic acid (C20:3)",
            "Gadoleic acid (C20:1)",
            "Heptadecanoic acid (C17:0)",
            "Tricosanoic acid (C23:0)",
            "Tetracosanoic acid (C24:0)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "myristoleic acid",
                "palmitoleic acid",
                "margaric acid",
                "erucic acid",
                "heptadecanoic acid",
                "gadoleic acid",
                "arachidonic acid",
                "docosahexaenoic acid",
                "linoleic acid",
                "oleic acid",
                "stearic acid"
            ],
            "mismatches": [
                "palmitic acid (C16:0)",
                "alpha-linolenic acid (C18:3)",
                "arachidic acid (C20:0)",
                "eicosapentaenoic acid (EPA)",
                "behenic acid (C22:0)",
                "lignoceric acid (C24:0)",
                "nervonic acid (C24:1)",
                "lauric acid (C12:0)",
                "myristic acid (C14:0)",
                "dihomo-gamma-linolenic acid (C20:3)",
                "tricosanoic acid (C23:0)",
                "tetracosanoic acid (C24:0)"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(10E)-octadecenoic acid",
                "(3R)-3,22-dihydroxybehenic acid",
                "(3S)-3-hydroxydocosanoyl-CoA",
                "(6Z,9Z,12Z,15Z,18Z,21Z)-tetracosahexaenoic acid",
                "(E)-hexadec-2-enoic acid",
                "1-alpha-linolenoylglycerol",
                "1-arachidonoylglycerol",
                "1-erucoylglycerol",
                "14(Z)-eicosenoic acid",
                "2,4-dimethyl-2-eicosenoic acid",
                "2,6-dimethyl-hexadecanoic acid",
                "2-hydroxybehenic acid",
                "3-hydroxydocosanoic acid",
                "3-oxo-tridecanoic acid",
                "4,8,12,15,18-eicosapentaenoic acid",
                "4,8-dimethyl-hexadecanoic acid",
                "4,8-dimethyl-pentadecanoic acid",
                "5E-eicosenoic acid",
                "7-Palmitoleic acid",
                "7-methyl-hexadecanoic acid",
                "8-methyl-hexadecanoic acid",
                "8-methyl-octadecanoic acid",
                "Dihomo-linoleate (20:2n6)",
                "Glycerol 1-hexadecanoate",
                "Linoleic acid(d4)",
                "Margaric acid(d3)",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "alpha-linolenic acid",
                "arachidonic acid",
                "docosahexaenoic acid",
                "docosapentaenoic acid",
                "docosatrienoic acid",
                "erucic acid",
                "ethyl arachidate",
                "gadoleic acid",
                "gamma-linolenic acid",
                "heptadecanoic acid",
                "hexadecanoic acid",
                "linoleic acid",
                "methyl gamma-linolenate",
                "myristic acid-13C3",
                "myristoleic acid",
                "myristyl palmitate",
                "octadecanoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "palmitoleic acid",
                "tetracosahexaenoic acid"
            ],
            "TP": 11,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Lauric acid (C12:0)",
            "Myristic acid (C14:0)",
            "Palmitic acid (C16:0)",
            "Stearic acid (C18:0)",
            "Arachidic acid (C20:0)",
            "Behenic acid (C22:0)",
            "Lignoceric acid (C24:0)",
            "Oleic acid (C18:1)",
            "Palmitoleic acid (C16:1)",
            "Elaidic acid (C18:1 trans)",
            "Linoleic acid (C18:2)",
            "Alpha-Linolenic acid (ALA, C18:3)",
            "Eicosapentaenoic acid (EPA, C20:5)",
            "Docosahexaenoic acid (DHA, C22:6)",
            "Erucic acid (C22:1)",
            "Gadoleic acid (C20:1)",
            "Mead acid (C20:3)",
            "Nervonic acid (C24:1)",
            "Sapienic acid (C16:1\u03946)",
            "Vaccenic acid (C18:1\u039411)",
            "Gondoic acid (C20:1\u03949)",
            "Petroselinic acid (C18:1\u03947)",
            "Cerotic acid (C26:0)",
            "Eicosenoic acid (C20:1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Palmitic acid (C16:0)",
                "Stearic acid (C18:0)",
                "Oleic acid (C18:1)",
                "Palmitoleic acid (C16:1)",
                "Elaidic acid (C18:1 trans)",
                "Linoleic acid (C18:2)",
                "Alpha-Linolenic acid (ALA, C18:3)",
                "Docosahexaenoic acid (DHA, C22:6)",
                "Erucic acid (C22:1)",
                "Gadoleic acid (C20:1)",
                "Sapienic acid (C16:1\u03946)",
                "Vaccenic acid (C18:1\u039411)",
                "Petroselinic acid (C18:1\u03947)"
            ],
            "mismatches": [
                "Lauric acid (C12:0)",
                "Myristic acid (C14:0)",
                "Arachidic acid (C20:0)",
                "Behenic acid (C22:0)",
                "Lignoceric acid (C24:0)",
                "Eicosapentaenoic acid (EPA, C20:5)",
                "Mead acid (C20:3)",
                "Nervonic acid (C24:1)",
                "Gondoic acid (C20:1\u03949)",
                "Cerotic acid (C26:0)",
                "Eicosenoic acid (C20:1)"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(-)-vernolic acid",
                "(10E)-octadecenoic acid",
                "(2E)-2-heptadecenoic acid",
                "(3E)-3-hexadecenoic acid",
                "(3R)-3,22-dihydroxybehenic acid",
                "(E)-hexadec-2-enoic acid",
                "1-alpha-linolenoylglycerol",
                "1-erucoylglycerol",
                "14(Z)-eicosenoic acid",
                "2,4-Dimethyl-tetradecanoic acid",
                "2,4-dimethyl-2-eicosenoic acid",
                "2,6-dimethyl-hexadecanoic acid",
                "2,6-dimethyl-tetradecanoic acid",
                "2-hydroxybehenic acid",
                "3,5-dimethyl-tetradecanoic acid",
                "4,8,12,15,18-eicosapentaenoic acid",
                "4,8-dimethyl-hexadecanoic acid",
                "4,8-dimethyl-pentadecanoic acid",
                "5E-eicosenoic acid",
                "7-Palmitoleic acid",
                "8-methyl-hexadecanoic acid",
                "8-methyl-octadecanoic acid",
                "Ceriporic acid A",
                "Ceriporic acid C",
                "Ceriporic acid D",
                "Glycerol 1-hexadecanoate",
                "Linoleic acid(d4)",
                "Margaric acid(d3)",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "alpha-linolenic acid",
                "arachidonic acid",
                "cis-vaccenic acid",
                "docosahexaenoic acid",
                "docosapentaenoic acid",
                "docosatrienoic acid",
                "elaidic acid",
                "erucic acid",
                "ethyl arachidate",
                "gadoleic acid",
                "gorlic acid",
                "hexadecanoic acid",
                "linoleic acid",
                "myristic acid-13C3",
                "myristoleic acid",
                "octadecanoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "palmitoleic acid",
                "petroselaidic acid",
                "petroselinamide",
                "petroselinic acid",
                "sapienic acid",
                "trans-12-elaidic acid",
                "trans-8-elaidic acid",
                "trans-gondoic acid",
                "trans-vaccenic acid",
                "vaccenic acid"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Palmitic acid (C16:0)",
            "Stearic acid (C18:0)",
            "Oleic acid (C18:1)",
            "Linoleic acid (C18:2)",
            "Alpha-linolenic acid (C18:3)",
            "Arachidonic acid (C20:4)",
            "Eicosapentaenoic acid (EPA, C20:5)",
            "Docosahexaenoic acid (DHA, C22:6)",
            "Erucic acid (C22:1)",
            "Nervonic acid (C24:1)",
            "Lignoceric acid (C24:0)",
            "Behenic acid (C22:0)",
            "Arachidic acid (C20:0)",
            "Gondoic acid (C20:1)",
            "Mead acid (C20:3)",
            "Docosapentaenoic acid (DPA, C22:5)",
            "Elaidic acid (C18:1 trans)",
            "Vaccenic acid (C18:1 trans-11)",
            "Palmitoleic acid (C16:1)",
            "Margaric acid (C17:0)",
            "Heptadecenoic acid (C17:1)",
            "Eicosatrienoic acid (C20:3)",
            "Tricosanoic acid (C23:0)",
            "Cerotic acid (C26:0)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "alpha-linolenic acid",
                "arachidonic acid",
                "docosahexaenoic acid",
                "docosapentaenoic acid",
                "elaidic acid",
                "erucic acid",
                "heptadecenoic acid",
                "linoleic acid",
                "oleic acid",
                "palmitoleic acid",
                "stearic acid",
                "vaccenic acid"
            ],
            "mismatches": [
                "Palmitic acid (C16:0)",
                "Eicosapentaenoic acid (EPA, C20:5)",
                "Nervonic acid (C24:1)",
                "Lignoceric acid (C24:0)",
                "Behenic acid (C22:0)",
                "Arachidic acid (C20:0)",
                "Gondoic acid (C20:1)",
                "Mead acid (C20:3)",
                "Eicosatrienoic acid (C20:3)",
                "Margaric acid (C17:0)",
                "Tricosanoic acid (C23:0)",
                "Cerotic acid (C26:0)"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(-)-vernolic acid",
                "(2E)-2-heptadecenoic acid",
                "(3R)-3,22-dihydroxybehenic acid",
                "(3S)-3-hydroxydocosanoyl-CoA",
                "(E)-hexadec-2-enoic acid",
                "1-alpha-linolenoylglycerol",
                "1-arachidonoylglycerol",
                "1-erucoylglycerol",
                "11,12-Epoxyeicosatrienoic acid",
                "2,4-Dimethyl-tetradecanoic acid",
                "2,6-dimethyl-tetradecanoic acid",
                "2-hydroxybehenic acid",
                "3,5-dimethyl-tetradecanoic acid",
                "3-hydroxydocosanoic acid",
                "3-oxo-tridecanoic acid",
                "4,8,12,15,18-eicosapentaenoic acid",
                "4,8-dimethyl-hexadecanoic acid",
                "4,8-dimethyl-pentadecanoic acid",
                "5,8,11-eicosatrienoic acid",
                "7,11,14-Eicosatrienoic acid",
                "7-Palmitoleic acid",
                "7-heptadecenoic acid",
                "7-methyl-hexadecanoic acid",
                "8-methyl-hexadecanoic acid",
                "8-methyl-octadecanoic acid",
                "Ceriporic acid A",
                "Ceriporic acid C",
                "Ceriporic acid D",
                "Glycerol 1-hexadecanoate",
                "Linoleic acid(d4)",
                "Margaric acid(d3)",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "alpha-linolenic acid",
                "arachidonic acid",
                "cis-vaccenic acid",
                "docosadienoic acid",
                "docosahexaenoic acid",
                "docosapentaenoic acid",
                "docosatrienoic acid",
                "elaidic acid",
                "erucic acid",
                "ethyl arachidate",
                "gorlic acid",
                "heptadecenoic acid",
                "linoleic acid",
                "octadecanoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "palmitoleic acid",
                "trans-12-elaidic acid",
                "trans-8-elaidic acid",
                "trans-gondoic acid",
                "trans-vaccenic acid",
                "vaccenic acid"
            ],
            "TP": 12,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Palmitic acid (C16:0)",
            "Stearic acid (C18:0)",
            "Oleic acid (C18:1)",
            "Linoleic acid (C18:2)",
            "\u03b1-Linolenic acid (C18:3)",
            "\u03b3-Linolenic acid (C18:3)",
            "Arachidic acid (C20:0)",
            "Gondoic acid (C20:1)",
            "Arachidonic acid (C20:4)",
            "Eicosapentaenoic acid (C20:5)",
            "Behenic acid (C22:0)",
            "Erucic acid (C22:1)",
            "Docosahexaenoic acid (C22:6)",
            "Lignoceric acid (C24:0)",
            "Nervonic acid (C24:1)",
            "Cerotic acid (C26:0)",
            "Montanic acid (C28:0)",
            "Melissic acid (C30:0)",
            "Lacceroic acid (C32:0)",
            "Geddic acid (C34:0)",
            "Hexatriacontylic acid (C36:0)",
            "Octatriacontylic acid (C38:0)",
            "Tetracosapentaenoic acid (C24:5)",
            "Tetracosahexaenoic acid (C24:6)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "arachidonic acid",
                "docosahexaenoic acid",
                "erucic acid",
                "gamma-linolenic acid",
                "linoleic acid",
                "oleic acid",
                "tetracosahexaenoic acid"
            ],
            "mismatches": [
                "Palmitic acid (C16:0)",
                "Stearic acid (C18:0)",
                "Arachidic acid (C20:0)",
                "Gondoic acid (C20:1)",
                "Eicosapentaenoic acid (C20:5)",
                "Behenic acid (C22:0)",
                "Lignoceric acid (C24:0)",
                "Nervonic acid (C24:1)",
                "Cerotic acid (C26:0)",
                "Montanic acid (C28:0)",
                "Melissic acid (C30:0)",
                "Lacceroic acid (C32:0)",
                "Geddic acid (C34:0)",
                "Hexatriacontylic acid (C36:0)",
                "Octatriacontylic acid (C38:0)",
                "Tetracosapentaenoic acid (C24:5)"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(-)-vernolic acid",
                "(10E)-octadecenoic acid",
                "(17R)-hydroxydocosahexaenoic acid",
                "(2E,4E,6E,8E,10E)-octadecapentaenoic acid",
                "(3R)-3,22-dihydroxybehenic acid",
                "(4E,7E,10E,13E)-Hexadeca-4,7,10,13-tetraenoic acid",
                "(6Z,9Z,12Z,15Z,18Z,21Z)-tetracosahexaenoic acid",
                "(E)-hexadec-2-enoic acid",
                "(R)-lamenallenic acid",
                "(S)-laballenic acid",
                "(S)-lamenallenic acid",
                "1-alpha-linolenoylglycerol",
                "1-arachidonoylglycerol",
                "1-erucoylglycerol",
                "2-hydroxybehenic acid",
                "3,9-hexadecadiynoic acid",
                "4,8,12,15,18-eicosapentaenoic acid",
                "4,8-dimethyl-hexadecanoic acid",
                "4,8-dimethyl-pentadecanoic acid",
                "5,7,9,11,13-tetradecapentaenoic acid",
                "6,8,10-Pentadecatriynoic acid",
                "6,9,12-Octadecatriynoic acid",
                "6,9-Hexadecadienoic acid",
                "8,11,14-Octadecatriynoic acid",
                "8-methyl-hexadecanoic acid",
                "8-methyl-octadecanoic acid",
                "Ceriporic acid A",
                "Ceriporic acid C",
                "Ceriporic acid D",
                "Glycerol 1-hexadecanoate",
                "Linoleic acid(d4)",
                "Paleic acid",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "alpha-linolenic acid",
                "arachidonic acid",
                "cholesteryl gamma-linolenate",
                "docosahexaenoic acid",
                "docosapentaenoic acid",
                "docosatrienoic acid",
                "erucic acid",
                "ethyl arachidate",
                "gadelaidic acid",
                "gamma-linolenic acid",
                "gorlic acid",
                "linoleic acid",
                "octadecanoic acid",
                "octadecatetraenoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "tetracosahexaenoic acid",
                "trans-gondoic acid"
            ],
            "TP": 7,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Palmitic acid (C16:0)",
            "Stearic acid (C18:0)",
            "Oleic acid (C18:1)",
            "Linoleic acid (C18:2)",
            "Alpha-linolenic acid (C18:3)",
            "Arachidonic acid (C20:4)",
            "Eicosapentaenoic acid (EPA, C20:5)",
            "Docosahexaenoic acid (DHA, C22:6)",
            "Erucic acid (C22:1)",
            "Lignoceric acid (C24:0)",
            "Nervonic acid (C24:1)",
            "Cerotic acid (C26:0)",
            "Montanic acid (C28:0)",
            "Melissic acid (C30:0)",
            "Geddic acid (C32:0)",
            "Hexatriacontanoic acid (C36:0)",
            "Tetracontanoic acid (C40:0)",
            "Tetracosapentaenoic acid (C24:5)",
            "Tetracosahexaenoic acid (C24:6)",
            "Clupadonic acid (C28:5)",
            "Nisinic acid (C24:6)",
            "Osbondic acid (C22:5)",
            "Selacholeic acid (C24:5)",
            "Ximenynic acid (C26:4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Palmitic acid (C16:0)",
                "Stearic acid (C18:0)",
                "Oleic acid (C18:1)",
                "Linoleic acid (C18:2)",
                "Alpha-linolenic acid (C18:3)",
                "Arachidonic acid (C20:4)",
                "Docosahexaenoic acid (DHA, C22:6)",
                "Erucic acid (C22:1)",
                "Tetracosahexaenoic acid (C24:6)",
                "Ximenynic acid (C26:4)"
            ],
            "mismatches": [
                "Eicosapentaenoic acid (EPA, C20:5)",
                "Lignoceric acid (C24:0)",
                "Nervonic acid (C24:1)",
                "Cerotic acid (C26:0)",
                "Montanic acid (C28:0)",
                "Melissic acid (C30:0)",
                "Geddic acid (C32:0)",
                "Hexatriacontanoic acid (C36:0)",
                "Tetracontanoic acid (C40:0)",
                "Tetracosapentaenoic acid (C24:5)",
                "Clupadonic acid (C28:5)",
                "Nisinic acid (C24:6)",
                "Osbondic acid (C22:5)",
                "Selacholeic acid (C24:5)"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(17R)-hydroxydocosahexaenoic acid",
                "(2E,4E,6E,8E,10E)-octadecapentaenoic acid",
                "(4E,7E,10E,13E)-Hexadeca-4,7,10,13-tetraenoic acid",
                "(6Z,9Z,12Z,15Z,18Z,21Z)-tetracosahexaenoic acid",
                "(E)-hexadec-2-enoic acid",
                "(R)-lamenallenic acid",
                "(S)-2-hydroxyoctadecanoic acid",
                "(S)-3-hydroxyoctadecanoic acid",
                "(S)-laballenic acid",
                "(S)-lamenallenic acid",
                "(Z)-hexadec-7-enoic acid",
                "1-alpha-linolenoylglycerol",
                "1-arachidonoylglycerol",
                "1-erucoylglycerol",
                "11Z-Hexadecen-7,9-diynoic acid",
                "3,4-tetradecadienoic acid",
                "4,8,12,15,18-eicosapentaenoic acid",
                "4,8-dimethyl-hexadecanoic acid",
                "4,8-dimethyl-pentadecanoic acid",
                "5,7,9,11,13-tetradecapentaenoic acid",
                "5,8-Tetradecadienoic acid",
                "6,9-Hexadecadienoic acid",
                "8,11,14-Octadecatriynoic acid",
                "8-methyl-hexadecanoic acid",
                "8-methyl-octadecanoic acid",
                "8Z-decen-4,6-diynoic acid",
                "9,12-Hexadecadienoic acid",
                "Avenoleic acid",
                "Ceriporic acid A",
                "Ceriporic acid C",
                "Ceriporic acid D",
                "Glycerol 1-hexadecanoate",
                "Linoleic acid(d4)",
                "Octadec-9-ene-1,18-dioic-acid",
                "Paleic acid",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "Ximenynic acid",
                "alpha-linolenic acid",
                "arachidonic acid",
                "cetoleic acid",
                "docosahexaenoic acid",
                "docosapentaenoic acid",
                "docosatrienoic acid",
                "erucic acid",
                "gadelaidic acid",
                "gorlic acid",
                "hexadecadienoic acid",
                "lactobacillic acid",
                "linoleic acid",
                "octadecanoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "tetracosahexaenoic acid",
                "tetradecanoic acid",
                "tetradecenoic acid",
                "trans-gondoic acid"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Palmitic Acid (PA)",
            "Stearic Acid (SA)",
            "Oleic Acid (OA)",
            "Linoleic Acid (LA)",
            "Arachidonic Acid (AA)",
            "Eicosapentaenoic Acid (EPA)",
            "Docosahexaenoic Acid (DHA)",
            "Lignoceric Acid (LGA)",
            "Behenic Acid (BA)",
            "Erucic Acid (EA)",
            "Nervonic Acid (NA)",
            "Arachidic Acid (ADA)",
            "Gondoic Acid (GA)",
            "Cetoleic Acid (CA)",
            "Myristoleic Acid (MA)",
            "Gadoleic Acid (GDA)",
            "Elaidic Acid (EA)",
            "Paullinic Acid (PA)",
            "Petroselinic Acid (PA)",
            "Gondoic Acid (GA)",
            "Cetoleic Acid (CA)",
            "Myristoleic Acid (MA)",
            "Gadoleic Acid (GDA)",
            "Elaidic Acid (EA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Palmitic Acid (PA)",
                "Oleic Acid (OA)",
                "Linoleic Acid (LA)",
                "Arachidonic Acid (AA)",
                "Docosahexaenoic Acid (DHA)",
                "Erucic Acid (EA)",
                "Cetoleic Acid (CA)",
                "Myristoleic Acid (MA)",
                "Gadoleic Acid (GDA)",
                "Elaidic Acid (EA)",
                "Petroselinic Acid (PA)"
            ],
            "mismatches": [
                "Stearic Acid (SA)",
                "Eicosapentaenoic Acid (EPA)",
                "Lignoceric Acid (LGA)",
                "Behenic Acid (BA)",
                "Nervonic Acid (NA)",
                "Arachidic Acid (ADA)",
                "Gondoic Acid (GA)",
                "Paullinic Acid (PA)"
            ],
            "true_referents": [
                "(-)-vernolic acid",
                "(9E)-tetradecenoic acid",
                "1-erucoylglycerol",
                "1-palmitoyl-2-propionyl-sn-glycero-3-phosphocholine",
                "12-oxo-octadecanoic acid",
                "2-hydroxybehenic acid",
                "4,8,12,15,18-eicosapentaenoic acid",
                "5-DOXYL-stearic acid",
                "Avenoleic acid",
                "Elaidolinolenic acid",
                "Himeic acid B",
                "Lyngbic acid",
                "Palmitic acid(d3)",
                "Pentadecylic acid(d3)",
                "Stearic acid(d3)",
                "alpha-licanic acid",
                "arachidonic acid",
                "cetoleic acid",
                "docosahexaenoic acid",
                "docosapentaenoic acid",
                "docosatrienoic acid",
                "elaidic acid",
                "erucic acid",
                "erucoyl-CoA",
                "ethyl arachidate",
                "gadelaidic acid",
                "gadoleic acid",
                "gorlic acid",
                "linoleic acid",
                "linolenic acid",
                "methyl arachidonate",
                "myristoleic acid",
                "myristyl palmitate",
                "octadecanoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "palmitoleic acid",
                "petroselaidic acid",
                "petroselinamide",
                "petroselinic acid",
                "scleropyric acid",
                "stearolic acid",
                "trans-12-elaidic acid",
                "trans-gondoic acid"
            ],
            "TP": 11,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": "[\n\"Palmitic acid (C16:0)\" ,\n\"Stearic acid (C18:0)\" ,\n\"Oleic acid (C18:1)\" ,\n\"Linoleic acid (C18:2)\" ,\n\"Linolenic acid (C18:3)\" ,\n\"Arachidonic acid (C20:4)\" ,\n\"Eicosapentaenoic acid (EPA, C20:5)\" ,\n\"Docosahexaenoic acid (DHA, C22:6)\" ,\n\"Gamma-linolenic acid (GLA, C18:3)\" ,\n\"Alpha-linolenic acid (ALA, C18:3)\" ,\n\"Behenic acid (C22:0)\" ,\n\"Lignoceric acid (C24:0)\" ,\n\"Sphingomyelin\" ,\n\"Phosphatidylcholine\" ,\n\"Phosphatidylethanolamine\" ,\n\"Phosphatidylinositol\" ,\n\"Triacylglycerol\" ,\n\"Dietary fat\" ,\n\"Body fat\" ,\n\"Adipose tissue\" ,\n\"Cholesterol ester\" ,\n\"Phospholipid\" ,\n\"Cell membrane\" ,\n\"Plasma lipoprotein\" ,\n\"VLDL\" ,\n\"HDL\" ,\n\"LDL\"",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": [
            "Myristic acid (C14:0)",
            "Palmitic acid (C16:0)",
            "Stearic acid (C18:0)",
            "Arachidic acid (C20:0)",
            "Behenic acid (C22:0)",
            "Lignoceric acid (C24:0)",
            "Cerotic acid (C26:0)",
            "Montanic acid (C28:0)",
            "Melissic acid (C30:0)",
            "Palmitoleic acid (C16:1)",
            "Oleic acid (C18:1)",
            "Vaccenic acid (C18:1)",
            "Gadoleic acid (C20:1)",
            "Erucic acid (C22:1)",
            "Nervonic acid (C24:1)",
            "Linoleic acid (C18:2)",
            "Gamma-linolenic acid (C18:3)",
            "Arachidonic acid (C20:4)",
            "Eicosapentaenoic acid (C20:5)",
            "Docosahexaenoic acid (C22:6)",
            "Cerulenin (C18:2)",
            "Ricinoleic acid (C18:1)",
            "Dihomo-gamma-linolenic acid (C20:3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Palmitoleic acid",
                "Oleic acid",
                "Vaccenic acid",
                "Gadoleic acid",
                "Erucic acid",
                "Linoleic acid",
                "Gamma-linolenic acid",
                "Arachidonic acid",
                "Docosahexaenoic acid",
                "Ricinoleic acid"
            ],
            "mismatches": [
                "Myristic acid (C14:0)",
                "Palmitic acid (C16:0)",
                "Stearic acid (C18:0)",
                "Arachidic acid (C20:0)",
                "Behenic acid (C22:0)",
                "Lignoceric acid (C24:0)",
                "Cerotic acid (C26:0)",
                "Montanic acid (C28:0)",
                "Melissic acid (C30:0)",
                "Nervonic acid (C24:1)",
                "Eicosapentaenoic acid (C20:5)",
                "Cerulenin (C18:2)",
                "Dihomo-gamma-linolenic acid (C20:3)"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(10E)-octadecenoic acid",
                "(3R)-3,22-dihydroxybehenic acid",
                "(E)-hexadec-2-enoic acid",
                "(R)-lamenallenic acid",
                "(S)-laballenic acid",
                "(S)-lamenallenic acid",
                "1-arachidonoylglycerol",
                "1-erucoylglycerol",
                "2-Hydroxylinolenic acid",
                "2-hydroxybehenic acid",
                "4,8,12,15,18-eicosapentaenoic acid",
                "4,8-dimethyl-hexadecanoic acid",
                "4,8-dimethyl-pentadecanoic acid",
                "7-Palmitoleic acid",
                "8,11,14-Octadecatriynoic acid",
                "8-Hydroxyhexadecanoic acid",
                "8-methyl-hexadecanoic acid",
                "8-methyl-octadecanoic acid",
                "8E-heptadecenoic acid",
                "Ceriporic acid A",
                "Ceriporic acid C",
                "Ceriporic acid D",
                "Dihomo-linoleate (20:2n6)",
                "Glycerol 1-hexadecanoate",
                "Linoleic acid(d4)",
                "Margaric acid(d3)",
                "Paleic acid",
                "Palmitic acid(d3)",
                "Stearic acid(d3)",
                "arachidonic acid",
                "cholesteryl gamma-linolenate",
                "cis-8-heptadecenoic acid",
                "cis-vaccenic acid",
                "docosahexaenoic acid",
                "docosapentaenoic acid",
                "docosatrienoic acid",
                "erucic acid",
                "ethyl arachidate",
                "gadoleic acid",
                "gamma-linolenic acid",
                "linoleic acid",
                "methyl gamma-linolenate",
                "myristic acid-13C3",
                "myristoleic acid",
                "octadecanoic acid",
                "octadecatetraenoic acid",
                "oleic acid",
                "palmitic acid-d31",
                "palmitoleic acid",
                "ricinoleic acid",
                "trans-vaccenic acid",
                "vaccenic acid"
            ],
            "TP": 10,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "long-chain fatty acid",
        "domain": "chemistry",
        "response": "Sorry - this model is unable to respond to this request.",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]