[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Cyclopropanecarboxylic acid (CPA)",
            "Cyclopropylpropanoic acid",
            "5-Methylcyclohex-1-ene-1-carboxylic acid",
            "Cyclopent-1-enecarboxylic acid",
            "Cyclohex-1-enecarboxylic acid",
            "Cyclohept-1-enecarboxylic acid",
            "Cyclooct-1-enecarboxylic acid",
            "Cyclonon-1-enecarboxylic acid",
            "Cyclodec-1-enecarboxylic acid",
            "Cyclopent-2-enecarboxylic acid",
            "Cyclohex-2-enecarboxylic acid",
            "Cyclohept-2-enecarboxylic acid",
            "Cyclooct-2-enecarboxylic acid",
            "Cyclonon-2-enecarboxylic acid",
            "Cyclodec-2-enecarboxylic acid",
            "Cyclopent-3-enecarboxylic acid",
            "Cyclohex-3-enecarboxylic acid",
            "Cyclohept-3-enecarboxylic acid",
            "Cyclooct-3-enecarboxylic acid",
            "Cyclonon-3-enecarboxylic acid",
            "Cyclodec-3-enecarboxylic acid",
            "Cyclopent-4-enecarboxylic acid",
            "Cyclohex-4-enecarboxylic acid",
            "Cyclohept-4-enecarboxylic acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Cyclopropanecarboxylic acid (CPA)",
                "Cyclopropylpropanoic acid",
                "5-Methylcyclohex-1-ene-1-carboxylic acid",
                "Cyclopent-1-enecarboxylic acid",
                "Cyclohex-1-enecarboxylic acid",
                "Cyclohept-1-enecarboxylic acid",
                "Cyclooct-1-enecarboxylic acid",
                "Cyclonon-1-enecarboxylic acid",
                "Cyclodec-1-enecarboxylic acid",
                "Cyclopent-2-enecarboxylic acid",
                "Cyclohex-2-enecarboxylic acid",
                "Cyclohept-2-enecarboxylic acid",
                "Cyclooct-2-enecarboxylic acid",
                "Cyclonon-2-enecarboxylic acid",
                "Cyclodec-2-enecarboxylic acid",
                "Cyclopent-3-enecarboxylic acid",
                "Cyclohex-3-enecarboxylic acid",
                "Cyclohept-3-enecarboxylic acid",
                "Cyclooct-3-enecarboxylic acid",
                "Cyclonon-3-enecarboxylic acid",
                "Cyclodec-3-enecarboxylic acid",
                "Cyclopent-4-enecarboxylic acid",
                "Cyclohex-4-enecarboxylic acid",
                "Cyclohept-4-enecarboxylic acid"
            ],
            "true_referents": [
                "(13S)-12,13-epoxyoctadeca-9,11-dienoic acid",
                "(2E,6E,10R,11S)-10,11-epoxy-3,7,11-trimethyltrideca-2,6-dienoic acid",
                "(4Z,9E,11E,13Z,15E,17S,19Z)-7,8-epoxy-17-hydroxydocosahexaenoic acid",
                "(7Z,13Z,16Z,19Z)-10,11-epoxydocosatetraenoic acid",
                "(9Z,13S,15Z)-12,13-epoxyoctadeca-9,11,15-trienoic acid",
                "11,12-epoxy-(5Z,8Z,14Z)-icosatrienoyl-CoA",
                "2-carboxyethyl-5-furanpentanoic acid",
                "3,4-dimethyl-5-carboxyethyl-2-furanpentanoic acid",
                "3,4-dimethyl-5-carboxyethyl-2-furanpropanoic acid",
                "3-carboxy-4-methyl-5-(4-oxopentyl)-2-furanpropanoic acid",
                "3-carboxy-4-methyl-5-propylene-2-furanpropanoic acid",
                "3-methyl-5-carboxypropyl-2-furanpropanoic acid",
                "4-methyl-5-carboxyethyl-2-furanacrylic acid",
                "4-methyl-5-carboxyethyl-2-furanpentanoic acid",
                "4S(5)-epoxy-17R-hydroxydocosahexaenoic acid",
                "5,6-Epoxyoctadeca-7,9-diynoic acid",
                "5,6-epoxy-(8Z,11Z,14Z)-icosatrienoyl-CoA",
                "5-((E)-hept-4-en-2-yne-1-one-1-yl)-2-furanacrylic acid",
                "8,9-epoxy-(5Z,11Z,14Z)-icosatrienoyl-CoA",
                "8-Hydroxy-9,10-epoxystearic acid",
                "9,10-epoxy-18-hydroxyoctadecanoic acid",
                "9,10-epoxyoctadecanoic acid",
                "cis-9,10-epoxyoctadecanoic acid",
                "epoxyoctadecenoic acid"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Ergosterol (Ergosterol)",
            "Cholesterol (Cholesterol)",
            "Vitamin D2 (Ergocalciferol)",
            "Vitamin D3 (Cholecalciferol)",
            "Prostaglandin F2alpha (PGF2\u03b1)",
            "Prostaglandin E2 (PGE2)",
            "Thromboxane A2 (TXA2)",
            "Leukotriene B4 (LTB4)",
            "Vitamin K2 (Menaquinone)",
            "Anandamide (Anandamide)",
            "2-Arachidonoylglycerol (2-AG)",
            "Oleoylethanolamide (OEA)",
            "Palmitoylethanolamide (PEA)",
            "Docosahexaenoylethanolamide (DHEA)",
            "Eicosapentaenoylethanolamide (EPEA)",
            "Lipoxin A4 (LXA4)",
            "Resolvin D1 (RvD1)",
            "Protectin D1 (PD1)",
            "Maresin 1 (MaR1)",
            "Isoprostane F2alpha (IsoP F2\u03b1)",
            "Isoprostane E2 (IsoP E2)",
            "Isoxazoline (Isoxazoline)",
            "Thyroxine (T4)",
            "Triiodothyronine (T3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Ergosterol (Ergosterol)",
                "Cholesterol (Cholesterol)",
                "Vitamin D2 (Ergocalciferol)",
                "Vitamin D3 (Cholecalciferol)",
                "Prostaglandin F2alpha (PGF2\u03b1)",
                "Prostaglandin E2 (PGE2)",
                "Thromboxane A2 (TXA2)",
                "Leukotriene B4 (LTB4)",
                "Vitamin K2 (Menaquinone)",
                "Anandamide (Anandamide)",
                "2-Arachidonoylglycerol (2-AG)",
                "Oleoylethanolamide (OEA)",
                "Palmitoylethanolamide (PEA)",
                "Docosahexaenoylethanolamide (DHEA)",
                "Eicosapentaenoylethanolamide (EPEA)",
                "Lipoxin A4 (LXA4)",
                "Resolvin D1 (RvD1)",
                "Protectin D1 (PD1)",
                "Maresin 1 (MaR1)",
                "Isoprostane F2alpha (IsoP F2\u03b1)",
                "Isoprostane E2 (IsoP E2)",
                "Isoxazoline (Isoxazoline)",
                "Thyroxine (T4)",
                "Triiodothyronine (T3)"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(-)-vernolic acid",
                "(2E,11Z)-Wyerone acid",
                "(4Z,7Z,10Z,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(4Z,7Z,13Z,16Z,19Z)-10,11-epoxydocosapentaenoic acid",
                "(7Z,9E,11E,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(8S)-hepoxilin A3",
                "(R)-lipoamide",
                "(S)-lipoic acid",
                "11(S)-hydroxy-14(S),15(S)-hepoxilin A3",
                "26-deoxymonensin A",
                "4'-oxomacrophorin D",
                "4,5-epoxy-7z,10z,13z,16z,19z-docosapentaenoic acid, methyl ester",
                "4,5-leukotriene A4",
                "4-(4-ethyl-1-piperazinyl)-4-oxo-2-butenoic acid",
                "7,8-epoxy,17-hydroxy-(9E,11E,13Z,15E,19Z)-docosapentaenoic acid",
                "8-Hydroxy-9,10-epoxystearic acid",
                "Irpexlacte D",
                "Phellinulin D",
                "Pteridic acid D",
                "cis-9,10-epoxyoctadecanoic acid",
                "eoxin A4",
                "epoxydocosapentaenoic acid",
                "juvenile hormone III acid",
                "leukotriene A4",
                "lipoamide"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Cyclopropane fatty acid (CPA)",
            "Cyclopropaneoctanoic acid (CPO)",
            "Cyclopropaneheptanoic acid (CPA)",
            "Cyclopropanehexanoic acid (CPH)",
            "Cyclopentane fatty acid",
            "Cyclopentanoic acid",
            "Cyclohexane fatty acid",
            "Cyclohexanoic acid",
            "Cycloheptane fatty acid",
            "Cycloheptanoic acid",
            "Cyclooctane fatty acid",
            "Cyclooctanoic acid",
            "Cyclopentylacetic acid",
            "Cyclohexylacetic acid",
            "Cycloheptylacetic acid",
            "Cyclooctylacetic acid",
            "Cyclopentylpropionic acid",
            "Cyclohexylpropionic acid",
            "Cycloheptylpropionic acid",
            "Cyclooctylpropionic acid",
            "Cyclopentylbutyric acid",
            "Cyclohexylbutyric acid",
            "Cycloheptylbutyric acid",
            "Cyclooctylbutyric acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Cyclopropane fatty acid (CPA)",
                "Cyclopropaneoctanoic acid (CPO)",
                "Cyclopropaneheptanoic acid (CPA)",
                "Cyclopropanehexanoic acid (CPH)",
                "Cyclopentane fatty acid",
                "Cyclopentanoic acid",
                "Cyclohexane fatty acid",
                "Cyclohexanoic acid",
                "Cycloheptane fatty acid",
                "Cycloheptanoic acid",
                "Cyclooctane fatty acid",
                "Cyclooctanoic acid",
                "Cyclopentylacetic acid",
                "Cyclohexylacetic acid",
                "Cycloheptylacetic acid",
                "Cyclooctylacetic acid",
                "Cyclopentylpropionic acid",
                "Cyclohexylpropionic acid",
                "Cycloheptylpropionic acid",
                "Cyclooctylpropionic acid",
                "Cyclopentylbutyric acid",
                "Cyclohexylbutyric acid",
                "Cycloheptylbutyric acid",
                "Cyclooctylbutyric acid"
            ],
            "true_referents": [
                "(-)-vernolic acid",
                "(13S)-12,13-epoxyoctadeca-9,11-dienoic acid",
                "(9R,10S)-9,10-epoxyoctadecanoic acid",
                "(9S,10R)-9,10-epoxy-18-hydroxyoctadecanoic acid",
                "(9S,10R)-epoxyoctadecanoic acid",
                "11,12-epoxy-(5Z,8Z,14Z)-icosatrienoyl-CoA",
                "2-(5-hexadecylfuran-2-yl)-acetic acid",
                "2-carboxyethyl-5-furanpentanoic acid",
                "3,4-dimethyl-5-carboxybutyl-2-furanpentanoic acid",
                "3,4-dimethyl-5-carboxypropyl-2-furanpentanoic acid",
                "3-Carboxy-4-methyl-5-pentyl-2-furanpropanoic acid",
                "3-Methyl-5-propyl-2-furanheptanoic acid",
                "3-carboxy-4-methyl-5-(1-hydroxypropyl)-2-furanpropionic acid",
                "3-carboxy-4-methyl-5-(4-hydroxypentyl)-2-furanpropanoic acid",
                "3-carboxy-4-methyl-5-(4-oxopentyl)-2-furanpropanoic acid",
                "3-carboxy-4-methyl-5-propylene-2-furanpropanoic acid",
                "3-methyl-5-carboxypropyl-2-furanpropanoic acid",
                "4-methyl-5-carboxyethyl-2-furanacrylic acid",
                "5,6-Epoxyoctadeca-7,9-diynoic acid",
                "5,6-epoxy-(8Z,11Z,14Z)-icosatrienoyl-CoA",
                "5-((E)-hept-4-en-2-yne-1-one-1-yl)-2-furanacrylic acid",
                "5-Pentyl-2-furanheptanoic acid",
                "8-Hydroxy-9,10-epoxystearic acid",
                "9,10-epoxyoctadecanoic acid",
                "Ambuic acid",
                "Demethyl-harzianic acid",
                "cis-9,10-epoxyoctadecanoic acid",
                "epoxy fatty acid",
                "epoxydocosatetraenoic acid",
                "lipoic acid"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Sphingosine (Sph)",
            "Prostaglandin E2 (PGE2)",
            "Arachidonic Acid (AA)",
            "Docosahexaenoic Acid-derived Neuroprotectin D1 (NPD1)",
            "Lysophosphatidic Acid (LPA)",
            "Ceramide (Cer)",
            "Phosphatidylinositol (PI)",
            "Sphingomyelin (SM)",
            "Dinoprostone",
            "Leukotriene B4 (LTB4)",
            "Prostaglandin F2\u03b1 (PGF2\u03b1)",
            "Eicosapentaenoic Acid-derived Resolvin E1 (RvE1)",
            "Cardiolipin",
            "Phosphatidylserine (PS)",
            "Phosphatidylethanolamine (PE)",
            "Ganglioside GM1",
            "Thromboxane A2 (TXA2)",
            "Lipopolysaccharide (LPS)",
            "Squalene epoxide",
            "Vitamin K1 (Phylloquinone)",
            "Biotin (Vitamin B7)",
            "Menatetrenone (Vitamin K2)",
            "Dolichol phosphate",
            "Plasmanylethanolamine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Sphingosine (Sph)",
                "Prostaglandin E2 (PGE2)",
                "Arachidonic Acid (AA)",
                "Docosahexaenoic Acid-derived Neuroprotectin D1 (NPD1)",
                "Lysophosphatidic Acid (LPA)",
                "Ceramide (Cer)",
                "Phosphatidylinositol (PI)",
                "Sphingomyelin (SM)",
                "Dinoprostone",
                "Leukotriene B4 (LTB4)",
                "Prostaglandin F2\u03b1 (PGF2\u03b1)",
                "Eicosapentaenoic Acid-derived Resolvin E1 (RvE1)",
                "Cardiolipin",
                "Phosphatidylserine (PS)",
                "Phosphatidylethanolamine (PE)",
                "Ganglioside GM1",
                "Thromboxane A2 (TXA2)",
                "Lipopolysaccharide (LPS)",
                "Squalene epoxide",
                "Vitamin K1 (Phylloquinone)",
                "Biotin (Vitamin B7)",
                "Menatetrenone (Vitamin K2)",
                "Dolichol phosphate",
                "Plasmanylethanolamine"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(-)-vernolic acid",
                "(4Z,7Z,10Z,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(5Z,8R,9Z,11Z,14Z)-8,9-epoxyicosatetraenoic acid",
                "(7Z,9E,11E,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(9S,10R)-epoxyoctadecanoic acid",
                "(R)-lipoamide",
                "(R)-lipoyl-GMP",
                "(S)-lipoic acid",
                "1-hexadecanoyl-2-(9,10-epoxyoctadecanoyl)-sn-glycero-3-phosphocholine",
                "2-Demethylmonensin A",
                "26-deoxymonensin A",
                "4'-oxomacrophorin D",
                "4,5-epoxy-7z,10z,13z,16z,19z-docosapentaenoic acid, methyl ester",
                "4,5-leukotriene A4",
                "7,8-epoxy,17-hydroxy-(9E,11E,13Z,15E,19Z)-docosapentaenoic acid",
                "8-Hydroxy-9,10-epoxystearic acid",
                "9,10-epoxyoctadecanoic acid",
                "Bisnorbiotin",
                "N-[(5Z,8Z,11Z)-14,15-epoxyicosatrienoyl]ethanolamine",
                "Neoenterocin A",
                "cis-9,10-epoxyoctadecanoic acid",
                "epoxy fatty acid",
                "epoxydocosapentaenoic acid",
                "epoxydocosatetraenoic acid",
                "epoxystearic acid",
                "juvenile hormone III acid",
                "leukotriene A4",
                "lipoamide",
                "lipoic acid",
                "lipoyl-AMP"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Prostaglandin E2 (PGE2)",
            "Prostaglandin D2 (PGD2)",
            "Prostaglandin F2\u03b1 (PGF2\u03b1)",
            "Leukotriene B4 (LTB4)",
            "Leukotriene C4 (LTC4)",
            "Leukotriene D4 (LTD4)",
            "Thromboxane A2 (TXA2)",
            "Thromboxane B2 (TXB2)",
            "Lipoxin A4 (LXA4)",
            "Lipoxin B4 (LXB4)",
            "Resolvin E1 (RvE1)",
            "Resolvin D1 (RvD1)",
            "Resolvin D2 (RvD2)",
            "Maresin 1 (MaR1)",
            "Protectin D1 (PD1)",
            "Isoprostane E2 (iPE2)",
            "Isoprostane F2\u03b1 (iPF2\u03b1)",
            "Epoxyeicosatrienoic acid (EET)",
            "Hepoxilin A3 (HxA3)",
            "Hepoxilin B3 (HxB3)",
            "Cyclopentenone prostaglandin A1 (PGA1)",
            "Cyclopentenone prostaglandin A2 (PGA2)",
            "Cyclopentenone prostaglandin J2 (PGJ2)",
            "Cyclopentenone prostaglandin D2 (\u039412-PGD2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepoxilin A3 (HxA3)",
                "Hepoxilin B3 (HxB3)"
            ],
            "mismatches": [
                "Prostaglandin E2 (PGE2)",
                "Prostaglandin D2 (PGD2)",
                "Prostaglandin F2\u03b1 (PGF2\u03b1)",
                "Leukotriene B4 (LTB4)",
                "Leukotriene C4 (LTC4)",
                "Leukotriene D4 (LTD4)",
                "Thromboxane A2 (TXA2)",
                "Thromboxane B2 (TXB2)",
                "Lipoxin A4 (LXA4)",
                "Lipoxin B4 (LXB4)",
                "Resolvin E1 (RvE1)",
                "Resolvin D1 (RvD1)",
                "Resolvin D2 (RvD2)",
                "Maresin 1 (MaR1)",
                "Protectin D1 (PD1)",
                "Isoprostane E2 (iPE2)",
                "Isoprostane F2\u03b1 (iPF2\u03b1)",
                "Epoxyeicosatrienoic acid (EET)",
                "Cyclopentenone prostaglandin A1 (PGA1)",
                "Cyclopentenone prostaglandin A2 (PGA2)",
                "Cyclopentenone prostaglandin J2 (PGJ2)",
                "Cyclopentenone prostaglandin D2 (\u039412-PGD2)"
            ],
            "true_referents": [
                "(8S)-hepoxilin A3",
                "(9Z,11Z,13S,15Z)-12,13-epoxyoctadecatrienoic acid",
                "(R)-lipoamide",
                "26-deoxymonensin A",
                "4'-oxomacrophorin D",
                "4,5-leukotriene A4",
                "8(9)-EET methyl ester",
                "Irpexlacte D",
                "Phellidene E",
                "Phellinulin D",
                "Pteridic acid D",
                "eoxin A4",
                "epoxydocosatetraenoic acid",
                "hepoxilin A3",
                "hepoxilin B3",
                "leukotriene A4"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Arachidonic acid (AA)",
            "Docosahexaenoic acid (DHA)",
            "Eicosapentaenoic acid (EPA)",
            "Linoleic acid (LA)",
            "Oleic acid (OA)",
            "Palmitoleic acid (POA)",
            "Stearidonic acid (SDA)",
            "Gamma-linolenic acid (GLA)",
            "Alpha-linolenic acid (ALA)",
            "Cerotic acid (C26:0)",
            "Myristoleic acid (14:1)",
            "Pentadecanoic acid (15:0)",
            "Lauric acid (C12:0)",
            "Capric acid (C10:0)",
            "Caprylic acid (C8:0)",
            "Cyclopropane fatty acid (CFA)",
            "Cyclopentane fatty acid (CPFA)",
            "Cyclohexane fatty acid (CHFA)",
            "Cycloheptane fatty acid (CH7FA)",
            "Cyclooctane fatty acid (COFA)",
            "Dodecylcyclopropane carboxylic acid (DCPCA)",
            "Octadecanoic acid (stearic acid)",
            "Tetracosanoic acid (lignoceric acid)",
            "Hexacosanoic acid (cerotic acid)",
            "Octadecatrienoic acid (OT)",
            "Eicosatrienoic acid (ETE)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Arachidonic acid (AA)",
                "Docosahexaenoic acid (DHA)",
                "Eicosapentaenoic acid (EPA)",
                "Linoleic acid (LA)",
                "Oleic acid (OA)",
                "Palmitoleic acid (POA)",
                "Stearidonic acid (SDA)",
                "Gamma-linolenic acid (GLA)",
                "Alpha-linolenic acid (ALA)",
                "Cerotic acid (C26:0)",
                "Myristoleic acid (14:1)",
                "Pentadecanoic acid (15:0)",
                "Lauric acid (C12:0)",
                "Capric acid (C10:0)",
                "Caprylic acid (C8:0)",
                "Cyclopropane fatty acid (CFA)",
                "Cyclopentane fatty acid (CPFA)",
                "Cyclohexane fatty acid (CHFA)",
                "Cycloheptane fatty acid (CH7FA)",
                "Cyclooctane fatty acid (COFA)",
                "Dodecylcyclopropane carboxylic acid (DCPCA)",
                "Octadecanoic acid (stearic acid)",
                "Tetracosanoic acid (lignoceric acid)",
                "Hexacosanoic acid (cerotic acid)",
                "Octadecatrienoic acid (OT)",
                "Eicosatrienoic acid (ETE)"
            ],
            "true_referents": [
                "(4Z,7Z,10Z,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(4Z,7Z,13Z,16Z,19Z)-10,11-epoxydocosapentaenoic acid",
                "(7Z,9E,11E,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(9R,10S)-9,10-epoxyoctadecanoic acid",
                "(9S,10R)-epoxyoctadecanoic acid",
                "(S)-lipoic acid",
                "3,4-dimethyl-5-carboxyethyl-2-furanacrylic acid",
                "3,4-dimethyl-5-propyl-2-furanoctanoic acid;",
                "3-Methyl-5-propyl-2-furanheptanoic acid",
                "4,5-epoxy-7z,10z,13z,16z,19z-docosapentaenoic acid, methyl ester",
                "9,10-epoxyoctadecanoic acid",
                "cis-9,10-epoxyoctadecanoic acid",
                "epoxydocosapentaenoic acid"
            ],
            "TP": 0,
            "FP": 26,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Ricinoleic Acid (RA)",
            "Coronaric Acid (CA)",
            "Conjugated Linoleic Acid (CLA)",
            "Pinolenic Acid (PA)",
            "Arachidonic Acid (AA)",
            "Eicosapentaenoic Acid (EPA)",
            "Docosahexaenoic Acid (DHA)",
            "Alpha-Linolenic Acid (ALA)",
            "Gamma-Linolenic Acid (GLA)",
            "Stearidonic Acid (SDA)",
            "Docosapentaenoic Acid (DPA)",
            "Linoleic Acid (LA)",
            "Oleic Acid (OA)",
            "Palmitic Acid (PALA)",
            "Myristic Acid (MA)",
            "Lauric Acid (LAU)",
            "Capric Acid (CA)",
            "Caprylic Acid (CAPA)",
            "Caproic Acid (CAP)",
            "Butyric Acid (BA)",
            "Propionic Acid (PA)",
            "Acetic Acid (AA)",
            "Valeric Acid (VA)",
            "Isovaleric Acid (IVA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Ricinoleic Acid (RA)",
                "Coronaric Acid (CA)",
                "Conjugated Linoleic Acid (CLA)",
                "Pinolenic Acid (PA)",
                "Arachidonic Acid (AA)",
                "Eicosapentaenoic Acid (EPA)",
                "Docosahexaenoic Acid (DHA)",
                "Alpha-Linolenic Acid (ALA)",
                "Gamma-Linolenic Acid (GLA)",
                "Stearidonic Acid (SDA)",
                "Docosapentaenoic Acid (DPA)",
                "Linoleic Acid (LA)",
                "Oleic Acid (OA)",
                "Palmitic Acid (PALA)",
                "Myristic Acid (MA)",
                "Lauric Acid (LAU)",
                "Capric Acid (CA)",
                "Caprylic Acid (CAPA)",
                "Caproic Acid (CAP)",
                "Butyric Acid (BA)",
                "Propionic Acid (PA)",
                "Acetic Acid (AA)",
                "Valeric Acid (VA)",
                "Isovaleric Acid (IVA)"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(-)-vernolic acid",
                "(4Z,7Z,10Z,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(4Z,7Z,13Z,16Z,19Z)-10,11-epoxydocosapentaenoic acid",
                "(7Z,9E,11E,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(9R,10S)-9,10-epoxyoctadecanoic acid",
                "(9S,10R)-epoxyoctadecanoic acid",
                "(S)-lipoic acid",
                "5-Butyl-2-furanoctanoic acid",
                "5-pentyl-2-furannonanoic acid",
                "7,8-epoxy,17-hydroxy-(9E,11E,13Z,15E,19Z)-docosapentaenoic acid",
                "9,10-epoxyoctadecanoic acid",
                "Ambuic acid",
                "Monic acid",
                "cis-9,10-epoxyoctadecanoic acid",
                "epoxydocosapentaenoic acid",
                "lipoic acid"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Arachidonic acid",
            "Docosahexaenoic acid",
            "Eicosapentaenoic acid",
            "Linoleic acid",
            "Oleic acid",
            "Palmitic acid",
            "Stearic acid",
            "Alpha-linolenic acid",
            "Gamma-linolenic acid",
            "Dihomo-gamma-linolenic acid",
            "Eicosadienoic acid",
            "Erucic acid",
            "Lauric acid",
            "Myristic acid",
            "Pentadecanoic acid",
            "Heptadecanoic acid",
            "Nonadecanoic acid",
            "Behenic acid",
            "Lignoceric acid",
            "Cerotic acid",
            "Montanic acid",
            "Melissic acid",
            "Lacceroic acid",
            "Cerotic acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Arachidonic acid",
                "Docosahexaenoic acid",
                "Eicosapentaenoic acid",
                "Linoleic acid",
                "Oleic acid",
                "Palmitic acid",
                "Stearic acid",
                "Alpha-linolenic acid",
                "Gamma-linolenic acid",
                "Dihomo-gamma-linolenic acid",
                "Eicosadienoic acid",
                "Erucic acid",
                "Lauric acid",
                "Myristic acid",
                "Pentadecanoic acid",
                "Heptadecanoic acid",
                "Nonadecanoic acid",
                "Behenic acid",
                "Lignoceric acid",
                "Cerotic acid",
                "Montanic acid",
                "Melissic acid",
                "Lacceroic acid"
            ],
            "true_referents": [
                "(-)-vernolic acid",
                "(4Z,7Z,10Z,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(4Z,7Z,13Z,16Z,19Z)-10,11-epoxydocosapentaenoic acid",
                "(7Z,9E,11E,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(9R,10S)-9,10-epoxyoctadecanoic acid",
                "(9S,10R)-epoxyoctadecanoic acid",
                "(R)-lipoic acid",
                "(S)-lipoic acid",
                "7,8-epoxy,17-hydroxy-(9E,11E,13Z,15E,19Z)-docosapentaenoic acid",
                "9,10-epoxyoctadecanoic acid",
                "Ambuic acid",
                "Harzianic acid",
                "Monic acid",
                "cis-9,10-epoxyoctadecanoic acid",
                "epoxydocosapentaenoic acid",
                "epoxystearic acid",
                "lipoic acid"
            ],
            "TP": 0,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Gamma-Decalactone (\u03b3-DecaL)",
            "Gamma-Undecalactone (\u03b3-UndecaL)",
            "Delta-Decalactone (\u03b4-DecaL)",
            "Delta-Undecalactone (\u03b4-UndecaL)",
            "Gamma-Dodecalactone (\u03b3-DodecaL)",
            "Delta-Dodecalactone (\u03b4-DodecaL)",
            "Gamma-Nonalactone (\u03b3-Nonalactone)",
            "Gamma-Pentadecalactone (\u03b3-PentadecaL)",
            "Gamma-Tetradecalactone (\u03b3-TetradecaL)",
            "Gamma-Tridecalactone (\u03b3-TridecaL)",
            "Delta-Heptadecalactone (\u03b4-HeptadecaL)",
            "Delta-Octadecalactone (\u03b4-OctadecaL)",
            "Gamma-Eicosalactone (\u03b3-EicosaL)",
            "Delta-Eicosalactone (\u03b4-EicosaL)",
            "Gamma-Pentadecalactone (\u03b3-PentadecaL)",
            "Gamma-Hexadecalactone (\u03b3-HexadecaL)",
            "Gamma-Heptadecalactone (\u03b3-HeptadecaL)",
            "Delta-Heptadecalactone (\u03b4-HeptadecaL)",
            "Gamma-Octadecalactone (\u03b3-OctadecaL)",
            "Delta-Octadecalactone (\u03b4-OctadecaL)",
            "Gamma-Nonadecalactone (\u03b3-NonadecaL)",
            "Delta-Nonadecalactone (\u03b4-NonadecaL)",
            "Gamma-Decadecalactone (\u03b3-DecadecaL)",
            "Delta-Decadecalactone (\u03b4-DecadecaL)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Gamma-Decalactone (\u03b3-DecaL)",
                "Gamma-Undecalactone (\u03b3-UndecaL)",
                "Delta-Decalactone (\u03b4-DecaL)",
                "Delta-Undecalactone (\u03b4-UndecaL)",
                "Gamma-Dodecalactone (\u03b3-DodecaL)",
                "Delta-Dodecalactone (\u03b4-DodecaL)",
                "Gamma-Nonalactone (\u03b3-Nonalactone)",
                "Gamma-Pentadecalactone (\u03b3-PentadecaL)",
                "Gamma-Tetradecalactone (\u03b3-TetradecaL)",
                "Gamma-Tridecalactone (\u03b3-TridecaL)",
                "Delta-Heptadecalactone (\u03b4-HeptadecaL)",
                "Delta-Octadecalactone (\u03b4-OctadecaL)",
                "Gamma-Eicosalactone (\u03b3-EicosaL)",
                "Delta-Eicosalactone (\u03b4-EicosaL)",
                "Gamma-Hexadecalactone (\u03b3-HexadecaL)",
                "Gamma-Heptadecalactone (\u03b3-HeptadecaL)",
                "Gamma-Octadecalactone (\u03b3-OctadecaL)",
                "Gamma-Nonadecalactone (\u03b3-NonadecaL)",
                "Delta-Nonadecalactone (\u03b4-NonadecaL)",
                "Gamma-Decadecalactone (\u03b3-DecadecaL)",
                "Delta-Decadecalactone (\u03b4-DecadecaL)"
            ],
            "true_referents": [
                "(-)-vernolic acid",
                "(2E,6E,10R,11S)-10,11-epoxy-3,7,11-trimethyltrideca-2,6-dienoic acid",
                "(5Z,11Z,14Z,17Z)-8,9-epoxyicosatetraenoic acid",
                "(9S),10-epoxy-(10,12Z)-octadecadienoic acid",
                "(9S,10R)-epoxyoctadecanoic acid",
                "(R)-lipoamide",
                "11,12-epoxy-(5Z,8Z,14Z)-icosatrienoyl-CoA",
                "3,4-dimethyl-5-carboxyethyl-2-furanhexanoic acid",
                "3,4-dimethyl-5-propyl-2-furanoctanoic acid;",
                "3-Methyl-5-propyl-2-furannonanoic acid",
                "4'-oxomacrophorin D",
                "4,5-leukotriene A4",
                "5,6-epoxy-(8Z,11Z,14Z)-icosatrienoyl-CoA",
                "5-Hexyl-2-furanhexanoic acid",
                "8-Hydroxy-9,10-epoxystearic acid",
                "9,10-epoxyoctadecanoic acid",
                "cis-9,10-epoxyoctadecanoic acid"
            ],
            "TP": 0,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Prostaglandin E2 (PGE2)",
            "Thromboxane A2 (TXA2)",
            "Prostacyclin (PGI2)",
            "Leukotriene B4 (LTB4)",
            "Lipoxin A4 (LXA4)",
            "Resolvin D1 (RvD1)",
            "Maresin 1 (MaR1)",
            "Protectin D1 (PD1)",
            "Jasmonic acid",
            "Vernolic acid",
            "Furan fatty acids",
            "Cyclopentenone prostaglandins",
            "Isoprostanes",
            "Neuroprostanes",
            "Phytoprostanes",
            "Clavulonic acid",
            "Lactobacillic acid",
            "Mycolic acids",
            "Chaulmoogric acid",
            "Hydnocarpic acid",
            "Gorlic acid",
            "Sterculic acid",
            "Malvalic acid",
            "Coronaric acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Vernolic acid"
            ],
            "mismatches": [
                "Prostaglandin E2 (PGE2)",
                "Thromboxane A2 (TXA2)",
                "Prostacyclin (PGI2)",
                "Leukotriene B4 (LTB4)",
                "Lipoxin A4 (LXA4)",
                "Resolvin D1 (RvD1)",
                "Maresin 1 (MaR1)",
                "Protectin D1 (PD1)",
                "Jasmonic acid",
                "Furan fatty acids",
                "Cyclopentenone prostaglandins",
                "Isoprostanes",
                "Neuroprostanes",
                "Phytoprostanes",
                "Clavulonic acid",
                "Lactobacillic acid",
                "Mycolic acids",
                "Chaulmoogric acid",
                "Hydnocarpic acid",
                "Gorlic acid",
                "Sterculic acid",
                "Malvalic acid",
                "Coronaric acid"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(-)-vernolic acid",
                "(8S)-hepoxilin A3",
                "(S)-lipoic acid",
                "26-deoxymonensin A",
                "4'-oxomacrophorin D",
                "4,5-leukotriene A4",
                "5-Butyl-2-furanoctanoic acid",
                "5-Hexyl-2-furanhexanoic acid",
                "5-Pentyl-2-furanoctanoic acid",
                "Ambuic acid",
                "Demethyl-harzianic acid",
                "Harzianic acid",
                "Homoharzianic acid",
                "Irpexlacte D",
                "Monic acid",
                "Oxazoltriene acid",
                "Phellinulin D",
                "Pteridic acid D",
                "Wyeronic acid",
                "eoxin A4",
                "epoxydocosapentaenoic acid",
                "epoxydocosatetraenoic acid",
                "epoxyoctadecenoic acid",
                "epoxystearic acid",
                "leukotriene A4",
                "lipoic acid",
                "vernolic acid"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Chaulmoogric acid",
            "Hydnocarpic acid",
            "Gorlic acid",
            "Erucic acid",
            "Lactobacillic acid",
            "Mycolic acid",
            "Phytomonic acid",
            "Retinoic acid",
            "Ricinoleic acid",
            "Densipolic acid",
            "Ximenynic acid",
            "Lumepueic acid",
            "Crepenynic acid",
            "Ximenic acid",
            "Bolekic acid",
            "Cyclopropaneoctanoic acid",
            "Cycloartenolic acid",
            "Juniperonic acid",
            "Podocarpic acid",
            "Abietic acid",
            "Isopimaric acid",
            "Levopimaric acid",
            "Neoabietic acid",
            "Dehydroabietic acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Chaulmoogric acid",
                "Hydnocarpic acid",
                "Gorlic acid",
                "Erucic acid",
                "Lactobacillic acid",
                "Mycolic acid",
                "Phytomonic acid",
                "Retinoic acid",
                "Ricinoleic acid",
                "Densipolic acid",
                "Ximenynic acid",
                "Lumepueic acid",
                "Crepenynic acid",
                "Ximenic acid",
                "Bolekic acid",
                "Cyclopropaneoctanoic acid",
                "Cycloartenolic acid",
                "Juniperonic acid",
                "Podocarpic acid",
                "Abietic acid",
                "Isopimaric acid",
                "Levopimaric acid",
                "Neoabietic acid",
                "Dehydroabietic acid"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(-)-vernolic acid",
                "(R)-lipoic acid",
                "(S)-lipoic acid",
                "11,12-epoxy-(5Z,8Z,14Z)-icosatrienoyl-CoA",
                "17R,(16)-epoxy-(4Z,7Z,10Z,13Z,19Z)-docosahexa-4,7,10,13,15,19-enoic acid",
                "5,6-Epoxyoctadeca-7,9-diynoic acid",
                "5,6-epoxy-(8Z,11Z,14Z)-icosatrienoyl-CoA",
                "5S,6S-epoxy-7-undecynoic acid",
                "8,9-epoxy-(5Z,11Z,14Z)-icosatrienoyl-CoA",
                "9,10-epoxyoctadecanoic acid",
                "Ambuic acid",
                "Demethyl-harzianic acid",
                "Dihydrowyerone acid",
                "Harzianic acid",
                "Homoharzianic acid",
                "Isoharzianic acid",
                "Monic acid",
                "Neotetrafibricin A",
                "Pestalic acid B",
                "Wyerone acid",
                "Wyeronic acid",
                "cis-9,10-epoxyoctadecanoic acid",
                "epoxydocosapentaenoic acid",
                "epoxyoctadecenoic acid",
                "lipoic acid",
                "vernolic acid"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Furan fatty acids (F-acids)",
            "Pyran fatty acids (P-acids)",
            "Thiophene fatty acids (T-acids)",
            "Pyrrole fatty acids (Pyr-acids)",
            "Oxazole fatty acids (Ox-acids)",
            "Isoxazole fatty acids (Isox-acids)",
            "Pyrazole fatty acids (Pyz-acids)",
            "Imidazole fatty acids (Im-acids)",
            "Triazole fatty acids (Tr-acids)",
            "Tetrazole fatty acids (Tetr-acids)",
            "Oxadiazole fatty acids (Oxd-acids)",
            "Thiadiazole fatty acids (Thd-acids)",
            "Pyridine fatty acids (Pyr-acids)",
            "Pyridazine fatty acids (Pydz-acids)",
            "Pyrimidine fatty acids (Pym-acids)",
            "Pyrazine fatty acids (Pyz-acids)",
            "Triazine fatty acids (Trz-acids)",
            "Oxazine fatty acids (Oxz-acids)",
            "Thiazine fatty acids (Thz-acids)",
            "Benzofuran fatty acids (Bf-acids)",
            "Indole fatty acids (Ind-acids)",
            "Benzothiophene fatty acids (Bt-acids)",
            "Benzoxazole fatty acids (Box-acids)",
            "Benzimidazole fatty acids (Bim-acids)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Furan fatty acids (F-acids)",
                "Pyran fatty acids (P-acids)",
                "Thiophene fatty acids (T-acids)",
                "Pyrrole fatty acids (Pyr-acids)",
                "Oxazole fatty acids (Ox-acids)",
                "Isoxazole fatty acids (Isox-acids)",
                "Pyrazole fatty acids (Pyz-acids)",
                "Imidazole fatty acids (Im-acids)",
                "Triazole fatty acids (Tr-acids)",
                "Tetrazole fatty acids (Tetr-acids)",
                "Oxadiazole fatty acids (Oxd-acids)",
                "Thiadiazole fatty acids (Thd-acids)",
                "Pyridine fatty acids (Pyr-acids)",
                "Pyridazine fatty acids (Pydz-acids)",
                "Pyrimidine fatty acids (Pym-acids)",
                "Pyrazine fatty acids (Pyz-acids)",
                "Triazine fatty acids (Trz-acids)",
                "Oxazine fatty acids (Oxz-acids)",
                "Thiazine fatty acids (Thz-acids)",
                "Benzofuran fatty acids (Bf-acids)",
                "Indole fatty acids (Ind-acids)",
                "Benzothiophene fatty acids (Bt-acids)",
                "Benzoxazole fatty acids (Box-acids)",
                "Benzimidazole fatty acids (Bim-acids)"
            ],
            "true_referents": [
                "(-)-vernolic acid",
                "(2E,11Z)-Wyerone acid",
                "(9S,10R)-epoxyoctadecanoic acid",
                "(9Z,13S,15Z)-12,13-epoxyoctadeca-9,11,15-trienoic acid",
                "(R)-lipoic acid",
                "(S)-lipoic acid",
                "13-hydroxy-14,15-epoxy-(5Z,8Z,11Z)-icosatrienoic acid",
                "3,4-dimethyl-5-propyl-2-furanoctanoic acid;",
                "4,5-epoxy-7z,10z,13z,16z,19z-docosapentaenoic acid, methyl ester",
                "4-(4-ethyl-1-piperazinyl)-4-oxo-2-butenoic acid",
                "5,6-Epoxyoctadeca-7,9-diynoic acid",
                "5-Butyl-2-furanoctanoic acid",
                "5-Pentyl-2-furanoctanoic acid",
                "5-pentyl-2-furannonanoic acid",
                "7-(3-methyl-5-pentylfuran-2-yl)-heptanoic acid",
                "8-(5-hexylfuran-2-yl)octanoic acid",
                "9,10-epoxyoctadecanoic acid",
                "9-(3,4-dimethyl-5-pentylfuran-2-yl)-nonanoic acid",
                "Harzianic acid",
                "Monic acid",
                "Oxazoltetraene acid",
                "Oxazoltriene acid",
                "Trihazone F",
                "Wyerone acid",
                "Wyeronic acid",
                "cis-9,10-epoxyoctadecanoic acid",
                "epoxy fatty acid",
                "epoxy(hydroxy)icosatrienoic acid"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Arachidonic Acid (AA)",
            "Docosahexaenoic Acid (DHA)",
            "Eicosapentaenoic Acid (EPA)",
            "Gamma-Linolenic Acid (GLA)",
            "Indole-3-Acetic Acid (IAA)",
            "Linoleic Acid (LA)",
            "Oleic Acid (OA)",
            "Palmitic Acid (PA)",
            "Stearic Acid (SA)",
            "Cholic Acid (CA)",
            "Deoxycholic Acid (DCA)",
            "Lithocholic Acid (LCA)",
            "Ursodeoxycholic Acid (UDCA)",
            "Prostaglandin E2 (PGE2)",
            "Prostaglandin F2\u03b1 (PGF2\u03b1)",
            "Thromboxane A2 (TXA2)",
            "Leukotriene B4 (LTB4)",
            "Leukotriene C4 (LTC4)",
            "Leukotriene D4 (LTD4)",
            "Leukotriene E4 (LTE4)",
            "Retinol (Vitamin A)",
            "Cholecalciferol (Vitamin D3)",
            "Tocopherol (Vitamin E)",
            "Ascorbic Acid (Vitamin C)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Arachidonic Acid (AA)",
                "Docosahexaenoic Acid (DHA)",
                "Eicosapentaenoic Acid (EPA)",
                "Gamma-Linolenic Acid (GLA)",
                "Indole-3-Acetic Acid (IAA)",
                "Linoleic Acid (LA)",
                "Oleic Acid (OA)",
                "Palmitic Acid (PA)",
                "Stearic Acid (SA)",
                "Cholic Acid (CA)",
                "Deoxycholic Acid (DCA)",
                "Lithocholic Acid (LCA)",
                "Ursodeoxycholic Acid (UDCA)",
                "Prostaglandin E2 (PGE2)",
                "Prostaglandin F2\u03b1 (PGF2\u03b1)",
                "Thromboxane A2 (TXA2)",
                "Leukotriene B4 (LTB4)",
                "Leukotriene C4 (LTC4)",
                "Leukotriene D4 (LTD4)",
                "Leukotriene E4 (LTE4)",
                "Retinol (Vitamin A)",
                "Cholecalciferol (Vitamin D3)",
                "Tocopherol (Vitamin E)",
                "Ascorbic Acid (Vitamin C)"
            ],
            "true_referents": [
                "(+)-vernolic acid",
                "(-)-vernolic acid",
                "(4Z,7Z,10Z,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(4Z,7Z,13Z,16Z,19Z)-10,11-epoxydocosapentaenoic acid",
                "(7Z,9E,11E,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(9R,10S)-9,10-epoxyoctadecanoic acid",
                "(9S,10R)-epoxyoctadecanoic acid",
                "(R)-lipoic acid",
                "(S)-lipoic acid",
                "4'-oxomacrophorin D",
                "4,5-leukotriene A4",
                "7,8-epoxy,17-hydroxy-(9E,11E,13Z,15E,19Z)-docosapentaenoic acid",
                "9,10-epoxyoctadecanoic acid",
                "Demethyl-harzianic acid",
                "cis-9,10-epoxyoctadecanoic acid",
                "epoxydocosapentaenoic acid",
                "juvenile hormone III acid",
                "leukotriene A4",
                "lipoic acid"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": "[\n    \"Bile acid (BA)\", \n    \"Cholic acid\", \n    \"Chenodeoxycholic acid\", \n    \"Deoxycholic acid\", \n    \"Lithocholic acid\", \n    \"Ursodeoxycholic acid\", \n    \"Glycochenodeoxycholic acid\", \n    \"Glycocholic acid\", \n    \"Taurocholic acid\", \n    \"Taurochenodeoxycholic acid\", \n    \"Deoxyglycocholic acid\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxycholate\", \n    \"Cholate\", \n    \"Chenodeoxycholate\", \n    \"Lithocholate\", \n    \"Ursodeoxycholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglycocholate\", \n    \"Glycochenodeoxycholate\", \n    \"Glycocholate\", \n    \"Deoxyglyco",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            "Arachidonic acid (ARA)",
            "Prostacyclin (PGI2)",
            "Thromboxane A2 (TXA2)",
            "Cholesterol",
            "Ergosterol",
            "Lanosterol",
            "Cycloartenol",
            "24,25-Dihydrolanosterol",
            "4-Methylsterol",
            "Obtusifoliol",
            "Gramisterol",
            "4-Alpha-Methylsterol",
            "Sitosterol",
            "Stigmasterol",
            "Fucosterol",
            "Campesterol",
            "Brassicasterol",
            "Cholestanol",
            "Coprostanol",
            "Cholesterol sulfate",
            "Cholesteryl acetate",
            "Cholesteryl oleate",
            "Cholesteryl linoleate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Arachidonic acid (ARA)",
                "Prostacyclin (PGI2)",
                "Thromboxane A2 (TXA2)",
                "Cholesterol",
                "Ergosterol",
                "Lanosterol",
                "Cycloartenol",
                "24,25-Dihydrolanosterol",
                "4-Methylsterol",
                "Obtusifoliol",
                "Gramisterol",
                "4-Alpha-Methylsterol",
                "Sitosterol",
                "Stigmasterol",
                "Fucosterol",
                "Campesterol",
                "Brassicasterol",
                "Cholestanol",
                "Coprostanol",
                "Cholesterol sulfate",
                "Cholesteryl acetate",
                "Cholesteryl oleate",
                "Cholesteryl linoleate"
            ],
            "true_referents": [
                "(12S)-hydroperoxy-(14R,15S)-epoxy-(5Z,8Z,10E)-icosatrienoic acid",
                "(4Z,7Z,10Z,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(5S)-hydroperoxy-(14R,15S)-epoxy-(6E,8Z,11Z)-icosatrienoic acid",
                "(5Z,8R,9Z,11Z,14Z)-8,9-epoxyicosatetraenoic acid",
                "(5Z,8Z,11Z,17Z)-14,15-epoxyicosatetraenoic acid",
                "(5Z,8Z,14Z,17Z)-11,12-epoxyicosatetraenoic acid",
                "(7Z,9E,11E,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(8S)-hydroperoxy-(14S,15R)-epoxy-(5Z,9E,11Z)-icosatrienoic acid",
                "11,12-epoxy-(5Z,8Z,14Z)-icosatrienoyl-CoA",
                "11,12-epoxy-20-hydroxy-(5Z,8Z,14Z)-icosatrienoic acid",
                "4'-oxomacrophorin D",
                "4,5-epoxy-7z,10z,13z,16z,19z-docosapentaenoic acid, methyl ester",
                "4,5-leukotriene A4",
                "7,8-epoxy,17-hydroxy-(9E,11E,13Z,15E,19Z)-docosapentaenoic acid",
                "8(9)-EET methyl ester",
                "8-Hydroxy-9,10-epoxystearic acid",
                "9,10-epoxyoctadecanoic acid",
                "DG(13D5/11M5/0:0)",
                "Dihydrowyerol",
                "Ficifuranone A",
                "Flavodonfuran",
                "Ligerin",
                "Oxazoltriene acid",
                "Tricycloalternarene A",
                "Tricycloalternarene L",
                "Wyerol",
                "Zopfiellamide B",
                "cis-9,10-epoxyoctadecanoic acid",
                "epoxydocosapentaenoic acid",
                "epoxydocosatetraenoic acid",
                "leukotriene A4"
            ],
            "TP": 0,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "heterocyclic fatty acid",
        "domain": "chemistry",
        "response": [
            [
                "Canonical name",
                "Docosahexaenoic acid"
            ],
            [
                "Canonical name",
                "Cholesterol"
            ],
            [
                "Canonical name",
                "Bilirubin"
            ]
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Docosahexaenoic acid",
                "Cholesterol",
                "Bilirubin"
            ],
            "true_referents": [
                "(-)-vernolic acid",
                "(4Z,7Z,10Z,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "(7Z,9E,11E,16Z,19Z)-13,14-epoxydocosapentaenoic acid",
                "4'-oxomacrophorin D",
                "7,8-epoxy,17-hydroxy-(9E,11E,13Z,15E,19Z)-docosapentaenoic acid",
                "cis-9,10-epoxyoctadecanoic acid",
                "epoxydocosapentaenoic acid"
            ],
            "TP": 0,
            "FP": 3,
            "FN": 0
        }
    }
]