[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Valinomycin (Val)",
            "Monensin (Mon)",
            "Nigericin (Nig)",
            "Gramicidin D (G-D)",
            "Carbenicillin (Carb)",
            "Polymyxin B (PMB)",
            "Aureobasidin A (AurA)",
            "Cyclic Peptide Ionophore A (CPIA)",
            "Dipicolinic acid (DPA)",
            "Calicheamicin (Cal)",
            "Cyclosporin A (CyA)",
            "Lipopeptide (Lipopep)",
            "Phenylarsine oxide (PAO)",
            "Bis-(2-ethylhexyl) sodium sulfosuccinate (AOT)",
            "Dihexadecyl phosphate (DHDP)",
            "Bile salts (BileS)",
            "Dioctyl sodium sulfosuccinate (AOS)",
            "Sodium dodecyl sulfate (SDS)",
            "Pentamidine (Penta)",
            "Dibucaine (Dibu)",
            "Tridemorph (Trid)",
            "Meglumine (Megl)",
            "Sodium caprylate (NaCap)",
            "Sodium lauryl sulfate (SLS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Valinomycin",
                "Monensin A",
                "Nigericin"
            ],
            "mismatches": [
                "Gramicidin D (G-D)",
                "Carbenicillin (Carb)",
                "Polymyxin B (PMB)",
                "Aureobasidin A (AurA)",
                "Cyclic Peptide Ionophore A (CPIA)",
                "Dipicolinic acid (DPA)",
                "Calicheamicin (Cal)",
                "Cyclosporin A (CyA)",
                "Lipopeptide (Lipopep)",
                "Phenylarsine oxide (PAO)",
                "Bis-(2-ethylhexyl) sodium sulfosuccinate (AOT)",
                "Dihexadecyl phosphate (DHDP)",
                "Bile salts (BileS)",
                "Dioctyl sodium sulfosuccinate (AOS)",
                "Sodium dodecyl sulfate (SDS)",
                "Pentamidine (Penta)",
                "Dibucaine (Dibu)",
                "Tridemorph (Trid)",
                "Meglumine (Megl)",
                "Sodium caprylate (NaCap)",
                "Sodium lauryl sulfate (SLS)"
            ],
            "true_referents": [
                "(S,S,S)-avenic acid A",
                "3''-deamino-3''-oxonicotianamine",
                "3-epi-3-hydroxy-2'-deoxymugineic acid",
                "3-epi-3-hydroxymugineic acid",
                "Gramicidin A",
                "N(5)-[(S)-citryl]-D-ornithine(2-)",
                "N-(2,3-dihydroxybenzoyl)serine",
                "Salinomycin",
                "beauvericin",
                "bisucaberin B",
                "calcium ionophore",
                "carboxymycobactin",
                "chlortetracycline",
                "desferricoprogen B(3-)",
                "desferricoprogen(3-)",
                "enniatin",
                "griseochelin",
                "indanomycin",
                "ionomycin",
                "iron ionophore",
                "lasalocid sodium",
                "monensin A",
                "mugineic acid",
                "myxochelin B",
                "nigericin",
                "petrobactin(1+)",
                "potassium ionophore",
                "pseudomonine",
                "pyrithione",
                "rhodotorulic acid",
                "staphyloferrin B",
                "tridodecylamine",
                "valinomycin",
                "vibriobactin"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "A23187 (A23187)",
            "Albendazole",
            "Bambermycins",
            "Bambermycin",
            "Chloride ionophore",
            "Carbonyl cyanide m-chlorophenylhydrazone (CCCP)",
            "Carbonyl cyanide p-trifluoromethoxyphenylhydrazone (FCCP)",
            "Cation ionophore",
            "Cerulenin",
            "Cerivastatin",
            "Cyclosporin A",
            "Dinactin",
            "Dioxyquin",
            "Dinitrophenol",
            "Erythromycin A",
            "Furea",
            "Halichondrin B",
            "Lasalocid A",
            "Monensin",
            "Nigericin",
            "Palytoxin",
            "Phenylarsine oxide",
            "Salinomycin",
            "Valinomycin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Carbonyl cyanide p-trifluoromethoxyphenylhydrazone",
                "Nigericin",
                "Salinomycin",
                "Valinomycin"
            ],
            "mismatches": [
                "A23187 (A23187)",
                "Albendazole",
                "Bambermycins",
                "Bambermycin",
                "Chloride ionophore",
                "Carbonyl cyanide m-chlorophenylhydrazone (CCCP)",
                "Cation ionophore",
                "Cerulenin",
                "Cerivastatin",
                "Cyclosporin A",
                "Dinactin",
                "Dioxyquin",
                "Dinitrophenol",
                "Erythromycin A",
                "Furea",
                "Halichondrin B",
                "Lasalocid A",
                "Monensin",
                "Palytoxin",
                "Phenylarsine oxide"
            ],
            "true_referents": [
                "2'-deoxymugineic acid",
                "3''-deamino-3''-oxonicotianamine",
                "3-epi-3-hydroxy-2'-deoxymugineic acid",
                "CCCP",
                "Gramicidin A",
                "IC202A",
                "IC202C",
                "N-(2,3-dihydroxybenzoyl)serine",
                "Salinomycin",
                "alborixin",
                "bisucaberin B",
                "calcium ionophore",
                "carbonyl cyanide p-trifluoromethoxyphenylhydrazone",
                "cefiderocol",
                "chlortetracycline",
                "chrysobactin",
                "coelichelin",
                "coelichelin(3-)",
                "deferrichrome",
                "desferrialbomycin epsilon",
                "desferrialbomycins",
                "desferriexochelin 772MS",
                "desferrioxamine E",
                "dinophysistoxin 1",
                "dinophysistoxin 2",
                "enniatin",
                "enniatin A",
                "indanomycin",
                "ionomycin",
                "iron ionophore",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mutalomycin",
                "myxochelin B",
                "nigericin",
                "petrobactin(1+)",
                "potassium ionophore",
                "pyrithione",
                "quinolobactin",
                "staphyloferrin A",
                "staphyloferrin B",
                "valinomycin",
                "vanchrobactin"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Valinomycin (Val)",
            "Gramicidin A",
            "Nigericin",
            "Monensin",
            "A23187 (Calcimycin)",
            "Lasalocid",
            "Salinomycin",
            "Ionomycin",
            "Nonactin",
            "Antimycin A",
            "Alamethicin",
            "Beomycin",
            "Lactobacillin",
            "Enniatin B",
            "X-537A",
            "Lumichrome",
            "FCCP (Carbonyl cyanide-p-trifluoromethoxyphenylhydrazone)",
            "Dinitrophenol",
            "Nigericin",
            "A23187 (Calcimycin)",
            "Cyclosporine A",
            "Rotenone",
            "Oligomycin",
            "Nigericin",
            "Pentachlorophenol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gramicidin A",
                "Nigericin",
                "Lasalocid",
                "Salinomycin",
                "Ionomycin",
                "Enniatin B",
                "Carbonyl cyanide-p-trifluoromethoxyphenylhydrazone"
            ],
            "mismatches": [
                "Valinomycin (Val)",
                "Monensin",
                "A23187 (Calcimycin)",
                "Nonactin",
                "Antimycin A",
                "Alamethicin",
                "Beomycin",
                "Lactobacillin",
                "X-537A",
                "Lumichrome",
                "Dinitrophenol",
                "Cyclosporine A",
                "Rotenone",
                "Oligomycin",
                "Pentachlorophenol"
            ],
            "true_referents": [
                "(R,R,R)-nicotianamine",
                "(S,R,R)-nicotianamine",
                "3''-deamino-3''-oxonicotianamine",
                "Gramicidin A",
                "IC202A",
                "IC202C",
                "N-(2,3-dihydroxybenzoyl)serine",
                "Salinomycin",
                "carbonyl cyanide p-trifluoromethoxyphenylhydrazone",
                "chlortetracycline",
                "deferrichrome",
                "desferriexochelin 772MS",
                "enniatin",
                "enniatin A",
                "enniatin B",
                "enterobactin",
                "enterobactin(6-)",
                "indanomycin",
                "ionomycin",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mutalomycin",
                "nigericin",
                "pyrithione",
                "siderophore",
                "staphyloferrin A",
                "staphyloferrin B",
                "valinomycin"
            ],
            "TP": 7,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Valinomycin (VAL)",
            "Monensin (MON)",
            "Nystatin (NYST)",
            "Nigericin (NIG)",
            "Lasalocid A (LAS)",
            "Salinomycin (SAL)",
            "Tunicamycin (TUN)",
            "A23187",
            "Gramicidin A (GRAM)",
            "Nonactin",
            "Futalosine",
            "X-537A",
            "BP3",
            "Ionomycin",
            "Calciumophore 1",
            "Crown ethers (e.g., 18-crown-6)",
            "Cryptands (e.g., Kryptofix 222)",
            "Polyether antibiotics",
            "Synthetic azacrown ethers",
            "Triphenylmethylphosphonium chloride",
            "Tetraethylammonium bromide",
            "Adamantane-based ionophores",
            "Calixarenes",
            "Cyclodextrins"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Valinomycin",
                "Nigericin",
                "Salinomycin",
                "Gramicidin A",
                "Ionomycin"
            ],
            "mismatches": [
                "Monensin (MON)",
                "Nystatin (NYST)",
                "Lasalocid A (LAS)",
                "Tunicamycin (TUN)",
                "A23187",
                "Nonactin",
                "Futalosine",
                "X-537A",
                "BP3",
                "Calciumophore 1",
                "Crown ethers (e.g., 18-crown-6)",
                "Cryptands (e.g., Kryptofix 222)",
                "Polyether antibiotics",
                "Synthetic azacrown ethers",
                "Triphenylmethylphosphonium chloride",
                "Tetraethylammonium bromide",
                "Adamantane-based ionophores",
                "Calixarenes",
                "Cyclodextrins"
            ],
            "true_referents": [
                "(R,R,R)-nicotianamine",
                "(S,S,S)-avenic acid A",
                "3''-deamino-3''-oxonicotianamine",
                "Gramicidin A",
                "IC202A",
                "IC202C",
                "Salinomycin",
                "beauvericin",
                "calcium ionophore",
                "carbonyl cyanide p-trifluoromethoxyphenylhydrazone",
                "chlortetracycline",
                "deferrichrome",
                "desferrialbomycin delta1",
                "desferricoprogen B(3-)",
                "desferricoprogen(3-)",
                "desferriexochelin 772MS",
                "diglucosyl-enterobactin",
                "dinophysistoxin 1",
                "enniatin",
                "enniatin A",
                "enniatin B",
                "enniatin B4",
                "indanomycin",
                "ionomycin",
                "iron ionophore",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mutalomycin",
                "nigericin",
                "petrobactin(1+)",
                "phytosiderophore",
                "potassium ionophore",
                "pseudomonine",
                "quinolobactin",
                "tridodecylamine",
                "valinomycin"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Valinomycin",
            "Nigericin",
            "Monensin",
            "Lasalocid",
            "Gramicidin",
            "A23187 (Calcimycin)",
            "Ionomycin",
            "Salinomycin",
            "Beauvericin",
            "Enniatin",
            "Nonactin",
            "Antimycin A",
            "X-537A (Lasalocid A)",
            "Maduramicin",
            "Narasin",
            "Semduramicin",
            "Tetronasin",
            "Dinitrophenol",
            "Carbonyl cyanide m-chlorophenyl hydrazone (CCCP)",
            "Protonophore",
            "Sodium ionophore III",
            "ETH 129",
            "ETH 2120",
            "ETH 5506"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Valinomycin",
                "Nigericin",
                "Salinomycin",
                "Beauvericin",
                "Enniatin",
                "Ionomycin",
                "Lasalocid",
                "Gramicidin",
                "Carbonyl cyanide m-chlorophenyl hydrazone (CCCP)"
            ],
            "mismatches": [
                "Monensin",
                "A23187 (Calcimycin)",
                "Nonactin",
                "Antimycin A",
                "X-537A (Lasalocid A)",
                "Maduramicin",
                "Narasin",
                "Semduramicin",
                "Tetronasin",
                "Dinitrophenol",
                "Protonophore",
                "Sodium ionophore III",
                "ETH 129",
                "ETH 2120",
                "ETH 5506"
            ],
            "true_referents": [
                "(R,R,R)-nicotianamine",
                "3''-deamino-3''-oxonicotianamine",
                "CCCP",
                "Gramicidin A",
                "IC202A",
                "IC202C",
                "N-(2,3-dihydroxybenzoyl)serine",
                "Salinomycin",
                "alborixin",
                "bafilomycin A1",
                "beauvericin",
                "calcium ionophore",
                "carbonyl cyanide p-trifluoromethoxyphenylhydrazone",
                "chlortetracycline",
                "desferriexochelin 772MS",
                "enniatin",
                "enniatin A",
                "enniatin B",
                "enterobactin(6-)",
                "indanomycin",
                "ionomycin",
                "iron ionophore",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mutalomycin",
                "nigericin",
                "petrobactin(1+)",
                "potassium ionophore",
                "siderophore",
                "valinomycin"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Valinomycin (Val)",
            "Gramicidin A (GrA)",
            "Monensin (Mon)",
            "Nigericin (Nig)",
            "Lasalocid (Las)",
            "A23187 (A23187)",
            "Calcimycin (Calc)",
            "CCCP (Carbonyl cyanide m-chlorophenyl hydrazone)",
            "Dinitrophenol (DNP)",
            "Ethyl 4-aminobenzoate (Ethyl PABA)",
            "Sodium ionophore X (Sodium ionophore X)",
            "Bacitracin (Bac)",
            "Ionomycin (Iono)",
            "Syringomycin E (Syr E)",
            "Benzyl alcohol (BzOH)",
            "Phorbol myristate acetate (PMA)",
            "Chloroquine (CQ)",
            "Amphotericin B (AmB)",
            "Pyrithione (Py)",
            "Thapsigargin (Thap)",
            "Aurovertin (Au)",
            "Oligomycin (Oligo)",
            "Ruthenium red (RuRed)",
            "Thioflavin T (ThT)",
            "Kainic acid (KA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Valinomycin",
                "Gramicidin A",
                "Nigericin",
                "Ionomycin",
                "Pyrithione"
            ],
            "mismatches": [
                "Monensin",
                "Lasalocid",
                "A23187",
                "Calcimycin",
                "CCCP",
                "Dinitrophenol",
                "Ethyl 4-aminobenzoate",
                "Sodium ionophore X",
                "Bacitracin",
                "Syringomycin E",
                "Benzyl alcohol",
                "Phorbol myristate acetate",
                "Chloroquine",
                "Amphotericin B",
                "Thapsigargin",
                "Aurovertin",
                "Oligomycin",
                "Ruthenium red",
                "Thioflavin T",
                "Kainic acid"
            ],
            "true_referents": [
                "(R,R,R)-nicotianamine",
                "(R,S,S)-nicotianamine",
                "(S,R,R)-nicotianamine",
                "(S,S,S)-nicotianamine",
                "2'-deoxymugineic acid",
                "3''-deamino-3''-oxonicotianamine",
                "CCCP",
                "Gramicidin A",
                "IC202A",
                "IC202C",
                "N-(2,3-dihydroxybenzoyl)serine",
                "Salinomycin",
                "bafilomycin A1",
                "beauvericin",
                "bisucaberin B",
                "calcium ionophore",
                "carbonyl cyanide p-trifluoromethoxyphenylhydrazone",
                "chlortetracycline",
                "desferrialbomycin epsilon",
                "desferriexochelin 772MS",
                "enniatin",
                "enniatin B",
                "griseochelin",
                "indanomycin",
                "ionomycin",
                "iron ionophore",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mutalomycin",
                "myxochelin B",
                "nigericin",
                "petrobactin(1+)",
                "potassium ionophore",
                "pseudomonine",
                "pyoverdine",
                "pyrithione",
                "quinolobactin",
                "rhodotorulic acid",
                "valinomycin",
                "vanchrobactin"
            ],
            "TP": 5,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Valinomycin (VAL)",
            "Monensin (MON)",
            "Calcimycin (CAL)",
            "Ionomycin (ION)",
            "Gramicidin (GRAM)",
            "Nonactin (NON)",
            "Salinomycin (SAL)",
            "Nigericin (NIG)",
            "A23187 (A23)",
            "Lasalocid (LAS)",
            "X537A (X53)",
            "Ethidium (ETH)",
            "Amphotericin B (AMP)",
            "Oligomycin (OLI)",
            "Dicyclohexylcarbodiimide (DCC)",
            "CCCP (CCCP)",
            "Gramicidin A (GRAMA)",
            "Gramicidin S (GRAMS)",
            "Gramicidin D (GRAMD)",
            "Nystatin (NYS)",
            "Trifluoperazine (TRI)",
            "Verapamil (VER)",
            "Diltiazem (DIL)",
            "Nifedipine (NIF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Valinomycin",
                "Salinomycin",
                "Nigericin",
                "CCCP",
                "Gramicidin A"
            ],
            "mismatches": [
                "Monensin (MON)",
                "Calcimycin (CAL)",
                "Ionomycin (ION)",
                "Gramicidin (GRAM)",
                "Nonactin (NON)",
                "A23187 (A23)",
                "Lasalocid (LAS)",
                "X537A (X53)",
                "Ethidium (ETH)",
                "Amphotericin B (AMP)",
                "Oligomycin (OLI)",
                "Dicyclohexylcarbodiimide (DCC)",
                "Gramicidin S (GRAMS)",
                "Gramicidin D (GRAMD)",
                "Nystatin (NYS)",
                "Trifluoperazine (TRI)",
                "Verapamil (VER)",
                "Diltiazem (DIL)",
                "Nifedipine (NIF)"
            ],
            "true_referents": [
                "(S,R,R)-nicotianamine",
                "(S,S,S)-avenic acid A",
                "3''-deamino-3''-oxonicotianamine",
                "3-epi-3-hydroxy-2'-deoxymugineic acid",
                "3-epi-3-hydroxymugineic acid",
                "CCCP",
                "Gramicidin A",
                "IC202A",
                "IC202C",
                "Salinomycin",
                "bafilomycin A1",
                "bisucaberin B",
                "calcium ionophore",
                "carbonyl cyanide p-trifluoromethoxyphenylhydrazone",
                "chlortetracycline",
                "desferrialbomycin delta1",
                "desferrialbomycin delta2",
                "desferriexochelin 772MS",
                "enniatin",
                "enniatin A",
                "enterobactin(1-)",
                "indanomycin",
                "ionomycin",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mutalomycin sodium salt",
                "nigericin",
                "petrobactin(1+)",
                "pseudomonine",
                "pyrithione",
                "sideramine",
                "tridodecylamine",
                "valinomycin",
                "vibrioferrin(3-)",
                "yersiniabactin"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Valinomycin",
            "Gramicidin A",
            "A23187 (Calcimycin)",
            "Monensin",
            "Nigericin",
            "Lasalocid",
            "Salinomycin",
            "Ionomycin",
            "X-537A",
            "ETH2120",
            "Nonactin",
            "Pyrithione",
            "Amphotericin B",
            "Cerulenin",
            "Antimycin A",
            "FCCP (Carbonyl cyanide-p-trifluoromethoxyphenylhydrazone)",
            "Dodecylbenzenesulfonate",
            "Cyclosporin A",
            "Bambermycin",
            "Ferrioxamine E",
            "Ro 31-8220",
            "Geldanamycin",
            "Cephalosporin C",
            "Bacitracin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Valinomycin",
                "Gramicidin A",
                "Nigericin",
                "Lasalocid",
                "Salinomycin",
                "Ionomycin",
                "Pyrithione",
                "carbonyl cyanide p-trifluoromethoxyphenylhydrazone"
            ],
            "mismatches": [
                "A23187 (Calcimycin)",
                "Monensin",
                "X-537A",
                "ETH2120",
                "Nonactin",
                "Amphotericin B",
                "Cerulenin",
                "Antimycin A",
                "Dodecylbenzenesulfonate",
                "Cyclosporin A",
                "Bambermycin",
                "Ferrioxamine E",
                "Ro 31-8220",
                "Geldanamycin",
                "Cephalosporin C",
                "Bacitracin"
            ],
            "true_referents": [
                "(S,S,S)-avenic acid A",
                "(S,S,S)-nicotianamine",
                "3''-deamino-3''-oxonicotianamine",
                "Gramicidin A",
                "IC202A",
                "IC202C",
                "N-(2,3-dihydroxybenzoyl)serine",
                "Salinomycin",
                "bisucaberin B",
                "carbonyl cyanide p-trifluoromethoxyphenylhydrazone",
                "cefiderocol",
                "chlortetracycline",
                "coelichelin",
                "coelichelin(3-)",
                "desferriexochelin 772MS",
                "desferrioxamine B(3-)",
                "desferrioxamine E",
                "desferrioxamine E(3-)",
                "enniatin",
                "enniatin A",
                "enniatin B",
                "indanomycin",
                "ionomycin",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mutalomycin",
                "nigericin",
                "pseudomonine",
                "pyrithione",
                "staphyloferrin A",
                "staphyloferrin B",
                "valinomycin",
                "vanchrobactin"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Valinomycin (Val)",
            "Monensin (Mon)",
            "Nigericin",
            "Ionomycin",
            "A23187 (Calcimycin)",
            "Gramicidin D",
            "Salinomycin",
            "Lasalocid",
            "Carbonyl cyanide m-chlorophenyl hydrazone (CCCP)",
            "Carbonyl cyanide p-trifluoromethoxyphenylhydrazone (FCCP)",
            "Nonactin",
            "18-Crown-6",
            "Amphotericin B",
            "Sebifungicidin",
            "Lasalocid A",
            "Gramicidin A",
            "Cyclopiazonic acid",
            "Fragin",
            "Isonomycin",
            "Methyl valinomycin",
            "Ethyl ionophore",
            "X-537A",
            "Rhopo ionophore",
            "Saricolysin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Valinomycin",
                "Nigericin",
                "Ionomycin",
                "Salinomycin",
                "Lasalocid",
                "Gramicidin A"
            ],
            "mismatches": [
                "Monensin (Mon)",
                "A23187 (Calcimycin)",
                "Gramicidin D",
                "Carbonyl cyanide m-chlorophenyl hydrazone (CCCP)",
                "Carbonyl cyanide p-trifluoromethoxyphenylhydrazone (FCCP)",
                "Nonactin",
                "18-Crown-6",
                "Amphotericin B",
                "Sebifungicidin",
                "Lasalocid A",
                "Cyclopiazonic acid",
                "Fragin",
                "Isonomycin",
                "Methyl valinomycin",
                "Ethyl ionophore",
                "X-537A",
                "Rhopo ionophore",
                "Saricolysin"
            ],
            "true_referents": [
                "3''-deamino-3''-oxonicotianamine",
                "CCCP",
                "Gramicidin A",
                "IC202A",
                "IC202C",
                "Salinomycin",
                "bisucaberin B",
                "calcium ionophore",
                "carbonyl cyanide p-trifluoromethoxyphenylhydrazone",
                "desferricoprogen",
                "desferricoprogen B",
                "desferriexochelin 772MS",
                "enniatin",
                "enniatin A",
                "enniatin B",
                "indanomycin",
                "ionomycin",
                "iron ionophore",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mugineic acid",
                "mutalomycin",
                "nigericin",
                "petrobactin(1+)",
                "potassium ionophore",
                "pseudomonine",
                "pyrithione",
                "quinolobactin",
                "schizokinen",
                "sideramine",
                "staphyloferrin A",
                "valinomycin",
                "vanchrobactin"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Valinomycin (VAL)",
            "Gramicidin A (gA)",
            "Nigericin (NIG)",
            "Monensin (MON)",
            "Ionomycin (ION)",
            "A23187 (Calcimycin)",
            "Salinomycin (SAL)",
            "Lasalocid A (LAS)",
            "Beauvericin (BEA)",
            "Narasin (NAR)",
            "Enniatin B (ENN B)",
            "Nonactin",
            "Maduramicin",
            "Nystatin",
            "Amphotericin B (AmB)",
            "Carbonyl cyanide m-chlorophenyl hydrazone (CCCP)",
            "Carbonyl cyanide-p-trifluoromethoxyphenylhydrazone (FCCP)",
            "Quercetin",
            "Pyrithione",
            "Niguldipine",
            "ETH 129",
            "Tetranactin",
            "Cereulide",
            "Polyether antibiotics"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Valinomycin",
                "Gramicidin A",
                "Nigericin",
                "Ionomycin",
                "Salinomycin",
                "Beauvericin",
                "Enniatin B",
                "Pyrithione",
                "CCCP"
            ],
            "mismatches": [
                "Monensin",
                "A23187 (Calcimycin)",
                "Lasalocid A (LAS)",
                "Narasin",
                "Nonactin",
                "Maduramicin",
                "Nystatin",
                "Amphotericin B (AmB)",
                "Carbonyl cyanide-p-trifluoromethoxyphenylhydrazone (FCCP)",
                "Quercetin",
                "Niguldipine",
                "ETH 129",
                "Tetranactin",
                "Cereulide",
                "Polyether antibiotics"
            ],
            "true_referents": [
                "(R,R,R)-nicotianamine",
                "(S,S,S)-avenic acid A",
                "3''-deamino-3''-oxonicotianamine",
                "CCCP",
                "Gramicidin A",
                "IC202A",
                "IC202C",
                "Salinomycin",
                "alborixin",
                "bafilomycin A1",
                "beauvericin",
                "bisucaberin B",
                "carbonyl cyanide p-trifluoromethoxyphenylhydrazone",
                "chlortetracycline",
                "desferrioxamine E",
                "enniatin",
                "enniatin A",
                "enniatin A1",
                "enniatin B",
                "enniatin B4",
                "enterobactin(6-)",
                "indanomycin",
                "ionomycin",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mutalomycin",
                "mutalomycin sodium salt",
                "nigericin",
                "petrobactin(1+)",
                "pseudomonine",
                "pyrithione",
                "quinolobactin",
                "sideramine",
                "staphyloferrin A",
                "valinomycin"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Valinomycin",
            "Nigericin",
            "Monensin (MON)",
            "Salinomycin (SAL)",
            "Lasalocid (LAS)",
            "Ionomycin",
            "Gramicidin A",
            "Gramicidin B",
            "Gramicidin C",
            "Gramicidin D",
            "Gramicidin S",
            "Nonactin",
            "Monactin",
            "Dinactin",
            "Trinactin",
            "Tetranactin",
            "Calcimycin (A23187)",
            "4-Bromo-A23187",
            "Beauvericin",
            "Enniatin A",
            "Enniatin B",
            "Enniatin C",
            "Alamethicin",
            "Amphotericin B (AmB)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Valinomycin",
                "Nigericin",
                "Salinomycin",
                "Ionomycin",
                "Gramicidin A",
                "Beauvericin",
                "Enniatin A",
                "Enniatin B"
            ],
            "mismatches": [
                "Monensin (MON)",
                "Lasalocid (LAS)",
                "Gramicidin B",
                "Gramicidin C",
                "Gramicidin D",
                "Gramicidin S",
                "Nonactin",
                "Monactin",
                "Dinactin",
                "Trinactin",
                "Tetranactin",
                "Calcimycin (A23187)",
                "4-Bromo-A23187",
                "Enniatin C",
                "Alamethicin",
                "Amphotericin B (AmB)"
            ],
            "true_referents": [
                "(R,R,R)-nicotianamine",
                "(R,S,S)-nicotianamine",
                "(S,R,R)-nicotianamine",
                "3''-deamino-3''-oxonicotianamine",
                "Gramicidin A",
                "Salinomycin",
                "aerobactin",
                "alborixin",
                "beauvericin",
                "bisucaberin B",
                "chrysobactin",
                "enniatin",
                "enniatin A",
                "enniatin A1",
                "enniatin B",
                "indanomycin",
                "ionomycin",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mutalomycin",
                "nigericin",
                "petrobactin(1+)",
                "pseudomonine",
                "quinolobactin",
                "staphyloferrin B",
                "valinomycin",
                "vanchrobactin"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Valinomycin (Val)",
            "Monensin (Mon)",
            "Nigericin (Nig)",
            "Gramicidin A (GrA)",
            "Nonactin (Non)",
            "Ionomycin (Ion)",
            "Salinomycin (Sal)",
            "Lasalocid (Las)",
            "Calcimycin (Cal)",
            "Beauvericin (Beau)",
            "Enniatins (Enns)",
            "Amphotericin B (AmB)",
            "Nystatin (Nys)",
            "Natamycin (Nat)",
            "Mucidin (Muc)",
            "Trichomycin (Tri)",
            "Duramycin (Dur)",
            "Leptomycin B (LepB)",
            "Syringomycin (Syr)",
            "Filipin (Fil)",
            "Pseudomonic Acid (PsA)",
            "Milbemycin (Mil)",
            "Avermectin (Aver)",
            "Tetranactin (Tet)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Valinomycin",
                "Monensin A",
                "Nigericin",
                "Gramicidin A",
                "Ionomycin",
                "Salinomycin",
                "Lasalocid",
                "Beauvericin"
            ],
            "mismatches": [
                "Nonactin",
                "Calcimycin",
                "Enniatins",
                "Amphotericin B",
                "Nystatin",
                "Natamycin",
                "Mucidin",
                "Trichomycin",
                "Duramycin",
                "Leptomycin B",
                "Syringomycin",
                "Filipin",
                "Pseudomonic Acid",
                "Milbemycin",
                "Avermectin",
                "Tetranactin"
            ],
            "true_referents": [
                "(S,S,S)-avenic acid A",
                "3''-deamino-3''-oxonicotianamine",
                "3-hydroxymugineic acid",
                "Gramicidin A",
                "Salinomycin",
                "achromobactin",
                "alborixin",
                "beauvericin",
                "bisucaberin B",
                "calcium ionophore",
                "chlortetracycline",
                "coelichelin(3-)",
                "desferrialbomycin delta1",
                "desferrialbomycin epsilon",
                "desferrialbomycins",
                "enniatin",
                "enniatin A",
                "enniatin A1",
                "enniatin B",
                "enterobactin(1-)",
                "griseochelin",
                "indanomycin",
                "ionomycin",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mutalomycin",
                "mutalomycin sodium salt",
                "nigericin",
                "okadaic acid",
                "petrobactin(1+)",
                "pseudomonine",
                "tridodecylamine",
                "valinomycin",
                "vanchrobactin",
                "yersiniabactin"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Monensin (MON)",
            "Nigericin (NIG)",
            "Valinomycin (VAL)",
            "Gramicidin (GRA)",
            "Ionomycin (ION)",
            "A23187 (A23187)",
            "Calcimycin (CAL)",
            "Lasalocid (LAS)",
            "Salinomycin (SAL)",
            "Narasin (NAR)",
            "Maduramicin (MAD)",
            "Laidlomycin (LAI)",
            "Lysocellin (LYS)",
            "Epimerized Monensin (E-MON)",
            "Dehydromonensin (D-MON)",
            "Dihydromonensin (DH-MON)",
            "Tetronasin (TET)",
            "Semduramicin (SEM)",
            "Halogenated Monensin Analogues (H-MON)",
            "Lonomycin (LON)",
            "Carriomycin (CAR)",
            "Dianemycin (DIA)",
            "Boromycin (BOR)",
            "Dinactin (DIN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nigericin",
                "Valinomycin",
                "Salinomycin"
            ],
            "mismatches": [
                "Monensin (MON)",
                "Gramicidin (GRA)",
                "Ionomycin (ION)",
                "A23187 (A23187)",
                "Calcimycin (CAL)",
                "Lasalocid (LAS)",
                "Narasin (NAR)",
                "Maduramicin (MAD)",
                "Laidlomycin (LAI)",
                "Lysocellin (LYS)",
                "Epimerized Monensin (E-MON)",
                "Dehydromonensin (D-MON)",
                "Dihydromonensin (DH-MON)",
                "Tetronasin (TET)",
                "Semduramicin (SEM)",
                "Halogenated Monensin Analogues (H-MON)",
                "Lonomycin (LON)",
                "Carriomycin (CAR)",
                "Dianemycin (DIA)",
                "Boromycin (BOR)",
                "Dinactin (DIN)"
            ],
            "true_referents": [
                "(R,R,R)-nicotianamine",
                "24-dehydrozincophorin",
                "3''-deamino-3''-oxonicotianamine",
                "3-epi-3-hydroxy-2'-deoxymugineic acid",
                "Gramicidin A",
                "IC202A",
                "IC202C",
                "N-(2,3-dihydroxybenzoyl)serine",
                "Salinomycin",
                "bafilomycin A1",
                "bisucaberin B",
                "calcium ionophore",
                "carboxymycobactin",
                "chlortetracycline",
                "chrysobactin",
                "coelichelin(3-)",
                "desferriexochelin 772MS",
                "enniatin",
                "enniatin A",
                "enniatin B",
                "griseochelin",
                "indanomycin",
                "ionomycin",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mutalomycin",
                "mutalomycin sodium salt",
                "myxochelin B",
                "nigericin",
                "pseudomonine",
                "valinomycin"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Valinomycin (Val)",
            "Nonactin",
            "Monactin",
            "Dinactin",
            "Enforsin",
            "Nigericin",
            "Monensin",
            "Lasalocid",
            "Carboxin",
            "X-537A",
            "A23187",
            "Calcimycin",
            "Ionophor A",
            "Ionophor B",
            "Fusaricidin",
            "Tyrothricin",
            "Pyrrolidino[1,2-a]indole-1-carboxamide",
            "Calcitonin gene-related peptide",
            "Forskolin",
            "Ruthenium red",
            "Rhodopsin",
            "Cyclosporin A",
            "Gramicidin",
            "Nystatin",
            "Amphotericin B"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nigericin",
                "Lasalocid",
                "Gramicidin"
            ],
            "mismatches": [
                "Valinomycin (Val)",
                "Nonactin",
                "Monactin",
                "Dinactin",
                "Enforsin",
                "Monensin",
                "Carboxin",
                "X-537A",
                "A23187",
                "Calcimycin",
                "Ionophor A",
                "Ionophor B",
                "Fusaricidin",
                "Tyrothricin",
                "Pyrrolidino[1,2-a]indole-1-carboxamide",
                "Calcitonin gene-related peptide",
                "Forskolin",
                "Ruthenium red",
                "Rhodopsin",
                "Cyclosporin A",
                "Nystatin",
                "Amphotericin B"
            ],
            "true_referents": [
                "(R,R,R)-nicotianamine",
                "(R,S,S)-nicotianamine",
                "(S,R,R)-nicotianamine",
                "3''-deamino-3''-oxonicotianamine",
                "3-epi-3-hydroxy-2'-deoxymugineic acid",
                "Gramicidin A",
                "IC202A",
                "IC202C",
                "N(5)-[(S)-citryl]-D-ornithine(2-)",
                "Salinomycin",
                "aerobactin",
                "calcium ionophore",
                "carboxymycobactin",
                "chlortetracycline",
                "chrysobactin",
                "desferriexochelin 772MS",
                "enniatin",
                "enniatin A",
                "enniatin A1",
                "enniatin B",
                "indanomycin",
                "ionomycin",
                "iron ionophore",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mutalomycin",
                "nigericin",
                "petrobactin(1+)",
                "potassium ionophore",
                "pyrithione",
                "quinolobactin",
                "rhodotorulic acid",
                "valinomycin",
                "vanchrobactin",
                "yersiniabactin"
            ],
            "TP": 3,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            "Valinomycin (VAL)",
            "Enniatin (ENN)",
            "Beauvericin (BEA)",
            "Monensin (MON)",
            "Nigericin (NIG)",
            "Salinomycin (SAL)",
            "Lasalocid (LAS)",
            "Septamycin (SEP)",
            "A23187 (Calcimycin)",
            "Ionomycin (ION)",
            "Dicyclohexyl-18-crown-6 (DCHC)",
            "Naphthoquinone (NQ)",
            "Dinactin (DIN)",
            "Etomycin (ETM)",
            "Granicidin (GRA)",
            "Alamethicin (ALM)",
            "Zinniol (ZIN)",
            "Kryptofix (KRY)",
            "Cryptofix (CRY)",
            "Monactin (MONA)",
            "Dinemycin (DINM)",
            "Fluorinated ionophore (FION)",
            "Proton ionophore (PIO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Valinomycin",
                "Enniatin",
                "Beauvericin",
                "Monensin",
                "Nigericin",
                "Salinomycin",
                "Lasalocid",
                "Ionomycin"
            ],
            "mismatches": [
                "Septamycin",
                "A23187 (Calcimycin)",
                "Dicyclohexyl-18-crown-6",
                "Naphthoquinone",
                "Dinactin",
                "Etomycin",
                "Granicidin",
                "Alamethicin",
                "Zinniol",
                "Kryptofix",
                "Cryptofix",
                "Monactin",
                "Dinemycin",
                "Fluorinated ionophore",
                "Proton ionophore"
            ],
            "true_referents": [
                "24-dehydrozincophorin",
                "3''-deamino-3''-oxonicotianamine",
                "Gramicidin A",
                "N-(2,3-dihydroxybenzoyl)serine",
                "Salinomycin",
                "aerobactin",
                "alborixin",
                "beauvericin",
                "bisucaberin B",
                "calcium ionophore",
                "carbonyl cyanide p-trifluoromethoxyphenylhydrazone",
                "chlortetracycline",
                "chrysobactin",
                "coelichelin(3-)",
                "deferrichrome",
                "desferrialbomycin delta1",
                "desferricoprogen(3-)",
                "desferriexochelin 772MS",
                "desferrioxamine E",
                "enniatin",
                "enniatin A",
                "enniatin B",
                "griseochelin",
                "indanomycin",
                "ionomycin",
                "iron ionophore",
                "lasalocid",
                "lasalocid sodium",
                "monensin A",
                "mutalomycin",
                "mutalomycin sodium salt",
                "myxochelin B",
                "nigericin",
                "petrobactin(1+)",
                "potassium ionophore",
                "pseudomonine",
                "quinolobactin",
                "valinomycin",
                "vanchrobactin"
            ],
            "TP": 8,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "ionophore",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            },
            {
                "Referent": "Ionophore",
                "Canonical Name": "Ionophore"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Ionophore"
            ],
            "true_referents": [
                "calcium ionophore",
                "iron ionophore",
                "potassium ionophore"
            ],
            "TP": 0,
            "FP": 1,
            "FN": 0
        }
    }
]