[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (DNZ)",
            "Rivastigmine (RIV)",
            "Galantamine (GAN)",
            "Huperzine A (HUP-A)",
            "Neostigmine (NSTM)",
            "Physostigmine (PSTG)",
            "Edrophonium (EDRO)",
            "Pyridostigmine (PYR)",
            "Echothiophate (ECH)",
            "Isoxsuprine (ISOX)",
            "Mecamylamine (MECA)",
            "Bethanechol (BTH)",
            "Ambenonium (AMB)",
            "Metamidophos (MET)",
            "Phorate (PHR)",
            "Carbaryl (CAR)",
            "Phosmet (PHS)",
            "Fenitrothion (FEN)",
            "Chlorpyrifos (CHP)",
            "Malathion (MAL)",
            "Paraoxon (PAR)",
            "Sulfotep (SUL)",
            "Trioxypen (TRI)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Donepezil",
                "Rivastigmine",
                "Galantamine",
                "Huperzine A",
                "Neostigmine",
                "Physostigmine",
                "Edrophonium",
                "Pyridostigmine",
                "Echothiophate",
                "Ambenonium",
                "Chlorpyrifos",
                "Malathion",
                "Paraoxon"
            ],
            "mismatches": [
                "Isoxsuprine",
                "Mecamylamine",
                "Bethanechol",
                "Metamidophos",
                "Phorate",
                "Carbaryl",
                "Phosmet",
                "Fenitrothion",
                "Sulfotep",
                "Trioxypen"
            ],
            "true_referents": [
                "3-Acetylpyridine",
                "AMBENONIUM",
                "AZINPHOS-METHYL",
                "Ambenonium Chloride",
                "BENZIL",
                "BENZYL SULFOXIDE",
                "Bromophos",
                "Caproctamine",
                "Carbachol",
                "Carbaril",
                "Carbofuran",
                "Chlorpyrifos",
                "Chlorpyrifos oxon",
                "Chlorpyrifos-methyl oxon",
                "Compound Donepezil",
                "Compound Galantamine",
                "Compound Methamidophos",
                "DECAMETHONIUM",
                "DFP (Diisopropyl fluorophosphate)",
                "DONEPEZIL",
                "Dimethyl sulfoxide",
                "Donepezil",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "Ethyl parathion",
                "Ethyl-methyl-[2-(methyl-propoxy-phosphinoylsulfanyl)-ethyl]-sulfonium; methyl sulfate",
                "GALANTAMINE",
                "HUPERZINE A",
                "Huperzine A",
                "Huprine X",
                "Huprine-X",
                "KETAMINE",
                "MALATHION",
                "MEMANTINE",
                "Malaoxon",
                "Malathion",
                "Mesuagenin A",
                "Minaprine",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,O,S-triethyl thiophosphate",
                "O,S-dihexyl methylphosphonothioate",
                "PARAOXON",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Paraoxon",
                "Phenothiazine",
                "Phenthoate",
                "Phoxim",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "TRIMEDOXIME",
                "Trientine",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 13,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (Cerazette)",
            "Rivastigmine (Exelon)",
            "Galantamine (Reminyl)",
            "Physostigmine (Antilirium)",
            "Edrophonium (Tensilon)",
            "Tacrine (Cognex)",
            "Pyridostigmine (Mestinon)",
            "Safinamide (Xadago)",
            "Huperzine A",
            "Ambenonium",
            "Demecarium",
            "Echothiophate",
            "Donepezil hydrochloride",
            "Rivastigmine tartrate",
            "Galantamine hydrobromide",
            "Physostigmine salicylate",
            "Edrophonium chloride",
            "Tacrine hydrochloride",
            "Pyridostigmine bromide",
            "Huperzine A (extract)",
            "Ambenonium chloride",
            "Demecarium bromide",
            "Echothiophate iodide",
            "Metrifonate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Huperzine A",
                "Ambenonium",
                "Demecarium",
                "Echothiophate",
                "Donepezil hydrochloride",
                "Rivastigmine tartrate",
                "Galantamine hydrobromide",
                "Edrophonium chloride",
                "Tacrine hydrochloride",
                "Pyridostigmine bromide",
                "Ambenonium chloride",
                "Echothiophate iodide"
            ],
            "mismatches": [
                "Donepezil (Cerazette)",
                "Rivastigmine (Exelon)",
                "Galantamine (Reminyl)",
                "Physostigmine (Antilirium)",
                "Edrophonium (Tensilon)",
                "Tacrine (Cognex)",
                "Pyridostigmine (Mestinon)",
                "Safinamide (Xadago)",
                "Huperzine A (extract)",
                "Demecarium bromide",
                "Physostigmine salicylate",
                "Metrifonate"
            ],
            "true_referents": [
                "14-Fluorohuperzine A",
                "AMBENONIUM",
                "Ambenonium Chloride",
                "BENZYLTRIMETHYLAMMONIUM CHLORIDE",
                "Chlorpyrifos-methyl oxon",
                "Compound Galantamine",
                "DEHYDROROEMERINE",
                "DEMECARIUM",
                "DONEPEZIL",
                "DONEPEZIL HYDROCHLORIDE",
                "Decamethonium",
                "Distigmine bromide",
                "Donepezil",
                "Donepezil hydrochloride",
                "Drofenine",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "Edrophonium chloride",
                "GALANTAMINE",
                "GALANTAMINE HYDROBROMIDE",
                "Galantamine hydrobromide",
                "HUPERZINE A",
                "Huperzine A",
                "MEMANTINE",
                "Methomyl",
                "Metrifonate(trichlorfon)",
                "O,O,S-triethyl thiophosphate",
                "O,S-dihexyl methylphosphonothioate",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "PHYSOSTIGMINE SALICYLATE",
                "PYRIDOSTIGMINE",
                "PYRIDOSTIGMINE BROMIDE",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "Quifenadine",
                "RIVASTIGMINE",
                "Rivastigmine",
                "Rivastigmine tartrate",
                "TACRINE",
                "Tacrine",
                "Tacrine Hydrochloride",
                "Tacrine hydrochloride",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 12,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Physostigmine",
            "Neostigmine",
            "Pyridostigmine",
            "Edrophonium",
            "Rivastigmine",
            "Galantamine",
            "Donepezil",
            "Tacrine",
            "Methanesulfonyl fluoride",
            "Echothiophate",
            "Demecarium",
            "Ambenonium",
            "Isocarboxazid",
            "Eserine",
            "Huperzine A",
            "Malathion",
            "Parathion",
            "Organophosphorus compounds",
            "Carbamates",
            "Benzylisoquinoline alkaloids",
            "Phenylcarbamates",
            "Fenamiphos",
            "Temefos",
            "Echothiophene iodide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Physostigmine",
                "Neostigmine",
                "Pyridostigmine",
                "Edrophonium",
                "Rivastigmine",
                "Galantamine",
                "Donepezil",
                "Tacrine",
                "Methanesulfonyl fluoride",
                "Echothiophate",
                "Demecarium",
                "Ambenonium",
                "Huperzine A",
                "Malathion"
            ],
            "mismatches": [
                "Isocarboxazid",
                "Eserine",
                "Parathion",
                "Organophosphorus compounds",
                "Carbamates",
                "Benzylisoquinoline alkaloids",
                "Phenylcarbamates",
                "Fenamiphos",
                "Temefos",
                "Echothiophene iodide"
            ],
            "true_referents": [
                "14-Fluorohuperzine A",
                "AMBENONIUM",
                "Ambenonium Chloride",
                "Azamethiphos",
                "Bromophos",
                "Chlorproethazine",
                "Chlorpyrifos",
                "Chlorpyrifos-methyl oxon",
                "Compound Galantamine",
                "Compound Methamidophos",
                "Coumaphos",
                "Cymserine",
                "DEHYDROROEMERINE",
                "DEMECARIUM",
                "DONEPEZIL",
                "Decamethonium",
                "Dimefox",
                "Donepezil",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "ETHOPROPAZINE",
                "Echothiophate iodide",
                "Edrophonium",
                "Ethopropazine",
                "Ethyl parathion",
                "GALANTAMINE",
                "GALLAMINE TRIETHIODIDE",
                "HUPERZINE A",
                "Huperzine A",
                "ISOBAVACHALCONE",
                "Isovanihuperzine A",
                "MALATHION",
                "Malathion",
                "Methanesulfonyl fluoride",
                "Methyl arachidonylphosphonofluoridate",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,O,S-triethyl thiophosphate",
                "PHENSERINE",
                "PHENYLMETHYLSULFONYLFLUORIDE",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "PYRIDOSTIGMINE BROMIDE",
                "Phenylcarbamate- 14b",
                "Phenylcarbamate- 9a",
                "Phenylcarbamate- 9b",
                "Phenylcarbamate-26b",
                "Physostigmine",
                "Pyridostigmine",
                "RIVASTIGMINE",
                "Rivastigmine",
                "TACRINE",
                "TOLSERINE",
                "Tacrine",
                "Tacrine Hydrochloride",
                "Tetrachloro-p-benzoquinone",
                "Tolserine",
                "Zanapezil",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Physostigmine (PHY)",
            "Neostigmine (NEO)",
            "Pyridostigmine (PYR)",
            "Rivastigmine (RIV)",
            "Donepezil (DON)",
            "Galantamine (GAL)",
            "Tacrine (TAC)",
            "Edrophonium (EDR)",
            "Sarin (SAR)",
            "Soman (SOM)",
            "Tabun (TAB)",
            "VX (VX)",
            "Malathion (MAL)",
            "Parathion (PAR)",
            "Diazinon (DIA)",
            "Chlorpyrifos (CPF)",
            "Imidacloprid (IMI)",
            "Carbaryl (CAR)",
            "Aldicarb (ALD)",
            "Methiocarb (MET)",
            "Benomyl (BEN)",
            "Eserine (ESE)",
            "Amblyopia treatment eyedrops (various)",
            "DFP (DFP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Physostigmine",
                "Neostigmine",
                "Pyridostigmine",
                "Rivastigmine",
                "Donepezil",
                "Galantamine",
                "Tacrine",
                "Edrophonium",
                "Sarin",
                "Soman",
                "Tabun",
                "Malathion",
                "Diazinon",
                "Chlorpyrifos",
                "DFP (Diisopropyl fluorophosphate)"
            ],
            "mismatches": [
                "VX",
                "Parathion",
                "Imidacloprid",
                "Carbaryl",
                "Aldicarb",
                "Methiocarb",
                "Benomyl",
                "Eserine",
                "Amblyopia treatment eyedrops (various)"
            ],
            "true_referents": [
                "(+/-)-SM-21",
                "AMBENONIUM",
                "AZADIRACTIN",
                "BENZIL",
                "BZYX",
                "Benactyzine",
                "Carbaril",
                "Carbofuran",
                "Chlorpyrifos",
                "Chlorpyrifos oxon",
                "Chlorpyrifos-methyl oxon",
                "Compound Donepezil",
                "Compound Galantamine",
                "Cymserine",
                "DFP (Diisopropyl fluorophosphate)",
                "DONEPEZIL",
                "Diazinon",
                "Diazoxon",
                "Diisopropyl phosphorofluoridate (DFP)",
                "Donepezil",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Edrophonium",
                "Ethyl parathion",
                "GALANTAMINE",
                "Icopezil",
                "MALATHION",
                "MET-Carbamyl sulfonate",
                "MULBERROFURAN D",
                "Malaoxon",
                "Malathion",
                "Methomyl",
                "NEOSTIGMINE",
                "NEOSTIGMINE BROMIDE",
                "Neostigmine",
                "PARAOXON",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Paraoxon",
                "Phenylcarbamate-25b",
                "Physostigmine",
                "Potasan",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SOMAN",
                "SUVN-911",
                "Sarin",
                "T-82",
                "TACRINE",
                "TOLSERINE",
                "Tabun",
                "Tacrine",
                "Tacrine hydrochloride",
                "Thiodicarb",
                "Tolserine",
                "[3H]galantamine hydrobromide",
                "compound 2f [Jiang <i>et al.</i>, 2018]",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (Aricept)",
            "Rivastigmine (Exelon)",
            "Galantamine (Razadyne)",
            "Tacrine (Cognex)",
            "Physostigmine",
            "Neostigmine",
            "Pyridostigmine",
            "Edrophonium",
            "Ambenonium",
            "Demecarium",
            "Echothiophate",
            "Malathion",
            "Parathion",
            "Diazinon",
            "Sarin",
            "Soman",
            "Tabun",
            "VX",
            "Carbaryl",
            "Propoxur",
            "Aldicarb",
            "Metrifonate",
            "Galantamine hydrobromide",
            "Huperzine A"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Donepezil",
                "Rivastigmine",
                "Galantamine",
                "Tacrine",
                "Physostigmine",
                "Neostigmine",
                "Pyridostigmine",
                "Edrophonium",
                "Ambenonium",
                "Demecarium",
                "Echothiophate",
                "Malathion",
                "Diazinon",
                "Sarin",
                "Soman",
                "Tabun",
                "Metrifonate",
                "Galantamine hydrobromide",
                "Huperzine A"
            ],
            "mismatches": [
                "Parathion",
                "VX",
                "Carbaryl",
                "Propoxur",
                "Aldicarb"
            ],
            "true_referents": [
                "14-Fluorohuperzine A",
                "AD-35",
                "AMBENONIUM",
                "Ambenonium Chloride",
                "BENDIOCARB",
                "BENZOIN",
                "BZYX",
                "Carbaril",
                "Carbofuran",
                "Chlorpyrifos",
                "Chlorpyrifos-methyl oxon",
                "Compound Galantamine",
                "DEHYDROROEMERINE",
                "DEMECARIUM",
                "DONEPEZIL",
                "Decamethonium",
                "Diazinon",
                "Diazoxon",
                "Dimefox",
                "Donepezil",
                "Donepezil hydrochloride",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "Ethyl parathion",
                "GALANTAMINE",
                "GALANTAMINE HYDROBROMIDE",
                "Galantamine hydrobromide",
                "HUPERZINE A",
                "Huperzine A",
                "MALATHION",
                "MULBERROFURAN D",
                "Malathion",
                "Methomyl",
                "Metrifonate(trichlorfon)",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,O,S-triethyl thiophosphate",
                "PARAOXON",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "PYRIDOSTIGMINE BROMIDE",
                "Paraoxon",
                "Phoxim",
                "Physostigmine",
                "Potasan",
                "Pyridostigmine",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SOMAN",
                "SUVN-911",
                "Sarin",
                "T-82",
                "TACRINE",
                "Tabun",
                "Tacrine",
                "Tacrine hydrochloride",
                "Thiodicarb",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Physostigmine (Eserine)",
            "Neostigmine (Prostigmin)",
            "Pyridostigmine (Mestinon)",
            "Donepezil (Aricept)",
            "Rivastigmine (Exelon)",
            "Galantamine (Razadyne)",
            "Carbamate (general class)",
            "Malathion (Ovide)",
            "Parathion (general class)",
            "Sarin (GB)",
            "VX (nerve agent)",
            "Tacrine (Cognex)",
            "Ambenonium (Mytelase)",
            "Edrophonium (Tensilon)",
            "Dichlorvos (DDVP)",
            "Organophosphate (general class)",
            "Soman (GD)",
            "Centrally acting cholinesterase inhibitors (general class)",
            "Bromide (general class)",
            "Galantamine hydrobromide (Razadyne ER)",
            "Echothiophate (Phospholine Iodide)",
            "Dimephosphate (general class)",
            "Metrifonate (Neguvon)",
            "Butyrylcholinesterase inhibitors (general class)",
            "Fentanyl (cholinergic effects in overdose)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Physostigmine (Eserine)",
                "Neostigmine (Prostigmin)",
                "Pyridostigmine (Mestinon)",
                "Donepezil (Aricept)",
                "Rivastigmine (Exelon)",
                "Galantamine (Razadyne)",
                "Malathion (Ovide)",
                "Sarin (GB)",
                "Tacrine (Cognex)",
                "Ambenonium (Mytelase)",
                "Edrophonium (Tensilon)",
                "Dichlorvos (DDVP)",
                "Soman (GD)",
                "Galantamine hydrobromide (Razadyne ER)",
                "Echothiophate (Phospholine Iodide)"
            ],
            "mismatches": [
                "Carbamate (general class)",
                "Parathion (general class)",
                "VX (nerve agent)",
                "Organophosphate (general class)",
                "Centrally acting cholinesterase inhibitors (general class)",
                "Bromide (general class)",
                "Dimephosphate (general class)",
                "Metrifonate (Neguvon)",
                "Butyrylcholinesterase inhibitors (general class)",
                "Fentanyl (cholinergic effects in overdose)"
            ],
            "true_referents": [
                "2-Bromo LSD",
                "AD-35",
                "AMBENONIUM",
                "Acetylcholine chloride",
                "Ambenonium Chloride",
                "Chlorpyrifos",
                "Chlorpyrifos-methyl oxon",
                "Compound Donepezil",
                "Compound Galantamine",
                "DFP (Diisopropyl fluorophosphate)",
                "DONEPEZIL",
                "Decamethonium",
                "Dichlorvos",
                "Diisopropyl phosphorofluoridate (DFP)",
                "Distigmine bromide",
                "Donepezil",
                "Donepezil hydrochloride",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "Echothiophate iodide",
                "Edrophonium",
                "Edrophonium chloride",
                "Ethyl parathion",
                "GALANTAMINE",
                "GALANTAMINE HYDROBROMIDE",
                "Galantamine hydrobromide",
                "Hexafluorenium bromide",
                "MALATHION",
                "MET-Carbamyl sulfonate",
                "Malathion",
                "Metrifonate(trichlorfon)",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,S-dihexyl methylphosphonothioate",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Phenylcarbamate- 9a",
                "Phenylcarbamate- 9b",
                "Phenylcarbamate-26b",
                "Phosphoric acid 2,2-dimethyl-propyl ester diethyl ester",
                "Phosphoric acid 3,3-dimethyl-butyl ester diethyl ester",
                "Phosphoric acid 4,4-dimethyl-pentyl ester diethyl ester",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SOMAN",
                "Sarin",
                "T-82",
                "TACRINE",
                "Tacrine",
                "Tacrine hydrochloride",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 15,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Physostigmine (PHY)",
            "Galantamine (GAL)",
            "Donepezil (DON)",
            "Rivastigmine (RIV)",
            "Tacrine (TAC)",
            "Huperzine A (HUP)",
            "Neostigmine (NEO)",
            "Pyridostigmine (PYR)",
            "Edrophonium (EDR)",
            "Demecarium (DEM)",
            "Echothiophate (ECHO)",
            "Isoflurophate (ISO)",
            "Malathion (MAL)",
            "Parathion (PAR)",
            "Sarin (SAR)",
            "Soman (SOM)",
            "Tabun (TAB)",
            "VX Nerve Gas (VX)",
            "Metrifonate (MET)",
            "Phosmet (PHO)",
            "Tetrachlorvinphos (TET)",
            "Chlorpyrifos (CHL)",
            "Diazinon (DIA)",
            "Carbaryl (CAR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Galantamine",
                "Donepezil",
                "Rivastigmine",
                "Tacrine",
                "Huperzine A",
                "Neostigmine",
                "Pyridostigmine",
                "Edrophonium",
                "Demecarium",
                "Echothiophate",
                "Isoflurophate",
                "Malathion",
                "Sarin",
                "Soman",
                "Tabun",
                "Chlorpyrifos",
                "Diazinon",
                "Physostigmine"
            ],
            "mismatches": [
                "Physostigmine (PHY)",
                "Parathion (PAR)",
                "VX Nerve Gas (VX)",
                "Metrifonate (MET)",
                "Phosmet (PHO)",
                "Tetrachlorvinphos (TET)",
                "Carbaryl (CAR)"
            ],
            "true_referents": [
                "(+/-)-SM-21",
                "AZINPHOS-METHYL",
                "BENZIL",
                "Carbaril",
                "Carbofuran",
                "Chlorfenvinphos",
                "Chlorpyrifos",
                "Chlorpyrifos oxon",
                "Chlorpyrifos-methyl oxon",
                "Compound Donepezil",
                "Compound Galantamine",
                "DECAMETHONIUM",
                "DEMECARIUM",
                "DONEPEZIL",
                "Decamethonium",
                "Diazinon",
                "Diazoxon",
                "Donepezil",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "Ethyl parathion",
                "GALANTAMINE",
                "HUPERZINE A",
                "Huperzine A",
                "Huprine-X",
                "ISOFLUROPHATE",
                "ISOPROPYL METHYLPHOSPHONOFLUORIDATE",
                "Isoflurophate",
                "MALATHION",
                "MET-Carbamyl sulfonate",
                "Malaoxon",
                "Malathion",
                "Methomyl",
                "Methyl-phosphonothioic acid (2,2-dimethyl-propyl) ester ethyl ester",
                "Metrifonate(trichlorfon)",
                "NEOSTIGMINE",
                "NEOSTIGMINE BROMIDE",
                "Neostigmine",
                "O,O,S-triethyl thiophosphate",
                "O,S-dihexyl methylphosphonothioate",
                "PARAOXON",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Paraoxon",
                "Physostigmine",
                "Potasan",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SOMAN",
                "SUVN-911",
                "Sarin",
                "T-82",
                "TACRINE",
                "Tabun",
                "Tacrine",
                "Tacrine hydrochloride",
                "Tetrachloro-p-benzoquinone",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 18,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Rivastigmine (Exelon)",
            "Donepezil (Aricept)",
            "Galantamine (Razadyne)",
            "Tacrine (Cognex)",
            "Physostigmine",
            "Neostigmine",
            "Pyridostigmine (Mestinon)",
            "Edrophonium",
            "Ambenonium",
            "Echothiophate",
            "Malathion",
            "Parathion",
            "Dichlorvos",
            "Carbamates",
            "Organophosphates",
            "Sarin",
            "Tabun",
            "VX nerve agent",
            "Echothiophate (Phospholine Iodide)",
            "Isofluorophate",
            "Tolserine",
            "Phenyl saligenin phosphate",
            "Phenserine",
            "Huperzine A"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rivastigmine",
                "Donepezil",
                "Galantamine",
                "Tacrine",
                "Physostigmine",
                "Neostigmine",
                "Pyridostigmine",
                "Edrophonium",
                "Ambenonium",
                "Echothiophate",
                "Malathion",
                "Dichlorvos",
                "Sarin",
                "Tabun",
                "Tolserine",
                "Phenserine",
                "Huperzine A"
            ],
            "mismatches": [
                "Rivastigmine (Exelon)",
                "Donepezil (Aricept)",
                "Galantamine (Razadyne)",
                "Tacrine (Cognex)",
                "Pyridostigmine (Mestinon)",
                "Parathion",
                "Carbamates",
                "Organophosphates",
                "VX nerve agent",
                "Echothiophate (Phospholine Iodide)",
                "Isofluorophate",
                "Phenyl saligenin phosphate"
            ],
            "true_referents": [
                "14-Fluorohuperzine A",
                "4-ISOPROPYLPHENSERINE",
                "AMBENONIUM",
                "Ambenonium Chloride",
                "Chlorpyrifos",
                "Chlorpyrifos-methyl oxon",
                "Compound Galantamine",
                "Cymserine",
                "DIZOCILPINE",
                "DONEPEZIL",
                "Decamethonium",
                "Desoxypeganine",
                "Dichlorvos",
                "Donepezil",
                "Donepezil hydrochloride",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "Ethyl parathion",
                "GALANTAMINE",
                "HUPERZINE A",
                "Huperzine A",
                "ISOFLUROPHATE",
                "Isoflurophate",
                "Isopropyl methylphosphonofluoridate",
                "MALATHION",
                "Malathion",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,O,S-triethyl thiophosphate",
                "O,S-dihexyl methylphosphonothioate",
                "PHENETHYLCYMSERINE",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "PHYSOSTIGMINE SALICYLATE",
                "PYRIDOSTIGMINE",
                "Phenylcarbamate- 9a",
                "Phenylcarbamate- 9b",
                "Phenylcarbamate-26b",
                "Physostigmine",
                "Potasan",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "Sarin",
                "T-82",
                "TACRINE",
                "TOLSERINE",
                "Tabun",
                "Tacrine",
                "Tacrine hydrochloride",
                "Tolserine",
                "Trichlorfon",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 17,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (Aricept)",
            "Rivastigmine (Exelon)",
            "Galantamine (Razadyne)",
            "Neostigmine",
            "Pyridostigmine",
            "Physostigmine",
            "Echothiophate",
            "Tacrine (Cognex)",
            "Ambenonium",
            "Edrophonium",
            "Metrifonate",
            "Parathion",
            "VX",
            "Sarin",
            "Soman",
            "BW284c51",
            "Isoflurane",
            "Isoxsuprine",
            "Fesoterodine",
            "Pyridostigmine bromide",
            "Tetrahydroaminoacridine",
            "Carbamylcholine",
            "Prostigmine",
            "Benactyzine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neostigmine",
                "Pyridostigmine",
                "Physostigmine",
                "Echothiophate",
                "Tacrine (Cognex)",
                "Ambenonium",
                "Edrophonium",
                "Metrifonate",
                "Sarin",
                "Soman",
                "Pyridostigmine bromide",
                "Benactyzine"
            ],
            "mismatches": [
                "Donepezil (Aricept)",
                "Rivastigmine (Exelon)",
                "Galantamine (Razadyne)",
                "Parathion",
                "VX",
                "BW284c51",
                "Isoflurane",
                "Isoxsuprine",
                "Fesoterodine",
                "Tetrahydroaminoacridine",
                "Carbamylcholine",
                "Prostigmine"
            ],
            "true_referents": [
                "2-Fluorotoluene",
                "3-Acetylpyridine",
                "ACRIDINE",
                "AD-35",
                "AMBENONIUM",
                "ATHEROSPERMIDINE",
                "Acetyl choline",
                "Acetylcholine chloride",
                "Ambenonium Chloride",
                "BI-4924",
                "BW284C51",
                "BZYX",
                "Benactyzine",
                "CCT251921",
                "Carbachol",
                "Chlorpyrifos",
                "Chlorpyrifos-methyl oxon",
                "Compound Galantamine",
                "DONEPEZIL",
                "Decamethonium",
                "Dimefox",
                "Donepezil",
                "Donepezil hydrochloride",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "ETHOPROPAZINE",
                "Echothiophate iodide",
                "Edrophonium",
                "Ethopropazine",
                "Ethyl parathion",
                "GALANTAMINE",
                "Hexafluorenium bromide",
                "Huprine-X",
                "KETAMINE",
                "MALATHION",
                "MINAPRINE",
                "Malathion",
                "Methomyl",
                "Metrifonate(trichlorfon)",
                "Minaprine",
                "N-TRANS-FERULOYLDOPAMINE",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,O,S-triethyl thiophosphate",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "PYRIDOSTIGMINE BROMIDE",
                "Paraoxon",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RESERPINE",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SOMAN",
                "SUVN-911",
                "Sarin",
                "TACRINE",
                "Tacrine",
                "Tacrine hydrochloride",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 12,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (E2020)",
            "Rivastigmine (ENA-713)",
            "Galantamine (GAL)",
            "Tacrine (THA)",
            "Physostigmine (PHY)",
            "Neostigmine (NEO)",
            "Pyridostigmine (PYR)",
            "Edrophonium (EDR)",
            "Huperzine A (HupA)",
            "Metrifonate (MTF)",
            "Echothiophate (ECH)",
            "Malathion (MAL)",
            "Parathion (PAR)",
            "Chlorpyrifos (CPF)",
            "Diazinon (DZN)",
            "Sarin (GB)",
            "VX nerve agent",
            "Tabun (GA)",
            "Soman (GD)",
            "Paraoxon (POX)",
            "Dichlorvos (DDVP)",
            "Acephate (ACE)",
            "Dimethoate (DMT)",
            "Carbaryl (CBR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Donepezil (E2020)",
                "Rivastigmine (ENA-713)",
                "Galantamine (GAL)",
                "Tacrine (THA)",
                "Physostigmine (PHY)",
                "Neostigmine (NEO)",
                "Pyridostigmine (PYR)",
                "Edrophonium (EDR)",
                "Huperzine A (HupA)",
                "Metrifonate (MTF)",
                "Echothiophate (ECH)",
                "Malathion (MAL)",
                "Chlorpyrifos (CPF)",
                "Diazinon (DZN)",
                "Sarin (GB)",
                "Tabun (GA)",
                "Soman (GD)",
                "Paraoxon (POX)",
                "Dichlorvos (DDVP)"
            ],
            "mismatches": [
                "Parathion (PAR)",
                "VX nerve agent",
                "Acephate (ACE)",
                "Dimethoate (DMT)",
                "Carbaryl (CBR)"
            ],
            "true_referents": [
                "3-Acetylpyridine",
                "AD-35",
                "BENZOIN",
                "Carbaril",
                "Carbofuran",
                "Chlorpyrifos",
                "Chlorpyrifos oxon",
                "Chlorpyrifos-methyl oxon",
                "Compound Donepezil",
                "Compound Galantamine",
                "DFP (Diisopropyl fluorophosphate)",
                "DONEPEZIL",
                "Diazinon",
                "Diazoxon",
                "Dichlorvos",
                "Diisopropyl phosphorofluoridate (DFP)",
                "Donepezil",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "Ethyl acetate",
                "Ethyl parathion",
                "GALANTAMINE",
                "HUPERZINE A",
                "Huperzine A",
                "Huprine-X",
                "MALATHION",
                "MET-Carbamyl sulfonate",
                "Malaoxon",
                "Malathion",
                "Methanesulfonyl fluoride",
                "Metrifonate(trichlorfon)",
                "NEOSTIGMINE",
                "NEOSTIGMINE BROMIDE",
                "Neostigmine",
                "PARAOXON",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Paraoxon",
                "Phenylcarbamate-25b",
                "Phosphoric acid diethyl ester 1-ethyl-propyl ester",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SOMAN",
                "Sarin",
                "T-82",
                "TACRINE",
                "Tabun",
                "Tacrine",
                "Tacrine Hydrochloride",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (Aricept)",
            "Rivastigmine (Exelon)",
            "Galantamine (Razadyne)",
            "Tacrine (Cognex)",
            "Pyridostigmine (Mestinon)",
            "Neostigmine (Prostigmin)",
            "Physostigmine (Eserine)",
            "Edrophonium (Enlon)",
            "Demecarium (Humorsol)",
            "Echothiophate (Phospholine Iodide)",
            "Isoflurophate (Floropryl)",
            "Metrifonate",
            "Huperzine A",
            "Phenserine",
            "Tolserine",
            "Phenethylnorspermine",
            "Ladostigil",
            "Onchidal",
            "Diisopropyl fluorophosphate (DFP)",
            "Sarin (GB)",
            "Soman (GD)",
            "Tabun (GA)",
            "VX (methylphosphonothioic acid S-[2-(diisopropylamino)ethyl] O-ethyl ester)",
            "Cyclosarin (GF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rivastigmine (Exelon)",
                "Galantamine (Razadyne)",
                "Tacrine (Cognex)",
                "Pyridostigmine (Mestinon)",
                "Neostigmine (Prostigmin)",
                "Physostigmine (Eserine)",
                "Edrophonium (Enlon)",
                "Demecarium (Humorsol)",
                "Echothiophate (Phospholine Iodide)",
                "Isoflurophate (Floropryl)",
                "Metrifonate",
                "Huperzine A",
                "Phenserine",
                "Tolserine",
                "Onchidal",
                "Diisopropyl fluorophosphate (DFP)",
                "Sarin (GB)",
                "Soman (GD)",
                "Tabun (GA)",
                "Cyclosarin (GF)"
            ],
            "mismatches": [
                "Donepezil (Aricept)",
                "Phenethylnorspermine",
                "Ladostigil",
                "VX (methylphosphonothioic acid S-[2-(diisopropylamino)ethyl] O-ethyl ester)"
            ],
            "true_referents": [
                "14-Fluorohuperzine A",
                "4-ISOPROPYLPHENSERINE",
                "AD-35",
                "BENZIL",
                "Carbaril",
                "Chlorpyrifos-methyl oxon",
                "Compound Galantamine",
                "Cyclosarin (GF)",
                "Cymserine",
                "DEMECARIUM",
                "DFP (Diisopropyl fluorophosphate)",
                "DONEPEZIL",
                "Diisopropyl phosphorofluoridate (DFP)",
                "Donepezil",
                "Donepezil hydrochloride",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "Echothiophate iodide",
                "Edrophonium",
                "Edrophonium chloride",
                "GALANTAMINE",
                "Ganstigmine",
                "HUPERZINE A",
                "Huperzine A",
                "ISOFLUROPHATE",
                "Isoflurophate",
                "Isopropyl methylphosphonofluoridate",
                "MALATHION",
                "Malathion",
                "Methomyl",
                "Methyl-phosphonothioic acid (2,2-dimethyl-propyl) ester ethyl ester",
                "Methyl-phosphonothioic acid (5,5-dimethyl-hexyl) ester ethyl ester",
                "Metrifonate(trichlorfon)",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,S-dihexyl methylphosphonothioate",
                "ONCHIDAL",
                "PHENETHYLCYMSERINE",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "PHYSOSTIGMINE SALICYLATE",
                "PYRIDOSTIGMINE",
                "Phenethylnorcymserine",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SOMAN",
                "Sarin",
                "T-82",
                "TACRINE",
                "TOLSERINE",
                "Tabun",
                "Tacrine",
                "Tacrine hydrochloride",
                "Tolserine",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (DON)",
            "Rivastigmine (RIV)",
            "Galantamine (GAL)",
            "Physostigmine (PHY)",
            "Neostigmine (NEO)",
            "Pyridostigmine (PYR)",
            "Edrophonium (EDR)",
            "Ambenonium (AMB)",
            "Demecarium (DEM)",
            "Echothiophate (ECO)",
            "Malathion (MAL)",
            "Parathion (PAR)",
            "Diazinon (DIA)",
            "Chlorpyrifos (CHL)",
            "Tacrine (TAC)",
            "Huperzine A (HUP)",
            "Metrifonate (MET)",
            "Phenserine (PHE)",
            "Tolserine (TOL)",
            "Bambuterol (BAM)",
            "Ganstigmine (GAN)",
            "Xanomeline (XAN)",
            "Milameline (MIL)",
            "Sabcomeline (SAB)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Donepezil (DON)",
                "Rivastigmine (RIV)",
                "Galantamine (GAL)",
                "Physostigmine (PHY)",
                "Neostigmine (NEO)",
                "Pyridostigmine (PYR)",
                "Edrophonium (EDR)",
                "Ambenonium (AMB)",
                "Demecarium (DEM)",
                "Echothiophate (ECO)",
                "Malathion (MAL)",
                "Diazinon (DIA)",
                "Chlorpyrifos (CHL)",
                "Tacrine (TAC)",
                "Huperzine A (HUP)",
                "Phenserine (PHE)",
                "Tolserine (TOL)",
                "Bambuterol (BAM)",
                "Ganstigmine (GAN)"
            ],
            "mismatches": [
                "Parathion (PAR)",
                "Metrifonate (MET)",
                "Xanomeline (XAN)",
                "Milameline (MIL)",
                "Sabcomeline (SAB)"
            ],
            "true_referents": [
                "(-)-ASIMILOBINE",
                "4-ISOPROPYLPHENSERINE",
                "AMBENONIUM",
                "Ambenonium Chloride",
                "BAMBUTEROL",
                "Bambuterol Hydrochloride",
                "Carbachol",
                "Chlorpyrifos",
                "Chlorpyrifos oxon",
                "Chlorpyrifos-methyl oxon",
                "Cocaine",
                "Compound Donepezil",
                "Compound Galantamine",
                "Cymserine",
                "DECAMETHONIUM",
                "DEMECARIUM",
                "DONEPEZIL",
                "Decamethonium",
                "Diazinon",
                "Diazoxon",
                "Donepezil",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "Ethyl parathion",
                "GALANTAMINE",
                "Ganstigmine",
                "HUPERZINE A",
                "Huperzine A",
                "Huprine-X",
                "KETAMINE",
                "MALATHION",
                "MEMANTINE",
                "MET-Carbamyl sulfonate",
                "Malaoxon",
                "Malathion",
                "Methomyl",
                "Metrifonate(trichlorfon)",
                "Milnacipran",
                "NEOSTIGMINE",
                "NEOSTIGMINE BROMIDE",
                "Neostigmine",
                "O,O,S-triethyl thiophosphate",
                "PARAOXON",
                "PHENETHYLCYMSERINE",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Paraoxon",
                "Phenothiazine",
                "Phenylcarbamate-30b",
                "Phenylcarbamate-36b",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "RS-1439",
                "Rivastigmine",
                "TACRINE",
                "TOLSERINE",
                "Tacrine",
                "Tacrine hydrochloride",
                "Tolserine",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Acetylcholinesterase Inhibitor (AChEI)",
            "Butyrylcholinesterase Inhibitor (BChEI)",
            "Donepezil (DON)",
            "Rivastigmine (RIV)",
            "Galantamine (GAL)",
            "Tacrine (TAC)",
            "Physostigmine (PHY)",
            "Neostigmine (NEO)",
            "Pyridostigmine (PYR)",
            "Edrophonium (EDR)",
            "Demecarium (DEM)",
            "Echothiophate (ECH)",
            "Isoflurophate (ISO)",
            "Parathion (PAR)",
            "Malathion (MAL)",
            "Sarin (SAR)",
            "Soman (SOM)",
            "VX Nerve Agent (VX)",
            "Ambenonium (AMB)",
            "Distigmine (DIS)",
            "Huperzine A (HUP)",
            "Metrifonate (MET)",
            "Pralidoxime (PRA)",
            "Obidoxime (OBI)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Donepezil (DON)",
                "Rivastigmine (RIV)",
                "Galantamine (GAL)",
                "Tacrine (TAC)",
                "Physostigmine (PHY)",
                "Neostigmine (NEO)",
                "Pyridostigmine (PYR)",
                "Edrophonium (EDR)",
                "Demecarium (DEM)",
                "Echothiophate (ECH)",
                "Isoflurophate (ISO)",
                "Malathion (MAL)",
                "Sarin (SAR)",
                "Soman (SOM)",
                "Ambenonium (AMB)",
                "Huperzine A (HUP)"
            ],
            "mismatches": [
                "Acetylcholinesterase Inhibitor (AChEI)",
                "Butyrylcholinesterase Inhibitor (BChEI)",
                "Parathion (PAR)",
                "VX Nerve Agent (VX)",
                "Distigmine (DIS)",
                "Metrifonate (MET)",
                "Pralidoxime (PRA)",
                "Obidoxime (OBI)"
            ],
            "true_referents": [
                "(+/-)-SM-21",
                "AMBENONIUM",
                "Acetylcholine chloride",
                "Ambenonium Chloride",
                "Chlorpyrifos",
                "Chlorpyrifos-methyl oxon",
                "Compound Donepezil",
                "Compound Galantamine",
                "DECAMETHONIUM",
                "DEMECARIUM",
                "DONEPEZIL",
                "Decamethonium",
                "Distigmine bromide",
                "Donepezil",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "Ethyl parathion",
                "GALANTAMINE",
                "HUPERZINE A",
                "Huperzine A",
                "Huprine-X",
                "ISOFLUROPHATE",
                "ISOPROPYL METHYLPHOSPHONOFLUORIDATE",
                "Isoflurophate",
                "MALATHION",
                "MET-Carbamyl sulfonate",
                "Malathion",
                "Methomyl",
                "Metrifonate(trichlorfon)",
                "NEOSTIGMINE",
                "NEOSTIGMINE BROMIDE",
                "Neostigmine",
                "OBIDOXIME CHLORIDE",
                "OBIDOXIME MESYLATE",
                "Obidoxime chloride",
                "PARAOXON",
                "PHYSOSTIGMINE",
                "PRALIDOXIME",
                "PRALIDOXIME CHLORIDE",
                "PYRIDOSTIGMINE",
                "Paraoxon",
                "Physostigmine",
                "Pralidoxime chloride",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SOMAN",
                "SUVN-911",
                "Sarin",
                "TACRINE",
                "Tacrine",
                "Tacrine hydrochloride",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Physostigmine (ES)",
            "Neostigmine",
            "Pilocarpine",
            "Carbachol",
            "Edrophonium",
            "Echothiophate",
            "Demecarium",
            "Ambenonium",
            "Donepezil (Aricept)",
            "Galantamine (Reminyl)",
            "Rivastigmine (Exelon)",
            "Tacrine",
            "Pyridostigmine",
            "Pyridostigmine bromide",
            "Neostigmine methylsulfate",
            "Edrophonium chloride",
            "Physostigmine salicylate",
            "Carbamylcholine",
            "Benzydamine",
            "Arecoline",
            "Huperzine A",
            "Phenserine",
            "BW284C51",
            "Galanthamine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neostigmine",
                "Carbachol",
                "Edrophonium",
                "Echothiophate",
                "Demecarium",
                "Ambenonium",
                "Tacrine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "Neostigmine methylsulfate",
                "Edrophonium chloride",
                "Physostigmine salicylate",
                "Huperzine A",
                "Phenserine",
                "BW284C51"
            ],
            "mismatches": [
                "Physostigmine (ES)",
                "Pilocarpine",
                "Donepezil (Aricept)",
                "Galantamine (Reminyl)",
                "Rivastigmine (Exelon)",
                "Carbamylcholine",
                "Benzydamine",
                "Arecoline",
                "Galanthamine"
            ],
            "true_referents": [
                "14-Fluorohuperzine A",
                "3-Acetylpyridine",
                "4-ISOPROPYLPHENSERINE",
                "AMBENONIUM",
                "Acetyl choline",
                "Acetylcholine chloride",
                "Ambenonium Chloride",
                "BENDIOCARB",
                "BENZOIN",
                "BI-4924",
                "BW284C51",
                "CCT251921",
                "Carbachol",
                "Compound Galantamine",
                "DEHYDROROEMERINE",
                "DEMECARIUM",
                "DONEPEZIL",
                "Decamethonium",
                "Donepezil",
                "Donepezil hydrochloride",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "Edrophonium chloride",
                "GALANTAMINE",
                "Gallamine",
                "Ganstigmine",
                "HUPERZINE A",
                "Huperzine A",
                "Ipidacrine",
                "LYCORINE",
                "NEOSTIGMINE",
                "NEOSTIGMINE METHYLSULFATE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,O,S-triethyl thiophosphate",
                "PHENETHYLCYMSERINE",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "PHYSOSTIGMINE SALICYLATE",
                "PYRIDOSTIGMINE",
                "PYRIDOSTIGMINE BROMIDE",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RESERPINE",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SCOULERINE",
                "TACRINE",
                "Tacrine",
                "Tacrine Hydrochloride",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Tacrine (THA)",
            "Donepezil (Aricept)",
            "Galantamine (Razadyne)",
            "Rivastigmine (Exelon)",
            "Pyridostigmine (Mestinon)",
            "Neostigmine (Prostigmin)",
            "Physostigmine (Eserin)",
            "Echothiophate (Phospholine)",
            "Demecarium (Humorsol)",
            "Edrophonium (Tensilon)",
            "Phenserine",
            "Metrifonate",
            "Benserazide",
            "Velasol",
            "Phisophamine",
            "Carbachol",
            "Carbaryl",
            "Alvocidib",
            "Ipidacon",
            "Ganoderma lucidum",
            "Parathion",
            "Malathion",
            "Obidoxime",
            "Cymserine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Tacrine",
                "Donepezil",
                "Galantamine",
                "Rivastigmine",
                "Pyridostigmine",
                "Neostigmine",
                "Physostigmine",
                "Echothiophate",
                "Demecarium",
                "Edrophonium",
                "Phenserine",
                "Metrifonate",
                "Carbachol",
                "Malathion",
                "Obidoxime",
                "Cymserine"
            ],
            "mismatches": [
                "Tacrine (THA)",
                "Donepezil (Aricept)",
                "Galantamine (Razadyne)",
                "Rivastigmine (Exelon)",
                "Pyridostigmine (Mestinon)",
                "Neostigmine (Prostigmin)",
                "Physostigmine (Eserin)",
                "Echothiophate (Phospholine)",
                "Demecarium (Humorsol)",
                "Edrophonium (Tensilon)",
                "Benserazide",
                "Velasol",
                "Phisophamine",
                "Carbaryl",
                "Alvocidib",
                "Ipidacon",
                "Ganoderma lucidum",
                "Parathion"
            ],
            "true_referents": [
                "4-ISOPROPYLPHENSERINE",
                "Acetylcholine chloride",
                "Benactyzine",
                "Bisnorcymserine",
                "Carbachol",
                "Carbaril",
                "Carbofuran",
                "Chlorproethazine",
                "Chlorpyrifos",
                "Chlorpyrifos-methyl oxon",
                "Compound Galantamine",
                "Convallatoxin",
                "Cresol",
                "Cymserine",
                "DEMECARIUM",
                "DEOXYVASICINONE",
                "DONEPEZIL",
                "Donepezil",
                "Donepezil hydrochloride",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "Echothiophate iodide",
                "Edrophonium",
                "Edrophonium chloride",
                "Ethyl parathion",
                "GALANTAMINE",
                "Ganoderic acid B",
                "HARMINE",
                "ITOPRIDE",
                "Ipidacrine",
                "Irinotecan",
                "LYCORINE",
                "Lysergic acid diethylamide",
                "MALATHION",
                "Malathion",
                "Methomyl",
                "Metrifonate(trichlorfon)",
                "Mipafox",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,O,S-triethyl thiophosphate",
                "OBIDOXIME CHLORIDE",
                "OBIDOXIME MESYLATE",
                "Obidoxime chloride",
                "PHENETHYLCYMSERINE",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "PITOLISANT",
                "PYRIDOSTIGMINE",
                "Phenothiazine",
                "Phoxim",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "TACRINE",
                "TOLSERINE",
                "Tacrine",
                "Tacrine Hydrochloride",
                "VANILLOLOSIDE",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 16,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            {
                "Referent": "Acetylcholinesterase inhibitor",
                "Canonical name": "AChEI"
            },
            {
                "Referent": "Galantamine",
                "Canonical name": "GAL"
            },
            {
                "Referent": "Donepezil",
                "Canonical name": "DON"
            },
            {
                "Referent": "Rivastigmine",
                "Canonical name": "RIV"
            },
            {
                "Referent": "Tacrine",
                "Canonical name": "TAC"
            },
            {
                "Referent": "Physostigmine",
                "Canonical name": "PHY"
            },
            {
                "Referent": "Neostigmine",
                "Canonical name": "NEO"
            },
            {
                "Referent": "Baclofen",
                "Canonical name": "BAC"
            },
            {
                "Referent": "Raclopride",
                "Canonical name": "RAC"
            },
            {
                "Referent": "Biperiden",
                "Canonical name": "BI"
            },
            {
                "Referent": "Procyclidine",
                "Canonical name": "PRO"
            },
            {
                "Referent": "Trihexyphenidyl",
                "Canonical name": "TRI"
            },
            {
                "Referent": "Ambenonium",
                "Canonical name": "AMB"
            },
            {
                "Referent": "Pirenzepine",
                "Canonical name": "PIR"
            },
            {
                "Referent": "Physostigmine",
                "Canonical name": "PHY"
            },
            {
                "Referent": "Donepezil",
                "Canonical name": "DON"
            },
            {
                "Referent": "Rivastigmine",
                "Canonical name": "RIV"
            },
            {
                "Referent": "Tacrine",
                "Canonical name": "TAC"
            },
            {
                "Referent": "Galantamine",
                "Canonical name": "GAL"
            },
            {
                "Referent": "Neostigmine",
                "Canonical name": "NEO"
            },
            {
                "Referent": "Physostigmine",
                "Canonical name": "PHY"
            },
            {
                "Referent": "Neostigmine",
                "Canonical name": "NEO"
            },
            {
                "Referent": "Rivastigmine",
                "Canonical name": "RIV"
            },
            {
                "Referent": "Tacrine",
                "Canonical name": "TAC"
            },
            {
                "Referent": "Galantamine",
                "Canonical name": "GAL"
            },
            {
                "Referent": "Donepezil",
                "Canonical name": "DON"
            },
            {
                "Referent": "Rivastigmine",
                "Canonical name": "RIV"
            },
            {
                "Referent": "Tacrine",
                "Canonical name": "TAC"
            },
            {
                "Referent": "Physostigmine",
                "Canonical name": "PHY"
            },
            {
                "Referent": "Neostigmine",
                "Canonical name": "NEO"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Galantamine",
                "Donepezil",
                "Rivastigmine",
                "Tacrine",
                "Physostigmine",
                "Neostigmine",
                "Ambenonium"
            ],
            "mismatches": [
                "Acetylcholinesterase inhibitor",
                "Baclofen",
                "Raclopride",
                "Biperiden",
                "Procyclidine",
                "Trihexyphenidyl",
                "Pirenzepine"
            ],
            "true_referents": [
                "(+)-Cocaine",
                "(-)-ASIMILOBINE",
                "1-Bromopinacolone",
                "1-Butanol",
                "AMBENONIUM",
                "Acetylcholine chloride",
                "Ambenonium Chloride",
                "BENZOIN",
                "BI-4924",
                "BI-605906",
                "Chlorproethazine",
                "Compound Donepezil",
                "Compound Galantamine",
                "DECAMETHONIUM",
                "DONEPEZIL",
                "Donepezil",
                "GALANTAMINE",
                "NEOSTIGMINE",
                "Neostigmine",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "Phenothiazine",
                "Physostigmine",
                "RIVASTIGMINE",
                "Rivastigmine",
                "TACRINE",
                "Tacrine",
                "[3H]galantamine hydrobromide",
                "compound 2f [Jiang <i>et al.</i>, 2018]",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 7,
            "FP": 7,
            "FN": 0
        }
    }
]