[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Organophosphates (OP)",
            "Carbamates",
            "Echothiophate iodide",
            "Physostigmine",
            "Rivastigmine",
            "Galantamine",
            "Edrophonium",
            "Neostigmine",
            "Pyridostigmine",
            "Bethanechol",
            "Ambenonium",
            "Pilocarpine",
            "Eserine",
            "Tacrine",
            "Donepezil",
            "Decamethonium",
            "Alosetron",
            "Tramadoline",
            "Methacholine",
            "Metacholine",
            "Carbachol",
            "Bethanechol chloride",
            "Mecamylamine",
            "Trimethyltin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Echothiophate iodide",
                "Physostigmine",
                "Rivastigmine",
                "Edrophonium",
                "Neostigmine",
                "Pyridostigmine",
                "Ambenonium",
                "Tacrine",
                "Donepezil",
                "Decamethonium",
                "Carbachol"
            ],
            "mismatches": [
                "Organophosphates (OP)",
                "Carbamates",
                "Galantamine",
                "Bethanechol",
                "Pilocarpine",
                "Eserine",
                "Bethanechol chloride",
                "Alosetron",
                "Tramadoline",
                "Methacholine",
                "Metacholine",
                "Mecamylamine",
                "Trimethyltin"
            ],
            "true_referents": [
                "AMBENONIUM",
                "Acetyl choline",
                "Acetylcholine chloride",
                "Ambenonium Chloride",
                "BENDIOCARB",
                "BERBERINE CHLORIDE",
                "Caproctamine",
                "Carbachol",
                "Chlorpyrifos",
                "Chlorpyrifos-methyl oxon",
                "Cocaine",
                "Compound Galantamine",
                "Cymserine",
                "DECAMETHONIUM",
                "DONEPEZIL",
                "Decamethonium",
                "Donepezil",
                "Drofenine",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "GALANTAMINE",
                "Ipidacrine",
                "KETAMINE",
                "MEMANTINE",
                "Malaoxon",
                "Methomyl",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,O,S-triethyl thiophosphate",
                "O,S-dihexyl methylphosphonothioate",
                "PARAOXON",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "PYRIDOSTIGMINE BROMIDE",
                "Paraoxon",
                "Phenothiazine",
                "Phenylcarbamate- 9a",
                "Phenylcarbamate- 9b",
                "Phenylcarbamate-26b",
                "Physostigmine",
                "Pyridostigmine",
                "RIVASTIGMINE",
                "Rivastigmine",
                "Sarin",
                "TACRINE",
                "TOLSERINE",
                "TRIMEDOXIME",
                "Tacrine",
                "Tacrine Hydrochloride",
                "Tolserine",
                "Zanapezil",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Physostigmine (ESM)",
            "Neostigmine (NXT)",
            "Pyridostigmine (AChE-I)",
            "Rivastigmine (RTG)",
            "Donepezil (DNZ)",
            "Galantamine (GAL)",
            "Edrophonium (EDE)",
            "Tacrine (AC-107)",
            "Distigmine bromide (DIB)",
            "Ambenonium (Mytelase)",
            "Demecarium bromide (DIB)",
            "Isofluorphate (ISO)",
            "Echothiophate iodide (Phospholine iodide)",
            "Malathion (MAL)",
            "Paraoxon (PAR)",
            "Fenthion (FTH)",
            "Diisopropylfluorophosphate (DFP)",
            "Soman (GD)",
            "VX (O-ethyl S-2-diisopropylaminoethyl methylphosphonothiolate)",
            "Diazinon (DZN)",
            "Mecamylamine (MECA)",
            "Metrifonate (TRP)",
            "Cyclosarin (GF)",
            "Sarin (GB)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Physostigmine (ESM)",
                "Neostigmine (NXT)",
                "Pyridostigmine (AChE-I)",
                "Rivastigmine (RTG)",
                "Donepezil (DNZ)",
                "Galantamine (GAL)",
                "Edrophonium (EDE)",
                "Tacrine (AC-107)",
                "Distigmine bromide (DIB)",
                "Ambenonium (Mytelase)",
                "Isofluorphate (ISO)",
                "Echothiophate iodide (Phospholine iodide)",
                "Malathion (MAL)",
                "Paraoxon (PAR)",
                "Diisopropylfluorophosphate (DFP)",
                "Soman (GD)",
                "Diazinon (DZN)",
                "Metrifonate (TRP)",
                "Cyclosarin (GF)",
                "Sarin (GB)"
            ],
            "mismatches": [
                "Demecarium bromide (DIB)",
                "Fenthion (FTH)",
                "VX (O-ethyl S-2-diisopropylaminoethyl methylphosphonothiolate)",
                "Mecamylamine (MECA)"
            ],
            "true_referents": [
                "AD-35",
                "AMBENONIUM",
                "Ambenonium Chloride",
                "BENZOIN",
                "Caproctamine",
                "Compound Donepezil",
                "Compound Galantamine",
                "Cyclosarin (GF)",
                "DEMECARIUM",
                "DFP (Diisopropyl fluorophosphate)",
                "DONEPEZIL",
                "Decamethonium",
                "Diazinon",
                "Diazoxon",
                "Diisopropyl phosphorofluoridate (DFP)",
                "Distigmine bromide",
                "Donepezil",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "Echothiophate iodide",
                "Edrophonium",
                "Edrophonium chloride",
                "Ethyl parathion",
                "GALANTAMINE",
                "ISOFLUROPHATE",
                "Isopropyl methylphosphonofluoridate",
                "MALATHION",
                "MEMANTINE",
                "Malaoxon",
                "Malathion",
                "Mesuagenin A",
                "Metrifonate(trichlorfon)",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,S-dihexyl methylphosphonothioate",
                "PARAOXON",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "PYRIDOSTIGMINE BROMIDE",
                "Paraoxon",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "S-Hexyl o-pentyl methylphosphonothioate",
                "S-Hexyl o-propyl methylphosphonothioate",
                "SOMAN",
                "Sarin",
                "T-82",
                "TACRINE",
                "Tacrine",
                "Tacrine hydrochloride",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Physostigmine (Eserine)",
            "Neostigmine",
            "Pyridostigmine",
            "Edrophonium",
            "Rivastigmine",
            "Donepezil",
            "Galanthamine",
            "Tacrine",
            "Huperzine A",
            "Ambenonium",
            "Demecarium",
            "Echothiophate",
            "Isoflurophate",
            "Parathion",
            "Malathion",
            "Dichlorvos",
            "Diisopropyl fluorophosphate",
            "Sarin",
            "Soman",
            "VX",
            "Tabun",
            "Eserine",
            "Brivudine",
            "Echothiophate iodide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neostigmine",
                "Pyridostigmine",
                "Edrophonium",
                "Rivastigmine",
                "Donepezil",
                "Tacrine",
                "Huperzine A",
                "Ambenonium",
                "Demecarium",
                "Echothiophate",
                "Isoflurophate",
                "Malathion",
                "Dichlorvos",
                "Diisopropyl fluorophosphate",
                "Sarin",
                "Soman",
                "Tabun",
                "Echothiophate iodide"
            ],
            "mismatches": [
                "Physostigmine (Eserine)",
                "Galanthamine",
                "Parathion",
                "VX",
                "Eserine",
                "Brivudine"
            ],
            "true_referents": [
                "14-Fluorohuperzine A",
                "AD-35",
                "AMBENONIUM",
                "Ambenonium Chloride",
                "BESIPIRDINE",
                "BZYX",
                "Chlorpyrifos",
                "Compound Galantamine",
                "Cymserine",
                "DEHYDROROEMERINE",
                "DEMECARIUM",
                "DFP (Diisopropyl fluorophosphate)",
                "DIPIVEFRIN",
                "DIZOCILPINE",
                "DONEPEZIL",
                "Decamethonium",
                "Dichlorvos",
                "Diisopropyl phosphorofluoridate (DFP)",
                "Dimefox",
                "Donepezil",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "Ethyl parathion",
                "GALANTAMINE",
                "Ganstigmine",
                "HUPERZINE A",
                "Huperzine A",
                "ISOFLUROPHATE",
                "ISOPROPYL METHYLPHOSPHONOFLUORIDATE",
                "Isoflurophate",
                "MALATHION",
                "Malathion",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,O,S-triethyl thiophosphate",
                "O,S-dihexyl methylphosphonothioate",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "PYRIDOSTIGMINE BROMIDE",
                "Paraoxon",
                "Physostigmine",
                "Potasan",
                "Pyridostigmine",
                "Quifenadine",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SOMAN",
                "SUVN-911",
                "Sarin",
                "T-82",
                "TACRINE",
                "TOLSERINE",
                "Tabun",
                "Tacrine",
                "Tacrine Hydrochloride",
                "Tolserine",
                "Trichlorfon",
                "Zanapezil",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Physostigmine (PHY)",
            "Neostigmine (NEO)",
            "Pyridostigmine (PYR)",
            "Donepezil (DON)",
            "Rivastigmine (RIV)",
            "Galantamine (GAL)",
            "Tacrine (TAC)",
            "Edrophonium (EDR)",
            "Sarin (SAR)",
            "Soman (SOM)",
            "Tabun (TAB)",
            "VX (VX)",
            "Malathion (MAL)",
            "Parathion (PAR)",
            "Diazinon (DIA)",
            "Chlorpyrifos (CPF)",
            "Coumaphos (COU)",
            "Dimethoate (DIM)",
            "Eserine (ESR)",
            "Amblyopyrine (AMB)",
            "Propidium (PRO)",
            "Benzylconium chloride (BCQ)",
            "Demecarium bromide (DEM)",
            "Isoamyl methylphosphonate (IMP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Physostigmine (PHY)",
                "Neostigmine (NEO)",
                "Pyridostigmine (PYR)",
                "Donepezil (DON)",
                "Rivastigmine (RIV)",
                "Galantamine (GAL)",
                "Tacrine (TAC)",
                "Edrophonium (EDR)",
                "Sarin (SAR)",
                "Soman (SOM)",
                "Tabun (TAB)",
                "Malathion (MAL)",
                "Diazinon (DIA)",
                "Chlorpyrifos (CPF)",
                "Coumaphos (COU)"
            ],
            "mismatches": [
                "VX (VX)",
                "Parathion (PAR)",
                "Dimethoate (DIM)",
                "Eserine (ESR)",
                "Amblyopyrine (AMB)",
                "Propidium (PRO)",
                "Benzylconium chloride (BCQ)",
                "Demecarium bromide (DEM)",
                "Isoamyl methylphosphonate (IMP)"
            ],
            "true_referents": [
                "(+/-)-SM-21",
                "3-Acetylpyridine",
                "AMBENONIUM",
                "Ambenonium Chloride",
                "BENZYLTRIMETHYLAMMONIUM CHLORIDE",
                "BZYX",
                "Bromophos",
                "Chlorpyrifos",
                "Chlorpyrifos oxon",
                "Chlorpyrifos-methyl oxon",
                "Compound Donepezil",
                "Compound Galantamine",
                "Compound Methamidophos",
                "Coumaphos",
                "Cymserine",
                "DEMECARIUM",
                "DFP (Diisopropyl fluorophosphate)",
                "DONEPEZIL",
                "Diazinon",
                "Diazoxon",
                "Distigmine bromide",
                "Donepezil",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Edrophonium",
                "Ethyl parathion",
                "GALANTAMINE",
                "ISOPROPYL METHYLPHOSPHONOFLUORIDATE",
                "Isopropyl methylphosphonofluoridate",
                "MALATHION",
                "MEMANTINE",
                "Malaoxon",
                "Malathion",
                "Methyl-phosphonothioic acid butyl ester isopropyl ester",
                "NEOSTIGMINE",
                "NEOSTIGMINE BROMIDE",
                "Neostigmine",
                "O,O-Diethyl S-propyl thiophosphate",
                "PARAOXON",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Paraoxon",
                "Physostigmine",
                "Potasan",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "S-Hexyl o-propyl methylphosphonothioate",
                "SOMAN",
                "SUVN-911",
                "Sarin",
                "T-82",
                "TACRINE",
                "TOLSERINE",
                "Tabun",
                "Tacrine",
                "Tacrine hydrochloride",
                "Tetrachloro-p-benzoquinone",
                "Tolserine",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (Aricept)",
            "Rivastigmine (Exelon)",
            "Galantamine (Razadyne)",
            "Tacrine (Cognex)",
            "Pyridostigmine (Mestinon)",
            "Neostigmine (Prostigmin)",
            "Physostigmine (Antilirium)",
            "Edrophonium (Enlon)",
            "Ambenonium (Mytelase)",
            "Demecarium (Humorsol)",
            "Echothiophate (Phospholine Iodide)",
            "Malathion (Ovide)",
            "Parathion",
            "Sarin",
            "Soman",
            "Tabun",
            "Metrifonate",
            "Carbaryl (Sevin)",
            "Diazinon",
            "Chlorpyrifos",
            "Aldicarb (Temik)",
            "Profenofos",
            "Phosmet",
            "Dichlorvos (DDVP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Donepezil",
                "Rivastigmine",
                "Galantamine",
                "Tacrine",
                "Pyridostigmine",
                "Neostigmine",
                "Physostigmine",
                "Edrophonium",
                "Ambenonium",
                "Demecarium",
                "Echothiophate",
                "Malathion",
                "Sarin",
                "Soman",
                "Tabun",
                "Metrifonate",
                "Diazinon",
                "Chlorpyrifos",
                "Dichlorvos"
            ],
            "mismatches": [
                "Parathion",
                "Carbaryl (Sevin)",
                "Aldicarb (Temik)",
                "Profenofos",
                "Phosmet"
            ],
            "true_referents": [
                "AD-35",
                "AMBENONIUM",
                "AZINPHOS-METHYL",
                "Ambenonium Chloride",
                "Azamethiphos",
                "BENDIOCARB",
                "BENZOIN",
                "Carbaril",
                "Carbofuran",
                "Carbosulfan",
                "Chlorpyrifos",
                "Chlorpyrifos oxon",
                "Chlorpyrifos-methyl oxon",
                "Compound Galantamine",
                "DEMECARIUM",
                "DFP (Diisopropyl fluorophosphate)",
                "DONEPEZIL",
                "Decamethonium",
                "Diazinon",
                "Diazoxon",
                "Dichlorvos",
                "Diisopropyl phosphorofluoridate (DFP)",
                "Donepezil",
                "Donepezil hydrochloride",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "Echothiophate iodide",
                "Edrophonium",
                "Edrophonium chloride",
                "Ethyl parathion",
                "GALANTAMINE",
                "MALATHION",
                "Malathion",
                "Methomyl",
                "Metrifonate(trichlorfon)",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,S-dihexyl methylphosphonothioate",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Phenylcarbamate-25b",
                "Physostigmine",
                "Potasan",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SOMAN",
                "SUVN-911",
                "Sarin",
                "T-82",
                "TACRINE",
                "Tabun",
                "Tacrine",
                "Tacrine hydrochloride",
                "Thiodicarb",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Physostigmine (Eserine)",
            "Neostigmine (Prostigmin)",
            "Pyridostigmine (Mestinon)",
            "Rivastigmine (Exelon)",
            "Galantamine (Razadyne)",
            "Donepezil (Aricept)",
            "Carbamate (e.g., Carbaryl)",
            "Organophosphate (e.g., Malathion)",
            "Sarin (GB)",
            "VX (nerve agent)",
            "Dichlorvos (DDVP)",
            "Parathion",
            "Tabun (GA)",
            "Methyl parathion",
            "Bromophos",
            "Azinphos-methyl",
            "Clorpyrifos",
            "Diazinon",
            "Phosmet",
            "Chlorpyrifos-methyl",
            "Echothiophate (Phospholine Iodide)",
            "Isoflurophate (Floropryl)",
            "Soman (GD)",
            "Fenthion"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Physostigmine (Eserine)",
                "Neostigmine (Prostigmin)",
                "Pyridostigmine (Mestinon)",
                "Rivastigmine (Exelon)",
                "Galantamine (Razadyne)",
                "Donepezil (Aricept)",
                "Organophosphate (e.g., Malathion)",
                "Sarin (GB)",
                "Dichlorvos (DDVP)",
                "Tabun (GA)",
                "Bromophos",
                "Azinphos-methyl",
                "Diazinon",
                "Isoflurophate (Floropryl)",
                "Soman (GD)"
            ],
            "mismatches": [
                "Carbamate (e.g., Carbaryl)",
                "VX (nerve agent)",
                "Parathion",
                "Methyl parathion",
                "Clorpyrifos",
                "Phosmet",
                "Chlorpyrifos-methyl",
                "Echothiophate (Phospholine Iodide)",
                "Fenthion"
            ],
            "true_referents": [
                "AD-35",
                "AZINPHOS-METHYL",
                "Azamethiphos",
                "BENZOIN",
                "Bromophos",
                "Chlorpyrifos",
                "Chlorpyrifos oxon",
                "Chlorpyrifos-methyl oxon",
                "Compound Galantamine",
                "Compound Methamidophos",
                "DFP (Diisopropyl fluorophosphate)",
                "DONEPEZIL",
                "Diazinon",
                "Diazoxon",
                "Dichlorvos",
                "Diisopropyl phosphorofluoridate (DFP)",
                "Donepezil",
                "Donepezil hydrochloride",
                "ECHOTHIOPHATE",
                "Echothiophate iodide",
                "Ethyl parathion",
                "GALANTAMINE",
                "ISOFLUROPHATE",
                "Isoflurophate",
                "Isopropyl methylphosphonofluoridate",
                "MALATHION",
                "Malathion",
                "Monocrotophos",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,S-dihexyl methylphosphonothioate",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Phenylcarbamate- 14b",
                "Phenylcarbamate- 9a",
                "Phenylcarbamate- 9b",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SOMAN",
                "Sarin",
                "T-82",
                "Tabun",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (DPZ)",
            "Rivastigmine (RVT)",
            "Galantamine (GLT)",
            "Tacrine (TCR)",
            "Huperzine A (HUP)",
            "Edrophonium (EDR)",
            "Physostigmine (PHY)",
            "Neostigmine (NEO)",
            "Pyridostigmine (PYR)",
            "Echothiophate (ECHO)",
            "Isoflurophate (ISO)",
            "Demecarium (DEM)",
            "Metrifonate (MET)",
            "Phenanthrene (PHE)",
            "Trichlorfon (TRI)",
            "Alvocidib (ALV)",
            "Metoclopramide (METO)",
            "Propafenone (PRO)",
            "Bezafibrate (BEZ)",
            "Carbaryl (CAR)",
            "Propoxur (PROX)",
            "Aldicarb (ALD)",
            "Methomyl (METH)",
            "Oxamyl (OXAM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Donepezil",
                "Rivastigmine",
                "Galantamine",
                "Tacrine",
                "Huperzine A",
                "Edrophonium",
                "Physostigmine",
                "Neostigmine",
                "Pyridostigmine",
                "Echothiophate",
                "Isoflurophate",
                "Demecarium",
                "Trichlorfon",
                "Methomyl",
                "Metoclopramide"
            ],
            "mismatches": [
                "Phenanthrene",
                "Alvocidib",
                "Propafenone",
                "Bezafibrate",
                "Carbaryl",
                "Propoxur",
                "Aldicarb",
                "Oxamyl"
            ],
            "true_referents": [
                "(-)-ASIMILOBINE",
                "1,2-Xylene",
                "1,4-Xylene",
                "2,2',4,4'-Tetrahydroxybenzil",
                "AZADIRACTIN",
                "BENZIL",
                "Bupropion",
                "Carbaril",
                "Carbofuran",
                "Chlorproethazine",
                "Chlorpyrifos-methyl oxon",
                "Compound Donepezil",
                "Compound Galantamine",
                "Compound Methamidophos",
                "Convallatoxin",
                "DECAMETHONIUM",
                "DEMECARIUM",
                "DEOXYVASICINONE",
                "DONEPEZIL",
                "Decamethonium",
                "Donepezil",
                "Drofenine",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "GALANTAMINE",
                "HUPERZINE A",
                "Hexafluorenium bromide",
                "Huperzine A",
                "Huprine-X",
                "ISOFLUROPHATE",
                "ISOPROPYL METHYLPHOSPHONOFLUORIDATE",
                "Irinotecan",
                "Isoamyl acetate",
                "Isoflurophate",
                "MET-Carbamyl sulfonate",
                "MULBERROFURAN D",
                "Methomyl",
                "Metoclopramide hydrochloride",
                "Metrifonate(trichlorfon)",
                "NEOSTIGMINE",
                "NEOSTIGMINE BROMIDE",
                "Neostigmine",
                "O,O,S-triethyl thiophosphate",
                "PARAOXON",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Paraoxon",
                "Phoxim",
                "Physostigmine",
                "Pitofenone",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "TACRINE",
                "Tacrine",
                "Tacrine Hydrochloride",
                "Thiodicarb",
                "Trichlorfon",
                "VILAZODONE",
                "Zanapezil",
                "[3H]galantamine hydrobromide",
                "donecopride",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 15,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (Aricept)",
            "Rivastigmine (Exelon)",
            "Galantamine (Razadyne)",
            "Tacrine (Cognex)",
            "Physostigmine (Antilirium)",
            "Neostigmine (Prostigmin)",
            "Pyridostigmine (Mestinon)",
            "Edrophonium (Tensilon)",
            "Ambenonium (Mytelase)",
            "Echothiophate (Phospholine Iodide)",
            "Malathion (Ovide)",
            "Parathion",
            "Dichlorvos (DDVP)",
            "Carbamates (e.g., Physostigmine carbamate)",
            "Organophosphates (e.g., Paraoxon)",
            "Isoflurophate (Floropryl)",
            "Sarin",
            "Tabun",
            "VX",
            "Galanthamine (Galantamin)",
            "Huperzine A",
            "Phenserine",
            "Tacrine hydrochloride",
            "Donepezil hydrochloride",
            "Rivastigmine tartrate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Donepezil hydrochloride",
                "Rivastigmine",
                "Galantamine",
                "Tacrine",
                "Physostigmine",
                "Neostigmine",
                "Pyridostigmine",
                "Edrophonium",
                "Ambenonium",
                "Echothiophate",
                "Malathion",
                "Dichlorvos",
                "Isoflurophate",
                "Sarin",
                "Tabun",
                "Huperzine A",
                "Phenserine",
                "Tacrine hydrochloride",
                "Donepezil"
            ],
            "mismatches": [
                "Parathion",
                "Carbamates (e.g., Physostigmine carbamate)",
                "Organophosphates (e.g., Paraoxon)",
                "VX",
                "Rivastigmine tartrate"
            ],
            "true_referents": [
                "14-Fluorohuperzine A",
                "4-ISOPROPYLPHENSERINE",
                "AMBENONIUM",
                "Ambenonium Chloride",
                "BZYX",
                "Chlorpyrifos",
                "Chlorpyrifos-methyl oxon",
                "Compound Galantamine",
                "DFP (Diisopropyl fluorophosphate)",
                "DONEPEZIL",
                "DONEPEZIL HYDROCHLORIDE",
                "Decamethonium",
                "Dichlorvos",
                "Diisopropyl phosphorofluoridate (DFP)",
                "Dimefox",
                "Donepezil",
                "Donepezil hydrochloride",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "Echothiophate iodide",
                "Edrophonium",
                "Edrophonium chloride",
                "Ethyl parathion",
                "GALANTAMINE",
                "HUPERZINE A",
                "Huperzine A",
                "ISOFLUROPHATE",
                "Isoflurophate",
                "Isopropyl methylphosphonofluoridate",
                "MALATHION",
                "Malathion",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,S-dihexyl methylphosphonothioate",
                "PARAOXON",
                "PHENETHYLCYMSERINE",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Paraoxon",
                "Physostigmine",
                "Potasan",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "Sarin",
                "T-82",
                "TACRINE",
                "Tabun",
                "Tacrine",
                "Tacrine Hydrochloride",
                "Tacrine hydrochloride",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (Aricept)",
            "Rivastigmine (Exelon)",
            "Galantamine (Razadyne)",
            "Neostigmine",
            "Pyridostigmine",
            "Physostigmine",
            "Echothiophate",
            "Tacrine",
            "Ambenonium",
            "Edrophonium",
            "Phenserine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Donepezil",
                "Rivastigmine",
                "Neostigmine",
                "Pyridostigmine",
                "Physostigmine",
                "Echothiophate",
                "Tacrine",
                "Ambenonium",
                "Edrophonium",
                "Phenserine"
            ],
            "mismatches": [
                "Galantamine (Razadyne)"
            ],
            "true_referents": [
                "4-ISOPROPYLPHENSERINE",
                "AMBENONIUM",
                "Ambenonium Chloride",
                "Compound Galantamine",
                "DONEPEZIL",
                "Decamethonium",
                "Donepezil",
                "Donepezil hydrochloride",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "GALANTAMINE",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,O,S-triethyl thiophosphate",
                "PHENETHYLCYMSERINE",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "PYRIDOSTIGMINE BROMIDE",
                "Physostigmine",
                "Pyridostigmine",
                "RIVASTIGMINE",
                "Rivastigmine",
                "TACRINE",
                "Tacrine",
                "Tacrine Hydrochloride",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 10,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (E2020)",
            "Rivastigmine (ENA-713)",
            "Galantamine (GAL)",
            "Tacrine (THA)",
            "Physostigmine (PHY)",
            "Neostigmine (NEO)",
            "Pyridostigmine (PYR)",
            "Edrophonium (EDR)",
            "Huperzine A (HupA)",
            "Metrifonate (MTF)",
            "Eptastigmine (EPS)",
            "Ambenonium (AMB)",
            "Demecarium (DEM)",
            "Echothiophate (ECH)",
            "Isoflurophate (DFP)",
            "Malathion (MAL)",
            "Paraoxon (PAR)",
            "Sarin (GB)",
            "VX nerve agent",
            "Tabun (GA)",
            "Soman (GD)",
            "Cyclosarin (GF)",
            "Diisopropylfluorophosphate (DIFP)",
            "Tetraisopropyl pyrophosphoramide (iso-OMPA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Donepezil (E2020)",
                "Rivastigmine (ENA-713)",
                "Galantamine (GAL)",
                "Tacrine (THA)",
                "Physostigmine (PHY)",
                "Neostigmine (NEO)",
                "Pyridostigmine (PYR)",
                "Edrophonium (EDR)",
                "Huperzine A (HupA)",
                "Metrifonate (MTF)",
                "Eptastigmine (EPS)",
                "Ambenonium (AMB)",
                "Demecarium (DEM)",
                "Echothiophate (ECH)",
                "Isoflurophate (DFP)",
                "Malathion (MAL)",
                "Paraoxon (PAR)",
                "Sarin (GB)",
                "Tabun (GA)",
                "Soman (GD)",
                "Cyclosarin (GF)"
            ],
            "mismatches": [
                "VX nerve agent",
                "Diisopropylfluorophosphate (DIFP)",
                "Tetraisopropyl pyrophosphoramide (iso-OMPA)"
            ],
            "true_referents": [
                "AD-35",
                "AMBENONIUM",
                "Ambenonium Chloride",
                "Chlorpyrifos",
                "Compound Donepezil",
                "Compound Galantamine",
                "Cyclosarin (GF)",
                "DECAMETHONIUM",
                "DEMECARIUM",
                "DFP (Diisopropyl fluorophosphate)",
                "DONEPEZIL",
                "Decamethonium",
                "Diisopropyl phosphorofluoridate (DFP)",
                "Donepezil",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "EPTASTIGMINE",
                "Echothiophate iodide",
                "Edrophonium",
                "Eptastigmine",
                "Ethyl parathion",
                "GALANTAMINE",
                "HUPERZINE A",
                "Huperzine A",
                "Huprine-X",
                "ISOFLUROPHATE",
                "ISOPROPYL METHYLPHOSPHONOFLUORIDATE",
                "Isoflurophate",
                "Isopropyl methylphosphonofluoridate",
                "MALATHION",
                "MET-Carbamyl sulfonate",
                "Malaoxon",
                "Malathion",
                "Methanesulfonyl fluoride",
                "Metrifonate(trichlorfon)",
                "NEOSTIGMINE",
                "NEOSTIGMINE BROMIDE",
                "Neostigmine",
                "PARAOXON",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Paraoxon",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SOMAN",
                "Sarin",
                "T-82",
                "TACRINE",
                "Tabun",
                "Tacrine",
                "Tacrine Hydrochloride",
                "XANTHOSTIGMINE",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (Aricept)",
            "Rivastigmine (Exelon)",
            "Galantamine (Razadyne)",
            "Tacrine (Cognex)",
            "Physostigmine (Antilirium)",
            "Pyridostigmine (Mestinon)",
            "Neostigmine (Prostigmin)",
            "Edrophonium (Enlon)",
            "Demecarium (Humorsol)",
            "Echothiophate (Phospholine Iodide)",
            "Isoflurophate (Floropryl)",
            "Metrifonate",
            "Huperzine A",
            "Phenserine",
            "Tolserine",
            "Ipidacrine",
            "Ladostigil",
            "Ungeremine",
            "Zifrosilone",
            "Ganstigmine",
            "Icopezil",
            "Zanapezil",
            "Esolerine",
            "Suronacrine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Rivastigmine",
                "Galantamine",
                "Tacrine",
                "Physostigmine",
                "Pyridostigmine",
                "Neostigmine",
                "Edrophonium",
                "Demecarium",
                "Echothiophate",
                "Isoflurophate",
                "Metrifonate",
                "Huperzine A",
                "Phenserine",
                "Tolserine",
                "Ipidacrine",
                "Ganstigmine",
                "Icopezil",
                "Zanapezil"
            ],
            "mismatches": [
                "Donepezil (Aricept)",
                "Ladostigil",
                "Ungeremine",
                "Zifrosilone",
                "Esolerine",
                "Suronacrine"
            ],
            "true_referents": [
                "14-Fluorohuperzine A",
                "4-ISOPROPYLPHENSERINE",
                "Acetyl choline",
                "BESIPIRDINE",
                "Caracemide",
                "Chlorpyrifos-methyl oxon",
                "Compound Galantamine",
                "Cymserine",
                "DEHYDROROEMERINE",
                "DEMECARIUM",
                "DONEPEZIL",
                "Donepezil",
                "Donepezil hydrochloride",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "Echothiophate iodide",
                "Edrophonium",
                "Edrophonium chloride",
                "GALANTAMINE",
                "Ganstigmine",
                "HUPERZINE A",
                "Huperzine A",
                "ISOFLUROPHATE",
                "Icopezil",
                "Ipidacrine",
                "Isoflurophate",
                "Isopropyl methylphosphonofluoridate",
                "Mesuagenin A",
                "Methomyl",
                "Metrifonate(trichlorfon)",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,S-dihexyl methylphosphonothioate",
                "PHENETHYLCYMSERINE",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "PHYSOSTIGMINE SALICYLATE",
                "PYRIDOSTIGMINE",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "Quifenadine",
                "RIVASTIGMINE",
                "Rivastigmine",
                "Stacofylline",
                "TACRINE",
                "TOLSERINE",
                "Tacrine",
                "Tacrine hydrochloride",
                "Tolserine",
                "Zanapezil",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (DPZ)",
            "Rivastigmine (RVS)",
            "Galantamine (GAL)",
            "Tacrine (TAC)",
            "Huperzine A (HUP)",
            "Physostigmine (PHY)",
            "Neostigmine (NEO)",
            "Pyridostigmine (PYR)",
            "Ambenonium (AMB)",
            "Distigmine (DIS)",
            "Edrophonium (EDR)",
            "Echothiophate (ECO)",
            "Demecarium (DEM)",
            "Isoflurophate (ISO)",
            "Malathion (MAL)",
            "Parathion (PAR)",
            "Diazinon (DIA)",
            "Chlorpyrifos (CHL)",
            "Dichlorvos (DDV)",
            "Metrifonate (MET)",
            "Phenserine (PHN)",
            "Tolserine (TOL)",
            "Bambuterol (BAM)",
            "Ambenonium dichloride (AMD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Donepezil",
                "Rivastigmine",
                "Galantamine",
                "Tacrine",
                "Huperzine A",
                "Physostigmine",
                "Neostigmine",
                "Pyridostigmine",
                "Ambenonium",
                "Edrophonium",
                "Echothiophate",
                "Isoflurophate",
                "Malathion",
                "Diazinon",
                "Chlorpyrifos",
                "Dichlorvos",
                "Phenserine",
                "Tolserine",
                "Bambuterol"
            ],
            "mismatches": [
                "Distigmine",
                "Parathion",
                "Demecarium",
                "Metrifonate",
                "Ambenonium dichloride"
            ],
            "true_referents": [
                "AMBENONIUM",
                "Ambenonium Chloride",
                "Amodiaquine Hydrochloride",
                "BAMBUTEROL",
                "Bambuterol Hydrochloride",
                "Carbachol",
                "Chlorpyrifos",
                "Chlorpyrifos oxon",
                "Chlorpyrifos-methyl oxon",
                "Compound Donepezil",
                "Compound Galantamine",
                "Cymserine",
                "DECAMETHONIUM",
                "DEMECARIUM",
                "DFP (Diisopropyl fluorophosphate)",
                "DIZOCILPINE",
                "DONEPEZIL",
                "Decamethonium",
                "Diazinon",
                "Diazoxon",
                "Dichlorvos",
                "Distigmine bromide",
                "Donepezil",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "Ethyl parathion",
                "GALANTAMINE",
                "HUPERZINE A",
                "Huperzine A",
                "Huprine-X",
                "ISOFLUROPHATE",
                "ISOPROPYL METHYLPHOSPHONOFLUORIDATE",
                "Isoflurophate",
                "MALATHION",
                "MET-Carbamyl sulfonate",
                "Malaoxon",
                "Malathion",
                "Methomyl",
                "Metrifonate(trichlorfon)",
                "NEOSTIGMINE",
                "NEOSTIGMINE BROMIDE",
                "Neostigmine",
                "O,O,S-triethyl thiophosphate",
                "PARAOXON",
                "PHENETHYLCYMSERINE",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Paraoxon",
                "Phenethylnorcymserine",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "TACRINE",
                "TOLSERINE",
                "Tacrine",
                "Tacrine hydrochloride",
                "Tolserine",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Donepezil (DON)",
            "Rivastigmine (RIV)",
            "Galantamine (GAL)",
            "Physostigmine (PHY)",
            "Neostigmine (NEO)",
            "Pyridostigmine (PYR)",
            "Tacrine (TAC)",
            "Edrophonium (EDR)",
            "Echothiophate (ECH)",
            "Isoflurophate (ISO)",
            "Demecarium (DEM)",
            "Paraoxon (PAR)",
            "Sarin (SAR)",
            "Soman (SOM)",
            "VX (VX)",
            "Diisopropyl fluorophosphate (DFP)",
            "Echothiophate iodide (ECI)",
            "Diisopropylfluorophosphate (DFP)",
            "Tetraethyl pyrophosphate (TEPP)",
            "Disulfoton (DIS)",
            "Malathion (MAL)",
            "Parathion (PAT)",
            "Chlorpyrifos (CHL)",
            "Coumaphos (COU)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Donepezil",
                "Rivastigmine",
                "Galantamine",
                "Physostigmine",
                "Neostigmine",
                "Pyridostigmine",
                "Tacrine",
                "Edrophonium",
                "Echothiophate",
                "Isoflurophate",
                "Demecarium",
                "Paraoxon",
                "Sarin",
                "Soman",
                "Diisopropyl fluorophosphate",
                "Echothiophate iodide",
                "Malathion",
                "Chlorpyrifos",
                "Coumaphos"
            ],
            "mismatches": [
                "VX (VX)",
                "Diisopropylfluorophosphate (DFP)",
                "Tetraethyl pyrophosphate (TEPP)",
                "Disulfoton (DIS)",
                "Parathion (PAT)"
            ],
            "true_referents": [
                "(+/-)-SM-21",
                "BENZYL SULFOXIDE",
                "BZYX",
                "Bromophos",
                "Chlorpyrifos",
                "Chlorpyrifos oxon",
                "Chlorpyrifos-methyl oxon",
                "Compound Donepezil",
                "Compound Galantamine",
                "Compound Methamidophos",
                "Coumaphos",
                "DECAMETHONIUM",
                "DEMECARIUM",
                "DFP (Diisopropyl fluorophosphate)",
                "DONEPEZIL",
                "Decamethonium",
                "Dichlorvos",
                "Diisopropyl phosphorofluoridate (DFP)",
                "Dimethyl sulfoxide",
                "Donepezil",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "Ethyl parathion",
                "GALANTAMINE",
                "GALLAMINE TRIETHIODIDE",
                "ISOFLUROPHATE",
                "ISOPROPYL METHYLPHOSPHONOFLUORIDATE",
                "Isoflurophate",
                "Isopropyl methylphosphonofluoridate",
                "MALATHION",
                "Malaoxon",
                "Malathion",
                "NEOSTIGMINE",
                "NEOSTIGMINE BROMIDE",
                "Neostigmine",
                "O,O-Diethyl S-pentyl thiophosphate",
                "PARAOXON",
                "PHYSOSTIGMINE",
                "PYRIDOSTIGMINE",
                "Paraoxon",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "SOMAN",
                "SUVN-911",
                "Sarin",
                "TACRINE",
                "Tacrine",
                "Tacrine hydrochloride",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Physostigmine (Physost)",
            "Neostigmine (NeoStig)",
            "Pyridostigmine (Pyridost)",
            "Edrophonium (Edro)",
            "Ambenonium (Ambenon)",
            "Rivastigmine (Exelon)",
            "Galantamine (Reminyl)",
            "Tacrine (Cognex)",
            "Donepezil (Aricept)",
            "Memantine (Namenda)",
            "Huperzine A (HupA)",
            "BW284C51",
            "Echothiophate (Echoth)",
            "Iso-OMPA (Iso-OMPA)",
            "Phenserine (Phenser)",
            "Xanomeline (Xanomel)",
            "Zanamivir (Relenza)",
            "Mecamylamine (Inversine)",
            "Dioscoretin",
            "Diosbulbin",
            "Huperzin",
            "Gambogic acid",
            "Bulbocapnine",
            "Cymserine",
            "Cymserine",
            "Ganoderic acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Physostigmine (Physost)",
                "Neostigmine (NeoStig)",
                "Pyridostigmine (Pyridost)",
                "Edrophonium (Edro)",
                "Ambenonium (Ambenon)",
                "Rivastigmine (Exelon)",
                "Galantamine (Reminyl)",
                "Tacrine (Cognex)",
                "Donepezil (Aricept)",
                "Memantine (Namenda)",
                "Huperzine A (HupA)",
                "BW284C51",
                "Echothiophate (Echoth)",
                "Phenserine (Phenser)",
                "Cymserine"
            ],
            "mismatches": [
                "Iso-OMPA (Iso-OMPA)",
                "Xanomeline (Xanomel)",
                "Zanamivir (Relenza)",
                "Mecamylamine (Inversine)",
                "Dioscoretin",
                "Diosbulbin",
                "Huperzin",
                "Gambogic acid",
                "Bulbocapnine",
                "Ganoderic acid"
            ],
            "true_referents": [
                "2,2',4,4'-Tetrahydroxybenzil",
                "4,8-DIHYDROXY-1-TETRALONE",
                "AMBENONIUM",
                "Ambenonium Chloride",
                "BAVACHININ A",
                "BERBERIN",
                "BI-4924",
                "BW284C51",
                "Bisnorcymserine",
                "CANNABIDIOL",
                "CCT251921",
                "Caproctamine",
                "Compound Galantamine",
                "Cymserine",
                "DECAMETHONIUM",
                "DONEPEZIL",
                "Donepezil",
                "Donepezil hydrochloride",
                "Drofenine",
                "ECHOTHIOPHATE",
                "EDROPHONIUM",
                "EDROPHONIUM CHLORIDE",
                "Echothiophate iodide",
                "Edrophonium",
                "GALANTAMINE",
                "GENISTEIN",
                "GLABRANIN",
                "Gallamine",
                "Ganoderic acid B",
                "HUPERZINE A",
                "Huperzine A",
                "Huprine-X",
                "Huprine-Y",
                "Isoamyl acetate",
                "KETAMINE",
                "MEMANTINE",
                "Mipafox",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,O,S-triethyl thiophosphate",
                "PD138670",
                "PHENETHYLCYMSERINE",
                "PHENSERINE",
                "PHYSOSTIGMINE",
                "PURPUREAMINE I",
                "PURPURIN",
                "PYRIDOSTIGMINE",
                "Phenthoate",
                "Physostigmine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "QUERCETIN",
                "RIVASTIGMINE",
                "RUTIN",
                "Ranitidine hydrochloride",
                "Rivastigmine",
                "TACRINE",
                "TOLSERINE",
                "Tacrine",
                "Tacrine hydrochloride",
                "Zanapezil",
                "[3H]galantamine hydrobromide",
                "physostigmine",
                "rivastigmine"
            ],
            "TP": 15,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": [
            "Neostigmine (Prostigmin)",
            "Pyridostigmine (Mestinon)",
            "Tacrine (Cognex)",
            "Rivastigmine (Exelon)",
            "Galantamine (Razadyne)",
            "Donepezil (Aricept)",
            "Eptastigmine",
            "Phenserine",
            "Metrifonate",
            "Ambenonium chloride",
            "Demecarium",
            "Parathion",
            "Malathion",
            "Echothiophate",
            "Isoflurophate",
            "Dyflos",
            "Cresylate",
            "Carbachol",
            "Bethanechol",
            "Carbaryl",
            "Alverine citrate",
            "Methantheline",
            "Bromoxyne"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Eptastigmine",
                "Phenserine",
                "Ambenonium chloride",
                "Demecarium",
                "Malathion",
                "Echothiophate",
                "Isoflurophate",
                "Carbachol"
            ],
            "mismatches": [
                "Neostigmine (Prostigmin)",
                "Pyridostigmine (Mestinon)",
                "Tacrine (Cognex)",
                "Rivastigmine (Exelon)",
                "Galantamine (Razadyne)",
                "Donepezil (Aricept)",
                "Metrifonate",
                "Parathion",
                "Dyflos",
                "Cresylate",
                "Bethanechol",
                "Carbaryl",
                "Alverine citrate",
                "Methantheline",
                "Bromoxyne"
            ],
            "true_referents": [
                "4-ISOPROPYLPHENSERINE",
                "AMBENONIUM",
                "Acetylcholine chloride",
                "Ambenonium Chloride",
                "BENZYLTRIMETHYLAMMONIUM CHLORIDE",
                "Bromophos",
                "Butyl acetate",
                "Caproctamine",
                "Carbachol",
                "Carbaril",
                "Carbofuran",
                "Chlorpyrifos",
                "Chlorpyrifos-methyl oxon",
                "Cocaine",
                "Compound Galantamine",
                "Cresol",
                "DEHYDROROEMERINE",
                "DEMECARIUM",
                "DFP (Diisopropyl fluorophosphate)",
                "DONEPEZIL",
                "Dimefox",
                "Donepezil",
                "Donepezil hydrochloride",
                "ECHOTHIOPHATE",
                "EPTASTIGMINE",
                "Echothiophate iodide",
                "Eptastigmine",
                "Ethyl acetate",
                "Ethyl parathion",
                "GALANTAMINE",
                "ISOFLUROPHATE",
                "ISOPROPYL METHYLPHOSPHONOFLUORIDATE",
                "Isoflurophate",
                "KETAMINE",
                "Leptophos",
                "MALATHION",
                "Malathion",
                "Methomyl",
                "Metrifonate(trichlorfon)",
                "NEOSTIGMINE",
                "Neostigmine",
                "Neostigmine bromide",
                "O,O,S-triethyl thiophosphate",
                "PARAOXON",
                "PHENETHYLCYMSERINE",
                "PHENSERINE",
                "PYRIDOSTIGMINE",
                "Palmatine",
                "Paraoxon",
                "Phenothiazine",
                "Pyridostigmine",
                "Pyridostigmine bromide",
                "RIVASTIGMINE",
                "Rivastigmine",
                "TACRINE",
                "Tacrine",
                "Tacrine hydrochloride",
                "Trientine",
                "XANTHOSTIGMINE",
                "[3H]galantamine hydrobromide",
                "rivastigmine"
            ],
            "TP": 8,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "cholinesterase inhibitor",
        "domain": "medicine",
        "response": "[\n        {\n            \"Referent\": \"acetylcholinesterase\" (ACE)\n        },\n        {\n            \"Referent\": \"butyrylcholinesterase\" (BChE)\n        },\n        {\n            \"Referent\": \"pyridostigmine bromide\"\n        },\n        {\n            \"Referent\": \"neostigmine methylsulfate\"\n        },\n        {\n            \"Referent\": \"rivastigmine tartrate\"\n        },\n        {\n            \"Referent\": \"galantamine hydrobromide\"\n        },\n        {\n            \"Referent\": \"tacrine\"\n        },\n        {\n            \"Referent\": \"donepezil\"\n        },\n        {\n            \"Referent\": \"galantamine\"\n        },\n        {\n            \"Referent\": \"memantine\"\n        },\n        {\n            \"Referent\": \"huperzine A\"\n        },\n        {\n            \"Referent\": \"physostigmine\"\n        },\n        {\n            \"Referent\": \"benztropine mesylate\"\n        },\n        {\n            \"Referent\": \"trihexyphenidyl\"\n        },\n        {\n            \"Referent\": \"benzatropine mesylate\"\n        },\n        {\n            \"Referent\": \"isopropyl carbamate\"\n        },\n        {\n            \"Referent\": \"carbamate\"\n        },\n        {\n            \"Referent\": \"carbamates\"\n        },\n        {\n            \"Referent\": \"carbamate pesticides\"\n        },\n        {\n            \"Referent\": \"carbamate insecticides\"\n        },\n        {\n            \"Referent\": \"carbamate herbicides\"\n        },\n        {\n            \"Referent\": \"carbamate drugs\"\n        }\n    ]",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]