[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Histamine (HIS)",
            "Serotonin (5-HT)",
            "Dopamine (DA)",
            "Norepinephrine (NE)",
            "Epinephrine (EPI)",
            "Acetylcholine (ACh)",
            "Octopamine",
            "Tyramine",
            "Phenylethylamine",
            "Melatonin",
            "Tryptamine",
            "Dimethyltryptamine (DMT)",
            "5-Methoxydimethyltryptamine (5-MeO-DMT)",
            "Benzylamine",
            "Aniline",
            "Methamphetamine (METH)",
            "Amphetamine (AMP)",
            "L-DOPA",
            "Ethylamine",
            "Methylamine",
            "Trimethylamine",
            "Choline",
            "Adrenaline (EPI)",
            "Noradrenaline (NE)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Phenylethylamine",
                "Benzylamine",
                "Aniline",
                "Methamphetamine",
                "Amphetamine",
                "Ethylamine",
                "Methylamine",
                "Trimethylamine"
            ],
            "mismatches": [
                "Histamine (HIS)",
                "Serotonin (5-HT)",
                "Dopamine (DA)",
                "Norepinephrine (NE)",
                "Epinephrine (EPI)",
                "Acetylcholine (ACh)",
                "Octopamine",
                "Tyramine",
                "Melatonin",
                "Tryptamine",
                "Dimethyltryptamine (DMT)",
                "5-Methoxydimethyltryptamine (5-MeO-DMT)",
                "L-DOPA",
                "Choline",
                "Adrenaline (EPI)",
                "Noradrenaline (NE)"
            ],
            "true_referents": [
                "(+)-N-methylpseudoephedrine",
                "(+)-norephedrine",
                "(-)-norephedrine",
                "(R)-amphetamine",
                "(S)-amphetamine",
                "(S)-dobutamine",
                "1-phenylethylamine",
                "2-phenylethylamine",
                "3,4-methylenedioxymethamphetamine",
                "4-(phenylazo)aniline",
                "5-methoxy-N,N-dimethyltryptamine",
                "Dimethylamphetamine",
                "EPH",
                "L-phenylalaninol",
                "N-acylethanolamine",
                "N-acylethanolamine 18:0",
                "N-acyllysophosphatidylethanolamine",
                "N-alpha-Methylhistamine",
                "Na,Na-Dimethylhistamine",
                "Phenelzine",
                "a-Methyldopamine",
                "alpha-Methyl-m-tyramine",
                "alpha-methyl-L-dopa ethyl ester",
                "amphetamine",
                "aniline",
                "benzylamine",
                "cyclopropylamine",
                "diethylamine",
                "dobutamine",
                "ethylamine",
                "methamphetamine",
                "methoxamine",
                "methylamine",
                "methylamines",
                "methylhexaneamine",
                "phenylethylamine",
                "propranolol",
                "propylamine",
                "triethylamine",
                "trimethylamine",
                "tripropylamine"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Aniline (C6H5NH2)",
            "Methamphetamine (CH3NHCH3CH2CH2NH2)",
            "Histamine (C5H9N3)",
            "Serotonin (C10H12N2O)",
            "Epinephrine (C9H13NO3)",
            "Dopamine (C8H11NO2)",
            "Norepinephrine (C8H11NO3)",
            "Guanine (C5H5N5O)",
            "Adenine (C5H5N5)",
            "Caffeine (C8H10N4O2)",
            "Nicotine (C10H14N2)",
            "Morphine (C17H19NO3)",
            "Lysergic acid diethylamide (LSD) (C20H25N3O)",
            "Tryptamine (C10H12N2)",
            "Phenethylamine (C8H11N)",
            "Tyramine (C8H11NO)",
            "Glycine (C2H5NO2)",
            "Putrescine (C4H12N2)",
            "Cadaverine (C5H14N2)",
            "Spermidine (C7H19N3)",
            "Spermine (C10H26N4)",
            "Ethanolamine (C2H7NO)",
            "Choline (C5H14NO+)",
            "Trimethylamine (C3H9N)",
            "Dimethylamine (C2H7N)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aniline (C6H5NH2)",
                "Phenethylamine (C8H11N)",
                "Putrescine (C4H12N2)",
                "Ethanolamine (C2H7NO)",
                "Trimethylamine (C3H9N)"
            ],
            "mismatches": [
                "Methamphetamine (CH3NHCH3CH2CH2NH2)",
                "Histamine (C5H9N3)",
                "Serotonin (C10H12N2O)",
                "Epinephrine (C9H13NO3)",
                "Dopamine (C8H11NO2)",
                "Norepinephrine (C8H11NO3)",
                "Guanine (C5H5N5O)",
                "Adenine (C5H5N5)",
                "Caffeine (C8H10N4O2)",
                "Nicotine (C10H14N2)",
                "Morphine (C17H19NO3)",
                "Lysergic acid diethylamide (LSD) (C20H25N3O)",
                "Tryptamine (C10H12N2)",
                "Tyramine (C8H11NO)",
                "Glycine (C2H5NO2)",
                "Cadaverine (C5H14N2)",
                "Spermidine (C7H19N3)",
                "Spermine (C10H26N4)",
                "Choline (C5H14NO+)",
                "Dimethylamine (C2H7N)"
            ],
            "true_referents": [
                "(+)-N-methylpseudoephedrine",
                "(+)-norephedrine",
                "(1R,2S)-tranylcypromine",
                "(1S,2R)-tranylcypromine",
                "(S)-3,4-methylenedioxy-N-ethylamphetamine",
                "1,2-diamino-2-methylpropane",
                "1-phenylethylamine",
                "13-(2-methylcrotonoyloxy)lupanine",
                "2,5-Dimethoxy-4-ethylamphetamine",
                "2-Aminomethylpyrimidine",
                "2-phenylethylamine",
                "3,4-methylenedioxymethamphetamine",
                "3-O-Methyl-a-methyldopamine",
                "4-(4-nitrophenylazo)aniline",
                "4-(phenylazo)aniline",
                "4-Aminomethylpyrimidine",
                "5-acetamidopentanoic acid",
                "5-methoxy-N,N-dimethyltryptamine",
                "6-(4-hydroxy-3-nitrobenzamido)hexanoic acid",
                "6-methyl-N2-(phenylmethyl)-N4-[(phenylmethylene)amino]pyrimidine-2,4-diamine",
                "Decylamine",
                "Dimethylamphetamine",
                "N,N-Dimethylphenethylamine",
                "N,N-bis(2-hydroxyethyl)glycine",
                "N-(2,6-dimethylphenyl)-N(2)-(3,5-dimethylphenyl)glycinamide",
                "N-(octanoyl)ethanolamine",
                "N-(saturated fatty acyl)ethanolamine",
                "N-Acetyl-2,6-diethylaniline",
                "N-Cyclohexyl-N-methylcyclohexanamine",
                "N-acetoxy-1,1'-biphenyl-4-amine",
                "N-alpha-Methylhistamine",
                "N-methyl-N-(3-pyridylmethyl)amine",
                "Na,Na-Dimethylhistamine",
                "Putrescine_d4",
                "S-adenosylmethioninamine",
                "a-Methyldopamine",
                "alpha-Methyl-m-tyramine",
                "aniline",
                "anthracen-2-amine",
                "benzylamine",
                "cyclopropylamine",
                "diethyl(propyl)amine",
                "ethanolamine",
                "ethylamine",
                "methamphetamine",
                "methoxamine",
                "methylamine",
                "phenylethylamine",
                "piperidine",
                "triethylamine",
                "trimethylamine"
            ],
            "TP": 5,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Propylamine (C3H7NH2)",
            "Butylamine (C4H9NH2)",
            "Pentylamine (C5H11NH2)",
            "Hexylamine (C6H13NH2)",
            "Heptylamine (C7H15NH2)",
            "Octylamine (C8H17NH2)",
            "Aniline (C6H5NH2)",
            "Methylenediamine (H2NCH2NH2)",
            "Ethylenediamine (H2NCH2CH2NH2)",
            "Propylenediamine (H2NCH2CH(OH)CH2NH2)",
            "Butylenediamine (H2NCH2CH2CH2NH2)",
            "Phenylalanine (C9H11NO2)",
            "Tyramine (C8H11NO)",
            "Histamine (C5H9N3)",
            "Serotonin (C10H12N2O)",
            "Epinephrine (C9H13NO3)",
            "Norepinephrine (C8H11NO3)",
            "Dopamine (C8H11NO2)",
            "Caffeine (C8H10N4O2)",
            "Theophylline (C7H8N4O2)",
            "Theobromine (C7H8N4O2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Propylamine (C3H7NH2)",
                "Heptylamine (C7H15NH2)",
                "Aniline (C6H5NH2)"
            ],
            "mismatches": [
                "Butylamine (C4H9NH2)",
                "Pentylamine (C5H11NH2)",
                "Hexylamine (C6H13NH2)",
                "Octylamine (C8H17NH2)",
                "Methylenediamine (H2NCH2NH2)",
                "Ethylenediamine (H2NCH2CH2NH2)",
                "Propylenediamine (H2NCH2CH(OH)CH2NH2)",
                "Butylenediamine (H2NCH2CH2CH2NH2)",
                "Phenylalanine (C9H11NO2)",
                "Tyramine (C8H11NO)",
                "Histamine (C5H9N3)",
                "Serotonin (C10H12N2O)",
                "Epinephrine (C9H13NO3)",
                "Norepinephrine (C8H11NO3)",
                "Dopamine (C8H11NO2)",
                "Caffeine (C8H10N4O2)",
                "Theophylline (C7H8N4O2)",
                "Theobromine (C7H8N4O2)"
            ],
            "true_referents": [
                "(+)-N-methylpseudoephedrine",
                "(+)-norephedrine",
                "(+/-)-n-ethyl-1-phenyl-2-butylamine",
                "(1S,2R)-tranylcypromine",
                "(R)-N-acetyl-1-phenylethylamine",
                "1-Hexadecylamine",
                "13-(2-methylcrotonoyloxy)lupanine",
                "2,5-Dimethoxy-4-ethylamphetamine",
                "2,5-dimethyl-p-phenylenediamine",
                "2-hydroxy-5-[(1E)-(2-phenylethylidene)amino]-L-tyrosine",
                "3-O-Methyl-a-methyldopamine",
                "3-buten-1-amine",
                "3-phenylpropylamine",
                "4-(4-nitrophenylazo)aniline",
                "4-(aminomethyl)octane-1,8-diamine",
                "4-(phenylazo)aniline",
                "4-hydroxymethamphetamine",
                "5-acetamidopentanoic acid",
                "5-morpholino-2,4(1H,3H)-pyrimidinedione",
                "6-(4-hydroxy-3-nitrobenzamido)hexanoic acid",
                "Heptylamine",
                "L-phenylalaninol",
                "N'-(2-propoxyphenyl)-2-butenediamide",
                "N,N,2,2-tetramethyl-3-hexyn-1-amine",
                "N,N-Dimethylphenethylamine",
                "N-(4-hydroxyphenyl)eicosa-5,8,11,14-tetraenamide",
                "N-(alpha-L-aspartyl)-2-naphthylamine",
                "N-(octanoyl)ethanolamine",
                "N-Cyclohexyl-N-methylcyclohexanamine",
                "N-acetoxy-1,1'-biphenyl-4-amine",
                "N-alpha-Methylhistamine",
                "N-benzoyl-L-phenylalaninol",
                "Na,Na-Dimethylhistamine",
                "a-Methyldopamine",
                "alkylamine",
                "alpha-Methyl-m-tyramine",
                "aniline",
                "benzylamine",
                "butan-1-amine",
                "cyclopropylamine",
                "diethyl(propyl)amine",
                "diethylamine",
                "dimethylamine",
                "ethylamine",
                "isopentylamine",
                "methoxamine",
                "methylamine",
                "methylhexaneamine",
                "phenylalkylamine",
                "propylamine"
            ],
            "TP": 5,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (MeNH2)",
            "Dimethylamine ((CH3)2NH)",
            "Trimethylamine ((CH3)3N)",
            "Ethylamine (C2H5NH2)",
            "Diethylamine ((C2H5)2NH)",
            "Isopropylamine ((CH3)2CHNH2)",
            "Triethylamine ((C2H5)3N)",
            "Aniline (C6H5NH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Dopamine (3,4-dihydroxyphenethylamine)",
            "Histamine (2-(1H-imidazol-4-yl)ethanamine)",
            "Serotonin (5-hydroxytryptamine)",
            "GABA (\u03b3-aminobutyric acid)",
            "Putrescine (1,4-diaminobutane)",
            "Cadaverine (1,5-diaminopentane)",
            "Spermine (N-Spermidine-3-amine)",
            "Spermidine (N-(aminopropyl)-putrescine)",
            "Choline (2-hydroxyethyltrimethylammonium)",
            "Ethanolamine (2-aminoethanol)",
            "Lysine (2-amino-5-(aminomethyl)pentanoic acid)",
            "Arginine (2-amino-5-(guanidinomethyl)pentanoic acid)",
            "Tyramine (4-hydroxyphenethylamine)",
            "\u03b2-Alanine (3-aminopropanoic acid)",
            "Morpholine (C4H9NO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (MeNH2)",
                "Dimethylamine ((CH3)2NH)",
                "Trimethylamine ((CH3)3N)",
                "Ethylamine (C2H5NH2)",
                "Diethylamine ((C2H5)2NH)",
                "Isopropylamine ((CH3)2CHNH2)",
                "Triethylamine ((C2H5)3N)",
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Ethanolamine (2-aminoethanol)"
            ],
            "mismatches": [
                "Dopamine (3,4-dihydroxyphenethylamine)",
                "Histamine (2-(1H-imidazol-4-yl)ethanamine)",
                "Serotonin (5-hydroxytryptamine)",
                "GABA (\u03b3-aminobutyric acid)",
                "Putrescine (1,4-diaminobutane)",
                "Cadaverine (1,5-diaminopentane)",
                "Spermine (N-Spermidine-3-amine)",
                "Spermidine (N-(aminopropyl)-putrescine)",
                "Choline (2-hydroxyethyltrimethylammonium)",
                "Lysine (2-amino-5-(aminomethyl)pentanoic acid)",
                "Arginine (2-amino-5-(guanidinomethyl)pentanoic acid)",
                "Tyramine (4-hydroxyphenethylamine)",
                "\u03b2-Alanine (3-aminopropanoic acid)",
                "Morpholine (C4H9NO)"
            ],
            "true_referents": [
                "(1-Methyl-1H-imidazol-4-yl)methylamine",
                "(2S)-1-(1H-imidazol-5-yl)-2-propanamine",
                "1,2-diamino-2-methylpropane",
                "2,4-dimethylpentan-3-amine",
                "2,5-Dimethoxy-4-ethylamphetamine",
                "2-Aminomethylpyrimidine",
                "2-isopropylaminoethylamine",
                "2-morpholino-1-phenyl-1-ethanol",
                "3-O-Methyl-a-methyldopamine",
                "3-[(4-aminobutyl)amino]propanal",
                "3-aminooctanoic acid",
                "4-(4-nitrophenylazo)aniline",
                "4-(5,6-diphenyl-1,2,4-triazin-3-yl)morpholine",
                "4-(phenylazo)aniline",
                "4-Aminomethylpyrimidine",
                "4-hydroxymethamphetamine",
                "4-methoxytyramine",
                "5-(dimethylamino)pentanoic acid",
                "5-acetamidopentanoic acid",
                "5-aminopentanoic acid",
                "5-methoxy-N,N-dimethyltryptamine",
                "5-morpholino-2,4(1H,3H)-pyrimidinedione",
                "9-aminononanoic acid",
                "Decylamine",
                "L-glutamylglycyl-L-arginine 2-naphthylamide",
                "L-lysine 2-naphthylamide",
                "N,N-Dimethylphenethylamine",
                "N-(decanoyl)ethanolamine",
                "N-methyl-N-(3-pyridylmethyl)amine",
                "N1,N1-diethyl-2-(4-pyridyl)ethan-1-amine",
                "Na,Na-Dimethylhistamine",
                "Putrescine_d4",
                "a-Methyldopamine",
                "alpha-Methyl-m-tyramine",
                "aniline",
                "benzylamine",
                "beta-amino-fatty acid",
                "cyclopropylamine",
                "diethanolamine",
                "diethyl(propyl)amine",
                "diethylamine",
                "dimethylamine",
                "ethanolamine",
                "ethylamine",
                "isopropylamine",
                "methoxamine",
                "methylamine",
                "triethanolamine",
                "triethylamine",
                "trimethylamine"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Aniline (C6H5NH2)",
            "Trimethylamine (N(CH3)3)",
            "Diethylamine ((C2H5)2NH)",
            "Phenethylamine (C8H11N)",
            "Amphetamine (C9H13N)",
            "Dopamine (C8H11NO2)",
            "Serotonin (C10H12N2O)",
            "Histamine (C5H9N3)",
            "Tyramine (C8H11NO)",
            "Putrescine (C4H12N2)",
            "Cadaverine (C5H14N2)",
            "Spermidine (C7H19N3)",
            "Spermine (C10H26N4)",
            "Piperidine (C5H11N)",
            "Pyrrolidine (C4H9N)",
            "Imidazole (C3H4N2)",
            "Lysine (C6H14N2O2)",
            "Procaine (C13H20N2O2)",
            "Lidocaine (C14H22N2O)",
            "Benzylamine (C7H9N)",
            "Phenylalanine (C9H11NO2)",
            "Tryptamine (C10H12N2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Aniline (C6H5NH2)",
                "Trimethylamine (N(CH3)3)",
                "Diethylamine ((C2H5)2NH)",
                "Phenethylamine (C8H11N)",
                "Amphetamine (C9H13N)",
                "Procaine (C13H20N2O2)",
                "Benzylamine (C7H9N)",
                "Piperidine (C5H11N)"
            ],
            "mismatches": [
                "Dopamine (C8H11NO2)",
                "Serotonin (C10H12N2O)",
                "Histamine (C5H9N3)",
                "Tyramine (C8H11NO)",
                "Putrescine (C4H12N2)",
                "Cadaverine (C5H14N2)",
                "Spermidine (C7H19N3)",
                "Spermine (C10H26N4)",
                "Pyrrolidine (C4H9N)",
                "Imidazole (C3H4N2)",
                "Lysine (C6H14N2O2)",
                "Lidocaine (C14H22N2O)",
                "Phenylalanine (C9H11NO2)",
                "Tryptamine (C10H12N2)"
            ],
            "true_referents": [
                "(1-Methyl-1H-imidazol-4-yl)methylamine",
                "(1R,2S)-tranylcypromine",
                "(1S,2R)-tranylcypromine",
                "(2-Piperidino-3-pyridinyl)methanol",
                "(2S)-1-(1H-imidazol-5-yl)-2-propanamine",
                "(6S)-6-hydroxyhyoscyamine",
                "(R)-amphetamine",
                "1,2-diamino-2-methylpropane",
                "1-phenylethylamine",
                "13-(2-methylcrotonoyloxy)lupanine",
                "2,5-Dimethoxy-4-ethylamphetamine",
                "2-(1-methyl-2-pyrrolidinyl)-pyridine",
                "2-(2-Furanyl)pyrrolidine",
                "2-phenylethylamine",
                "3-O-Methyl-a-methyldopamine",
                "3-[(2R)-2-piperidinyl]pyridine",
                "4-(2-aminoethyl)benzene-1,3-diol",
                "4-(4-nitrophenylazo)aniline",
                "4-(phenylazo)aniline",
                "4-Aminomethylpyrimidine",
                "4-[3-(1H-imidazol-5-yl)propyl]piperidine",
                "5-acetamidopentanoic acid",
                "5-methoxy-N,N-dimethyltryptamine",
                "Decylamine",
                "L-phenylalaninol",
                "N,N-Dimethylphenethylamine",
                "N,N-bis(2-hydroxyethyl)glycine",
                "N-alpha-Methylhistamine",
                "N-benzoyl-L-phenylalaninol",
                "N-methyl-N-(3-pyridylmethyl)amine",
                "N1,N1-diethyl-2-(4-pyridyl)ethan-1-amine",
                "Na,Na-Dimethylhistamine",
                "Putrescine_d4",
                "[6-(1-Pyrrolidinyl)-3-pyridinyl]methanol",
                "a-Methyldopamine",
                "alpha-Methyl-m-tyramine",
                "amphetamine",
                "aniline",
                "anthracen-2-amine",
                "benzylamine",
                "chloroprocaine",
                "diethylamine",
                "dimethylamine",
                "ethylamine",
                "methoxamine",
                "methylamine",
                "oxybuprocaine",
                "phenylalkylamine",
                "phenylethylamine",
                "piperidine",
                "primary arylamine",
                "procaine",
                "trimethylamine"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Ammonia (NH3)",
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Propylamine (C3H7NH2)",
            "Butylamine (C4H9NH2)",
            "Aniline (C6H5NH2)",
            "Pyridine (C5H5N)",
            "Pyrrole (C4H5N)",
            "Tryptamine (C10H12N2)",
            "Serotonin (C10H12N2O)",
            "Histamine (C5H9N3)",
            "Dopamine (C8H11NO2)",
            "Norepinephrine (C8H11NO3)",
            "Epinephrine (C9H13NO3)",
            "Lysine (C6H14N2O2)",
            "Arginine (C6H14N4O2)",
            "Caffeine (C8H10N4O2)",
            "Nicotine (C10H14N2)",
            "Choline (C5H14NO)",
            "Creatine (C4H9N3O2)",
            "Spermidine (C7H18N4)",
            "Spermine (C10H26N4)",
            "Nicotinamide (C6H6N2O)",
            "Trimethylamine (C3H9N)",
            "Dimethylamine (C2H7N)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Propylamine (C3H7NH2)",
                "Aniline (C6H5NH2)",
                "Trimethylamine (C3H9N)",
                "Dimethylamine (C2H7N)"
            ],
            "mismatches": [
                "Ammonia (NH3)",
                "Butylamine (C4H9NH2)",
                "Pyridine (C5H5N)",
                "Pyrrole (C4H5N)",
                "Tryptamine (C10H12N2)",
                "Serotonin (C10H12N2O)",
                "Histamine (C5H9N3)",
                "Dopamine (C8H11NO2)",
                "Norepinephrine (C8H11NO3)",
                "Epinephrine (C9H13NO3)",
                "Lysine (C6H14N2O2)",
                "Arginine (C6H14N4O2)",
                "Caffeine (C8H10N4O2)",
                "Nicotine (C10H14N2)",
                "Choline (C5H14NO)",
                "Creatine (C4H9N3O2)",
                "Spermidine (C7H18N4)",
                "Spermine (C10H26N4)",
                "Nicotinamide (C6H6N2O)"
            ],
            "true_referents": [
                "(+)-N-methylpseudoephedrine",
                "(+)-norephedrine",
                "(+/-)-n-ethyl-1-phenyl-2-butylamine",
                "(1R,2S)-tranylcypromine",
                "(1S,2R)-tranylcypromine",
                "(6S)-6-hydroxyhyoscyamine",
                "1,2-diamino-2-methylpropane",
                "13-(2-methylcrotonoyloxy)lupanine",
                "1H-pyrrole",
                "2,5-Dimethoxy-4-ethylamphetamine",
                "2-(1-methyl-2-pyrrolidinyl)-pyridine",
                "3,4-dimethoxyphenylethylamine",
                "3-(3,4,5-timethoxyphenyl)propanoylpyrrole",
                "3-O-Methyl-a-methyldopamine",
                "3-[(2R)-2-piperidinyl]pyridine",
                "3-buten-1-amine",
                "3-phenylpropylamine",
                "4-(4-nitrophenylazo)aniline",
                "4-(phenylazo)aniline",
                "4-Aminomethylpyrimidine",
                "5-acetamidopentanoic acid",
                "5-methoxy-N,N-dimethyltryptamine",
                "6-(4-hydroxy-3-nitrobenzamido)hexanoic acid",
                "6-aminohexanoic acid",
                "Ethyl-2-amino-1-cyclohexene-1-carboxylate",
                "L-phenylalaninol",
                "N,N-Dimethylphenethylamine",
                "N,N-bis(2-hydroxyethyl)glycine",
                "N,N-dimethyl-4-[[6-(3-pyridinyl)-3,4-dihydro-2H-pyridin-5-ylidene]methyl]aniline",
                "N-(2,4-dinitrophenyl)aminohexanoic acid",
                "N-(4-ethylphenyl)-3-(1-pyrrolyl)propanamide",
                "N-(saturated fatty acyl)ethanolamine",
                "N-Acetyl-2,6-diethylaniline",
                "N-Cyclohexyl-N-methylcyclohexanamine",
                "N-[(E)-\\{[(Z)-2-amino-1,2-dicyanoethenyl]imino\\}methyl]phenylalanine",
                "N-acetoxy-1,1'-biphenyl-4-amine",
                "N-alpha-Methylhistamine",
                "N-benzoyl-D-arginine 2-naphthylamide",
                "N-methyl-N-(3-pyridylmethyl)amine",
                "Na,Na-Dimethylhistamine",
                "Thenyldiamine",
                "[[4-(diethylamino)phenyl]methylideneamino]urea",
                "a-Methyldopamine",
                "aniline",
                "butan-1-amine",
                "cyclopropylamine",
                "diethyl(propyl)amine",
                "diethylamine",
                "dimethylamine",
                "ethylamine",
                "methoxamine",
                "methylamine",
                "nitrilotriacetate(.4-)",
                "piperidine",
                "propylamine",
                "triethanolamine",
                "triethylamine",
                "trimethylamine"
            ],
            "TP": 6,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H7N)",
            "Propylamine (C3H9N)",
            "Butylamine (C4H11N)",
            "Pentylamine (C5H13N)",
            "Hexylamine (C6H15N)",
            "Heptylamine (C7H17N)",
            "Octylamine (C8H19N)",
            "Nonane (C9H21N)",
            "Decylamine (C10H23N)",
            "Phenethylamine (C8H11N)",
            "Tryptamine (C10H12N2)",
            "Serotonin (C10H12N2O)",
            "Histamine (C5H9N3)",
            "Dopamine (C8H11NO2)",
            "Norepinephrine (C8H11NO3)",
            "Epinephrine (C9H13NO3)",
            "Melatonin (C13H16N2O2)",
            "Tyramine (C8H11NO)",
            "Putrescine (C4H12N2)",
            "Cadaverine (C5H14N2)",
            "Spermidine (C7H19N3)",
            "Spermine (C10H26N4)",
            "Trimethylamine (C3H9N)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H7N)",
                "Heptylamine (C7H17N)",
                "Decylamine (C10H23N)",
                "Trimethylamine (C3H9N)"
            ],
            "mismatches": [
                "Propylamine (C3H9N)",
                "Butylamine (C4H11N)",
                "Pentylamine (C5H13N)",
                "Hexylamine (C6H15N)",
                "Octylamine (C8H19N)",
                "Nonane (C9H21N)",
                "Phenethylamine (C8H11N)",
                "Tryptamine (C10H12N2)",
                "Serotonin (C10H12N2O)",
                "Histamine (C5H9N3)",
                "Dopamine (C8H11NO2)",
                "Norepinephrine (C8H11NO3)",
                "Epinephrine (C9H13NO3)",
                "Melatonin (C13H16N2O2)",
                "Tyramine (C8H11NO)",
                "Putrescine (C4H12N2)",
                "Cadaverine (C5H14N2)",
                "Spermidine (C7H19N3)",
                "Spermine (C10H26N4)"
            ],
            "true_referents": [
                "(+)-N-methylpseudoephedrine",
                "(+)-norephedrine",
                "(+/-)-n-ethyl-1-phenyl-2-butylamine",
                "(1R,2S)-tranylcypromine",
                "(1S,2R)-tranylcypromine",
                "1,2-diamino-2-methylpropane",
                "1-Hexadecylamine",
                "1-hexanamine",
                "1-naphthylamine",
                "1-phenylethylamine",
                "13-(2-methylcrotonoyloxy)lupanine",
                "2,5-Dimethoxy-4-ethylamphetamine",
                "2-phenylethylamine",
                "3-O-Methyl-a-methyldopamine",
                "3-buten-1-amine",
                "4-(aminomethyl)octane-1,8-diamine",
                "4-Aminomethylpyrimidine",
                "4-methyl-3-penten-1-amine",
                "5-acetamidopentanoic acid",
                "5-methoxy-N,N-dimethyltryptamine",
                "Decylamine",
                "Heptylamine",
                "N,N,2,2-tetramethyl-3-hexyn-1-amine",
                "N,N-Dimethylphenethylamine",
                "N-(alpha-L-aspartyl)-2-naphthylamine",
                "N-(decanoyl)ethanolamine",
                "N-(octanoyl)ethanolamine",
                "N-Cyclohexyl-N-methylcyclohexanamine",
                "N-alpha-Methylhistamine",
                "N-methyl-N-(3-pyridylmethyl)amine",
                "Na,Na-Dimethylhistamine",
                "Putrescine_d4",
                "a-Methyldopamine",
                "alpha-Methyl-m-tyramine",
                "aniline",
                "anthracen-2-amine",
                "benzylamine",
                "butan-1-amine",
                "cyclopropylamine",
                "diethyl(propyl)amine",
                "diethylamine",
                "dimethylamine",
                "ethylamine",
                "isopentylamine",
                "methoxamine",
                "methylamine",
                "methylhexaneamine",
                "octan-1-amine",
                "pentan-1-amine",
                "phenylethylamine",
                "piperidine",
                "propylamine",
                "triethylamine",
                "trimethylamine"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Propylamine (C3H7NH2)",
            "Isopropylamine ((CH3)2CHNH2)",
            "Butylamine (C4H9NH2)",
            "Isobutylamine ((CH3)2CHCH2NH2)",
            "Cyclohexylamine (C6H11NH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Aniline (C6H5NH2)",
            "Dimethylamine ((CH3)2NH)",
            "Diethylamine ((C2H5)2NH)",
            "Triethylamine ((C2H5)3N)",
            "N,N-Dimethylethylamine ((CH3)2NCH2CH3)",
            "N,N-Diethylethylamine ((C2H5)2NCH2CH3)",
            "N,N-Dimethylisopropylamine ((CH3)2NCH(CH3)2)",
            "N,N-Diethylisopropylamine ((C2H5)2NCH(CH3)2)",
            "N-Methyl-1,3-propanediamine ((CH3)NH(CH2)3NH2)",
            "N-Ethyl-1,3-propanediamine ((C2H5)NH(CH2)3NH2)",
            "N-Methyl-1,4-butanediamine ((CH3)NH(CH2)4NH2)",
            "N-Ethyl-1,4-butanediamine ((C2H5)NH(CH2)4NH2)",
            "N,N-Dimethyl-1,3-propanediamine ((CH3)2N(CH2)3NH2)",
            "N,N-Diethyl-1,3-propanediamine ((C2H5)2N(CH2)3NH2)",
            "N,N-Dimethyl-1,4-butanediamine ((CH3)2N(CH2)4NH2)",
            "N,N-Diethyl-1,4-butanediamine ((C2H5)2N(CH2)4NH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Propylamine (C3H7NH2)",
                "Isopropylamine ((CH3)2CHNH2)",
                "Cyclohexylamine (C6H11NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Aniline (C6H5NH2)",
                "Dimethylamine ((CH3)2NH)",
                "Diethylamine ((C2H5)2NH)",
                "Triethylamine ((C2H5)3N)"
            ],
            "mismatches": [
                "Butylamine (C4H9NH2)",
                "Isobutylamine ((CH3)2CHCH2NH2)",
                "N,N-Dimethylethylamine ((CH3)2NCH2CH3)",
                "N,N-Diethylethylamine ((C2H5)2NCH2CH3)",
                "N,N-Dimethylisopropylamine ((CH3)2NCH(CH3)2)",
                "N,N-Diethylisopropylamine ((C2H5)2NCH(CH3)2)",
                "N-Methyl-1,3-propanediamine ((CH3)NH(CH2)3NH2)",
                "N-Ethyl-1,3-propanediamine ((C2H5)NH(CH2)3NH2)",
                "N-Methyl-1,4-butanediamine ((CH3)NH(CH2)4NH2)",
                "N-Ethyl-1,4-butanediamine ((C2H5)NH(CH2)4NH2)",
                "N,N-Dimethyl-1,3-propanediamine ((CH3)2N(CH2)3NH2)",
                "N,N-Diethyl-1,3-propanediamine ((C2H5)2N(CH2)3NH2)",
                "N,N-Dimethyl-1,4-butanediamine ((CH3)2N(CH2)4NH2)",
                "N,N-Diethyl-1,4-butanediamine ((C2H5)2N(CH2)4NH2)"
            ],
            "true_referents": [
                "(+/-)-n-ethyl-1-phenyl-2-butylamine",
                "2,2'-[(2-amino-2-oxoethyl)imino]diacetic acid",
                "2,4-dimethylpentan-3-amine",
                "2-Methylbutylamine",
                "2-isopropylaminoethylamine",
                "3-buten-1-amine",
                "3-methylamino-1,2-propanediol",
                "3-phenylpropylamine",
                "4-(4-nitrophenylazo)aniline",
                "4-(aminomethyl)octane-1,8-diamine",
                "4-(phenylazo)aniline",
                "4-Methylcyclohexylamine",
                "N(1)-isopropyl-2-methylpropan-1,2-diamine",
                "N,N,2,2-tetramethyl-3-hexyn-1-amine",
                "N,N-Dimethylphenethylamine",
                "N,N-dimethylcyclohexylamine",
                "N,N-dimethylethanolamine",
                "N-(2,4-dinitrophenyl)aminohexanoic acid",
                "N-[[4-(diethylamino)phenyl]methylideneamino]carbamic acid tert-butyl ester",
                "N-methylbutylamine",
                "N-phenyl-N'-(pyridin-4-ylmethylideneamino)butanediamide",
                "N1,N1-diethyl-2-(4-pyridyl)ethan-1-amine",
                "[[4-(diethylamino)phenyl]methylideneamino]urea",
                "aniline",
                "benzylamine",
                "butan-1-amine",
                "cyclohexylamine",
                "diethyl(propyl)amine",
                "diethylamine",
                "dimethylamine",
                "ethylamine",
                "isopentylamine",
                "isopropylamine",
                "methylamine",
                "propylamine",
                "triethanolamine",
                "triethylamine"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (MeNH\u2082)",
            "Ethylamine (EtNH\u2082)",
            "Aniline (C\u2086H\u2085NH\u2082)",
            "Dimethylamine ((CH\u2083)\u2082NH)",
            "Triethylamine ((C\u2082H\u2085)\u2083N)",
            "Histamine",
            "Dopamine",
            "Serotonin",
            "Epinephrine",
            "Norepinephrine",
            "Tryptamine",
            "Phenethylamine",
            "Putrescine",
            "Cadaverine",
            "Tyramine",
            "Methamphetamine (Meth)",
            "Amphetamine (Amp)",
            "Benzylamine",
            "Piperidine",
            "Spermine",
            "Spermidine",
            "Imidazole",
            "Pyridine",
            "Beta-Phenylethylamine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (MeNH\u2082)",
                "Ethylamine (EtNH\u2082)",
                "Aniline (C\u2086H\u2085NH\u2082)",
                "Dimethylamine ((CH\u2083)\u2082NH)",
                "Triethylamine ((C\u2082H\u2085)\u2083N)",
                "Methamphetamine (Meth)",
                "Amphetamine (Amp)",
                "Benzylamine",
                "Piperidine",
                "Phenethylamine",
                "Beta-Phenylethylamine"
            ],
            "mismatches": [
                "Histamine",
                "Dopamine",
                "Serotonin",
                "Epinephrine",
                "Norepinephrine",
                "Tryptamine",
                "Putrescine",
                "Cadaverine",
                "Tyramine",
                "Spermine",
                "Spermidine",
                "Imidazole",
                "Pyridine"
            ],
            "true_referents": [
                "(1-Methyl-1H-imidazol-4-yl)methylamine",
                "(2S)-1-(1H-imidazol-5-yl)-2-propanamine",
                "(R)-amphetamine",
                "(S)-amphetamine",
                "1-phenylethylamine",
                "2,4-dimethylpentan-3-amine",
                "2-(1-methyl-2-pyrrolidinyl)-pyridine",
                "2-phenylethylamine",
                "3-[(2R)-2-piperidinyl]pyridine",
                "4-(4-nitrophenylazo)aniline",
                "4-(phenylazo)aniline",
                "5-methoxy-N,N-dimethyltryptamine",
                "N,N-Dimethylphenethylamine",
                "Na,Na-Dimethylhistamine",
                "Putrescine_d4",
                "alpha-Methyl-m-tyramine",
                "alverine",
                "amphetamine",
                "aniline",
                "benzylamine",
                "candicine",
                "cyclopropylamine",
                "diethylamine",
                "dimethylamine",
                "dobutamine",
                "etanidazole",
                "ethylamine",
                "methamphetamine",
                "methoxamine",
                "methylamine",
                "phenylethylamine",
                "piperidine",
                "propranolol",
                "propylamine",
                "triethanolamine",
                "triethylamine",
                "tripropylamine"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Propylamine (C3H7NH2)",
            "Aniline (C6H5NH2)",
            "Dopamine",
            "Serotonin (5-HT)",
            "Histamine",
            "Tryptamine",
            "Putrescine",
            "Cadaverine",
            "Spermidine",
            "Spermine",
            "Tyramine",
            "Phenethylamine (PEA)",
            "Amphetamine",
            "Methamphetamine",
            "Epinephrine (Adrenaline)",
            "Norepinephrine (Noradrenaline)",
            "Tryptophan",
            "Lysine",
            "Arginine",
            "Histidine",
            "Ethanolamine",
            "Glucosamine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Propylamine (C3H7NH2)",
                "Aniline (C6H5NH2)",
                "Ethanolamine",
                "Amphetamine",
                "Methamphetamine"
            ],
            "mismatches": [
                "Dopamine",
                "Serotonin (5-HT)",
                "Histamine",
                "Tryptamine",
                "Putrescine",
                "Cadaverine",
                "Spermidine",
                "Spermine",
                "Tyramine",
                "Phenethylamine (PEA)",
                "Epinephrine (Adrenaline)",
                "Norepinephrine (Noradrenaline)",
                "Tryptophan",
                "Lysine",
                "Arginine",
                "Histidine",
                "Glucosamine"
            ],
            "true_referents": [
                "(+)-N-methylpseudoephedrine",
                "(+)-norephedrine",
                "1-phenylethylamine",
                "2-Aminomethylpyrimidine",
                "2-phenylethylamine",
                "3-phenylpropylamine",
                "4-(4-nitrophenylazo)aniline",
                "4-(phenylazo)aniline",
                "5-methoxy-N,N-dimethyltryptamine",
                "Heptylamine",
                "L-arginine 2-naphthylamide",
                "L-histidine 2-naphthylamide",
                "L-phenylalaninol",
                "L-tryptophan 2-naphthylamide",
                "N-(butanoyl)ethanolamine",
                "Na,Na-Dimethylhistamine",
                "Putrescine_d4",
                "alpha-Methyl-m-tyramine",
                "alpha-amino fatty acid",
                "alverine",
                "amphetamine",
                "amphetamines",
                "aniline",
                "benzylamine",
                "candicine",
                "cyclopropylamine",
                "cysteamine",
                "diethyl(propyl)amine",
                "diethylamine",
                "dimethylamine",
                "dobutamine",
                "dodecylamine",
                "ethanolamine",
                "ethylamine",
                "glycyl-L-tryptophan 2-naphthylamide",
                "methamphetamine",
                "methoxamine",
                "methylamine",
                "phenylethylamine",
                "piperidine",
                "propranolol",
                "propylamine",
                "tripropylamine"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (MA)",
            "Ethylamine (EA)",
            "Propylamine (PA)",
            "Butylamine (BA)",
            "Pentylamine",
            "Hexylamine",
            "Dimethylamine (DMA)",
            "Trimethylamine (TMA)",
            "Ethylenediamine (EDA)",
            "Putrescine",
            "Cadaverine",
            "Spermidine",
            "Spermine",
            "Histamine",
            "Serotonin (5-HT)",
            "Dopamine (DA)",
            "Norepinephrine (NE)",
            "Epinephrine (E)",
            "Tryptamine",
            "Phenethylamine (PEA)",
            "Tyramine",
            "Amphetamine",
            "Methamphetamine",
            "Lysine (Lys, K)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (MA)",
                "Ethylamine (EA)",
                "Propylamine (PA)",
                "Dimethylamine (DMA)",
                "Trimethylamine (TMA)",
                "Phenethylamine (PEA)",
                "Amphetamine",
                "Methamphetamine"
            ],
            "mismatches": [
                "Butylamine (BA)",
                "Pentylamine",
                "Hexylamine",
                "Ethylenediamine (EDA)",
                "Putrescine",
                "Cadaverine",
                "Spermidine",
                "Spermine",
                "Histamine",
                "Serotonin (5-HT)",
                "Dopamine (DA)",
                "Norepinephrine (NE)",
                "Epinephrine (E)",
                "Tryptamine",
                "Tyramine",
                "Lysine (Lys, K)"
            ],
            "true_referents": [
                "(+)-N-methylpseudoephedrine",
                "(+)-norephedrine",
                "(-)-norephedrine",
                "(R)-amphetamine",
                "1-Hexadecylamine",
                "1-phenylethylamine",
                "2,5-dimethyl-p-phenylenediamine",
                "2-phenylethylamine",
                "3-buten-1-amine",
                "5-methoxy-N,N-dimethyltryptamine",
                "Dimethylamphetamine",
                "L-lysine 2-naphthylamide",
                "L-phenylalaninol",
                "Na,Na-Dimethylhistamine",
                "Putrescine_d4",
                "a-Methyldopamine",
                "alkylamine",
                "alpha-Methyl-m-tyramine",
                "alverine",
                "amphetamine",
                "amphetamines",
                "benzylamine",
                "butan-1-amine",
                "candicine",
                "cyclopropylamine",
                "diethylamine",
                "dimethylamine",
                "dioctylamine",
                "dobutamine",
                "ethylamine",
                "isopentylamine",
                "methamphetamine",
                "methoxamine",
                "methylamine",
                "methylamines",
                "phenylalkylamine",
                "phenylethylamine",
                "piperidine",
                "propylamine",
                "sec-butylamine",
                "triethylamine",
                "trimethylamine",
                "tripropylamine"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (CH3CH2NH2)",
            "Propylamine (CH3CH2CH2NH2)",
            "Butylamine (CH3(CH2)3NH2)",
            "Aniline (C6H5NH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Tryptamine (C10H12N2)",
            "Histamine (C5H9N3)",
            "Serotonin (C10H12N2O)",
            "Dopamine (C8H11NO2)",
            "Epinephrine (C9H13NO3)",
            "Norepinephrine (C8H11NO3)",
            "Putrescine (NH2(CH2)4NH2)",
            "Cadaverine (NH2(CH2)5NH2)",
            "Spermidine (NH2(CH2)4NH(CH2)3NH2)",
            "Spermine (NH2(CH2)3NH(CH2)4NH(CH2)3NH2)",
            "Ethanolamine (NH2CH2CH2OH)",
            "Choline (C5H14NO+)",
            "Amphetamine (C9H13N)",
            "Methamphetamine (C10H15N)",
            "Lidocaine (C14H22N2O)",
            "Procaine (C13H20N2O2)",
            "Tetracaine (C15H24N2O2)",
            "Prilocaine (C13H20N2O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (CH3CH2NH2)",
                "Propylamine (CH3CH2CH2NH2)",
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Putrescine (NH2(CH2)4NH2)",
                "Ethanolamine (NH2CH2CH2OH)",
                "Amphetamine (C9H13N)",
                "Methamphetamine (C10H15N)",
                "Procaine (C13H20N2O2)"
            ],
            "mismatches": [
                "Butylamine (CH3(CH2)3NH2)",
                "Tryptamine (C10H12N2)",
                "Histamine (C5H9N3)",
                "Serotonin (C10H12N2O)",
                "Dopamine (C8H11NO2)",
                "Epinephrine (C9H13NO3)",
                "Norepinephrine (C8H11NO3)",
                "Cadaverine (NH2(CH2)5NH2)",
                "Spermidine (NH2(CH2)4NH(CH2)3NH2)",
                "Spermine (NH2(CH2)3NH(CH2)4NH(CH2)3NH2)",
                "Choline (C5H14NO+)",
                "Lidocaine (C14H22N2O)",
                "Tetracaine (C15H24N2O2)",
                "Prilocaine (C13H20N2O)"
            ],
            "true_referents": [
                "(+)-N-methylpseudoephedrine",
                "(+)-norephedrine",
                "(+/-)-n-ethyl-1-phenyl-2-butylamine",
                "(1-Methyl-1H-imidazol-4-yl)methylamine",
                "(1R,2S)-tranylcypromine",
                "(1S,2R)-tranylcypromine",
                "(R)-amphetamine",
                "13-(2-methylcrotonoyloxy)lupanine",
                "2,2'-[(2-amino-2-oxoethyl)imino]diacetic acid",
                "2,4,4-trimethyl-2-Pentanamine",
                "2,4-dimethylpentan-3-amine",
                "2,5-Dimethoxy-4-ethylamphetamine",
                "3-O-Methyl-a-methyldopamine",
                "3-buten-1-amine",
                "4-(2-aminoethyl)benzene-1,3-diol",
                "4-(4-nitrophenylazo)aniline",
                "4-(phenylazo)aniline",
                "4-[3-(dimethylamino)propylamino]phenol",
                "5-acetamidopentanoic acid",
                "5-methoxy-N,N-dimethyltryptamine",
                "N,N-Dimethylphenethylamine",
                "N-(butanoyl)ethanolamine",
                "N-(saturated fatty acyl)ethanolamine",
                "N-Cyclohexyl-N-methylcyclohexanamine",
                "N-[3-(aminomethyl)benzyl]acetamidine",
                "N-alpha-Methylhistamine",
                "Na,Na-Dimethylhistamine",
                "Putrescine_d4",
                "[[4-(diethylamino)phenyl]methylideneamino]urea",
                "a-Methyldopamine",
                "amphetamine",
                "aniline",
                "benzylamine",
                "chloroprocaine",
                "cyclopropylamine",
                "diethyl(propyl)amine",
                "diethylamine",
                "dimethylamine",
                "ethanolamine",
                "ethylamine",
                "methamphetamine",
                "methoxamine",
                "methylamine",
                "oxybuprocaine",
                "procaine",
                "propylamine",
                "triethylamine"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (CH3CH2NH2)",
            "Propylamine (CH3CH2CH2NH2)",
            "Butylamine (CH3(CH2)3NH2)",
            "Pentylamine (CH3(CH2)4NH2)",
            "Hexylamine (CH3(CH2)5NH2)",
            "Aniline (C6H5NH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Phenethylamine (C6H5CH2CH2NH2)",
            "Tyramine (p-HO-C6H4CH2CH2NH2)",
            "Dopamine (3,4-diOH-C6H3CH2CH2NH2)",
            "Histamine (imidazol-4-yl-CH2CH2NH2)",
            "Serotonin (5-HO-indol-3-yl-CH2CH2NH2)",
            "Epinephrine (adrenaline) (3,4-diOH-C6H3(OH)CH(OH)CH2NH(CH3))",
            "Norepinephrine (noradrenaline) (3,4-diOH-C6H3(OH)CH(OH)CH2NH2)",
            "Tryptamine (indol-3-yl-CH2CH2NH2)",
            "Putrescine (NH2(CH2)4NH2)",
            "Cadaverine (NH2(CH2)5NH2)",
            "Spermidine (NH2(CH2)3NH(CH2)4NH2)",
            "Spermine (NH2(CH2)3NH(CH2)4NH(CH2)3NH2)",
            "Ethanolamine (HOCH2CH2NH2)",
            "Choline ((CH3)3N+CH2CH2OH)",
            "Acetylcholine ((CH3)3N+CH2CH2OCOCH3)",
            "Creatine (N-Methylguanidino-acetic acid)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (CH3CH2NH2)",
                "Propylamine (CH3CH2CH2NH2)",
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Phenethylamine (C6H5CH2CH2NH2)",
                "Putrescine (NH2(CH2)4NH2)",
                "Ethanolamine (HOCH2CH2NH2)"
            ],
            "mismatches": [
                "Butylamine (CH3(CH2)3NH2)",
                "Pentylamine (CH3(CH2)4NH2)",
                "Hexylamine (CH3(CH2)5NH2)",
                "Tyramine (p-HO-C6H4CH2CH2NH2)",
                "Dopamine (3,4-diOH-C6H3CH2CH2NH2)",
                "Histamine (imidazol-4-yl-CH2CH2NH2)",
                "Serotonin (5-HO-indol-3-yl-CH2CH2NH2)",
                "Epinephrine (adrenaline) (3,4-diOH-C6H3(OH)CH(OH)CH2NH(CH3))",
                "Norepinephrine (noradrenaline) (3,4-diOH-C6H3(OH)CH(OH)CH2NH2)",
                "Tryptamine (indol-3-yl-CH2CH2NH2)",
                "Cadaverine (NH2(CH2)5NH2)",
                "Spermidine (NH2(CH2)3NH(CH2)4NH2)",
                "Spermine (NH2(CH2)3NH(CH2)4NH(CH2)3NH2)",
                "Choline ((CH3)3N+CH2CH2OH)",
                "Acetylcholine ((CH3)3N+CH2CH2OCOCH3)",
                "Creatine (N-Methylguanidino-acetic acid)"
            ],
            "true_referents": [
                "(+)-N-methylpseudoephedrine",
                "(+)-norephedrine",
                "(+/-)-n-ethyl-1-phenyl-2-butylamine",
                "(1-Methyl-1H-imidazol-4-yl)methylamine",
                "(1S,2R)-tranylcypromine",
                "(R)-N-acetyl-1-phenylethylamine",
                "1-Hexadecylamine",
                "1-phenylethylamine",
                "2,2'-[(2-amino-2-oxoethyl)imino]diacetic acid",
                "2,4,4-trimethyl-2-Pentanamine",
                "2,4-dimethylpentan-3-amine",
                "2,5-Dimethoxy-4-ethylamphetamine",
                "2-phenylethylamine",
                "3-O-Methyl-a-methyldopamine",
                "3-buten-1-amine",
                "4-(4-nitrophenylazo)aniline",
                "4-(phenylazo)aniline",
                "4-[3-(dimethylamino)propylamino]phenol",
                "4-tert-butyl-N-[2-(2-methoxyphenyl)ethyl]-1-cyclohexanamine",
                "5-(dimethylamino)pentanoic acid",
                "5-methoxy-N,N-dimethyltryptamine",
                "L-tryptophan 2-naphthylamide",
                "N,N,2,2-tetramethyl-3-hexyn-1-amine",
                "N,N-Dimethylphenethylamine",
                "N-(decanoyl)ethanolamine",
                "N-Cyclohexyl-N-methylcyclohexanamine",
                "N-[3-(aminomethyl)benzyl]acetamidine",
                "N-acetylcysteamine",
                "N-alpha-Methylhistamine",
                "Na,Na-Dimethylhistamine",
                "Putrescine_d4",
                "[[4-(diethylamino)phenyl]methylideneamino]urea",
                "a-Methyldopamine",
                "alpha-Methyl-m-tyramine",
                "aniline",
                "benzylamine",
                "diethyl(propyl)amine",
                "diethylamine",
                "dimethylamine",
                "ethanolamine",
                "ethylamine",
                "isopentylamine",
                "methoxamine",
                "methylamine",
                "phenylethylamine",
                "propylamine",
                "triethylamine"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Ethylamine (EA)",
            "Morphine",
            "Dopamine",
            "Serotonin",
            "Epinephrine",
            "Norepinephrine",
            "Tyramine",
            "Histamine",
            "Acetylcholine",
            "Choline",
            "Glycine",
            "Alanine",
            "Arginine",
            "Lysine",
            "Ornithine",
            "Glutamine",
            "Asparagine",
            "Aspartic acid",
            "Glutamic acid",
            "GABA",
            "Adrenaline",
            "Noradrenaline",
            "Catecholamine",
            "Putrescine",
            "Spermidine",
            "Spermine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethylamine"
            ],
            "mismatches": [
                "Morphine",
                "Dopamine",
                "Serotonin",
                "Epinephrine",
                "Norepinephrine",
                "Tyramine",
                "Histamine",
                "Acetylcholine",
                "Choline",
                "Glycine",
                "Alanine",
                "Arginine",
                "Lysine",
                "Ornithine",
                "Glutamine",
                "Asparagine",
                "Aspartic acid",
                "Glutamic acid",
                "GABA",
                "Adrenaline",
                "Noradrenaline",
                "Catecholamine",
                "Putrescine",
                "Spermidine",
                "Spermine"
            ],
            "true_referents": [
                "2-aminoacrylic acid",
                "5-acetamidopentanoic acid",
                "6-aminohexanoic acid",
                "Allylamine",
                "Heptylamine",
                "L-alanine 2-naphthylamide",
                "L-arginine 2-naphthylamide",
                "L-asparagine 2-naphthylamide",
                "L-glutamyl-L-glutamic acid 2-naphthylamide",
                "L-glutamylglycyl-L-arginine 2-naphthylamide",
                "L-phenylalaninol",
                "N(5)-phenyl-L-glutamine",
                "N,N-bis(2-hydroxyethyl)glycine",
                "N-(alpha-L-aspartyl)-2-naphthylamine",
                "N-acylethanolamine",
                "N-acyllysophosphatidylethanolamine",
                "Na,Na-Dimethylhistamine",
                "Putrescine_d4",
                "alkylamine",
                "alpha-Methyl-m-tyramine",
                "alpha-amino fatty acid",
                "amphetamine",
                "benzylamine",
                "cyclopropylamine",
                "diethylamine",
                "dobutamine",
                "ethylamine",
                "fentanyl",
                "memantine",
                "methamphetamine",
                "methoxamine",
                "methylamine",
                "methylhexaneamine",
                "propranolol",
                "propylamine",
                "triethylamine",
                "tripropylamine"
            ],
            "TP": 1,
            "FP": 25,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "amine",
        "domain": "chemistry",
        "response": [
            "Adenine (A)",
            "Amphetamine",
            "Aniline",
            "Benzylamine",
            "Catecholamine",
            "Choline",
            "Cysteamine",
            "Dopamine",
            "Ephedrine",
            "Epinephrine",
            "Histamine",
            "Melatonin",
            "Methamphetamine",
            "Monoamine",
            "Norepinephrine",
            "Phenethylamine",
            "Phenylethylamine",
            "Putrescine",
            "Spermidine",
            "Spermine",
            "Tryptamine",
            "Tyramine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amphetamine",
                "Aniline",
                "Benzylamine",
                "Cysteamine",
                "Methamphetamine",
                "Phenylethylamine"
            ],
            "mismatches": [
                "Adenine (A)",
                "Catecholamine",
                "Choline",
                "Dopamine",
                "Ephedrine",
                "Epinephrine",
                "Histamine",
                "Melatonin",
                "Monoamine",
                "Norepinephrine",
                "Putrescine",
                "Spermidine",
                "Spermine",
                "Tryptamine",
                "Tyramine"
            ],
            "true_referents": [
                "(+)-norephedrine",
                "1-phenylethylamine",
                "2-Aminomethylpyrimidine",
                "2-phenylethylamine",
                "4-(phenylazo)aniline",
                "4-Aminomethylpyrimidine",
                "5-methoxy-N,N-dimethyltryptamine",
                "Methylephedrine",
                "N-acyllysophosphatidylethanolamine",
                "Na,Na-Dimethylhistamine",
                "Phenelzine",
                "Putrescine_d4",
                "alpha-Methyl-m-tyramine",
                "amphetamine",
                "amphetamines",
                "aniline",
                "benzylamine",
                "cyclopropylamine",
                "cysteamine",
                "cysteamine S-phosphate",
                "dobutamine",
                "ethylamine",
                "methamphetamine",
                "methoxamine",
                "methylamine",
                "methylhexaneamine",
                "phenylethylamine",
                "piperidine",
                "propranolol",
                "propylamine",
                "triethylamine",
                "tripropylamine"
            ],
            "TP": 6,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "amine",
        "domain": "chemistry",
        "response": "[\n        {\n            \"Canonical name\": \"Ammonia\" (NH3)\n        },\n        {\n            \"Canonical name\": \"Methanamine\" (CH3NH2)\n        },\n        {\n            \"Canonical name\": \"Dimethylglycine\" (DMG)\n        },\n        {\n            \"Canonical name\": \"Methylarginine\" (MGA)\n        },\n        {\n            \"Canonical name\": \"Choline\" (CH3N+CH2CH2OH2-)\n        },\n        {\n            \"Canonical name\": \"Carbamoylcholine\" (CH3NH2CH2NHCOO-)\n        },\n        {\n            \"Canonical name\": \"Creatine\" (CH3NH2CH2N(CH3)COO-)\n        },\n        {\n            \"Canonical name\": \"Betaine\" (CH3)3N+CH2CH2OH2-\n        },\n        {\n            \"Canonical name\": \"Methionine\" (CH3CH2SH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylmethionine\" (S-AdoMet)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (S-AdoHcy)\n        },\n        {\n            \"Canonical name\": \"S-Methyl-5\u2032-thioadenosine\" (MTA)\n        },\n        {\n            \"Canonical name\": \"S-Methyl-5\u2032-deoxyadenosine\" (MDA)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        },\n        {\n            \"Canonical name\": \"S-Adenosylhomocysteine\" (SAH)\n        }\n    ]",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]