[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (MeNH2)",
            "Ethylamine (EtNH2)",
            "Propylamine (PrNH2)",
            "Butylamine (BuNH2)",
            "Isopropylamine ((i-Pr)NH2)",
            "Tert-butylamine ((t-Bu)NH2)",
            "Aniline (C6H5NH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Phenethylamine (C6H5CH2CH2NH2)",
            "Dimethylamine (Me2NH)",
            "Diethylamine (Et2NH)",
            "Diisopropylamine ((i-Pr)2NH)",
            "Trimethylamine (Me3N)",
            "Triethylamine (Et3N)",
            "Hexamethylenediamine (HMDA, (CH2)6(NH2)2)",
            "Choline (C5H14NO2)",
            "Histamine (C5H9N3)",
            "Serotonin (5-HT, C10H12N2O)",
            "Epinephrine (Adrenaline, C9H13NO3)",
            "Norepinephrine (Noradrenaline, C8H11NO3)",
            "Dopamine (C8H11NO2)",
            "Tyramine (C8H11NO)",
            "Hemoglobin (heme group, Fe(II)-porphyrin complex with NH2)",
            "Carnitine (C7H15NO3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (MeNH2)",
                "Ethylamine (EtNH2)",
                "Isopropylamine ((i-Pr)NH2)",
                "Tert-butylamine ((t-Bu)NH2)",
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Phenethylamine (C6H5CH2CH2NH2)"
            ],
            "mismatches": [
                "Propylamine (PrNH2)",
                "Butylamine (BuNH2)",
                "Dimethylamine (Me2NH)",
                "Diethylamine (Et2NH)",
                "Diisopropylamine ((i-Pr)2NH)",
                "Trimethylamine (Me3N)",
                "Triethylamine (Et3N)",
                "Hexamethylenediamine (HMDA, (CH2)6(NH2)2)",
                "Choline (C5H14NO2)",
                "Histamine (C5H9N3)",
                "Serotonin (5-HT, C10H12N2O)",
                "Epinephrine (Adrenaline, C9H13NO3)",
                "Norepinephrine (Noradrenaline, C8H11NO3)",
                "Dopamine (C8H11NO2)",
                "Tyramine (C8H11NO)",
                "Hemoglobin (heme group, Fe(II)-porphyrin complex with NH2)",
                "Carnitine (C7H15NO3)"
            ],
            "true_referents": [
                "(1R)-1-phenylethanamine",
                "(1S,2R)-tranylcypromine",
                "1-Hexadecylamine",
                "1-naphthylamine",
                "1-phenylethylamine",
                "1-phenylpropan-2-amine",
                "2,4-dimethylpentan-3-amine",
                "2,5-dimethyl-p-phenylenediamine",
                "2-isopropylaminoethylamine",
                "2-methylbutan-2-amine",
                "2-phenylethylamine",
                "3-methoxytyramine",
                "4-(4-nitrophenylazo)aniline",
                "4-(phenylazo)aniline",
                "4-hydroxymethamphetamine",
                "4-methoxytyramine",
                "Decylamine",
                "N(1)-isopropyl-2-methylpropan-1,2-diamine",
                "N,1-dioleoyl-sn-glycero-3-phosphoethanolamine",
                "N,1-dipalmitoyl-sn-glycero-3-phosphoethanolamine",
                "N,N-Dimethylphenethylamine",
                "N-(monounsaturated fatty acyl)ethanolamine",
                "N-(saturated fatty acyl)ethanolamine",
                "N-ethyldiethanolamine",
                "alkylamine",
                "aniline",
                "benzylamine",
                "beta-D-Manp-(1->2)-beta-D-Manp-(1->2)-alpha-D-Manp-O[CH2]2NH2",
                "butan-1-amine",
                "carboxin",
                "cyclopropylamine",
                "ethylamine",
                "isopentylamine",
                "isopropylamine",
                "methylamine",
                "methylhexaneamine",
                "phenylethylamine",
                "primary arylamine",
                "sec-butylamine",
                "tert-butylamine"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Propylamine (C3H7NH2)",
            "Butylamine (C4H9NH2)",
            "Isopropylamine ((CH3)2CHNH2)",
            "Aniline (C6H5NH2)",
            "Phenethylamine (C8H11N)",
            "Tryptamine (C10H12N2)",
            "Putrescine (NC(CH2)4CN)",
            "Cadaverine (NC(H2)5NC(H2)5)",
            "Histamine (C5H9N3)",
            "Serotonin (C10H12N2O)",
            "Spermidine (C7H19N3)",
            "Spermine (C10H26N4)",
            "Morpholine (C4H8ON)",
            "Pyrrolidine (C4H9N)",
            "Piperidine (C5H11N)",
            "Cyclohexylamine (C6H13N)",
            "N,N-Dimethylethylamine ((CH3)2NCH2CH3)",
            "N-Methylaniline (C7H9N)",
            "N-Ethylaniline (C8H11N)",
            "N,N-Dimethylaniline ((CH3)2NC6H5)",
            "N,N-Diethylaniline ((C2H5)2NC6H5)",
            "Glycine (NH2CH2COOH)",
            "Alanine (NH2CH(CH3)COOH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methylamine",
                "ethylamine",
                "isopropylamine",
                "aniline",
                "cyclohexylamine",
                "n-methylaniline"
            ],
            "mismatches": [
                "propylamine",
                "butylamine",
                "phenethylamine",
                "tryptamine",
                "putrescine",
                "cadaverine",
                "histamine",
                "serotonin",
                "spermidine",
                "spermine",
                "morpholine",
                "pyrrolidine",
                "piperidine",
                "n,n-dimethylethylamine",
                "n-ethylaniline",
                "n,n-dimethylaniline",
                "n,n-diethylaniline",
                "glycine",
                "alanine"
            ],
            "true_referents": [
                "(1R,2S)-tranylcypromine",
                "(1S,2R)-tranylcypromine",
                "1,2-diamino-2-methylpropane",
                "1-phenylethylamine",
                "2,4-dimethylpentan-3-amine",
                "2,5-dimethylaniline",
                "2,6-dimethylaniline",
                "2-(2,4-dichlorophenoxy)-N-[4-(4-morpholinylmethyl)phenyl]acetamide",
                "2-cyano-3-[2,5-dimethyl-1-(3-pyridinyl)-3-pyrrolyl]-N-phenyl-2-propenamide",
                "2-isopropylaminoethylamine",
                "2-phenylethylamine",
                "3,4-dimethylaniline",
                "3-buten-1-amine",
                "4-(4-nitrophenylazo)aniline",
                "4-(aminomethyl)octane-1,8-diamine",
                "4-(phenylazo)aniline",
                "4-Propylcyclohexylamine",
                "4-methyl-3-penten-1-amine",
                "Dicyclohexylamine",
                "L-tryptophan 2-naphthylamide",
                "N,N-Dimethylphenethylamine",
                "N-(2,6-dimethylphenyl)-N(2)-(3,5-dimethylphenyl)glycinamide",
                "N-(2-naphthyl)carboxamide",
                "N-(4-anilinophenyl)cyclopropanecarboxamide",
                "N-(4-ethylphenyl)-3-(1-pyrrolyl)propanamide",
                "N-(alpha-L-glutamyl)-2-naphthylamine",
                "N-Acetyl-2,6-diethylaniline",
                "N-[(3-methoxyphenyl)methyl]-N-methyl-1-[1-[2-(2-methylphenyl)ethyl]-3-piperidinyl]methanamine",
                "N-[4-(4-morpholinylazo)phenyl]acetamide",
                "N-methylaniline",
                "N-phenyl-N'-(pyridin-4-ylmethylideneamino)butanediamide",
                "Putrescine_d4",
                "alkylamine",
                "aniline",
                "benzylamine",
                "butan-1-amine",
                "cyclohexylamine",
                "ethylamine",
                "glycine 2-naphthylamide",
                "isopentylamine",
                "isopropylamine",
                "methylamine",
                "phenyl-[1-(2-phenylethyl)-4-piperidinyl]methanol",
                "phenylethylamine"
            ],
            "TP": 6,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Propylamine (C3H7NH2)",
            "Butylamine (C4H9NH2)",
            "Pentylamine (C5H11NH2)",
            "Hexylamine (C6H13NH2)",
            "Heptylamine (C7H15NH2)",
            "Octylamine (C8H17NH2)",
            "Aniline (C6H5NH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Phenethylamine (C6H5CH2CH2NH2)",
            "Tyramine (C8H11NO)",
            "Tryptamine (C10H12N2)",
            "Histamine (C5H9N3)",
            "Putrescine (C4H12N2)",
            "Cadaverine (C5H14N2)",
            "Spermidine (C7H19N3)",
            "Spermine (C10H26N4)",
            "Norepinephrine (C8H11NO3)",
            "Ephedrine (C10H15NO)",
            "Pseudoephedrine (C10H15NO)",
            "Methamphetamine (C10H15N)",
            "Amphetamine (C9H13N)",
            "Cocaine (C17H21NO4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Heptylamine (C7H15NH2)",
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Phenethylamine (C6H5CH2CH2NH2)",
                "Methamphetamine (C10H15N)"
            ],
            "mismatches": [
                "Propylamine (C3H7NH2)",
                "Butylamine (C4H9NH2)",
                "Pentylamine (C5H11NH2)",
                "Hexylamine (C6H13NH2)",
                "Octylamine (C8H17NH2)",
                "Tyramine (C8H11NO)",
                "Tryptamine (C10H12N2)",
                "Histamine (C5H9N3)",
                "Putrescine (C4H12N2)",
                "Cadaverine (C5H14N2)",
                "Spermidine (C7H19N3)",
                "Spermine (C10H26N4)",
                "Norepinephrine (C8H11NO3)",
                "Ephedrine (C10H15NO)",
                "Pseudoephedrine (C10H15NO)",
                "Amphetamine (C9H13N)",
                "Cocaine (C17H21NO4)"
            ],
            "true_referents": [
                "(1R)-1-phenylethanamine",
                "(1R,2S)-tranylcypromine",
                "(1S)-1-phenylethanamine",
                "(1S,2R)-tranylcypromine",
                "(R)-N-acetyl-1-phenylethylamine",
                "(R)-amphetamine",
                "(S)-(+)-4-(5-carboxypentyl)methamphetamine",
                "(S)-amphetamine",
                "1,2-diamino-2-methylpropane",
                "1-Hexadecylamine",
                "1-phenylethylamine",
                "2,4-dimethylpentan-3-amine",
                "2-phenylethylamine",
                "3,4-dimethoxyphenylethylamine",
                "3-buten-1-amine",
                "3-methoxytyramine",
                "4-(4-nitrophenylazo)aniline",
                "4-(aminomethyl)octane-1,8-diamine",
                "4-(phenylazo)aniline",
                "4-Propylcyclohexylamine",
                "4-hydroxymethamphetamine",
                "4-methoxytyramine",
                "4-tert-butyl-N-[2-(2-methoxyphenyl)ethyl]-1-cyclohexanamine",
                "Decylamine",
                "Heptylamine",
                "L-tryptophan 2-naphthylamide",
                "N,N-Dimethylphenethylamine",
                "N-(alpha-L-aspartyl)-2-naphthylamine",
                "N-(octanoyl)ethanolamine",
                "Putrescine_d4",
                "alkylamine",
                "aniline",
                "anthracen-2-amine",
                "benzylamine",
                "butan-1-amine",
                "ethylamine",
                "isopentylamine",
                "methamphetamine",
                "methylamine",
                "methylhexaneamine",
                "phenylethylamine"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Propylamine (C3H7NH2)",
            "Butylamine (C4H9NH2)",
            "Pentylamine (C5H11NH2)",
            "Hexylamine (C6H13NH2)",
            "Cyclohexylamine (C6H11NH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Aniline (C6H5NH2)",
            "2-Phenylethylamine (C8H11NH2)",
            "Dopamine (3,4-Dihydroxyphenethylamine)",
            "Histamine (4-(1H-Imidazol-4-yl)ethanamine)",
            "Serotonin (5-Hydroxytryptamine)",
            "Tyramine (4-Hydroxyphenethylamine)",
            "Putrescine (1,4-Diaminobutane)",
            "Spermidine (N-Spermidine)",
            "Spermine (N-Spermine)",
            "Alanine (2-Aminopropanoic acid)",
            "Glycine (2-Aminoacetic acid)",
            "Valine (2-Amino-3-methylbutanoic acid)",
            "Leucine (2-Amino-4-methylpentanoic acid)",
            "Lysine (2,6-Diaminohexanoic acid)",
            "Arginine (2-Amino-5-(guanidino)pentanoic acid)",
            "Ornithine (2,5-Diaminopentanoic acid)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Cyclohexylamine (C6H11NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Aniline (C6H5NH2)",
                "2-Phenylethylamine (C8H11NH2)"
            ],
            "mismatches": [
                "Propylamine (C3H7NH2)",
                "Butylamine (C4H9NH2)",
                "Pentylamine (C5H11NH2)",
                "Hexylamine (C6H13NH2)",
                "Dopamine (3,4-Dihydroxyphenethylamine)",
                "Histamine (4-(1H-Imidazol-4-yl)ethanamine)",
                "Serotonin (5-Hydroxytryptamine)",
                "Tyramine (4-Hydroxyphenethylamine)",
                "Putrescine (1,4-Diaminobutane)",
                "Spermidine (N-Spermidine)",
                "Spermine (N-Spermine)",
                "Alanine (2-Aminopropanoic acid)",
                "Glycine (2-Aminoacetic acid)",
                "Valine (2-Amino-3-methylbutanoic acid)",
                "Leucine (2-Amino-4-methylpentanoic acid)",
                "Lysine (2,6-Diaminohexanoic acid)",
                "Arginine (2-Amino-5-(guanidino)pentanoic acid)",
                "Ornithine (2,5-Diaminopentanoic acid)"
            ],
            "true_referents": [
                "(R)-N-acetyl-1-phenylethylamine",
                "1,2-diamino-2-methylpropane",
                "1-Hexadecylamine",
                "1-phenylethylamine",
                "2,4-dimethylpentan-3-amine",
                "2-Methylbutylamine",
                "2-[3,4-bis[2-(dimethylamino)ethoxy]phenyl]ethanamine",
                "2-arylethylamine",
                "2-phenylethylamine",
                "3,4-dimethoxyphenylethylamine",
                "3-buten-1-amine",
                "4-(3-methylanilino)-4-oxobutanoic acid",
                "4-(4-nitrophenylazo)aniline",
                "4-(aminomethyl)octane-1,8-diamine",
                "4-(phenylazo)aniline",
                "4-Propylcyclohexylamine",
                "4-hydroxymethamphetamine",
                "4-methoxytyramine",
                "Decylamine",
                "Dicyclohexylamine",
                "Heptylamine",
                "L-alanine 2-naphthylamide",
                "L-alanyl-L-alanine 2-naphthylamide",
                "L-alanyl-L-phenylalanyl-L-proline 2-naphthylamide",
                "L-glutamylglycine 2-naphthylamide",
                "L-glutamylglycyl-L-arginine 2-naphthylamide",
                "L-leucine 2-naphthylamide",
                "L-lysine 2-naphthylamide",
                "L-ornithine 2-naphthylamide",
                "N(5)-phenyl-L-glutamine",
                "N,N-Dimethylphenethylamine",
                "N-[(4-acetamidophenyl)methylideneamino]-2-cyclohexylacetamide",
                "N-benzoyl-D-arginine 2-naphthylamide",
                "N-benzoyl-L-leucine 2-naphthylamide",
                "Putrescine_d4",
                "alkylamine",
                "aniline",
                "benzylamine",
                "butan-1-amine",
                "cyclohexane-1,2-diamine",
                "cyclohexylamine",
                "cyclopropylamine",
                "ethylamine",
                "glycine 2-naphthylamide",
                "glycyl-L-phenylalanine 2-naphthylamide",
                "isopentylamine",
                "methamphetamine",
                "methylamine",
                "methylhexaneamine"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Propylamine (C3H7NH2)",
            "Butylamine (C4H9NH2)",
            "Pentylamine (C5H11NH2)",
            "Hexylamine (C6H13NH2)",
            "Heptylamine (C7H15NH2)",
            "Octylamine (C8H17NH2)",
            "Nonylamine (C9H19NH2)",
            "Decylamine (C10H21NH2)",
            "Aniline (C6H5NH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Cyclohexylamine (C6H11NH2)",
            "Phenethylamine (C8H11N)",
            "Allylamine (C3H7NH2)",
            "Isopropylamine (C3H9N)",
            "Isobutylamine (C4H11N)",
            "Tert-butylamine (C4H11N)",
            "Ethanolamine (C2H7NO)",
            "Aminomethylpropane (C4H11N)",
            "Aminoethanol (C2H7NO)",
            "Aminopropanol (C3H9NO)",
            "1-Aminopentane (C5H13N)",
            "1-Aminohexane (C6H15N)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Heptylamine (C7H15NH2)",
                "Decylamine (C10H21NH2)",
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Cyclohexylamine (C6H11NH2)",
                "Allylamine (C3H7NH2)",
                "Isopropylamine (C3H9N)",
                "Tert-butylamine (C4H11N)",
                "Ethanolamine (C2H7NO)"
            ],
            "mismatches": [
                "Propylamine (C3H7NH2)",
                "Butylamine (C4H9NH2)",
                "Pentylamine (C5H11NH2)",
                "Hexylamine (C6H13NH2)",
                "Octylamine (C8H17NH2)",
                "Nonylamine (C9H19NH2)",
                "Phenethylamine (C8H11N)",
                "Isobutylamine (C4H11N)",
                "Aminomethylpropane (C4H11N)",
                "Aminoethanol (C2H7NO)",
                "Aminopropanol (C3H9NO)",
                "1-Aminopentane (C5H13N)",
                "1-Aminohexane (C6H15N)"
            ],
            "true_referents": [
                "(R)-N-acetyl-1-phenylethylamine",
                "1,2-diamino-2-methylpropane",
                "1-Hexadecylamine",
                "1-aminopentadecane",
                "1-hexanamine",
                "1-phenylethylamine",
                "2,4-dimethylpentan-3-amine",
                "2-Methylbutylamine",
                "2-diethylaminoethanol",
                "2-isopropylaminoethylamine",
                "2-phenylethylamine",
                "3-(2-aminoethyl)benzene-1,2-diol",
                "3-aminopropan-1-ol",
                "3-buten-1-amine",
                "4-(2-aminoethyl)benzene-1,3-diol",
                "4-(4-nitrophenylazo)aniline",
                "4-(aminomethyl)octane-1,8-diamine",
                "4-(phenylazo)aniline",
                "4-Propylcyclohexylamine",
                "Allylamine",
                "Decylamine",
                "Dicyclohexylamine",
                "Heptylamine",
                "N(1)-isopropyl-2-methylpropan-1,2-diamine",
                "N,N-Dimethylphenethylamine",
                "N-(3-aminopropyl)-4-aminobutanal",
                "N-(alpha-L-aspartyl)-2-naphthylamine",
                "N-(octanoyl)ethanolamine",
                "alkylamine",
                "aniline",
                "benzylamine",
                "butan-1-amine",
                "cyclohexane-1,2-diamine",
                "cyclohexylamine",
                "ethanolamine",
                "ethylamine",
                "isopentylamine",
                "isopropylamine",
                "methylamine",
                "methylhexaneamine",
                "pentan-1-amine",
                "pentan-3-amine",
                "phenylethylamine",
                "tert-butylamine"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (C1)",
            "Ethylamine (C2)",
            "Propylamine (C3)",
            "Butylamine (C4)",
            "Isopropylamine (C5)",
            "Cyclohexylamine (C6)",
            "Benzylamine (C7)",
            "Aniline (C8)",
            "Phenethylamine (C9)",
            "2-Aminopropane (C10)",
            "3-Aminobutane (C11)",
            "4-Aminobutane (C12)",
            "2-Amino-1-butanol (C13)",
            "Octylamine (C14)",
            "Dodecylamine (C15)",
            "2-Aminobutane (C16)",
            "N-Methyl-1-aminopropane (C17)",
            "N-Ethyl-1-aminobutane (C18)",
            "N-Propyl-2-aminopropane (C19)",
            "N-Benzyl-2-aminopropane (C20)",
            "2-Amino-1-pentanol (C21)",
            "1-Aminocyclohexane (C22)",
            "N,N-Dimethylamine (C23)",
            "N-Butyl-2-aminobutane (C24)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (C1)",
                "Ethylamine (C2)",
                "Isopropylamine (C5)",
                "Cyclohexylamine (C6)",
                "Benzylamine (C7)",
                "Aniline (C8)",
                "Dodecylamine (C15)"
            ],
            "mismatches": [
                "Propylamine (C3)",
                "Butylamine (C4)",
                "Phenethylamine (C9)",
                "2-Aminopropane (C10)",
                "3-Aminobutane (C11)",
                "4-Aminobutane (C12)",
                "2-Amino-1-butanol (C13)",
                "Octylamine (C14)",
                "2-Aminobutane (C16)",
                "N-Methyl-1-aminopropane (C17)",
                "N-Ethyl-1-aminobutane (C18)",
                "N-Propyl-2-aminopropane (C19)",
                "N-Benzyl-2-aminopropane (C20)",
                "2-Amino-1-pentanol (C21)",
                "1-Aminocyclohexane (C22)",
                "N,N-Dimethylamine (C23)",
                "N-Butyl-2-aminobutane (C24)"
            ],
            "true_referents": [
                "1,2-diamino-2-methylpropane",
                "1-aminopentadecane",
                "1-phenylethylamine",
                "1-phenylpropan-2-amine",
                "2,4-dimethylpentan-3-amine",
                "2-isopropylaminoethylamine",
                "2-methylbutan-2-amine",
                "2-naphthylamine",
                "2-phenylethylamine",
                "3-(2-aminoethyl)benzene-1,2-diol",
                "3-[(4-aminobutyl)amino]propanal",
                "3-aminopropan-1-ol",
                "3-buten-1-amine",
                "4-(4-nitrophenylazo)aniline",
                "4-(aminomethyl)octane-1,8-diamine",
                "4-(phenylazo)aniline",
                "4-Propylcyclohexylamine",
                "Decylamine",
                "Dicyclohexylamine",
                "N(1)-isopropyl-2-methylpropan-1,2-diamine",
                "N,N-Dimethylphenethylamine",
                "N-(3-aminopropyl)-4-aminobutanal",
                "N-(butanoyl)ethanolamine",
                "N-(dodecanoyl)ethanolamine",
                "N-methylbutan-2-amine",
                "alkylamine",
                "aniline",
                "benzylamine",
                "benzylpenicilloyl-benzylamine",
                "butan-1-amine",
                "cyclohexane-1,2-diamine",
                "cyclohexylamine",
                "dodecylamine",
                "ethylamine",
                "isopentylamine",
                "isopropylamine",
                "methylamine",
                "octan-1-amine",
                "pentan-1-amine",
                "phenylethylamine",
                "primary arylamine",
                "tert-butylamine"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H7N)",
            "Propylamine (C3H9N)",
            "Isopropylamine (C3H9N)",
            "Butylamine (C4H11N)",
            "Isobutylamine (C4H11N)",
            "Sec-Butylamine (C4H11N)",
            "Tert-Butylamine (C4H11N)",
            "Pentylamine (C5H13N)",
            "Hexylamine (C6H15N)",
            "Heptylamine (C7H17N)",
            "Octylamine (C8H19N)",
            "Nonylamine (C9H21N)",
            "Decylamine (C10H23N)",
            "Undecylamine (C11H25N)",
            "Dodecylamine (C12H27N)",
            "Tridecylamine (C13H29N)",
            "Tetradecylamine (C14H31N)",
            "Pentadecylamine (C15H33N)",
            "Hexadecylamine (C16H35N)",
            "Heptadecylamine (C17H37N)",
            "Octadecylamine (C18H39N)",
            "Nonadecylamine (C19H41N)",
            "Eicosylamine (C20H43N)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H7N)",
                "Isopropylamine (C3H9N)",
                "Sec-Butylamine (C4H11N)",
                "Tert-Butylamine (C4H11N)",
                "Heptylamine (C7H17N)",
                "Decylamine (C10H23N)",
                "Dodecylamine (C12H27N)",
                "Tetradecylamine (C14H31N)"
            ],
            "mismatches": [
                "Propylamine (C3H9N)",
                "Butylamine (C4H11N)",
                "Isobutylamine (C4H11N)",
                "Pentylamine (C5H13N)",
                "Hexylamine (C6H15N)",
                "Octylamine (C8H19N)",
                "Nonylamine (C9H21N)",
                "Undecylamine (C11H25N)",
                "Tridecylamine (C13H29N)",
                "Pentadecylamine (C15H33N)",
                "Hexadecylamine (C16H35N)",
                "Heptadecylamine (C17H37N)",
                "Octadecylamine (C18H39N)",
                "Nonadecylamine (C19H41N)",
                "Eicosylamine (C20H43N)"
            ],
            "true_referents": [
                "1-Hexadecylamine",
                "1-hexanamine",
                "1-naphthylamine",
                "2,4,4-trimethyl-2-Pentanamine",
                "2,4-dimethylpentan-3-amine",
                "2-Methylbutylamine",
                "2-isopropylaminoethylamine",
                "3,4-dimethoxyphenylethylamine",
                "3-buten-1-amine",
                "4-(aminomethyl)octane-1,8-diamine",
                "Decylamine",
                "Heptylamine",
                "N,N-Dimethylphenethylamine",
                "N-(alpha-L-aspartyl)-2-naphthylamine",
                "N-(decanoyl)ethanolamine",
                "N-(dodecanoyl)ethanolamine",
                "N-(octanoyl)ethanolamine",
                "N-[(5Z,8Z,11Z)-14,15-epoxyicosatrienoyl]ethanolamine",
                "Pentadecanoyl-EA",
                "Tetradecylamine",
                "alkylamine",
                "benzylamine",
                "butan-1-amine",
                "dodecylamine",
                "ethylamine",
                "isopentylamine",
                "isopropylamine",
                "methylamine",
                "methylhexaneamine",
                "octan-1-amine",
                "pentan-1-amine",
                "sec-butylamine",
                "tert-butylamine"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Propylamine (C3H7NH2)",
            "Butylamine (C4H9NH2)",
            "Pentylamine (C5H11NH2)",
            "Hexylamine (C6H13NH2)",
            "Heptylamine (C7H15NH2)",
            "Octylamine (C8H17NH2)",
            "Nonylamine (C9H19NH2)",
            "Decylamine (C10H21NH2)",
            "Undecylamine (C11H23NH2)",
            "Dodecylamine (C12H25NH2)",
            "Tridecylamine (C13H27NH2)",
            "Tetradecylamine (C14H29NH2)",
            "Pentadecylamine (C15H31NH2)",
            "Hexadecylamine (C16H33NH2)",
            "Heptadecylamine (C17H35NH2)",
            "Octadecylamine (C18H37NH2)",
            "Nonadecylamine (C19H39NH2)",
            "Eicosylamine (C20H41NH2)",
            "Docosylamine (C22H45NH2)",
            "Tetracosylamine (C24H49NH2)",
            "Tripropylamine (C9H21N)",
            "Diethylmethylamine (C5H13N)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Heptylamine (C7H15NH2)",
                "Decylamine (C10H21NH2)",
                "Dodecylamine (C12H25NH2)",
                "Tetradecylamine (C14H29NH2)",
                "Hexadecylamine (C16H33NH2)"
            ],
            "mismatches": [
                "Propylamine (C3H7NH2)",
                "Butylamine (C4H9NH2)",
                "Pentylamine (C5H11NH2)",
                "Hexylamine (C6H13NH2)",
                "Octylamine (C8H17NH2)",
                "Nonylamine (C9H19NH2)",
                "Undecylamine (C11H23NH2)",
                "Tridecylamine (C13H27NH2)",
                "Pentadecylamine (C15H31NH2)",
                "Heptadecylamine (C17H35NH2)",
                "Octadecylamine (C18H37NH2)",
                "Nonadecylamine (C19H39NH2)",
                "Eicosylamine (C20H41NH2)",
                "Docosylamine (C22H45NH2)",
                "Tetracosylamine (C24H49NH2)",
                "Tripropylamine (C9H21N)",
                "Diethylmethylamine (C5H13N)"
            ],
            "true_referents": [
                "(R)-N-acetyl-1-phenylethylamine",
                "(S)-N-acetyl-1-phenylethylamine",
                "1-Hexadecylamine",
                "1-phenylethylamine",
                "2,4,4-trimethyl-2-Pentanamine",
                "2,4-dimethylpentan-3-amine",
                "3,4-dimethoxyphenylethylamine",
                "3-buten-1-amine",
                "4-(aminomethyl)octane-1,8-diamine",
                "4-Propylcyclohexylamine",
                "Decylamine",
                "Heptylamine",
                "N,N-Dimethylphenethylamine",
                "N-(15Z-tetracosenoyl)ethanolamine",
                "N-(alpha-L-aspartyl)-2-naphthylamine",
                "N-(alpha-L-glutamyl)-2-naphthylamine",
                "N-(docosanoyl)ethanolamine",
                "N-(dodecanoyl)ethanolamine",
                "N-(octanoyl)ethanolamine",
                "Tetradecylamine",
                "alkylamine",
                "benzylamine",
                "butan-1-amine",
                "cyclohexane-1,2-diamine",
                "dodecylamine",
                "ethylamine",
                "isopentylamine",
                "methylamine",
                "methylhexaneamine",
                "tert-butylamine"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Propylamine (C3H7NH2)",
            "Isopropylamine ((CH3)2CHNH2)",
            "n-Butylamine (C4H9NH2)",
            "sec-Butylamine",
            "n-Pentylamine (C5H11NH2)",
            "iso-Pentylamine",
            "Benzylamine (C6H5CH2NH2)",
            "Aniline (C6H5NH2)",
            "Phenethylamine (C6H5CH2CH2NH2)",
            "Allylamine (CH2=CHCH2NH2)",
            "Propargylamine (HC\u2261CCH2NH2)",
            "Cyclohexylamine (C6H11NH2)",
            "Hexylamine (C6H13NH2)",
            "Heptylamine (C7H15NH2)",
            "Octylamine (C8H17NH2)",
            "Nonylamine (C9H19NH2)",
            "Decylamine (C10H21NH2)",
            "Ethanolamine (2-Aminoethanol)",
            "3-Aminopropanol",
            "Beta-Alanine (3-Aminopropanoic acid)",
            "Vinylamine (H2C=CHNH2)",
            "N-Propylamine",
            "Isobutylamine ((CH3)2CHCH2NH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Isopropylamine ((CH3)2CHNH2)",
                "sec-Butylamine",
                "iso-Pentylamine",
                "Benzylamine (C6H5CH2NH2)",
                "Aniline (C6H5NH2)",
                "Phenethylamine (C6H5CH2CH2NH2)",
                "Allylamine (CH2=CHCH2NH2)",
                "Cyclohexylamine (C6H11NH2)",
                "Heptylamine (C7H15NH2)",
                "Decylamine (C10H21NH2)",
                "Ethanolamine (2-Aminoethanol)",
                "3-Aminopropanol"
            ],
            "mismatches": [
                "Propylamine (C3H7NH2)",
                "n-Butylamine (C4H9NH2)",
                "n-Pentylamine (C5H11NH2)",
                "Propargylamine (HC\u2261CCH2NH2)",
                "Hexylamine (C6H13NH2)",
                "Octylamine (C8H17NH2)",
                "Nonylamine (C9H19NH2)",
                "Beta-Alanine (3-Aminopropanoic acid)",
                "Vinylamine (H2C=CHNH2)",
                "N-Propylamine",
                "Isobutylamine ((CH3)2CHCH2NH2)"
            ],
            "true_referents": [
                "(R)-N-acetyl-1-phenylethylamine",
                "1-Hexadecylamine",
                "1-phenylethylamine",
                "2,4-dimethylpentan-3-amine",
                "2-Methylbutylamine",
                "2-isopropylaminoethylamine",
                "2-phenylethylamine",
                "3-[(4-aminobutyl)amino]propanal",
                "3-aminopropan-1-ol",
                "3-buten-1-amine",
                "4-(4-nitrophenylazo)aniline",
                "4-(aminomethyl)octane-1,8-diamine",
                "4-(phenylazo)aniline",
                "4-Propylcyclohexylamine",
                "Allylamine",
                "Decylamine",
                "Dicyclohexylamine",
                "Heptylamine",
                "N,N-Dimethylphenethylamine",
                "N-(3-aminopropyl)-4-aminobutanal",
                "N-(alpha-L-aspartyl)-2-naphthylamine",
                "N-(decanoyl)ethanolamine",
                "N-(octanoyl)ethanolamine",
                "alkylamine",
                "aniline",
                "benzylamine",
                "beta-alanine 2-naphthylamide",
                "butan-1-amine",
                "cyclohexane-1,2-diamine",
                "cyclohexylamine",
                "ethanolamine",
                "ethylamine",
                "isopentylamine",
                "isopropylamine",
                "methylamine",
                "methylhexaneamine",
                "phenylethylamine",
                "sec-butylamine"
            ],
            "TP": 14,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Propylamine (C3H7NH2)",
            "Butylamine (C4H9NH2)",
            "Aniline (C6H5NH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Ethanolamine (HOCH2CH2NH2)",
            "Glycine (H2NCH2COOH)",
            "Lysine (C6H14N2O2)",
            "Putrescine (NH2(CH2)4NH2)",
            "Cadaverine (NH2(CH2)5NH2)",
            "Tryptamine (C10H12N2)",
            "Dopamine (C8H11NO2)",
            "Serotonin (C10H12N2O)",
            "Histamine (C5H9N3)",
            "Tyramine (C8H11NO)",
            "Phenethylamine (C8H11N)",
            "Cyclohexylamine (C6H11NH2)",
            "Allylamine (C3H5NH2)",
            "Glucosamine (C6H13NO5)",
            "Taurine (C2H7NO3S)",
            "Octopamine (C8H11NO2)",
            "Norepinephrine (C8H11NO3)",
            "Cysteamine (HSCH2CH2NH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Ethanolamine (HOCH2CH2NH2)",
                "Putrescine (NH2(CH2)4NH2)",
                "Phenethylamine (C8H11N)",
                "Cyclohexylamine (C6H11NH2)",
                "Allylamine (C3H5NH2)",
                "Cysteamine (HSCH2CH2NH2)"
            ],
            "mismatches": [
                "Propylamine (C3H7NH2)",
                "Butylamine (C4H9NH2)",
                "Glycine (H2NCH2COOH)",
                "Lysine (C6H14N2O2)",
                "Cadaverine (NH2(CH2)5NH2)",
                "Tryptamine (C10H12N2)",
                "Dopamine (C8H11NO2)",
                "Serotonin (C10H12N2O)",
                "Histamine (C5H9N3)",
                "Tyramine (C8H11NO)",
                "Glucosamine (C6H13NO5)",
                "Taurine (C2H7NO3S)",
                "Octopamine (C8H11NO2)",
                "Norepinephrine (C8H11NO3)"
            ],
            "true_referents": [
                "(1R)-1-phenylethanamine",
                "(1R,2S)-tranylcypromine",
                "(1S)-1-phenylethanamine",
                "(1S,2R)-tranylcypromine",
                "1-phenylethylamine",
                "2,4-dimethylpentan-3-amine",
                "2-hydroxy-5-[(1E)-(2-phenylethylidene)amino]-L-tyrosine",
                "2-phenylethylamine",
                "3,4-dimethoxyphenylethylamine",
                "3-buten-1-amine",
                "3-methoxytyramine",
                "4-(4-nitrophenylazo)aniline",
                "4-(aminomethyl)octane-1,8-diamine",
                "4-(phenylazo)aniline",
                "4-Propylcyclohexylamine",
                "4-hydroxymethamphetamine",
                "4-methoxytyramine",
                "4-tert-butyl-N-[2-(2-methoxyphenyl)ethyl]-1-cyclohexanamine",
                "Allylamine",
                "Dicyclohexylamine",
                "L-lysine 2-naphthylamide",
                "L-tryptophan 2-naphthylamide",
                "N,N-Dimethylphenethylamine",
                "N-(15Z-tetracosenoyl)ethanolamine",
                "N-(alpha-L-aspartyl)-2-naphthylamine",
                "N-(decanoyl)ethanolamine",
                "Putrescine_d4",
                "alkylamine",
                "aniline",
                "benzylamine",
                "beta-D-Manp-(1->2)-beta-D-Manp-(1->2)-alpha-D-Manp-O[CH2]2NH2",
                "butan-1-amine",
                "cyclohexane-1,2-diamine",
                "cyclohexylamine",
                "cyclopropylamine",
                "cystamine",
                "cysteamine",
                "cysteamine S-phosphate",
                "dodecylamine",
                "ethanolamine",
                "ethylamine",
                "glycine 2-naphthylamide",
                "glycyl-L-phenylalanine 2-naphthylamide",
                "glycyl-L-tryptophan 2-naphthylamide",
                "methylamine",
                "octan-1-amine",
                "phenylethylamine"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (MA)",
            "Ethylamine",
            "Propylamine",
            "Butylamine",
            "Pentylamine",
            "Hexylamine",
            "Heptylamine",
            "Octylamine",
            "Nonylamine",
            "Decylamine",
            "Isopropylamine",
            "Isobutylamine",
            "sec-Butylamine",
            "tert-Butylamine",
            "Cyclopropylamine",
            "Cyclobutylamine",
            "Cyclopentylamine",
            "Cyclohexylamine",
            "Allylamine",
            "Propargylamine",
            "Benzylamine",
            "Phenethylamine",
            "Dopamine",
            "Serotonin (5-HT)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (MA)",
                "Ethylamine",
                "Heptylamine",
                "Decylamine",
                "Isopropylamine",
                "sec-Butylamine",
                "tert-Butylamine",
                "Cyclopropylamine",
                "Cyclohexylamine",
                "Allylamine",
                "Benzylamine"
            ],
            "mismatches": [
                "Propylamine",
                "Butylamine",
                "Pentylamine",
                "Hexylamine",
                "Octylamine",
                "Nonylamine",
                "Isobutylamine",
                "Cyclobutylamine",
                "Cyclopentylamine",
                "Propargylamine",
                "Phenethylamine",
                "Dopamine",
                "Serotonin (5-HT)"
            ],
            "true_referents": [
                "(R)-amphetamine",
                "1-(1-phenylcyclopentyl)methylamine",
                "1-Hexadecylamine",
                "1-phenylethylamine",
                "2,4-dimethylpentan-3-amine",
                "2-Methylbutylamine",
                "2-isopropylaminoethylamine",
                "2-phenylethylamine",
                "3-buten-1-amine",
                "4-Propylcyclohexylamine",
                "Allylamine",
                "Decylamine",
                "Dicyclohexylamine",
                "Heptylamine",
                "Mecamylamine",
                "Phenelzine",
                "Tetradecylamine",
                "alkylamine",
                "benzylamine",
                "butan-1-amine",
                "cyclohexylamine",
                "cyclopropylamine",
                "dodecylamine",
                "ethylamine",
                "isopentylamine",
                "isopropylamine",
                "methamphetamine",
                "methylamine",
                "methylhexaneamine",
                "octan-1-amine",
                "phenylethylamine",
                "primary arylamine",
                "sec-butylamine",
                "tert-butylamine"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (CH3CH2NH2)",
            "Propylamine (CH3CH2CH2NH2)",
            "Butylamine (CH3(CH2)3NH2)",
            "Isopropylamine ((CH3)2CHNH2)",
            "Isobutylamine ((CH3)2CHCH2NH2)",
            "tert-Butylamine ((CH3)3CNH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Aniline (C6H5NH2)",
            "Cyclohexylamine (C6H11NH2)",
            "Ethanolamine (HOCH2CH2NH2)",
            "Histamine (C5H9N3)",
            "Tryptamine (C10H12N2)",
            "Serotonin (C10H12N2O)",
            "Dopamine (C8H11NO2)",
            "Norepinephrine (C8H11NO3)",
            "Epinephrine (C9H13NO3)",
            "Putrescine (NH2(CH2)4NH2)",
            "Cadaverine (NH2(CH2)5NH2)",
            "Spermidine (NH2(CH2)4NH(CH2)3NH2)",
            "Spermine (NH2(CH2)3NH(CH2)4NH(CH2)3NH2)",
            "Glucosamine (C6H13NO5)",
            "Galactosamine (C6H13NO5)",
            "Creatine (C4H9N3O2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (CH3CH2NH2)",
                "Isopropylamine ((CH3)2CHNH2)",
                "tert-Butylamine ((CH3)3CNH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Aniline (C6H5NH2)",
                "Cyclohexylamine (C6H11NH2)",
                "Ethanolamine (HOCH2CH2NH2)",
                "Putrescine (NH2(CH2)4NH2)"
            ],
            "mismatches": [
                "Propylamine (CH3CH2CH2NH2)",
                "Butylamine (CH3(CH2)3NH2)",
                "Isobutylamine ((CH3)2CHCH2NH2)",
                "Histamine (C5H9N3)",
                "Tryptamine (C10H12N2)",
                "Serotonin (C10H12N2O)",
                "Dopamine (C8H11NO2)",
                "Norepinephrine (C8H11NO3)",
                "Epinephrine (C9H13NO3)",
                "Cadaverine (NH2(CH2)5NH2)",
                "Spermidine (NH2(CH2)4NH(CH2)3NH2)",
                "Spermine (NH2(CH2)3NH(CH2)4NH(CH2)3NH2)",
                "Glucosamine (C6H13NO5)",
                "Galactosamine (C6H13NO5)",
                "Creatine (C4H9N3O2)"
            ],
            "true_referents": [
                "(1R)-1-phenylethanamine",
                "(1R,2S)-tranylcypromine",
                "(1S,2R)-tranylcypromine",
                "1-phenylethylamine",
                "2,4,4-trimethyl-2-Pentanamine",
                "2,4-dimethylpentan-3-amine",
                "2-Methylbutylamine",
                "2-[[4-(dimethylamino)phenyl]methylideneamino]oxy-N-(4-methylphenyl)acetamide",
                "2-isopropylaminoethylamine",
                "3,4-dimethoxyphenylethylamine",
                "3-buten-1-amine",
                "4-(4-nitrophenylazo)aniline",
                "4-(aminomethyl)octane-1,8-diamine",
                "4-(phenylazo)aniline",
                "4-hydroxymethamphetamine",
                "4-methyl-3-penten-1-amine",
                "4-tert-butyl-N-[2-(2-methoxyphenyl)ethyl]-1-cyclohexanamine",
                "Dicyclohexylamine",
                "L-tryptophan 2-naphthylamide",
                "N,N-Dimethylphenethylamine",
                "N-(15Z-tetracosenoyl)ethanolamine",
                "N-(2-hydroxyethyl)docosa-7,10,13,16-tetraenamide",
                "N-(decanoyl)ethanolamine",
                "Putrescine_d4",
                "alkylamine",
                "aniline",
                "benzylamine",
                "beta-D-Manp-(1->2)-beta-D-Manp-(1->2)-alpha-D-Manp-O[CH2]2NH2",
                "butan-1-amine",
                "cyclohexane-1,2-diamine",
                "cyclohexylamine",
                "cyclopropylamine",
                "dodecylamine",
                "ethanolamine",
                "ethylamine",
                "isopentylamine",
                "isopropylamine",
                "methylamine",
                "methylhexaneamine",
                "tert-butylamine"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H7N)",
            "Propylamine (C3H9N)",
            "Butylamine (C4H11N)",
            "Pentylamine (C5H13N)",
            "Hexylamine (C6H15N)",
            "Heptylamine (C7H17N)",
            "Octylamine (C8H19N)",
            "Nonylamine (C9H21N)",
            "Decylamine (C10H23N)",
            "Benzylamine (C6H5CH2NH2)",
            "Phenethylamine (C6H5CH2CH2NH2)",
            "Tryptamine (C10H12N2)",
            "Dopamine (C6H3(OH)2CH2NH2)",
            "Histamine (C5H9N3)",
            "Serotonin (C10H12N2O)",
            "Tyramine (C6H5CH2CH2NH2)",
            "Putrescine (H2N(CH2)4NH2)",
            "Cadaverine (H2N(CH2)5NH2)",
            "Spermidine (H2N(CH2)3NH(CH2)4NH2)",
            "Spermine (H2N(CH2)3NH(CH2)4NH(CH2)3NH2)",
            "Ethanolamine (C2H7NO)",
            "Choline (C5H14NO)",
            "Glucosamine (C6H13NO5)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H7N)",
                "Heptylamine (C7H17N)",
                "Decylamine (C10H23N)",
                "Benzylamine (C6H5CH2NH2)",
                "Phenethylamine (C6H5CH2CH2NH2)",
                "Putrescine (H2N(CH2)4NH2)",
                "Ethanolamine (C2H7NO)"
            ],
            "mismatches": [
                "Propylamine (C3H9N)",
                "Butylamine (C4H11N)",
                "Pentylamine (C5H13N)",
                "Hexylamine (C6H15N)",
                "Octylamine (C8H19N)",
                "Nonylamine (C9H21N)",
                "Tryptamine (C10H12N2)",
                "Dopamine (C6H3(OH)2CH2NH2)",
                "Histamine (C5H9N3)",
                "Serotonin (C10H12N2O)",
                "Tyramine (C6H5CH2CH2NH2)",
                "Cadaverine (H2N(CH2)5NH2)",
                "Spermidine (H2N(CH2)3NH(CH2)4NH2)",
                "Spermine (H2N(CH2)3NH(CH2)4NH(CH2)3NH2)",
                "Choline (C5H14NO)",
                "Glucosamine (C6H13NO5)"
            ],
            "true_referents": [
                "(1R)-1-phenylethanamine",
                "(1R,2S)-tranylcypromine",
                "(1S,2R)-tranylcypromine",
                "1-Hexadecylamine",
                "1-hexanamine",
                "1-naphthylamine",
                "1-phenylethylamine",
                "2,4-dimethylpentan-3-amine",
                "2-[[4-(dimethylamino)phenyl]methylideneamino]oxy-N-(4-methylphenyl)acetamide",
                "2-phenylethylamine",
                "3-buten-1-amine",
                "4-(aminomethyl)octane-1,8-diamine",
                "4-hydroxymethamphetamine",
                "Decylamine",
                "Heptylamine",
                "L-tryptophan 2-naphthylamide",
                "N,N-Dimethylphenethylamine",
                "N-(15Z-tetracosenoyl)ethanolamine",
                "N-(20-hydroxyarachidonoyl)ethanolamine",
                "N-(alpha-L-aspartyl)-2-naphthylamine",
                "N-(decanoyl)ethanolamine",
                "N-(octanoyl)ethanolamine",
                "N-(saturated fatty acyl)ethanolamine",
                "Putrescine_d4",
                "alkylamine",
                "benzylamine",
                "butan-1-amine",
                "dodecylamine",
                "ethanolamine",
                "ethylamine",
                "isopentylamine",
                "methylamine",
                "methylhexaneamine",
                "octan-1-amine",
                "pentan-1-amine",
                "phenylethylamine",
                "tert-butylamine"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Morphine (MOR)",
            "Codeine",
            "Pethidine",
            "Amphetamine",
            "Methamphetamine",
            "Ephedrine",
            "Norephedrine",
            "Pseudoephedrine",
            "Phenylephrine",
            "Tyramine",
            "Octopamine",
            "Synephrine",
            "Norepinephrine",
            "Epinephrine",
            "Dopamine",
            "Serotonin",
            "Tyrosine",
            "Tryptophan",
            "Histamine",
            "Adrenaline",
            "Noradrenaline",
            "Dopexamine",
            "Amiloride",
            "Minoxidil",
            "Captopril",
            "Enalapril"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methamphetamine"
            ],
            "mismatches": [
                "Morphine (MOR)",
                "Codeine",
                "Pethidine",
                "Amphetamine",
                "Ephedrine",
                "Norephedrine",
                "Pseudoephedrine",
                "Phenylephrine",
                "Tyramine",
                "Octopamine",
                "Synephrine",
                "Norepinephrine",
                "Epinephrine",
                "Dopamine",
                "Serotonin",
                "Tyrosine",
                "Tryptophan",
                "Histamine",
                "Adrenaline",
                "Noradrenaline",
                "Dopexamine",
                "Amiloride",
                "Minoxidil",
                "Captopril",
                "Enalapril"
            ],
            "true_referents": [
                "(1R)-1-phenylethanamine",
                "(1S)-1-phenylethanamine",
                "(R)-amphetamine",
                "(S)-(+)-4-(5-carboxypentyl)methamphetamine",
                "(S)-amphetamine",
                "1-phenylethylamine",
                "2-hydroxy-5-[(1E)-(2-phenylethylidene)amino]-L-tyrosine",
                "3,4-dimethoxyphenylethylamine",
                "4-hydroxymethamphetamine",
                "Albidopyrone",
                "Decylamine",
                "Heptylamine",
                "L-tryptophan 2-naphthylamide",
                "L-tyrosine 2-naphthylamide",
                "N-acylethanolamine",
                "N-gondoylethanolamine",
                "Phenelzine",
                "Ritodrine hydrochloride",
                "alkylamine",
                "amantadine",
                "benodanil",
                "benzylamine",
                "clenbuterol",
                "cyclohexylamine",
                "cyclopropylamine",
                "ethylamine",
                "fentanyl",
                "glycyl-L-tryptophan 2-naphthylamide",
                "hydroxyflutamide",
                "isopropylamine",
                "memantine",
                "methamphetamine",
                "naphthylamine",
                "phenacetin",
                "phentermine",
                "phenylethylamine",
                "remifentanil"
            ],
            "TP": 1,
            "FP": 25,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (MEA)",
            "Ethylamine (ETAM)",
            "Phenethylamine (PEA)",
            "Tyramine (TYR)",
            "Trypanothione",
            "Amphetamine (AMP)",
            "Methamphetamine (METH)",
            "Phenylethylamine (PEA)",
            "Noradrenaline (NOR)",
            "Dopamine (DA)",
            "Adrenaline (AD)",
            "Serotonin (5-HT)",
            "Melatonin (MLT)",
            "Tyrosine",
            "Tryptamine (TRP)",
            "5-Hydroxytryptophan (5-Hydroxy-L-tryptophan)",
            "Glucosamine (D-Glucosamine)",
            "Galactosamine (D-Galactosamine)",
            "Spermidine",
            "Spermine",
            "Putrescine",
            "Cadaverine",
            "Histamine (H1)",
            "Agmatine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (MEA)",
                "Ethylamine (ETAM)",
                "Methamphetamine (METH)",
                "Phenylethylamine (PEA)"
            ],
            "mismatches": [
                "Phenethylamine (PEA)",
                "Tyramine (TYR)",
                "Trypanothione",
                "Amphetamine (AMP)",
                "Noradrenaline (NOR)",
                "Dopamine (DA)",
                "Adrenaline (AD)",
                "Serotonin (5-HT)",
                "Melatonin (MLT)",
                "Tyrosine",
                "Tryptamine (TRP)",
                "5-Hydroxytryptophan (5-Hydroxy-L-tryptophan)",
                "Glucosamine (D-Glucosamine)",
                "Galactosamine (D-Galactosamine)",
                "Spermidine",
                "Spermine",
                "Putrescine",
                "Cadaverine",
                "Histamine (H1)",
                "Agmatine"
            ],
            "true_referents": [
                "(R)-amphetamine",
                "(S)-(+)-4-(5-carboxypentyl)methamphetamine",
                "(S)-amphetamine",
                "1-Hexadecylamine",
                "1-phenylethylamine",
                "2,4-dimethylpentan-3-amine",
                "2-hydroxy-5-[(1E)-(2-phenylethylidene)amino]-L-tyrosine",
                "2-phenylethylamine",
                "3-methoxytyramine",
                "4-methoxytyramine",
                "4-methyl-3-penten-1-amine",
                "Decylamine",
                "L-tryptophan 2-naphthylamide",
                "L-tyrosine 2-naphthylamide",
                "N-(2-hydroxyethyl)docosa-7,10,13,16-tetraenamide",
                "N-acylethanolamine",
                "Noralfentanil",
                "Phenelzine",
                "Putrescine_d4",
                "alkylamine",
                "benzylamine",
                "butan-1-amine",
                "candicine",
                "cyclopropylamine",
                "cysteamine",
                "diethanolamine",
                "dodecylamine",
                "etanidazole",
                "ethanolamine",
                "ethylamine",
                "glycyl-L-tryptophan 2-naphthylamide",
                "kitastatin 1",
                "lamotrigine",
                "methamphetamine",
                "methylamine",
                "norfentanyl",
                "phenylethylamine",
                "tert-butylamine"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "primary amine",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "methylamine",
                "Canonical Name": "methylamine"
            },
            {
                "Referent": "dimethylamine",
                "Canonical Name": "dimethylamine"
            },
            {
                "Referent": "trimethylamine",
                "Canonical Name": "trimethylamine"
            },
            {
                "Referent": "ethanamine",
                "Canonical Name": "ethanamine"
            },
            {
                "Referent": "propan-1-amine",
                "Canonical Name": "propan-1-amine"
            },
            {
                "Referent": "propan-2-amine",
                "Canonical Name": "propan-2-amine"
            },
            {
                "Referent": "propan-3-amine",
                "Canonical Name": "propan-3-amine"
            },
            {
                "Referent": "butan-1-amine",
                "Canonical Name": "butan-1-amine"
            },
            {
                "Referent": "butan-2-amine",
                "Canonical Name": "butan-2-amine"
            },
            {
                "Referent": "butan-3-amine",
                "Canonical Name": "butan-3-amine"
            },
            {
                "Referent": "pentan-1-amine",
                "Canonical Name": "pentan-1-amine"
            },
            {
                "Referent": "pentan-2-amine",
                "Canonical Name": "pentan-2-amine"
            },
            {
                "Referent": "pentan-3-amine",
                "Canonical Name": "pentan-3-amine"
            },
            {
                "Referent": "hexan-1-amine",
                "Canonical Name": "hexan-1-amine"
            },
            {
                "Referent": "hexan-2-amine",
                "Canonical Name": "hexan-2-amine"
            },
            {
                "Referent": "hexan-3-amine",
                "Canonical Name": "hexan-3-amine"
            },
            {
                "Referent": "heptan-1-amine",
                "Canonical Name": "heptan-1-amine"
            },
            {
                "Referent": "heptan-2-amine",
                "Canonical Name": "heptan-2-amine"
            },
            {
                "Referent": "heptan-3-amine",
                "Canonical Name": "heptan-3-amine"
            },
            {
                "Referent": "octan-1-amine",
                "Canonical Name": "octan-1-amine"
            },
            {
                "Referent": "octan-2-amine",
                "Canonical Name": "octan-2-amine"
            },
            {
                "Referent": "octan-3-amine",
                "Canonical Name": "octan-3-amine"
            },
            {
                "Referent": "nonan-1-amine",
                "Canonical Name": "nonan-1-amine"
            },
            {
                "Referent": "nonan-2-amine",
                "Canonical Name": "nonan-2-amine"
            },
            {
                "Referent": "nonan-3-amine",
                "Canonical Name": "nonan-3-amine"
            },
            {
                "Referent": "decane-1-amine",
                "Canonical Name": "decane-1-amine"
            },
            {
                "Referent": "decane-2-amine",
                "Canonical Name": "decane-2-amine"
            },
            {
                "Referent": "decane-3-amine",
                "Canonical Name": "decane-3-amine"
            },
            {
                "Referent": "undecane-1-amine",
                "Canonical Name": "undecane-1-amine"
            },
            {
                "Referent": "undecane-2-amine",
                "Canonical Name": "undecane-2-amine"
            },
            {
                "Referent": "undecane-3-amine",
                "Canonical Name": "undecane-3-amine"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methylamine",
                "butan-1-amine",
                "pentan-1-amine",
                "pentan-3-amine",
                "octan-1-amine"
            ],
            "mismatches": [
                "dimethylamine",
                "trimethylamine",
                "ethanamine",
                "propan-1-amine",
                "propan-2-amine",
                "propan-3-amine",
                "butan-2-amine",
                "butan-3-amine",
                "hexan-1-amine",
                "hexan-2-amine",
                "hexan-3-amine",
                "heptan-1-amine",
                "heptan-2-amine",
                "heptan-3-amine",
                "octan-2-amine",
                "octan-3-amine",
                "nonan-1-amine",
                "nonan-2-amine",
                "nonan-3-amine",
                "decane-1-amine",
                "decane-2-amine",
                "decane-3-amine",
                "undecane-1-amine",
                "undecane-2-amine",
                "undecane-3-amine"
            ],
            "true_referents": [
                "(+/-)5(6)-EET Ethanolamide",
                "1-(1-adamantyl)ethanamine",
                "1-Hexadecylamine",
                "1-hexanamine",
                "2,4-dimethylpentan-3-amine",
                "2-hexanamine",
                "3-(2-ethylhexoxy)propan-1-amine",
                "3-buten-1-amine",
                "N,N-Dimethylphenethylamine",
                "alkylamine",
                "butan-1-amine",
                "ethylamine",
                "methylamine",
                "methylhexaneamine",
                "octan-1-amine",
                "pentan-1-amine",
                "pentan-3-amine"
            ],
            "TP": 5,
            "FP": 25,
            "FN": 0
        }
    }
]