[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Propylamine (C3H7NH2)",
            "Butylamine (C4H9NH2)",
            "Isopropylamine ((CH3)2CHNH2)",
            "Sec-butylamine ((CH3)2CHCH2NH2)",
            "Tert-butylamine ((CH3)3CNH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Aniline (C6H5NH2)",
            "Morpholine (C4H7NO)",
            "Pyrrolidine (C4H7N)",
            "Piperidine (C5H9N)",
            "Trimethylamine ((CH3)3N)",
            "Triethylamine ((C2H5)3N)",
            "Dimethylamine (CH3)2NH",
            "Diethylamine (C2H5)2NH",
            "Ethanolamine (C2H5CH2NH2)",
            "Isopropanolamine (C3H7CH2NH2)",
            "2-Phenylethylamine (C6H5CH2CH2NH2)",
            "N-Methylpiperidine (C5H11N)",
            "N-Ethylpiperidine (C6H13N)",
            "N,N-Dimethylbenzylamine (C8H13N)",
            "N-Methylmorpholine (C5H11NO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Propylamine (C3H7NH2)",
                "Butylamine (C4H9NH2)",
                "Isopropylamine ((CH3)2CHNH2)",
                "Sec-butylamine ((CH3)2CHCH2NH2)",
                "Tert-butylamine ((CH3)3CNH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Aniline (C6H5NH2)",
                "Morpholine (C4H7NO)",
                "Pyrrolidine (C4H7N)",
                "Piperidine (C5H9N)",
                "Trimethylamine ((CH3)3N)",
                "Triethylamine ((C2H5)3N)",
                "Dimethylamine (CH3)2NH)",
                "Diethylamine (C2H5)2NH)",
                "Ethanolamine (C2H5CH2NH2)",
                "Isopropanolamine (C3H7CH2NH2)",
                "2-Phenylethylamine (C6H5CH2CH2NH2)",
                "N-Methylpiperidine (C5H11N)",
                "N-Ethylpiperidine (C6H13N)",
                "N,N-Dimethylbenzylamine (C8H13N)",
                "N-Methylmorpholine (C5H11NO)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Phenylethylamine (C6H5CH2CH2NH2)",
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Butylamine (C4H9NH2)",
                "Diethylamine (C2H5)2NH",
                "Dimethylamine (CH3)2NH",
                "Ethanolamine (C2H5CH2NH2)",
                "Ethylamine (C2H5NH2)",
                "Isopropanolamine (C3H7CH2NH2)",
                "Isopropylamine ((CH3)2CHNH2)",
                "Methylamine (CH3NH2)",
                "Morpholine (C4H7NO)",
                "N,N-Dimethylbenzylamine (C8H13N)",
                "N-Ethylpiperidine (C6H13N)",
                "N-Methylmorpholine (C5H11NO)",
                "N-Methylpiperidine (C5H11N)",
                "Piperidine (C5H9N)",
                "Propylamine (C3H7NH2)",
                "Pyrrolidine (C4H7N)",
                "Sec-butylamine ((CH3)2CHCH2NH2)",
                "Tert-butylamine ((CH3)3CNH2)",
                "Triethylamine ((C2H5)3N)",
                "Trimethylamine ((CH3)3N)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Dimethylamine ((CH3)2NH)",
            "Diethylamine ((C2H5)2NH)",
            "Trimethylamine ((CH3)3N)",
            "Propylamine (C3H7NH2)",
            "Isopropylamine ((CH3)2CHNH2)",
            "Butylamine (C4H9NH2)",
            "Isobutylamine ((CH3)2CHCH2NH2)",
            "tert-Butylamine ((CH3)3CNH2)",
            "Aniline (C6H5NH2)",
            "N-Methylaniline (C6H5NHC2H5)",
            "N,N-Dimethylaniline ((CH3)2NC6H5)",
            "N-Ethylaniline (C6H5NHC2H5)",
            "N,N-Diethylaniline ((C2H5)2NC6H5)",
            "Benzylamine (C6H5CH2NH2)",
            "N-Methylbenzylamine (C6H5CH2NHC2H5)",
            "N,N-Dimethylbenzylamine ((CH3)2NC6H5CH2)",
            "Cyclohexylamine (C6H11NH2)",
            "N-Methylcyclohexylamine (C6H11NHC2H5)",
            "N,N-Dimethylcyclohexylamine ((CH3)2NC6H11)",
            "Phenethylamine (C6H5CH2CH2NH2)",
            "N-Methylnorpseudoephedrine (C10H15NO)",
            "N,N-Dimethylethylamine ((CH3)2NC2H5)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Dimethylamine ((CH3)2NH)",
                "Diethylamine ((C2H5)2NH)",
                "Trimethylamine ((CH3)3N)",
                "Propylamine (C3H7NH2)",
                "Isopropylamine ((CH3)2CHNH2)",
                "Butylamine (C4H9NH2)",
                "Isobutylamine ((CH3)2CHCH2NH2)",
                "tert-Butylamine ((CH3)3CNH2)",
                "Aniline (C6H5NH2)",
                "N-Methylaniline (C6H5NHC2H5)",
                "N,N-Dimethylaniline ((CH3)2NC6H5)",
                "N-Ethylaniline (C6H5NHC2H5)",
                "Benzylamine (C6H5CH2NH2)",
                "N-Methylbenzylamine (C6H5CH2NHC2H5)",
                "N,N-Dimethylbenzylamine ((CH3)2NC6H5CH2)",
                "Cyclohexylamine (C6H11NH2)",
                "N-Methylcyclohexylamine (C6H11NHC2H5)",
                "N,N-Dimethylcyclohexylamine ((CH3)2NC6H11)",
                "Phenethylamine (C6H5CH2CH2NH2)",
                "N-Methylnorpseudoephedrine (C10H15NO)",
                "N,N-Dimethylethylamine ((CH3)2NC2H5)"
            ],
            "mismatches": [
                "N,N-Diethylaniline ((C2H5)2NC6H5)"
            ],
            "true_referents": [
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Butylamine (C4H9NH2)",
                "Cyclohexylamine (C6H11NH2)",
                "Diethylamine ((C2H5)2NH)",
                "Dimethylamine ((CH3)2NH)",
                "Ethylamine (C2H5NH2)",
                "Isobutylamine ((CH3)2CHCH2NH2)",
                "Isopropylamine ((CH3)2CHNH2)",
                "Methylamine (CH3NH2)",
                "N,N-Diethylaniline ((C2H5)2NC6H5)",
                "N,N-Dimethylaniline ((CH3)2NC6H5)",
                "N,N-Dimethylbenzylamine ((CH3)2NC6H5CH2)",
                "N,N-Dimethylcyclohexylamine ((CH3)2NC6H11)",
                "N,N-Dimethylethylamine ((CH3)2NC2H5)",
                "N-Ethylaniline (C6H5NHC2H5)",
                "N-Methylaniline (C6H5NHC2H5)",
                "N-Methylbenzylamine (C6H5CH2NHC2H5)",
                "N-Methylcyclohexylamine (C6H11NHC2H5)",
                "N-Methylnorpseudoephedrine (C10H15NO)",
                "Phenethylamine (C6H5CH2CH2NH2)",
                "Propylamine (C3H7NH2)",
                "Trimethylamine ((CH3)3N)",
                "tert-Butylamine ((CH3)3CNH2)"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Dimethylamine ((CH3)2NH)",
            "Ethylamine (C2H5NH2)",
            "Diethylamine ((C2H5)2NH)",
            "Propylamine (C3H7NH2)",
            "Dipropylamine ((C3H7)2NH)",
            "Butylamine (C4H9NH2)",
            "Dibutylamine ((C4H9)2NH)",
            "Phenylamine (C6H5NH2)",
            "Diphenylamine ((C6H5)2NH)",
            "Methylethylamine (CH3C2H5NH)",
            "Methylpropylamine (CH3C3H7NH)",
            "Ethylpropylamine (C2H5C3H7NH)",
            "Methylbutylamine (CH3C4H9NH)",
            "Ethylbutylamine (C2H5C4H9NH)",
            "Propybutylamine (C3H7C4H9NH)",
            "Methylphenylamine (CH3C6H5NH)",
            "Ethylphenylamine (C2H5C6H5NH)",
            "Propylphenylamine (C3H7C6H5NH)",
            "Butylphenylamine (C4H9C6H5NH)",
            "Diphenylmethylamine (C6H5C6H5CH3NH)",
            "Diphenylethylamine (C6H5C6H5C2H5NH)",
            "Diphenylpropylamine (C6H5C6H5C3H7NH)",
            "Diphenylbutylamine (C6H5C6H5C4H9NH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Dimethylamine ((CH3)2NH)",
                "Ethylamine (C2H5NH2)",
                "Diethylamine ((C2H5)2NH)",
                "Propylamine (C3H7NH2)",
                "Dipropylamine ((C3H7)2NH)",
                "Butylamine (C4H9NH2)",
                "Dibutylamine ((C4H9)2NH)",
                "Phenylamine (C6H5NH2)",
                "Diphenylamine ((C6H5)2NH)",
                "Methylethylamine (CH3C2H5NH)",
                "Methylpropylamine (CH3C3H7NH)",
                "Ethylpropylamine (C2H5C3H7NH)",
                "Methylbutylamine (CH3C4H9NH)",
                "Ethylbutylamine (C2H5C4H9NH)",
                "Propybutylamine (C3H7C4H9NH)",
                "Methylphenylamine (CH3C6H5NH)",
                "Ethylphenylamine (C2H5C6H5NH)",
                "Propylphenylamine (C3H7C6H5NH)",
                "Butylphenylamine (C4H9C6H5NH)",
                "Diphenylmethylamine (C6H5C6H5CH3NH)",
                "Diphenylethylamine (C6H5C6H5C2H5NH)",
                "Diphenylpropylamine (C6H5C6H5C3H7NH)",
                "Diphenylbutylamine (C6H5C6H5C4H9NH)"
            ],
            "mismatches": [],
            "true_referents": [
                "Butylamine (C4H9NH2)",
                "Butylphenylamine (C4H9C6H5NH)",
                "Dibutylamine ((C4H9)2NH)",
                "Diethylamine ((C2H5)2NH)",
                "Dimethylamine ((CH3)2NH)",
                "Diphenylamine ((C6H5)2NH)",
                "Diphenylbutylamine (C6H5C6H5C4H9NH)",
                "Diphenylethylamine (C6H5C6H5C2H5NH)",
                "Diphenylmethylamine (C6H5C6H5CH3NH)",
                "Diphenylpropylamine (C6H5C6H5C3H7NH)",
                "Dipropylamine ((C3H7)2NH)",
                "Ethylamine (C2H5NH2)",
                "Ethylbutylamine (C2H5C4H9NH)",
                "Ethylphenylamine (C2H5C6H5NH)",
                "Ethylpropylamine (C2H5C3H7NH)",
                "Methylamine (CH3NH2)",
                "Methylbutylamine (CH3C4H9NH)",
                "Methylethylamine (CH3C2H5NH)",
                "Methylphenylamine (CH3C6H5NH)",
                "Methylpropylamine (CH3C3H7NH)",
                "Phenylamine (C6H5NH2)",
                "Propybutylamine (C3H7C4H9NH)",
                "Propylamine (C3H7NH2)",
                "Propylphenylamine (C3H7C6H5NH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Dimethylamine (DMA)",
            "Diethylamine (DEA)",
            "Dipropylamine (DPA)",
            "Dibutylamine (DBA)",
            "Methylpropylamine (MPA)",
            "Methylbenzylamine (MBA)",
            "Ethylbenzylamine (EBA)",
            "Pyrrolidine (Pyr)",
            "Piperidine (Pip)",
            "Morpholine (Morph)",
            "N-Methylpiperidine (NMPip)",
            "N-Ethylpiperidine (NEPip)",
            "N-Methylmorpholine (NMMorph)",
            "N-Ethylmorpholine (NEMorph)",
            "Benzylmethylamine (BMA)",
            "Benzylpropylamine (BPA)",
            "N,N-Dimethylformamide (DMF)",
            "N,N-Diethylformamide (DEF)",
            "N,N-Dimethylacetamide (DMAc)",
            "N,N-Diethylacetamide (DEAc)",
            "N-Methylaniline (NMA)",
            "N-Ethylaniline (NEA)",
            "N-Isopropylbenzylamine (NIBA)",
            "N-Methylcyclohexylamine (NMCHA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethylamine (DMA)",
                "Diethylamine (DEA)",
                "Dipropylamine (DPA)",
                "Dibutylamine (DBA)",
                "Methylpropylamine (MPA)",
                "Methylbenzylamine (MBA)",
                "Ethylbenzylamine (EBA)",
                "Pyrrolidine (Pyr)",
                "Piperidine (Pip)",
                "Morpholine (Morph)",
                "N-Methylpiperidine (NMPip)",
                "N-Ethylpiperidine (NEPip)",
                "N-Methylmorpholine (NMMorph)",
                "N-Ethylmorpholine (NEMorph)",
                "Benzylmethylamine (BMA)",
                "Benzylpropylamine (BPA)",
                "N,N-Dimethylformamide (DMF)",
                "N,N-Diethylformamide (DEF)",
                "N,N-Dimethylacetamide (DMAc)",
                "N,N-Diethylacetamide (DEAc)",
                "N-Methylaniline (NMA)",
                "N-Ethylaniline (NEA)",
                "N-Isopropylbenzylamine (NIBA)",
                "N-Methylcyclohexylamine (NMCHA)"
            ],
            "mismatches": [],
            "true_referents": [
                "Benzylmethylamine (BMA)",
                "Benzylpropylamine (BPA)",
                "Dibutylamine (DBA)",
                "Diethylamine (DEA)",
                "Dimethylamine (DMA)",
                "Dipropylamine (DPA)",
                "Ethylbenzylamine (EBA)",
                "Methylbenzylamine (MBA)",
                "Methylpropylamine (MPA)",
                "Morpholine (Morph)",
                "N,N-Diethylacetamide (DEAc)",
                "N,N-Diethylformamide (DEF)",
                "N,N-Dimethylacetamide (DMAc)",
                "N,N-Dimethylformamide (DMF)",
                "N-Ethylaniline (NEA)",
                "N-Ethylmorpholine (NEMorph)",
                "N-Ethylpiperidine (NEPip)",
                "N-Isopropylbenzylamine (NIBA)",
                "N-Methylaniline (NMA)",
                "N-Methylcyclohexylamine (NMCHA)",
                "N-Methylmorpholine (NMMorph)",
                "N-Methylpiperidine (NMPip)",
                "Piperidine (Pip)",
                "Pyrrolidine (Pyr)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Dimethylamine ((CH3)2NH)",
            "Ethylamine (C2H5NH2)",
            "Diethylamine ((C2H5)2NH)",
            "Propylamine (C3H7NH2)",
            "Isopropylamine ((CH3)2CHNH2)",
            "Butylamine (C4H9NH2)",
            "Diisopropylamine ((CH3)2CHNH(CH3)2)",
            "Aniline (C6H5NH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Cyclohexylamine (C6H11NH2)",
            "Piperidine (C5H10NH)",
            "Pyrrolidine (C4H9NH)",
            "Morpholine (C4H9NO)",
            "Ethylenediamine (C2H4(NH2)2)",
            "Triethylamine ((C2H5)3N)",
            "N-Methylaniline (C6H5NHCH3)",
            "N-Ethylaniline (C6H5NHC2H5)",
            "N-Methylcyclohexylamine (C6H11NHCH3)",
            "N,N-Dimethylaniline (C6H5N(CH3)2)",
            "N-Methylpiperidine (C5H10NCH3)",
            "N-Methylpyrrolidine (C4H9NCH3)",
            "N-Methylmorpholine (C4H9NOCH3)",
            "N-Methyl-N-ethylamine (C3H9N)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Dimethylamine ((CH3)2NH)",
                "Ethylamine (C2H5NH2)",
                "Diethylamine ((C2H5)2NH)",
                "Propylamine (C3H7NH2)",
                "Isopropylamine ((CH3)2CHNH2)",
                "Butylamine (C4H9NH2)",
                "Diisopropylamine ((CH3)2CHNH(CH3)2)",
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Cyclohexylamine (C6H11NH2)",
                "Piperidine (C5H10NH)",
                "Pyrrolidine (C4H9NH)",
                "Morpholine (C4H9NO)",
                "Ethylenediamine (C2H4(NH2)2)",
                "Triethylamine ((C2H5)3N)",
                "N-Methylaniline (C6H5NHCH3)",
                "N-Ethylaniline (C6H5NHC2H5)",
                "N-Methylcyclohexylamine (C6H11NHCH3)",
                "N,N-Dimethylaniline (C6H5N(CH3)2)",
                "N-Methylpiperidine (C5H10NCH3)",
                "N-Methylpyrrolidine (C4H9NCH3)",
                "N-Methylmorpholine (C4H9NOCH3)",
                "N-Methyl-N-ethylamine (C3H9N)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Butylamine (C4H9NH2)",
                "Cyclohexylamine (C6H11NH2)",
                "Diethylamine ((C2H5)2NH)",
                "Diisopropylamine ((CH3)2CHNH(CH3)2)",
                "Dimethylamine ((CH3)2NH)",
                "Ethylamine (C2H5NH2)",
                "Ethylenediamine (C2H4(NH2)2)",
                "Isopropylamine ((CH3)2CHNH2)",
                "Methylamine (CH3NH2)",
                "Morpholine (C4H9NO)",
                "N,N-Dimethylaniline (C6H5N(CH3)2)",
                "N-Ethylaniline (C6H5NHC2H5)",
                "N-Methyl-N-ethylamine (C3H9N)",
                "N-Methylaniline (C6H5NHCH3)",
                "N-Methylcyclohexylamine (C6H11NHCH3)",
                "N-Methylmorpholine (C4H9NOCH3)",
                "N-Methylpiperidine (C5H10NCH3)",
                "N-Methylpyrrolidine (C4H9NCH3)",
                "Piperidine (C5H10NH)",
                "Propylamine (C3H7NH2)",
                "Pyrrolidine (C4H9NH)",
                "Triethylamine ((C2H5)3N)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (MA)",
            "Ethylamine (EA)",
            "Isopropylamine (IPA)",
            "Butylamine (BA)",
            "Pentylamine (PA)",
            "Hexylamine (HA)",
            "Cyclohexylamine (CHA)",
            "Phenethylamine (PEA)",
            "Benzylamine (BZA)",
            "Dimethylamine (DMA)",
            "Diethylamine (DEA)",
            "Dipropylamine (DPA)",
            "Triethylamine (TEA)",
            "N-Methyl-N-ethylamine (NMEA)",
            "N,N-Dimethylamine (NDMA)",
            "N,N-Diethylamine (NDEA)",
            "N,N-Dipropylamine (NDPA)",
            "N-Methylbenzylamine (NMBA)",
            "N-Ethylbenzylamine (NEBA)",
            "N,N-Bis(2-methylpropyl)amine (NBPA)",
            "N,N-Bis(ethyl)amine (NBA)",
            "N,N-Bis(phenyl)amine (NBPA)",
            "N,N-Di(2-ethylhexyl)amine (NDEHA)",
            "N-Methyl-N-propylamine (NMPA)",
            "N-Ethyl-N-butylamine (NEBA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (MA)",
                "Ethylamine (EA)",
                "Isopropylamine (IPA)",
                "Butylamine (BA)",
                "Pentylamine (PA)",
                "Hexylamine (HA)",
                "Cyclohexylamine (CHA)",
                "Phenethylamine (PEA)",
                "Benzylamine (BZA)",
                "Dimethylamine (DMA)",
                "Diethylamine (DEA)",
                "Dipropylamine (DPA)",
                "Triethylamine (TEA)",
                "N-Methyl-N-ethylamine (NMEA)",
                "N,N-Dimethylamine (NDMA)",
                "N,N-Diethylamine (NDEA)",
                "N,N-Dipropylamine (NDPA)",
                "N-Methylbenzylamine (NMBA)",
                "N-Ethylbenzylamine (NEBA)",
                "N,N-Bis(2-methylpropyl)amine (NBPA)",
                "N,N-Bis(ethyl)amine (NBA)",
                "N,N-Bis(phenyl)amine (NBPA)",
                "N,N-Di(2-ethylhexyl)amine (NDEHA)",
                "N-Methyl-N-propylamine (NMPA)"
            ],
            "mismatches": [
                "N-Ethyl-N-butylamine (NEBA)"
            ],
            "true_referents": [
                "Benzylamine (BZA)",
                "Butylamine (BA)",
                "Cyclohexylamine (CHA)",
                "Diethylamine (DEA)",
                "Dimethylamine (DMA)",
                "Dipropylamine (DPA)",
                "Ethylamine (EA)",
                "Hexylamine (HA)",
                "Isopropylamine (IPA)",
                "Methylamine (MA)",
                "N,N-Bis(2-methylpropyl)amine (NBPA)",
                "N,N-Bis(ethyl)amine (NBA)",
                "N,N-Bis(phenyl)amine (NBPA)",
                "N,N-Di(2-ethylhexyl)amine (NDEHA)",
                "N,N-Diethylamine (NDEA)",
                "N,N-Dimethylamine (NDMA)",
                "N,N-Dipropylamine (NDPA)",
                "N-Ethylbenzylamine (NEBA)",
                "N-Methyl-N-ethylamine (NMEA)",
                "N-Methyl-N-propylamine (NMPA)",
                "N-Methylbenzylamine (NMBA)",
                "Pentylamine (PA)",
                "Phenethylamine (PEA)",
                "Triethylamine (TEA)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Methanamine (CH3NH2)",
            "Ethanamine (C2H5NH2)",
            "Propanamine (C3H7NH2)",
            "Butanamine (C4H9NH2)",
            "Pentanamine (C5H11NH2)",
            "Hexanamine (C6H13NH2)",
            "Heptanamine (C7H15NH2)",
            "Octanamine (C8H17NH2)",
            "Nonanamine (C9H19NH2)",
            "Decanamine (C10H21NH2)",
            "Undecanamine (C11H23NH2)",
            "Dodecanamine (C12H25NH2)",
            "Tridecanamine (C13H27NH2)",
            "Tetradecanamine (C14H29NH2)",
            "Pentadecanamine (C15H31NH2)",
            "Hexadecanamine (C16H33NH2)",
            "Heptadecanamine (C17H35NH2)",
            "Octadecanamine (C18H37NH2)",
            "Nonadecanamine (C19H39NH2)",
            "Icosanamine (C20H41NH2)",
            "Heneicosanamine (C21H43NH2)",
            "Docosanamine (C22H45NH2)",
            "Tricosanamine (C23H47NH2)",
            "Tetracosanamine (C24H49NH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methanamine (CH3NH2)",
                "Ethanamine (C2H5NH2)",
                "Propanamine (C3H7NH2)",
                "Butanamine (C4H9NH2)",
                "Pentanamine (C5H11NH2)",
                "Hexanamine (C6H13NH2)",
                "Heptanamine (C7H15NH2)",
                "Octanamine (C8H17NH2)",
                "Nonanamine (C9H19NH2)",
                "Decanamine (C10H21NH2)",
                "Undecanamine (C11H23NH2)",
                "Dodecanamine (C12H25NH2)",
                "Tridecanamine (C13H27NH2)",
                "Tetradecanamine (C14H29NH2)",
                "Pentadecanamine (C15H31NH2)",
                "Hexadecanamine (C16H33NH2)",
                "Heptadecanamine (C17H35NH2)",
                "Octadecanamine (C18H37NH2)",
                "Nonadecanamine (C19H39NH2)",
                "Icosanamine (C20H41NH2)",
                "Heneicosanamine (C21H43NH2)",
                "Docosanamine (C22H45NH2)",
                "Tricosanamine (C23H47NH2)",
                "Tetracosanamine (C24H49NH2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Butanamine (C4H9NH2)",
                "Decanamine (C10H21NH2)",
                "Docosanamine (C22H45NH2)",
                "Dodecanamine (C12H25NH2)",
                "Ethanamine (C2H5NH2)",
                "Heneicosanamine (C21H43NH2)",
                "Heptadecanamine (C17H35NH2)",
                "Heptanamine (C7H15NH2)",
                "Hexadecanamine (C16H33NH2)",
                "Hexanamine (C6H13NH2)",
                "Icosanamine (C20H41NH2)",
                "Methanamine (CH3NH2)",
                "Nonadecanamine (C19H39NH2)",
                "Nonanamine (C9H19NH2)",
                "Octadecanamine (C18H37NH2)",
                "Octanamine (C8H17NH2)",
                "Pentadecanamine (C15H31NH2)",
                "Pentanamine (C5H11NH2)",
                "Propanamine (C3H7NH2)",
                "Tetracosanamine (C24H49NH2)",
                "Tetradecanamine (C14H29NH2)",
                "Tricosanamine (C23H47NH2)",
                "Tridecanamine (C13H27NH2)",
                "Undecanamine (C11H23NH2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "methylamine",
            "ethylamine",
            "propylamine",
            "butylamine",
            "isopropylamine",
            "isobutylamine",
            "sec-butylamine",
            "tert-butylamine",
            "phenethylamine",
            "benzylamine",
            "cyclohexylamine",
            "2-phenylethylamine",
            "3-phenylpropylamine",
            "4-phenylbutylamine",
            "2-methylpropylamine",
            "2-ethylbutylamine",
            "2-isopropylbutylamine",
            "2-isobutylbutylamine",
            "2-sec-butylbutylamine",
            "2-tert-butylbutylamine",
            "2-phenylethylbutylamine",
            "2-benzylbutylamine",
            "2-cyclohexylbutylamine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methylamine",
                "ethylamine",
                "propylamine",
                "butylamine",
                "isopropylamine",
                "isobutylamine",
                "sec-butylamine",
                "tert-butylamine",
                "phenethylamine",
                "benzylamine",
                "cyclohexylamine",
                "2-phenylethylamine",
                "3-phenylpropylamine",
                "4-phenylbutylamine",
                "2-methylpropylamine",
                "2-ethylbutylamine",
                "2-isopropylbutylamine",
                "2-isobutylbutylamine",
                "2-sec-butylbutylamine",
                "2-tert-butylbutylamine",
                "2-phenylethylbutylamine",
                "2-benzylbutylamine",
                "2-cyclohexylbutylamine"
            ],
            "mismatches": [],
            "true_referents": [
                "2-benzylbutylamine",
                "2-cyclohexylbutylamine",
                "2-ethylbutylamine",
                "2-isobutylbutylamine",
                "2-isopropylbutylamine",
                "2-methylpropylamine",
                "2-phenylethylamine",
                "2-phenylethylbutylamine",
                "2-sec-butylbutylamine",
                "2-tert-butylbutylamine",
                "3-phenylpropylamine",
                "4-phenylbutylamine",
                "benzylamine",
                "butylamine",
                "cyclohexylamine",
                "ethylamine",
                "isobutylamine",
                "isopropylamine",
                "methylamine",
                "phenethylamine",
                "propylamine",
                "sec-butylamine",
                "tert-butylamine"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Dimethylamine (DMA)",
            "Diethylamine (DEA)",
            "Dipropylamine",
            "Diphenylamine",
            "Methyl Ethylamine",
            "Methyl Propylamine",
            "Methyl Isopropylamine",
            "Ethyl Propylamine",
            "Ethyl Isopropylamine",
            "Methyl Butylamine",
            "Methyl Isobutylamine",
            "Methyl Sec-Butylamine",
            "Methyl tert-Butylamine",
            "Phenethylamine",
            "Benzyl Ethylamine",
            "Cyclohexylmethylamine",
            "N-Methylbenzylamine",
            "N-Ethylcyclohexylamine",
            "N-Methylbutylamine",
            "N-Isopropylmethylamine",
            "N-Methylisobutylamine",
            "N-Propylmethylamine",
            "N-Ethylmethylamine",
            "N-Cyclopropylmethylamine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethylamine (DMA)",
                "Diethylamine (DEA)",
                "Dipropylamine",
                "Diphenylamine",
                "Methyl Ethylamine",
                "Methyl Propylamine",
                "Methyl Isopropylamine",
                "Ethyl Propylamine",
                "Ethyl Isopropylamine",
                "Methyl Butylamine",
                "Methyl Isobutylamine",
                "Methyl Sec-Butylamine",
                "Methyl tert-Butylamine",
                "Phenethylamine",
                "Benzyl Ethylamine",
                "Cyclohexylmethylamine",
                "N-Methylbenzylamine",
                "N-Ethylcyclohexylamine",
                "N-Methylbutylamine",
                "N-Isopropylmethylamine",
                "N-Methylisobutylamine",
                "N-Propylmethylamine",
                "N-Ethylmethylamine",
                "N-Cyclopropylmethylamine"
            ],
            "mismatches": [],
            "true_referents": [
                "Benzyl Ethylamine",
                "Cyclohexylmethylamine",
                "Diethylamine (DEA)",
                "Dimethylamine (DMA)",
                "Diphenylamine",
                "Dipropylamine",
                "Ethyl Isopropylamine",
                "Ethyl Propylamine",
                "Methyl Butylamine",
                "Methyl Ethylamine",
                "Methyl Isobutylamine",
                "Methyl Isopropylamine",
                "Methyl Propylamine",
                "Methyl Sec-Butylamine",
                "Methyl tert-Butylamine",
                "N-Cyclopropylmethylamine",
                "N-Ethylcyclohexylamine",
                "N-Ethylmethylamine",
                "N-Isopropylmethylamine",
                "N-Methylbenzylamine",
                "N-Methylbutylamine",
                "N-Methylisobutylamine",
                "N-Propylmethylamine",
                "Phenethylamine"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Dimethylamine (DMA)",
            "Diethylamine (DEA)",
            "Dipropylamine (DPA)",
            "Dibutylamine (DBA)",
            "Methylethylamine (MEA)",
            "Ethylpropylamine (EPA)",
            "Methylpropylamine (MPA)",
            "Ethylbutylamine (EBA)",
            "Methylbutylamine (MBA)",
            "Propylbutylamine (PBA)",
            "Diisobutylamine (DIBA)",
            "Diisopropylamine (DIPA)",
            "Methylisopropylamine (MIPA)",
            "Ethylisopropylamine (EIPA)",
            "Methylisobutylamine (MIBA)",
            "Ethylisobutylamine (EIBA)",
            "Dicyclohexylamine (DCHA)",
            "Methylcyclohexylamine (MCHA)",
            "Ethylcyclohexylamine (ECHA)",
            "Dibenzylamine (DBzA)",
            "Methylbenzylamine (MBzA)",
            "Ethylbenzylamine (EBzA)",
            "Diphenylamine (DPhA)",
            "Methylphenylamine (MPhA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethylamine (DMA)",
                "Diethylamine (DEA)",
                "Dipropylamine (DPA)",
                "Dibutylamine (DBA)",
                "Methylethylamine (MEA)",
                "Ethylpropylamine (EPA)",
                "Methylpropylamine (MPA)",
                "Ethylbutylamine (EBA)",
                "Methylbutylamine (MBA)",
                "Propylbutylamine (PBA)",
                "Diisobutylamine (DIBA)",
                "Diisopropylamine (DIPA)",
                "Methylisopropylamine (MIPA)",
                "Ethylisopropylamine (EIPA)",
                "Methylisobutylamine (MIBA)",
                "Ethylisobutylamine (EIBA)",
                "Dicyclohexylamine (DCHA)",
                "Methylcyclohexylamine (MCHA)",
                "Ethylcyclohexylamine (ECHA)",
                "Dibenzylamine (DBzA)",
                "Methylbenzylamine (MBzA)",
                "Ethylbenzylamine (EBzA)",
                "Diphenylamine (DPhA)",
                "Methylphenylamine (MPhA)"
            ],
            "mismatches": [],
            "true_referents": [
                "Dibenzylamine (DBzA)",
                "Dibutylamine (DBA)",
                "Dicyclohexylamine (DCHA)",
                "Diethylamine (DEA)",
                "Diisobutylamine (DIBA)",
                "Diisopropylamine (DIPA)",
                "Dimethylamine (DMA)",
                "Diphenylamine (DPhA)",
                "Dipropylamine (DPA)",
                "Ethylbenzylamine (EBzA)",
                "Ethylbutylamine (EBA)",
                "Ethylcyclohexylamine (ECHA)",
                "Ethylisobutylamine (EIBA)",
                "Ethylisopropylamine (EIPA)",
                "Ethylpropylamine (EPA)",
                "Methylbenzylamine (MBzA)",
                "Methylbutylamine (MBA)",
                "Methylcyclohexylamine (MCHA)",
                "Methylethylamine (MEA)",
                "Methylisobutylamine (MIBA)",
                "Methylisopropylamine (MIPA)",
                "Methylphenylamine (MPhA)",
                "Methylpropylamine (MPA)",
                "Propylbutylamine (PBA)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (C2H5NH2)",
            "Dimethylamine ((CH3)2NH)",
            "Diethylamine ((C2H5)2NH)",
            "Propylamine (C3H7NH2)",
            "Isopropylamine ((CH3)2CHNH2)",
            "Butylamine (C4H9NH2)",
            "sec-Butylamine (CH3CH2CH(NH2)CH3)",
            "tert-Butylamine ((CH3)3CNH2)",
            "Pentylamine (C5H11NH2)",
            "Hexylamine (C6H13NH2)",
            "Cyclohexylamine (C6H11NH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Phenethylamine (C6H5CH2CH2NH2)",
            "Diphenylamine ((C6H5)2NH)",
            "Methylethylamine (CH3NHCH2CH3)",
            "Ethylenediamine (H2NCH2CH2NH2)",
            "Hexamethylenediamine (H2N(CH2)6NH2)",
            "Piperidine (C5H11N)",
            "Piperazine (C4H10N2)",
            "Morpholine (C4H9NO)",
            "Pyrrolidine (C4H9N)",
            "Aniline (C6H5NH2)",
            "Diphenylmethylamine ((C6H5)2CHNH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (C2H5NH2)",
                "Dimethylamine ((CH3)2NH)",
                "Diethylamine ((C2H5)2NH)",
                "Propylamine (C3H7NH2)",
                "Isopropylamine ((CH3)2CHNH2)",
                "Butylamine (C4H9NH2)",
                "sec-Butylamine (CH3CH2CH(NH2)CH3)",
                "tert-Butylamine ((CH3)3CNH2)",
                "Pentylamine (C5H11NH2)",
                "Hexylamine (C6H13NH2)",
                "Cyclohexylamine (C6H11NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Phenethylamine (C6H5CH2CH2NH2)",
                "Diphenylamine ((C6H5)2NH)",
                "Methylethylamine (CH3NHCH2CH3)",
                "Ethylenediamine (H2NCH2CH2NH2)",
                "Hexamethylenediamine (H2N(CH2)6NH2)",
                "Piperidine (C5H11N)",
                "Piperazine (C4H10N2)",
                "Morpholine (C4H9NO)",
                "Pyrrolidine (C4H9N)",
                "Aniline (C6H5NH2)",
                "Diphenylmethylamine ((C6H5)2CHNH2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Butylamine (C4H9NH2)",
                "Cyclohexylamine (C6H11NH2)",
                "Diethylamine ((C2H5)2NH)",
                "Dimethylamine ((CH3)2NH)",
                "Diphenylamine ((C6H5)2NH)",
                "Diphenylmethylamine ((C6H5)2CHNH2)",
                "Ethylamine (C2H5NH2)",
                "Ethylenediamine (H2NCH2CH2NH2)",
                "Hexamethylenediamine (H2N(CH2)6NH2)",
                "Hexylamine (C6H13NH2)",
                "Isopropylamine ((CH3)2CHNH2)",
                "Methylamine (CH3NH2)",
                "Methylethylamine (CH3NHCH2CH3)",
                "Morpholine (C4H9NO)",
                "Pentylamine (C5H11NH2)",
                "Phenethylamine (C6H5CH2CH2NH2)",
                "Piperazine (C4H10N2)",
                "Piperidine (C5H11N)",
                "Propylamine (C3H7NH2)",
                "Pyrrolidine (C4H9N)",
                "sec-Butylamine (CH3CH2CH(NH2)CH3)",
                "tert-Butylamine ((CH3)3CNH2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (CH3NH2)",
            "Ethylamine (CH3CH2NH2)",
            "Propylamine (CH3CH2CH2NH2)",
            "Butylamine (CH3(CH2)3NH2)",
            "Dimethylamine ((CH3)2NH)",
            "Diethylamine ((CH3CH2)2NH)",
            "Dipropylamine ((CH3CH2CH2)2NH)",
            "Dibutylamine ((CH3(CH2)3)2NH)",
            "Trimethylamine ((CH3)3N)",
            "Triethylamine ((CH3CH2)3N)",
            "Tripropylamine ((CH3CH2CH2)3N)",
            "Tributylamine ((CH3(CH2)3)3N)",
            "Ethylmethylamine (CH3CH2NHCH3)",
            "Propylmethylamine (CH3CH2CH2NHCH3)",
            "Butylmethylamine (CH3(CH2)3NHCH3)",
            "Ethylpropylamine (CH3CH2NHCH2CH2CH3)",
            "Ethylbutylamine (CH3CH2NH(CH2)3CH3)",
            "Propylbutylamine (CH3CH2CH2NH(CH2)3CH3)",
            "Aniline (C6H5NH2)",
            "Benzylamine (C6H5CH2NH2)",
            "Phenethylamine (C6H5CH2CH2NH2)",
            "Cyclohexylamine (C6H11NH2)",
            "Piperidine (C5H10NH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (CH3NH2)",
                "Ethylamine (CH3CH2NH2)",
                "Propylamine (CH3CH2CH2NH2)",
                "Butylamine (CH3(CH2)3NH2)",
                "Dimethylamine ((CH3)2NH)",
                "Diethylamine ((CH3CH2)2NH)",
                "Dipropylamine ((CH3CH2CH2)2NH)",
                "Dibutylamine ((CH3(CH2)3)2NH)",
                "Trimethylamine ((CH3)3N)",
                "Triethylamine ((CH3CH2)3N)",
                "Tripropylamine ((CH3CH2CH2)3N)",
                "Tributylamine ((CH3(CH2)3)3N)",
                "Ethylmethylamine (CH3CH2NHCH3)",
                "Propylmethylamine (CH3CH2CH2NHCH3)",
                "Butylmethylamine (CH3(CH2)3NHCH3)",
                "Ethylpropylamine (CH3CH2NHCH2CH2CH3)",
                "Ethylbutylamine (CH3CH2NH(CH2)3CH3)",
                "Propylbutylamine (CH3CH2CH2NH(CH2)3CH3)",
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Phenethylamine (C6H5CH2CH2NH2)",
                "Cyclohexylamine (C6H11NH2)",
                "Piperidine (C5H10NH)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aniline (C6H5NH2)",
                "Benzylamine (C6H5CH2NH2)",
                "Butylamine (CH3(CH2)3NH2)",
                "Butylmethylamine (CH3(CH2)3NHCH3)",
                "Cyclohexylamine (C6H11NH2)",
                "Dibutylamine ((CH3(CH2)3)2NH)",
                "Diethylamine ((CH3CH2)2NH)",
                "Dimethylamine ((CH3)2NH)",
                "Dipropylamine ((CH3CH2CH2)2NH)",
                "Ethylamine (CH3CH2NH2)",
                "Ethylbutylamine (CH3CH2NH(CH2)3CH3)",
                "Ethylmethylamine (CH3CH2NHCH3)",
                "Ethylpropylamine (CH3CH2NHCH2CH2CH3)",
                "Methylamine (CH3NH2)",
                "Phenethylamine (C6H5CH2CH2NH2)",
                "Piperidine (C5H10NH)",
                "Propylamine (CH3CH2CH2NH2)",
                "Propylbutylamine (CH3CH2CH2NH(CH2)3CH3)",
                "Propylmethylamine (CH3CH2CH2NHCH3)",
                "Tributylamine ((CH3(CH2)3)3N)",
                "Triethylamine ((CH3CH2)3N)",
                "Trimethylamine ((CH3)3N)",
                "Tripropylamine ((CH3CH2CH2)3N)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Methylamine (MA)",
            "Ethylamine (EA)",
            "Propylamine (PA)",
            "Butylamine (BA)",
            "Pentylamine (PNA)",
            "Hexylamine (HA)",
            "Heptylamine (HPA)",
            "Octylamine (OA)",
            "Benzylamine (BA)",
            "Phenethylamine (PEA)",
            "Tryptamine (TA)",
            "Dopamine (DA)",
            "Norepinephrine (NE)",
            "Epinephrine (E)",
            "Histamine (H)",
            "Serotonin (5-HT)",
            "Tyramine (TA)",
            "Putrescine (PUT)",
            "Cadaverine (CAD)",
            "Spermidine (SPD)",
            "Spermine (SPM)",
            "Ethanolamine (EA)",
            "Diethanolamine (DEA)",
            "Triethanolamine (TEA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methylamine (MA)",
                "Ethylamine (EA)",
                "Propylamine (PA)",
                "Butylamine (BA)",
                "Pentylamine (PNA)",
                "Hexylamine (HA)",
                "Heptylamine (HPA)",
                "Octylamine (OA)",
                "Benzylamine (BA)",
                "Phenethylamine (PEA)",
                "Tryptamine (TA)",
                "Dopamine (DA)",
                "Norepinephrine (NE)",
                "Epinephrine (E)",
                "Histamine (H)",
                "Serotonin (5-HT)",
                "Tyramine (TA)",
                "Putrescine (PUT)",
                "Cadaverine (CAD)",
                "Spermidine (SPD)",
                "Spermine (SPM)",
                "Ethanolamine (EA)",
                "Diethanolamine (DEA)",
                "Triethanolamine (TEA)"
            ],
            "mismatches": [],
            "true_referents": [
                "Benzylamine (BA)",
                "Butylamine (BA)",
                "Cadaverine (CAD)",
                "Diethanolamine (DEA)",
                "Dopamine (DA)",
                "Epinephrine (E)",
                "Ethanolamine (EA)",
                "Ethylamine (EA)",
                "Heptylamine (HPA)",
                "Hexylamine (HA)",
                "Histamine (H)",
                "Methylamine (MA)",
                "Norepinephrine (NE)",
                "Octylamine (OA)",
                "Pentylamine (PNA)",
                "Phenethylamine (PEA)",
                "Propylamine (PA)",
                "Putrescine (PUT)",
                "Serotonin (5-HT)",
                "Spermidine (SPD)",
                "Spermine (SPM)",
                "Triethanolamine (TEA)",
                "Tryptamine (TA)",
                "Tyramine (TA)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Amino acids (AAs)",
            "Amines (Ams)",
            "Aniline (An)",
            "Benzyldimethylamine (BDMA)",
            "Choline (Ch)",
            "Ethylamine (EtNH2)",
            "Histamine (H)",
            "Morpholine (M)",
            "Morpholine-3-amine (M3)",
            "Nicotine (Nc)",
            "Piperidine (Pip)",
            "Piperidine-2-amine (Pip2)",
            "Pyridine (Py)",
            "Pyridine-2-amine (Py2)",
            "Quinoline (Qu)",
            "Quinoline-2-amine (Qu2)",
            "Sarcosine (Sar)",
            "Tetrahydroisoquinoline (THIQ)",
            "Tetrahydroisoquinoline-2-amine (THIQ2)",
            "Triethylamine (TEA)",
            "Triphenylamine (TPA)",
            "Urea (U)",
            "Vinylamine (VinNH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amino acids (AAs)",
                "Amines (Ams)",
                "Aniline (An)",
                "Benzyldimethylamine (BDMA)",
                "Choline (Ch)",
                "Ethylamine (EtNH2)",
                "Histamine (H)",
                "Morpholine (M)",
                "Morpholine-3-amine (M3)",
                "Nicotine (Nc)",
                "Piperidine (Pip)",
                "Piperidine-2-amine (Pip2)",
                "Pyridine (Py)",
                "Pyridine-2-amine (Py2)",
                "Quinoline (Qu)",
                "Quinoline-2-amine (Qu2)",
                "Sarcosine (Sar)",
                "Tetrahydroisoquinoline (THIQ)",
                "Tetrahydroisoquinoline-2-amine (THIQ2)",
                "Triethylamine (TEA)",
                "Triphenylamine (TPA)",
                "Urea (U)",
                "Vinylamine (VinNH2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Amines (Ams)",
                "Amino acids (AAs)",
                "Aniline (An)",
                "Benzyldimethylamine (BDMA)",
                "Choline (Ch)",
                "Ethylamine (EtNH2)",
                "Histamine (H)",
                "Morpholine (M)",
                "Morpholine-3-amine (M3)",
                "Nicotine (Nc)",
                "Piperidine (Pip)",
                "Piperidine-2-amine (Pip2)",
                "Pyridine (Py)",
                "Pyridine-2-amine (Py2)",
                "Quinoline (Qu)",
                "Quinoline-2-amine (Qu2)",
                "Sarcosine (Sar)",
                "Tetrahydroisoquinoline (THIQ)",
                "Tetrahydroisoquinoline-2-amine (THIQ2)",
                "Triethylamine (TEA)",
                "Triphenylamine (TPA)",
                "Urea (U)",
                "Vinylamine (VinNH2)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": [
            "Aniline (C6H5NH2)",
            "Methylamine (CH3NH2)",
            "Dimethylamine (C2H7N)",
            "Ephedrine (C10H15NO)",
            "Pseudoephedrine (C10H13NO)",
            "Amphetamine (C9H13N)",
            "Methamphetamine (C10H15N)",
            "Phenethylamine (C8H11N)",
            "Tyramine (C8H11NO)",
            "Dopamine (C8H11NO2)",
            "Norepinephrine (C8H11NO2)",
            "Epinephrine (C9H13NO3)",
            "Serotonin (C10H12N2O)",
            "Melatonin (C13H16N2O2)",
            "Bufotenin (C12H16N2O)",
            "Dimethyltryptamine (C12H16N2)",
            "5-Methoxy-N,N-dimethyltryptamine (C13H18N2O)",
            "Bufotenidine (C13H19N3O)",
            "Ritalin (C14H19NO3)",
            "Desipramine (C18H22N2)",
            "Imipramine (C19H24N2)",
            "Trimipramine (C20H26N2)",
            "Amitriptyline (C20H23N)",
            "Nortriptyline (C19H21N)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aniline (C6H5NH2)",
                "Methylamine (CH3NH2)",
                "Dimethylamine (C2H7N)",
                "Ephedrine (C10H15NO)",
                "Pseudoephedrine (C10H13NO)",
                "Amphetamine (C9H13N)",
                "Methamphetamine (C10H15N)",
                "Phenethylamine (C8H11N)",
                "Tyramine (C8H11NO)",
                "Dopamine (C8H11NO2)",
                "Norepinephrine (C8H11NO2)",
                "Epinephrine (C9H13NO3)",
                "Serotonin (C10H12N2O)",
                "Melatonin (C13H16N2O2)",
                "Bufotenin (C12H16N2O)",
                "Dimethyltryptamine (C12H16N2)",
                "5-Methoxy-N,N-dimethyltryptamine (C13H18N2O)",
                "Bufotenidine (C13H19N3O)",
                "Ritalin (C14H19NO3)",
                "Desipramine (C18H22N2)",
                "Imipramine (C19H24N2)",
                "Trimipramine (C20H26N2)",
                "Amitriptyline (C20H23N)",
                "Nortriptyline (C19H21N)"
            ],
            "mismatches": [],
            "true_referents": [
                "5-Methoxy-N,N-dimethyltryptamine (C13H18N2O)",
                "Amitriptyline (C20H23N)",
                "Amphetamine (C9H13N)",
                "Aniline (C6H5NH2)",
                "Bufotenidine (C13H19N3O)",
                "Bufotenin (C12H16N2O)",
                "Desipramine (C18H22N2)",
                "Dimethylamine (C2H7N)",
                "Dimethyltryptamine (C12H16N2)",
                "Dopamine (C8H11NO2)",
                "Ephedrine (C10H15NO)",
                "Epinephrine (C9H13NO3)",
                "Imipramine (C19H24N2)",
                "Melatonin (C13H16N2O2)",
                "Methamphetamine (C10H15N)",
                "Methylamine (CH3NH2)",
                "Norepinephrine (C8H11NO2)",
                "Nortriptyline (C19H21N)",
                "Phenethylamine (C8H11N)",
                "Pseudoephedrine (C10H13NO)",
                "Ritalin (C14H19NO3)",
                "Serotonin (C10H12N2O)",
                "Trimipramine (C20H26N2)",
                "Tyramine (C8H11NO)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "secondary amine",
        "domain": "chemistry",
        "response": {
            "1": "ethanol",
            "2": "dimethylglyoxime",
            "3": "dimethylformamide",
            "4": "dimethylsulfoxide",
            "5": "acetamide",
            "6": "acetone",
            "7": "acetic acid",
            "8": "propionic acid",
            "9": "butyric acid",
            "10": "valeric acid",
            "11": "caproic acid",
            "12": "heptanoic acid",
            "13": "octanoic acid",
            "14": "nonanoic acid",
            "15": "decanoic acid",
            "16": "undecanoic acid",
            "17": "dodecanoic acid",
            "18": "tridecanoic acid",
            "19": "tetradecanoic acid",
            "20": "pentadecanoic acid",
            "21": "hexadecanoic acid",
            "22": "heptadecanoic acid",
            "23": "octadecanoic acid",
            "24": "nonadecanoic acid"
        },
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethanol",
                "dimethylglyoxime",
                "dimethylformamide",
                "dimethylsulfoxide",
                "acetamide",
                "acetone",
                "acetic acid",
                "propionic acid",
                "butyric acid",
                "valeric acid",
                "caproic acid",
                "heptanoic acid",
                "octanoic acid",
                "nonanoic acid",
                "decanoic acid",
                "undecanoic acid",
                "dodecanoic acid",
                "tridecanoic acid",
                "tetradecanoic acid",
                "pentadecanoic acid",
                "hexadecanoic acid",
                "heptadecanoic acid",
                "octadecanoic acid",
                "nonadecanoic acid"
            ],
            "mismatches": [],
            "true_referents": [
                "10: valeric acid",
                "11: caproic acid",
                "12: heptanoic acid",
                "13: octanoic acid",
                "14: nonanoic acid",
                "15: decanoic acid",
                "16: undecanoic acid",
                "17: dodecanoic acid",
                "18: tridecanoic acid",
                "19: tetradecanoic acid",
                "1: ethanol",
                "20: pentadecanoic acid",
                "21: hexadecanoic acid",
                "22: heptadecanoic acid",
                "23: octadecanoic acid",
                "24: nonadecanoic acid",
                "2: dimethylglyoxime",
                "3: dimethylformamide",
                "4: dimethylsulfoxide",
                "5: acetamide",
                "6: acetone",
                "7: acetic acid",
                "8: propionic acid",
                "9: butyric acid"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    }
]