[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "methylhydrazine (CH3NHNH2)",
            "ethylhydrazine (C2H5NHNH2)",
            "propylhydrazine (C3H7NHNH2)",
            "butylhydrazine (C4H9NHNH2)",
            "phenylhydrazine (C6H5NHNH2)",
            "benzylhydrazine (C6H5CH2NHNH2)",
            "acetylhydrazine (CH3COHNHNH2)",
            "propionylhydrazine (C3H7COHNHNH2)",
            "butyrylhydrazine (C4H9COHNHNH2)",
            "valerylhydrazine (C5H11COHNHNH2)",
            "hexanoylhydrazine (C6H13COHNHNH2)",
            "heptylhydrazine (C7H15NHNH2)",
            "octylhydrazine (C8H17NHNH2)",
            "nonylhydrazine (C9H19NHNH2)",
            "decylhydrazine (C10H21NHNH2)",
            "undecylhydrazine (C11H23NHNH2)",
            "dodecylhydrazine (C12H25NHNH2)",
            "tritylhydrazine (C18H19NHNH2)",
            "isopropylhydrazine (C3H7NHNH2)",
            "sec-butylhydrazine (C4H9NHNH2)",
            "tert-butylhydrazine (C4H9NHNH2)",
            "cyclopropylhydrazine (C3H5NHNH2)",
            "cyclobutylhydrazine (C4H7NHNH2)",
            "cyclopentylhydrazine (C5H9NHNH2)",
            "cyclohexylhydrazine (C6H11NHNH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methylhydrazine (CH3NHNH2)",
                "ethylhydrazine (C2H5NHNH2)",
                "propylhydrazine (C3H7NHNH2)",
                "butylhydrazine (C4H9NHNH2)",
                "phenylhydrazine (C6H5NHNH2)",
                "benzylhydrazine (C6H5CH2NHNH2)",
                "acetylhydrazine (CH3COHNHNH2)",
                "propionylhydrazine (C3H7COHNHNH2)",
                "butyrylhydrazine (C4H9COHNHNH2)",
                "valerylhydrazine (C5H11COHNHNH2)",
                "hexanoylhydrazine (C6H13COHNHNH2)",
                "heptylhydrazine (C7H15NHNH2)",
                "octylhydrazine (C8H17NHNH2)",
                "nonylhydrazine (C9H19NHNH2)",
                "decylhydrazine (C10H21NHNH2)",
                "undecylhydrazine (C11H23NHNH2)",
                "dodecylhydrazine (C12H25NHNH2)",
                "tritylhydrazine (C18H19NHNH2)",
                "isopropylhydrazine (C3H7NHNH2)",
                "sec-butylhydrazine (C4H9NHNH2)",
                "tert-butylhydrazine (C4H9NHNH2)",
                "cyclopropylhydrazine (C3H5NHNH2)",
                "cyclobutylhydrazine (C4H7NHNH2)",
                "cyclopentylhydrazine (C5H9NHNH2)"
            ],
            "mismatches": [
                "cyclohexylhydrazine (C6H11NHNH2)"
            ],
            "true_referents": [
                "acetylhydrazine (CH3COHNHNH2)",
                "benzylhydrazine (C6H5CH2NHNH2)",
                "butylhydrazine (C4H9NHNH2)",
                "butyrylhydrazine (C4H9COHNHNH2)",
                "cyclobutylhydrazine (C4H7NHNH2)",
                "cyclopentylhydrazine (C5H9NHNH2)",
                "cyclopropylhydrazine (C3H5NHNH2)",
                "decylhydrazine (C10H21NHNH2)",
                "dodecylhydrazine (C12H25NHNH2)",
                "ethylhydrazine (C2H5NHNH2)",
                "heptylhydrazine (C7H15NHNH2)",
                "hexanoylhydrazine (C6H13COHNHNH2)",
                "isopropylhydrazine (C3H7NHNH2)",
                "methylhydrazine (CH3NHNH2)",
                "nonylhydrazine (C9H19NHNH2)",
                "octylhydrazine (C8H17NHNH2)",
                "phenylhydrazine (C6H5NHNH2)",
                "propionylhydrazine (C3H7COHNHNH2)",
                "propylhydrazine (C3H7NHNH2)",
                "sec-butylhydrazine (C4H9NHNH2)",
                "tert-butylhydrazine (C4H9NHNH2)",
                "tritylhydrazine (C18H19NHNH2)",
                "undecylhydrazine (C11H23NHNH2)",
                "valerylhydrazine (C5H11COHNHNH2)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "Hydrazine (N2H4)",
            "Methylhydrazine (CH3NHNH2)",
            "Ethylhydrazine (C2H5NHNH2)",
            "Phenylhydrazine (C6H5NHNH2)",
            "Dimethylhydrazine ((CH3)2NNH2)",
            "Diethylhydrazine ((C2H5)2NNH2)",
            "Diisopropylhydrazine ((i-C3H7)2NNH2)",
            "Hydrazinecarbothioamide (CH5N2S)",
            "Hydrazinecarboxamide (CH5N3)",
            "Hydrazinecarboxylate (CH3N2COO-)",
            "Hydrazineacetate (CH3CH2N2O2)",
            "Hydrazineformate (CH3N2O2)",
            "Hydrazineacetamide (CH3CONHNH2)",
            "Hydrazineformamide (HCONHNH2)",
            "Hydrazinebenzamide (C6H5CONHNH2)",
            "Hydrazineacetohydrazide (CH3CONHNH2)",
            "Hydrazineformohydrazide (HCONHNH2)",
            "Hydrazinephenylacetate (C6H5CH2CONHNH2)",
            "Hydrazinephenylacetamide (C6H5CH2CONHNH2)",
            "Hydrazinephenylcarboxylate (C6H5CH2N2COO-)",
            "Hydrazinephenylcarboxamide (C6H5CH2N2CO)",
            "Hydrazinephenylformamide (C6H5CH2N2CHO)",
            "Hydrazinephenylformohydrazide (C6H5CH2N2CHO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrazine (N2H4)",
                "Methylhydrazine (CH3NHNH2)",
                "Ethylhydrazine (C2H5NHNH2)",
                "Phenylhydrazine (C6H5NHNH2)",
                "Dimethylhydrazine ((CH3)2NNH2)",
                "Diethylhydrazine ((C2H5)2NNH2)",
                "Diisopropylhydrazine ((i-C3H7)2NNH2)",
                "Hydrazinecarbothioamide (CH5N2S)",
                "Hydrazinecarboxamide (CH5N3)",
                "Hydrazinecarboxylate (CH3N2COO-)",
                "Hydrazineacetate (CH3CH2N2O2)",
                "Hydrazineformate (CH3N2O2)",
                "Hydrazineacetamide (CH3CONHNH2)",
                "Hydrazineformamide (HCONHNH2)",
                "Hydrazinebenzamide (C6H5CONHNH2)",
                "Hydrazineacetohydrazide (CH3CONHNH2)",
                "Hydrazineformohydrazide (HCONHNH2)",
                "Hydrazinephenylacetate (C6H5CH2CONHNH2)",
                "Hydrazinephenylacetamide (C6H5CH2CONHNH2)",
                "Hydrazinephenylcarboxylate (C6H5CH2N2COO-)",
                "Hydrazinephenylcarboxamide (C6H5CH2N2CO)",
                "Hydrazinephenylformamide (C6H5CH2N2CHO)",
                "Hydrazinephenylformohydrazide (C6H5CH2N2CHO)"
            ],
            "mismatches": [],
            "true_referents": [
                "Diethylhydrazine ((C2H5)2NNH2)",
                "Diisopropylhydrazine ((i-C3H7)2NNH2)",
                "Dimethylhydrazine ((CH3)2NNH2)",
                "Ethylhydrazine (C2H5NHNH2)",
                "Hydrazine (N2H4)",
                "Hydrazineacetamide (CH3CONHNH2)",
                "Hydrazineacetate (CH3CH2N2O2)",
                "Hydrazineacetohydrazide (CH3CONHNH2)",
                "Hydrazinebenzamide (C6H5CONHNH2)",
                "Hydrazinecarbothioamide (CH5N2S)",
                "Hydrazinecarboxamide (CH5N3)",
                "Hydrazinecarboxylate (CH3N2COO-)",
                "Hydrazineformamide (HCONHNH2)",
                "Hydrazineformate (CH3N2O2)",
                "Hydrazineformohydrazide (HCONHNH2)",
                "Hydrazinephenylacetamide (C6H5CH2CONHNH2)",
                "Hydrazinephenylacetate (C6H5CH2CONHNH2)",
                "Hydrazinephenylcarboxamide (C6H5CH2N2CO)",
                "Hydrazinephenylcarboxylate (C6H5CH2N2COO-)",
                "Hydrazinephenylformamide (C6H5CH2N2CHO)",
                "Hydrazinephenylformohydrazide (C6H5CH2N2CHO)",
                "Methylhydrazine (CH3NHNH2)",
                "Phenylhydrazine (C6H5NHNH2)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "Hydrazine (N2H4)",
            "Methylhydrazine (CH3NHNH2)",
            "1,1-Dimethylhydrazine ((CH3)2NNH2)",
            "1,2-Dimethylhydrazine (CH3NHNHCH3)",
            "1,1,2,2-Tetramethylhydrazine ((CH3)2NN(CH3)2)",
            "Phenylhydrazine (C6H5NHNH2)",
            "2,4-Dinitrophenylhydrazine (C6H3(NO2)2NHNH2)",
            "Benzyhydrazine (C6H5CH2NHNH2)",
            "Ethylhydrazine (C2H5NHNH2)",
            "Propyhydrazine (C3H7NHNH2)",
            "Butylhydrazine (C4H9NHNH2)",
            "Isopropylhydrazine ((CH3)2CHNHNH2)",
            "Cyclohexylhydrazine (C6H11NHNH2)",
            "Allylhydrazine (C3H5NHNH2)",
            "Hydrazobenzene (C6H5NHNHC6H5)",
            "Acetylhydrazine (CH3CONHNH2)",
            "Benzoylhydrazine (C6H5CONHNH2)",
            "Formylhydrazine (HCONHNH2)",
            "Carbamoylhydrazine (H2NCONHNH2)",
            "Ethylcarbamoylhydrazine (C2H5NCONHNH2)",
            "Methylcarbamoylhydrazine (CH3NCONHNH2)",
            "Propylcarbamoylhydrazine (C3H7NCONHNH2)",
            "Butylcarbamoylhydrazine (C4H9NCONHNH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrazine (N2H4)",
                "Methylhydrazine (CH3NHNH2)",
                "1,1-Dimethylhydrazine ((CH3)2NNH2)",
                "1,2-Dimethylhydrazine (CH3NHNHCH3)",
                "1,1,2,2-Tetramethylhydrazine ((CH3)2NN(CH3)2)",
                "Phenylhydrazine (C6H5NHNH2)",
                "2,4-Dinitrophenylhydrazine (C6H3(NO2)2NHNH2)",
                "Benzyhydrazine (C6H5CH2NHNH2)",
                "Ethylhydrazine (C2H5NHNH2)",
                "Propyhydrazine (C3H7NHNH2)",
                "Butylhydrazine (C4H9NHNH2)",
                "Isopropylhydrazine ((CH3)2CHNHNH2)",
                "Cyclohexylhydrazine (C6H11NHNH2)",
                "Allylhydrazine (C3H5NHNH2)",
                "Hydrazobenzene (C6H5NHNHC6H5)",
                "Acetylhydrazine (CH3CONHNH2)",
                "Benzoylhydrazine (C6H5CONHNH2)",
                "Formylhydrazine (HCONHNH2)",
                "Carbamoylhydrazine (H2NCONHNH2)",
                "Ethylcarbamoylhydrazine (C2H5NCONHNH2)",
                "Methylcarbamoylhydrazine (CH3NCONHNH2)",
                "Propylcarbamoylhydrazine (C3H7NCONHNH2)",
                "Butylcarbamoylhydrazine (C4H9NCONHNH2)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,1,2,2-Tetramethylhydrazine ((CH3)2NN(CH3)2)",
                "1,1-Dimethylhydrazine ((CH3)2NNH2)",
                "1,2-Dimethylhydrazine (CH3NHNHCH3)",
                "2,4-Dinitrophenylhydrazine (C6H3(NO2)2NHNH2)",
                "Acetylhydrazine (CH3CONHNH2)",
                "Allylhydrazine (C3H5NHNH2)",
                "Benzoylhydrazine (C6H5CONHNH2)",
                "Benzyhydrazine (C6H5CH2NHNH2)",
                "Butylcarbamoylhydrazine (C4H9NCONHNH2)",
                "Butylhydrazine (C4H9NHNH2)",
                "Carbamoylhydrazine (H2NCONHNH2)",
                "Cyclohexylhydrazine (C6H11NHNH2)",
                "Ethylcarbamoylhydrazine (C2H5NCONHNH2)",
                "Ethylhydrazine (C2H5NHNH2)",
                "Formylhydrazine (HCONHNH2)",
                "Hydrazine (N2H4)",
                "Hydrazobenzene (C6H5NHNHC6H5)",
                "Isopropylhydrazine ((CH3)2CHNHNH2)",
                "Methylcarbamoylhydrazine (CH3NCONHNH2)",
                "Methylhydrazine (CH3NHNH2)",
                "Phenylhydrazine (C6H5NHNH2)",
                "Propyhydrazine (C3H7NHNH2)",
                "Propylcarbamoylhydrazine (C3H7NCONHNH2)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "Hydrazine (N2H4)",
            "Monomethylhydrazine (MMH)",
            "Dimethylhydrazine (UDMH)",
            "Trimethylhydrazine",
            "Tetramethylhydrazine",
            "Monoethylhydrazine",
            "Diethylhydrazine",
            "Monophenylhydrazine (MPH)",
            "Diphenylhydrazine",
            "Benzylhydrazine",
            "N-tert-Butylhydrazine",
            "N,N-Diethylhydrazine",
            "N,N-Dimethylhydrazine (NDMH)",
            "N-Methyl-N-phenylhydrazine",
            "N-Ethyl-N-phenylhydrazine",
            "1,2-Dimethylhydrazine",
            "1,1-Dimethylhydrazine",
            "N-Acetylhydrazine",
            "N-Formylhydrazine",
            "N-Nitrosohydrazine",
            "N-Methyl-N-nitrosohydrazine (MNMH)",
            "N-Ethyl-N-nitrosohydrazine",
            "N-Phenyl-N-nitrosohydrazine",
            "N,N'-Diacetylhydrazine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrazine (N2H4)",
                "Monomethylhydrazine (MMH)",
                "Dimethylhydrazine (UDMH)",
                "Trimethylhydrazine",
                "Tetramethylhydrazine",
                "Monoethylhydrazine",
                "Diethylhydrazine",
                "Monophenylhydrazine (MPH)",
                "Diphenylhydrazine",
                "Benzylhydrazine",
                "N-tert-Butylhydrazine",
                "N,N-Diethylhydrazine",
                "N,N-Dimethylhydrazine (NDMH)",
                "N-Methyl-N-phenylhydrazine",
                "N-Ethyl-N-phenylhydrazine",
                "1,2-Dimethylhydrazine",
                "1,1-Dimethylhydrazine",
                "N-Acetylhydrazine",
                "N-Formylhydrazine",
                "N-Nitrosohydrazine",
                "N-Methyl-N-nitrosohydrazine (MNMH)",
                "N-Ethyl-N-nitrosohydrazine",
                "N-Phenyl-N-nitrosohydrazine",
                "N,N'-Diacetylhydrazine"
            ],
            "mismatches": [],
            "true_referents": [
                "1,1-Dimethylhydrazine",
                "1,2-Dimethylhydrazine",
                "Benzylhydrazine",
                "Diethylhydrazine",
                "Dimethylhydrazine (UDMH)",
                "Diphenylhydrazine",
                "Hydrazine (N2H4)",
                "Monoethylhydrazine",
                "Monomethylhydrazine (MMH)",
                "Monophenylhydrazine (MPH)",
                "N,N'-Diacetylhydrazine",
                "N,N-Diethylhydrazine",
                "N,N-Dimethylhydrazine (NDMH)",
                "N-Acetylhydrazine",
                "N-Ethyl-N-nitrosohydrazine",
                "N-Ethyl-N-phenylhydrazine",
                "N-Formylhydrazine",
                "N-Methyl-N-nitrosohydrazine (MNMH)",
                "N-Methyl-N-phenylhydrazine",
                "N-Nitrosohydrazine",
                "N-Phenyl-N-nitrosohydrazine",
                "N-tert-Butylhydrazine",
                "Tetramethylhydrazine",
                "Trimethylhydrazine"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "Hydrazine (N2H4)",
            "Methylhydrazine (CH3N2H3)",
            "Dimethylhydrazine ((CH3)2N2H2)",
            "Phenylhydrazine (C6H5N2H3)",
            "Ethylhydrazine (C2H5N2H3)",
            "Benzylhydrazine (C7H7N2H3)",
            "Hydrazone (R2C=N-NH2)",
            "Acetylhydrazine (CH3CON2H3)",
            "Hydrazinium ion (N2H5+)",
            "Hydrazide (RCONHNH2)",
            "Carbazide (NH2NHCONHNH2)",
            "Thiosemicarbazide (NH2CSNHNH2)",
            "Semicarbazide (NH2CONHNH2)",
            "Formylhydrazine (HCON2H3)",
            "Boc-hydrazine ((CH3)3COCONHNH2)",
            "Hydrazine sulfate (N2H6SO4)",
            "Hydrazine hydrate (N2H4\u00b7H2O)",
            "Hydrazine monohydrochloride (N2H4\u00b7HCl)",
            "Hydrazine dihydrochloride (N2H4\u00b72HCl)",
            "Hydrazine mononitrate (N2H4\u00b7HNO3)",
            "Hydrazine monocarbonate (N2H4\u00b7H2CO3)",
            "Hydrazine monophosphate (N2H4\u00b7H3PO4)",
            "Hydrazine monofluoride (N2H4\u00b7HF)",
            "Hydrazine monobromide (N2H4\u00b7HBr)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrazine (N2H4)",
                "Methylhydrazine (CH3N2H3)",
                "Dimethylhydrazine ((CH3)2N2H2)",
                "Phenylhydrazine (C6H5N2H3)",
                "Ethylhydrazine (C2H5N2H3)",
                "Benzylhydrazine (C7H7N2H3)",
                "Hydrazone (R2C=N-NH2)",
                "Acetylhydrazine (CH3CON2H3)",
                "Hydrazinium ion (N2H5+)",
                "Hydrazide (RCONHNH2)",
                "Carbazide (NH2NHCONHNH2)",
                "Thiosemicarbazide (NH2CSNHNH2)",
                "Semicarbazide (NH2CONHNH2)",
                "Formylhydrazine (HCON2H3)",
                "Boc-hydrazine ((CH3)3COCONHNH2)",
                "Hydrazine sulfate (N2H6SO4)",
                "Hydrazine hydrate (N2H4\u00b7H2O)",
                "Hydrazine monohydrochloride (N2H4\u00b7HCl)",
                "Hydrazine dihydrochloride (N2H4\u00b72HCl)",
                "Hydrazine mononitrate (N2H4\u00b7HNO3)",
                "Hydrazine monocarbonate (N2H4\u00b7H2CO3)",
                "Hydrazine monophosphate (N2H4\u00b7H3PO4)",
                "Hydrazine monofluoride (N2H4\u00b7HF)",
                "Hydrazine monobromide (N2H4\u00b7HBr)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetylhydrazine (CH3CON2H3)",
                "Benzylhydrazine (C7H7N2H3)",
                "Boc-hydrazine ((CH3)3COCONHNH2)",
                "Carbazide (NH2NHCONHNH2)",
                "Dimethylhydrazine ((CH3)2N2H2)",
                "Ethylhydrazine (C2H5N2H3)",
                "Formylhydrazine (HCON2H3)",
                "Hydrazide (RCONHNH2)",
                "Hydrazine (N2H4)",
                "Hydrazine dihydrochloride (N2H4\u00b72HCl)",
                "Hydrazine hydrate (N2H4\u00b7H2O)",
                "Hydrazine monobromide (N2H4\u00b7HBr)",
                "Hydrazine monocarbonate (N2H4\u00b7H2CO3)",
                "Hydrazine monofluoride (N2H4\u00b7HF)",
                "Hydrazine monohydrochloride (N2H4\u00b7HCl)",
                "Hydrazine mononitrate (N2H4\u00b7HNO3)",
                "Hydrazine monophosphate (N2H4\u00b7H3PO4)",
                "Hydrazine sulfate (N2H6SO4)",
                "Hydrazinium ion (N2H5+)",
                "Hydrazone (R2C=N-NH2)",
                "Methylhydrazine (CH3N2H3)",
                "Phenylhydrazine (C6H5N2H3)",
                "Semicarbazide (NH2CONHNH2)",
                "Thiosemicarbazide (NH2CSNHNH2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "Hydrazine (N2H4)",
            "Monomethylhydrazine (MMH)",
            "Dimethylhydrazine (DMH)",
            "Ethylhydrazine (EH)",
            "Phenylhydrazine (PH)",
            "Benzylhydrazine (BH)",
            "Carbethoxylhydrazine (CEH)",
            "Acetylhydrazine (AH)",
            "Hydrazobenzene (HB)",
            "Hydrazinecarboxylic acid (HCA)",
            "Hydrazine sulfate (HS)",
            "Tert-butylhydrazine (TBH)",
            "Cyclohexylhydrazine (CHH)",
            "Propylhydrazine (PH)",
            "Isopropylhydrazine (IPH)",
            "Hydrazinylpyridine (HP)",
            "Hydrazine-1-carboxamide (HCA)",
            "Hydrazine-1-methylcarbamate (HMC)",
            "Triazole hydrazine (TH)",
            "Boc-hydrazine (Boc-H)",
            "Hydrazine-1-phenylcarbamate (HPC)",
            "Hydrazine-1,2-dicarboxylic acid (HDCA)",
            "Hydrazine-2-carboxylic acid (HCA)",
            "N,N-Dimethylhydrazine (NDMH)",
            "N,N-Bis(2-hydroxyethyl)hydrazine (BHEH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrazine (N2H4)",
                "Monomethylhydrazine (MMH)",
                "Dimethylhydrazine (DMH)",
                "Ethylhydrazine (EH)",
                "Phenylhydrazine (PH)",
                "Benzylhydrazine (BH)",
                "Carbethoxylhydrazine (CEH)",
                "Acetylhydrazine (AH)",
                "Hydrazobenzene (HB)",
                "Hydrazinecarboxylic acid (HCA)",
                "Hydrazine sulfate (HS)",
                "Tert-butylhydrazine (TBH)",
                "Cyclohexylhydrazine (CHH)",
                "Isopropylhydrazine (IPH)",
                "Hydrazinylpyridine (HP)",
                "Hydrazine-1-carboxamide (HCA)",
                "Hydrazine-1-methylcarbamate (HMC)",
                "Triazole hydrazine (TH)",
                "Boc-hydrazine (Boc-H)",
                "Hydrazine-1-phenylcarbamate (HPC)",
                "Hydrazine-1,2-dicarboxylic acid (HDCA)",
                "Hydrazine-2-carboxylic acid (HCA)",
                "N,N-Dimethylhydrazine (NDMH)"
            ],
            "mismatches": [
                "Propylhydrazine (PH)",
                "N,N-Bis(2-hydroxyethyl)hydrazine (BHEH)"
            ],
            "true_referents": [
                "Acetylhydrazine (AH)",
                "Benzylhydrazine (BH)",
                "Boc-hydrazine (Boc-H)",
                "Carbethoxylhydrazine (CEH)",
                "Cyclohexylhydrazine (CHH)",
                "Dimethylhydrazine (DMH)",
                "Ethylhydrazine (EH)",
                "Hydrazine (N2H4)",
                "Hydrazine sulfate (HS)",
                "Hydrazine-1,2-dicarboxylic acid (HDCA)",
                "Hydrazine-1-carboxamide (HCA)",
                "Hydrazine-1-methylcarbamate (HMC)",
                "Hydrazine-1-phenylcarbamate (HPC)",
                "Hydrazine-2-carboxylic acid (HCA)",
                "Hydrazinecarboxylic acid (HCA)",
                "Hydrazinylpyridine (HP)",
                "Hydrazobenzene (HB)",
                "Isopropylhydrazine (IPH)",
                "Monomethylhydrazine (MMH)",
                "N,N-Dimethylhydrazine (NDMH)",
                "Phenylhydrazine (PH)",
                "Propylhydrazine (PH)",
                "Tert-butylhydrazine (TBH)",
                "Triazole hydrazine (TH)"
            ],
            "TP": 23,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "Hydrazine (N2H4)",
            "Methylhydrazine (CH3N2H3)",
            "1,1-Dimethylhydrazine (C2H6N2)",
            "1,2-Dimethylhydrazine (C2H6N2)",
            "Ethylhydrazine (C2H5N2H3)",
            "1,1-Diethylhydrazine (C4H10N2)",
            "1,2-Diethylhydrazine (C4H10N2)",
            "Propylhydrazine (C3H7N2H3)",
            "1,1-Dipropylhydrazine (C6H14N2)",
            "1,2-Dipropylhydrazine (C6H14N2)",
            "Butylhydrazine (C4H9N2H3)",
            "1,1-Dibutylhydrazine (C8H18N2)",
            "1,2-Dibutylhydrazine (C8H18N2)",
            "Pentylhydrazine (C5H11N2H3)",
            "1,1-Dipentylhydrazine (C10H22N2)",
            "1,2-Dipentylhydrazine (C10H22N2)",
            "Hexylhydrazine (C6H13N2H3)",
            "1,1-Dihexylhydrazine (C12H26N2)",
            "1,2-Dihexylhydrazine (C12H26N2)",
            "Heptylhydrazine (C7H15N2H3)",
            "1,1-Diheptylhydrazine (C14H30N2)",
            "1,2-Diheptylhydrazine (C14H30N2)",
            "Octylhydrazine (C8H17N2H3)",
            "1,1-Dioctylhydrazine (C16H34N2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "error": "JSON decode error: Expecting value: line 1 column 1 (char 0)",
            "true_referents": [
                "1,1-Dibutylhydrazine (C8H18N2)",
                "1,1-Diethylhydrazine (C4H10N2)",
                "1,1-Diheptylhydrazine (C14H30N2)",
                "1,1-Dihexylhydrazine (C12H26N2)",
                "1,1-Dimethylhydrazine (C2H6N2)",
                "1,1-Dioctylhydrazine (C16H34N2)",
                "1,1-Dipentylhydrazine (C10H22N2)",
                "1,1-Dipropylhydrazine (C6H14N2)",
                "1,2-Dibutylhydrazine (C8H18N2)",
                "1,2-Diethylhydrazine (C4H10N2)",
                "1,2-Diheptylhydrazine (C14H30N2)",
                "1,2-Dihexylhydrazine (C12H26N2)",
                "1,2-Dimethylhydrazine (C2H6N2)",
                "1,2-Dipentylhydrazine (C10H22N2)",
                "1,2-Dipropylhydrazine (C6H14N2)",
                "Butylhydrazine (C4H9N2H3)",
                "Ethylhydrazine (C2H5N2H3)",
                "Heptylhydrazine (C7H15N2H3)",
                "Hexylhydrazine (C6H13N2H3)",
                "Hydrazine (N2H4)",
                "Methylhydrazine (CH3N2H3)",
                "Octylhydrazine (C8H17N2H3)",
                "Pentylhydrazine (C5H11N2H3)",
                "Propylhydrazine (C3H7N2H3)"
            ]
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "methylhydrazine (CH3NHNH2)",
            "dimethylhydrazine (CH3NHNHCH3)",
            "trimethylhydrazine (CH3NHN(CH3)2)",
            "ethylhydrazine (C2H5NHNH2)",
            "diethylhydrazine (C2H5NHNHCH2CH3)",
            "propylhydrazine (C3H7NHNH2)",
            "isopropylhydrazine (C3H7NHNHCH3)",
            "butylhydrazine (C4H9NHNH2)",
            "isobutylhydrazine (C4H9NHNHCH3)",
            "sec-butylhydrazine (C4H9NHNHCH2CH3)",
            "tert-butylhydrazine (C4H9NHN(CH3)2)",
            "pentylhydrazine (C5H11NHNH2)",
            "hexylhydrazine (C6H13NHNH2)",
            "heptylhydrazine (C7H15NHNH2)",
            "octylhydrazine (C8H17NHNH2)",
            "nonylhydrazine (C9H19NHNH2)",
            "decylhydrazine (C10H21NHNH2)",
            "undecylhydrazine (C11H23NHNH2)",
            "dodecylhydrazine (C12H25NHNH2)",
            "tridecylhydrazine (C13H27NHNH2)",
            "tetradecylhydrazine (C14H29NHNH2)",
            "pentadecylhydrazine (C15H31NHNH2)",
            "hexadecylhydrazine (C16H33NHNH2)",
            "heptadecylhydrazine (C17H35NHNH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methylhydrazine (CH3NHNH2)",
                "dimethylhydrazine (CH3NHNHCH3)",
                "trimethylhydrazine (CH3NHN(CH3)2)",
                "ethylhydrazine (C2H5NHNH2)",
                "diethylhydrazine (C2H5NHNHCH2CH3)",
                "propylhydrazine (C3H7NHNH2)",
                "isopropylhydrazine (C3H7NHNHCH3)",
                "butylhydrazine (C4H9NHNH2)",
                "isobutylhydrazine (C4H9NHNHCH3)",
                "sec-butylhydrazine (C4H9NHNHCH2CH3)",
                "tert-butylhydrazine (C4H9NHN(CH3)2)",
                "pentylhydrazine (C5H11NHNH2)",
                "hexylhydrazine (C6H13NHNH2)",
                "heptylhydrazine (C7H15NHNH2)",
                "octylhydrazine (C8H17NHNH2)",
                "nonylhydrazine (C9H19NHNH2)",
                "decylhydrazine (C10H21NHNH2)",
                "undecylhydrazine (C11H23NHNH2)",
                "dodecylhydrazine (C12H25NHNH2)",
                "tridecylhydrazine (C13H27NHNH2)",
                "tetradecylhydrazine (C14H29NHNH2)",
                "pentadecylhydrazine (C15H31NHNH2)",
                "hexadecylhydrazine (C16H33NHNH2)",
                "heptadecylhydrazine (C17H35NHNH2)"
            ],
            "mismatches": [],
            "true_referents": [
                "butylhydrazine (C4H9NHNH2)",
                "decylhydrazine (C10H21NHNH2)",
                "diethylhydrazine (C2H5NHNHCH2CH3)",
                "dimethylhydrazine (CH3NHNHCH3)",
                "dodecylhydrazine (C12H25NHNH2)",
                "ethylhydrazine (C2H5NHNH2)",
                "heptadecylhydrazine (C17H35NHNH2)",
                "heptylhydrazine (C7H15NHNH2)",
                "hexadecylhydrazine (C16H33NHNH2)",
                "hexylhydrazine (C6H13NHNH2)",
                "isobutylhydrazine (C4H9NHNHCH3)",
                "isopropylhydrazine (C3H7NHNHCH3)",
                "methylhydrazine (CH3NHNH2)",
                "nonylhydrazine (C9H19NHNH2)",
                "octylhydrazine (C8H17NHNH2)",
                "pentadecylhydrazine (C15H31NHNH2)",
                "pentylhydrazine (C5H11NHNH2)",
                "propylhydrazine (C3H7NHNH2)",
                "sec-butylhydrazine (C4H9NHNHCH2CH3)",
                "tert-butylhydrazine (C4H9NHN(CH3)2)",
                "tetradecylhydrazine (C14H29NHNH2)",
                "tridecylhydrazine (C13H27NHNH2)",
                "trimethylhydrazine (CH3NHN(CH3)2)",
                "undecylhydrazine (C11H23NHNH2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "Hydrazine (N\u2082H\u2084)",
            "Monomethyl hydrazine (MMH)",
            "Unsymmetrical dimethylhydrazine (UDMH)",
            "Symmetrical dimethylhydrazine",
            "Phenylhydrazine",
            "Benzylhydrazine",
            "Ethylhydrazine",
            "N-Ethylhydrazine",
            "N-Benzylhydrazine",
            "N,N-Dimethylhydrazine",
            "N,N-Diethylhydrazine",
            "N-Methylphenylhydrazine",
            "N-Phenylhydrazine",
            "1,1-Dimethylhydrazine",
            "1,2-Dimethylhydrazine",
            "1,1-Diphenylhydrazine",
            "N,N-Dipropylhydrazine",
            "N,N-Diisopropylhydrazine",
            "N-Allylhydrazine",
            "N-Tert-Butylhydrazine",
            "N-Methyl-N-phenylhydrazine",
            "N-Methylhydrazine",
            "N,N-Dimethyl-1,2-dihydrazine",
            "N,N-Dimethylformohydrazide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrazine (N\u2082H\u2084)",
                "Monomethyl hydrazine (MMH)",
                "Unsymmetrical dimethylhydrazine (UDMH)",
                "Symmetrical dimethylhydrazine",
                "Phenylhydrazine",
                "Benzylhydrazine",
                "Ethylhydrazine",
                "N-Ethylhydrazine",
                "N-Benzylhydrazine",
                "N,N-Dimethylhydrazine",
                "N,N-Diethylhydrazine",
                "N-Methylphenylhydrazine",
                "N-Phenylhydrazine",
                "1,1-Dimethylhydrazine",
                "1,2-Dimethylhydrazine",
                "1,1-Diphenylhydrazine",
                "N,N-Dipropylhydrazine",
                "N,N-Diisopropylhydrazine",
                "N-Allylhydrazine",
                "N-Tert-Butylhydrazine",
                "N-Methyl-N-phenylhydrazine",
                "N-Methylhydrazine",
                "N,N-Dimethyl-1,2-dihydrazine",
                "N,N-Dimethylformohydrazide"
            ],
            "mismatches": [],
            "true_referents": [
                "1,1-Dimethylhydrazine",
                "1,1-Diphenylhydrazine",
                "1,2-Dimethylhydrazine",
                "Benzylhydrazine",
                "Ethylhydrazine",
                "Hydrazine (N\u2082H\u2084)",
                "Monomethyl hydrazine (MMH)",
                "N,N-Diethylhydrazine",
                "N,N-Diisopropylhydrazine",
                "N,N-Dimethyl-1,2-dihydrazine",
                "N,N-Dimethylformohydrazide",
                "N,N-Dimethylhydrazine",
                "N,N-Dipropylhydrazine",
                "N-Allylhydrazine",
                "N-Benzylhydrazine",
                "N-Ethylhydrazine",
                "N-Methyl-N-phenylhydrazine",
                "N-Methylhydrazine",
                "N-Methylphenylhydrazine",
                "N-Phenylhydrazine",
                "N-Tert-Butylhydrazine",
                "Phenylhydrazine",
                "Symmetrical dimethylhydrazine",
                "Unsymmetrical dimethylhydrazine (UDMH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "Hydrazine (N2H4)",
            "Methylhydrazine (CH3NHNH2)",
            "Dimethylhydrazine ((CH3)2NNH2)",
            "Phenylhydrazine (C6H5NHNH2)",
            "Semicarbazide (H2NNHCONH2)",
            "Thiosemicarbazide (H2NNHCSNH2)",
            "Hydrazobenzene (C6H5NHNHC6H5)",
            "Maleic hydrazide (C4H4N2O2)",
            "Isonicotinic acid hydrazide (Isoniazid)",
            "Hydralazine",
            "Procarbazine",
            "Carbidopa",
            "Phenelzine",
            "Iproniazid",
            "Acetylhydrazine",
            "Benzoylhydrazine",
            "Carbohydrazide (NH2NHCONH2)",
            "Ethylhydrazine (C2H5NHNH2)",
            "Tetramethylhydrazine ((CH3)2NN(CH3)2)",
            "Phenylethylhydrazine (C6H5CH2CH2NHNH2)",
            "1,2-Diphenylhydrazine (C6H5NHNHC6H5)",
            "Nitrohydrazine (O2NNHNH2)",
            "Hydrazinecarboxamide (H2NNHCONH2)",
            "Hydrazinecarbothioamide (H2NNHCSNH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrazine (N2H4)",
                "Methylhydrazine (CH3NHNH2)",
                "Dimethylhydrazine ((CH3)2NNH2)",
                "Phenylhydrazine (C6H5NHNH2)",
                "Semicarbazide (H2NNHCONH2)",
                "Thiosemicarbazide (H2NNHCSNH2)",
                "Hydrazobenzene (C6H5NHNHC6H5)",
                "Maleic hydrazide (C4H4N2O2)",
                "Isonicotinic acid hydrazide (Isoniazid)",
                "Hydralazine",
                "Procarbazine",
                "Carbidopa",
                "Phenelzine",
                "Iproniazid",
                "Acetylhydrazine",
                "Benzoylhydrazine",
                "Carbohydrazide (NH2NHCONH2)",
                "Ethylhydrazine (C2H5NHNH2)",
                "Tetramethylhydrazine ((CH3)2NN(CH3)2)",
                "Phenylethylhydrazine (C6H5CH2CH2NHNH2)",
                "1,2-Diphenylhydrazine (C6H5NHNHC6H5)",
                "Nitrohydrazine (O2NNHNH2)",
                "Hydrazinecarboxamide (H2NNHCONH2)",
                "Hydrazinecarbothioamide (H2NNHCSNH2)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,2-Diphenylhydrazine (C6H5NHNHC6H5)",
                "Acetylhydrazine",
                "Benzoylhydrazine",
                "Carbidopa",
                "Carbohydrazide (NH2NHCONH2)",
                "Dimethylhydrazine ((CH3)2NNH2)",
                "Ethylhydrazine (C2H5NHNH2)",
                "Hydralazine",
                "Hydrazine (N2H4)",
                "Hydrazinecarbothioamide (H2NNHCSNH2)",
                "Hydrazinecarboxamide (H2NNHCONH2)",
                "Hydrazobenzene (C6H5NHNHC6H5)",
                "Iproniazid",
                "Isonicotinic acid hydrazide (Isoniazid)",
                "Maleic hydrazide (C4H4N2O2)",
                "Methylhydrazine (CH3NHNH2)",
                "Nitrohydrazine (O2NNHNH2)",
                "Phenelzine",
                "Phenylethylhydrazine (C6H5CH2CH2NHNH2)",
                "Phenylhydrazine (C6H5NHNH2)",
                "Procarbazine",
                "Semicarbazide (H2NNHCONH2)",
                "Tetramethylhydrazine ((CH3)2NN(CH3)2)",
                "Thiosemicarbazide (H2NNHCSNH2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "Hydrazine (N2H4)",
            "Methylhydrazine (CH3NHNH2)",
            "1,1-Dimethylhydrazine ((CH3)2NNH2)",
            "1,2-Dimethylhydrazine (CH3NHNHCH3)",
            "Ethylhydrazine (C2H5NHNH2)",
            "1,1-Diethylhydrazine ((C2H5)2NNH2)",
            "1,2-Diethylhydrazine (C2H5NHNHC2H5)",
            "Phenylhydrazine (C6H5NHNH2)",
            "1,1-Diphenylhydrazine ((C6H5)2NNH2)",
            "1,2-Diphenylhydrazine (C6H5NHNHC6H5)",
            "Benzylhydrazine (C6H5CH2NHNH2)",
            "1,1-Dibenzylhydrazine ((C6H5CH2)2NNH2)",
            "1,2-Dibenzylhydrazine (C6H5CH2NHNHCH2C6H5)",
            "tert-Butylhydrazine ((CH3)3CNHNH2)",
            "1,1-Di-tert-butylhydrazine (((CH3)3C)2NNH2)",
            "Isopropylhydrazine ((CH3)2CHNHNH2)",
            "1,1-Diisopropylhydrazine (((CH3)2CH)2NNH2)",
            "Cyclopentylhydrazine (C5H9NHNH2)",
            "1,1-Dicyclopentylhydrazine ((C5H9)2NNH2)",
            "Cyclohexylhydrazine (C6H11NHNH2)",
            "1,1-Dicyclohexylhydrazine ((C6H11)2NNH2)",
            "2-Hydroxyethylhydrazine (HOCH2CH2NHNH2)",
            "Carbohydrazide ((H2NNH)2CO)",
            "Semicarbazide (H2NCONHNH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrazine (N2H4)",
                "Methylhydrazine (CH3NHNH2)",
                "1,1-Dimethylhydrazine ((CH3)2NNH2)",
                "1,2-Dimethylhydrazine (CH3NHNHCH3)",
                "Ethylhydrazine (C2H5NHNH2)",
                "1,1-Diethylhydrazine ((C2H5)2NNH2)",
                "1,2-Diethylhydrazine (C2H5NHNHC2H5)",
                "Phenylhydrazine (C6H5NHNH2)",
                "1,1-Diphenylhydrazine ((C6H5)2NNH2)",
                "1,2-Diphenylhydrazine (C6H5NHNHC6H5)",
                "Benzylhydrazine (C6H5CH2NHNH2)",
                "1,1-Dibenzylhydrazine ((C6H5CH2)2NNH2)",
                "1,2-Dibenzylhydrazine (C6H5CH2NHNHCH2C6H5)",
                "tert-Butylhydrazine ((CH3)3CNHNH2)",
                "1,1-Di-tert-butylhydrazine (((CH3)3C)2NNH2)",
                "Isopropylhydrazine ((CH3)2CHNHNH2)",
                "1,1-Diisopropylhydrazine (((CH3)2CH)2NNH2)",
                "Cyclopentylhydrazine (C5H9NHNH2)",
                "1,1-Dicyclopentylhydrazine ((C5H9)2NNH2)",
                "Cyclohexylhydrazine (C6H11NHNH2)",
                "1,1-Dicyclohexylhydrazine ((C6H11)2NNH2)",
                "2-Hydroxyethylhydrazine (HOCH2CH2NHNH2)",
                "Carbohydrazide ((H2NNH)2CO)",
                "Semicarbazide (H2NCONHNH2)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,1-Di-tert-butylhydrazine (((CH3)3C)2NNH2)",
                "1,1-Dibenzylhydrazine ((C6H5CH2)2NNH2)",
                "1,1-Dicyclohexylhydrazine ((C6H11)2NNH2)",
                "1,1-Dicyclopentylhydrazine ((C5H9)2NNH2)",
                "1,1-Diethylhydrazine ((C2H5)2NNH2)",
                "1,1-Diisopropylhydrazine (((CH3)2CH)2NNH2)",
                "1,1-Dimethylhydrazine ((CH3)2NNH2)",
                "1,1-Diphenylhydrazine ((C6H5)2NNH2)",
                "1,2-Dibenzylhydrazine (C6H5CH2NHNHCH2C6H5)",
                "1,2-Diethylhydrazine (C2H5NHNHC2H5)",
                "1,2-Dimethylhydrazine (CH3NHNHCH3)",
                "1,2-Diphenylhydrazine (C6H5NHNHC6H5)",
                "2-Hydroxyethylhydrazine (HOCH2CH2NHNH2)",
                "Benzylhydrazine (C6H5CH2NHNH2)",
                "Carbohydrazide ((H2NNH)2CO)",
                "Cyclohexylhydrazine (C6H11NHNH2)",
                "Cyclopentylhydrazine (C5H9NHNH2)",
                "Ethylhydrazine (C2H5NHNH2)",
                "Hydrazine (N2H4)",
                "Isopropylhydrazine ((CH3)2CHNHNH2)",
                "Methylhydrazine (CH3NHNH2)",
                "Phenylhydrazine (C6H5NHNH2)",
                "Semicarbazide (H2NCONHNH2)",
                "tert-Butylhydrazine ((CH3)3CNHNH2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "Hydrazine (N2H4)",
            "Methylhydrazine (CH3NHNH2)",
            "1,1-Dimethylhydrazine ((CH3)2NNH2)",
            "1,2-Dimethylhydrazine (CH3NHNH(CH3))",
            "1,1,1-Trimethylhydrazinium cation [(CH3)3NNH2]+",
            "Ethylhydrazine (CH3CH2NHNH2)",
            "1-Ethyl-1-methylhydrazine (CH3CH2N(CH3)NH2)",
            "1,1-Diethylhydrazine ((CH3CH2)2NNH2)",
            "1,2-Diethylhydrazine (CH3CH2NHNH(CH3CH2))",
            "Phenylhydrazine (C6H5NHNH2)",
            "1-Methyl-1-phenylhydrazine (C6H5N(CH3)NH2)",
            "1,1-Diphenylhydrazine ((C6H5)2NNH2)",
            "1,2-Diphenylhydrazine (C6H5NHNH(C6H5))",
            "Benzylhydrazine (C6H5CH2NHNH2)",
            "1-Benzyl-1-phenylhydrazine (C6H5CH2N(C6H5)NH2)",
            "2-Methylphenylhydrazine (CH3C6H4NHNH2)",
            "2,4-Dinitrophenylhydrazine ((O2N)2C6H3NHNH2)",
            "Semicarbazide (NH2CONHNH2)",
            "Thiosemicarbazide (NH2CSNH2NH2)",
            "4-Nitrophenylhydrazine (O2NC6H4NHNH2)",
            "2-Hydrazinopyridine (C5H4NNHNH2)",
            "Carbohydrazide (NH2CONHNH2)",
            "Adipohydrazide (NH2CONHNH(CH2)4NHNH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrazine (N2H4)",
                "Methylhydrazine (CH3NHNH2)",
                "1,1-Dimethylhydrazine ((CH3)2NNH2)",
                "1,2-Dimethylhydrazine (CH3NHNH(CH3))",
                "1,1,1-Trimethylhydrazinium cation [(CH3)3NNH2]+",
                "Ethylhydrazine (CH3CH2NHNH2)",
                "1-Ethyl-1-methylhydrazine (CH3CH2N(CH3)NH2)",
                "1,1-Diethylhydrazine ((CH3CH2)2NNH2)",
                "1,2-Diethylhydrazine (CH3CH2NHNH(CH3CH2))",
                "Phenylhydrazine (C6H5NHNH2)",
                "1-Methyl-1-phenylhydrazine (C6H5N(CH3)NH2)",
                "1,1-Diphenylhydrazine ((C6H5)2NNH2)",
                "1,2-Diphenylhydrazine (C6H5NHNH(C6H5))",
                "Benzylhydrazine (C6H5CH2NHNH2)",
                "1-Benzyl-1-phenylhydrazine (C6H5CH2N(C6H5)NH2)",
                "2-Methylphenylhydrazine (CH3C6H4NHNH2)",
                "2,4-Dinitrophenylhydrazine ((O2N)2C6H3NHNH2)",
                "Semicarbazide (NH2CONHNH2)",
                "Thiosemicarbazide (NH2CSNH2NH2)",
                "4-Nitrophenylhydrazine (O2NC6H4NHNH2)",
                "2-Hydrazinopyridine (C5H4NNHNH2)",
                "Carbohydrazide (NH2CONHNH2)",
                "Adipohydrazide (NH2CONHNH(CH2)4NHNH2)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,1,1-Trimethylhydrazinium cation [(CH3)3NNH2]+",
                "1,1-Diethylhydrazine ((CH3CH2)2NNH2)",
                "1,1-Dimethylhydrazine ((CH3)2NNH2)",
                "1,1-Diphenylhydrazine ((C6H5)2NNH2)",
                "1,2-Diethylhydrazine (CH3CH2NHNH(CH3CH2))",
                "1,2-Dimethylhydrazine (CH3NHNH(CH3))",
                "1,2-Diphenylhydrazine (C6H5NHNH(C6H5))",
                "1-Benzyl-1-phenylhydrazine (C6H5CH2N(C6H5)NH2)",
                "1-Ethyl-1-methylhydrazine (CH3CH2N(CH3)NH2)",
                "1-Methyl-1-phenylhydrazine (C6H5N(CH3)NH2)",
                "2,4-Dinitrophenylhydrazine ((O2N)2C6H3NHNH2)",
                "2-Hydrazinopyridine (C5H4NNHNH2)",
                "2-Methylphenylhydrazine (CH3C6H4NHNH2)",
                "4-Nitrophenylhydrazine (O2NC6H4NHNH2)",
                "Adipohydrazide (NH2CONHNH(CH2)4NHNH2)",
                "Benzylhydrazine (C6H5CH2NHNH2)",
                "Carbohydrazide (NH2CONHNH2)",
                "Ethylhydrazine (CH3CH2NHNH2)",
                "Hydrazine (N2H4)",
                "Methylhydrazine (CH3NHNH2)",
                "Phenylhydrazine (C6H5NHNH2)",
                "Semicarbazide (NH2CONHNH2)",
                "Thiosemicarbazide (NH2CSNH2NH2)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "Hydrazine (N2H4)",
            "Methylhydrazine (CH3-N2H3)",
            "Ethylhydrazine (C2H5-N2H3)",
            "Propylhydrazine (C3H7-N2H3)",
            "Butylhydrazine (C4H9-N2H3)",
            "Pentylhydrazine (C5H11-N2H3)",
            "Hexylhydrazine (C6H13-N2H3)",
            "Heptylhydrazine (C7H15-N2H3)",
            "Octylhydrazine (C8H17-N2H3)",
            "Nonylhydrazine (C9H19-N2H3)",
            "Decylhydrazine (C10H21-N2H3)",
            "Undecylhydrazine (C11H23-N2H3)",
            "Dodecylhydrazine (C12H25-N2H3)",
            "Tridecylhydrazine (C13H27-N2H3)",
            "Tetradecylhydrazine (C14H29-N2H3)",
            "Pentadecylhydrazine (C15H31-N2H3)",
            "Hexadecylhydrazine (C16H33-N2H3)",
            "Heptadecylhydrazine (C17H35-N2H3)",
            "Octadecylhydrazine (C18H37-N2H3)",
            "Nonadecylhydrazine (C19H39-N2H3)",
            "Eicosylhydrazine (C20H41-N2H3)",
            "Heneicosylhydrazine (C21H43-N2H3)",
            "Docosylhydrazine (C22H45-N2H3)",
            "Tricosylhydrazine (C23H47-N2H3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrazine (N2H4)",
                "Methylhydrazine (CH3-N2H3)",
                "Ethylhydrazine (C2H5-N2H3)",
                "Propylhydrazine (C3H7-N2H3)",
                "Butylhydrazine (C4H9-N2H3)",
                "Pentylhydrazine (C5H11-N2H3)",
                "Hexylhydrazine (C6H13-N2H3)",
                "Heptylhydrazine (C7H15-N2H3)",
                "Octylhydrazine (C8H17-N2H3)",
                "Nonylhydrazine (C9H19-N2H3)",
                "Decylhydrazine (C10H21-N2H3)",
                "Undecylhydrazine (C11H23-N2H3)",
                "Dodecylhydrazine (C12H25-N2H3)",
                "Tridecylhydrazine (C13H27-N2H3)",
                "Tetradecylhydrazine (C14H29-N2H3)",
                "Pentadecylhydrazine (C15H31-N2H3)",
                "Hexadecylhydrazine (C16H33-N2H3)",
                "Heptadecylhydrazine (C17H35-N2H3)",
                "Octadecylhydrazine (C18H37-N2H3)",
                "Nonadecylhydrazine (C19H39-N2H3)",
                "Eicosylhydrazine (C20H41-N2H3)",
                "Heneicosylhydrazine (C21H43-N2H3)",
                "Docosylhydrazine (C22H45-N2H3)",
                "Tricosylhydrazine (C23H47-N2H3)"
            ],
            "mismatches": [],
            "true_referents": [
                "Butylhydrazine (C4H9-N2H3)",
                "Decylhydrazine (C10H21-N2H3)",
                "Docosylhydrazine (C22H45-N2H3)",
                "Dodecylhydrazine (C12H25-N2H3)",
                "Eicosylhydrazine (C20H41-N2H3)",
                "Ethylhydrazine (C2H5-N2H3)",
                "Heneicosylhydrazine (C21H43-N2H3)",
                "Heptadecylhydrazine (C17H35-N2H3)",
                "Heptylhydrazine (C7H15-N2H3)",
                "Hexadecylhydrazine (C16H33-N2H3)",
                "Hexylhydrazine (C6H13-N2H3)",
                "Hydrazine (N2H4)",
                "Methylhydrazine (CH3-N2H3)",
                "Nonadecylhydrazine (C19H39-N2H3)",
                "Nonylhydrazine (C9H19-N2H3)",
                "Octadecylhydrazine (C18H37-N2H3)",
                "Octylhydrazine (C8H17-N2H3)",
                "Pentadecylhydrazine (C15H31-N2H3)",
                "Pentylhydrazine (C5H11-N2H3)",
                "Propylhydrazine (C3H7-N2H3)",
                "Tetradecylhydrazine (C14H29-N2H3)",
                "Tricosylhydrazine (C23H47-N2H3)",
                "Tridecylhydrazine (C13H27-N2H3)",
                "Undecylhydrazine (C11H23-N2H3)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "Aminomethane (Methylamine)",
            "Ethylamine",
            "Propylamine",
            "Butylamine",
            "Pentylamine",
            "Hexylamine",
            "Heptylamine",
            "Octylamine",
            "Nonylamine",
            "Decylamine",
            "Dodecylamine",
            "Tetradecylamine",
            "Hexadecylamine",
            "Octadecylamine",
            "Eicosylamine",
            "Docosylamine",
            "Tetracosylamine",
            "Hexacosylamine",
            "Octacosylamine",
            "Triacontylamine",
            "Dotriacontylamine",
            "Tetatriacontylamine",
            "Hexatriacontylamine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aminomethane (Methylamine)",
                "Ethylamine",
                "Propylamine",
                "Butylamine",
                "Pentylamine",
                "Hexylamine",
                "Heptylamine",
                "Octylamine",
                "Nonylamine",
                "Decylamine",
                "Dodecylamine",
                "Tetradecylamine",
                "Hexadecylamine",
                "Octadecylamine",
                "Eicosylamine",
                "Docosylamine",
                "Tetracosylamine",
                "Hexacosylamine",
                "Octacosylamine",
                "Triacontylamine",
                "Dotriacontylamine",
                "Tetatriacontylamine",
                "Hexatriacontylamine"
            ],
            "mismatches": [],
            "true_referents": [
                "Aminomethane (Methylamine)",
                "Butylamine",
                "Decylamine",
                "Docosylamine",
                "Dodecylamine",
                "Dotriacontylamine",
                "Eicosylamine",
                "Ethylamine",
                "Heptylamine",
                "Hexacosylamine",
                "Hexadecylamine",
                "Hexatriacontylamine",
                "Hexylamine",
                "Nonylamine",
                "Octacosylamine",
                "Octadecylamine",
                "Octylamine",
                "Pentylamine",
                "Propylamine",
                "Tetatriacontylamine",
                "Tetracosylamine",
                "Tetradecylamine",
                "Triacontylamine"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            "Hydrazine (N2H4) itself (HZ)",
            "Methylhydrazine (CH3NHNH2) (MMH)",
            "Dimethylhydrazine (C2H6N2) (UDMH)",
            "Ethylhydrazine (C2H5NHNH2) (EEH)",
            "Phenylhydrazine (C6H5NHNH2) (PHH)",
            "1,1-Dimethylhydrazine (C3H8N2) (UDMH)",
            "1,2-Dimethylhydrazine (C3H8N2) (DDMH)",
            "Diethylhydrazine (C4H10N2) (DEH)",
            "Diphenylhydrazine (C12H12N2) (DPH)",
            "Bis(2-carboxyethyl)hydrazine (C6H10N2O2) (BCHE)",
            "Bis(2-hydroxyethyl)hydrazine (C4H10N2O2) (BHEH)",
            "1-Carbethylhydrazine (C2H6N2O) (CMH)",
            "1-Hydroxymethylhydrazine (C2H6N2O) (HMH)",
            "1-Acetylhydrazine (C3H6N2O) (AEH)",
            "1-Benzoylhydrazine (C8H8N2O) (BEH)",
            "1,2-Bis(acetyl)hydrazine (C6H10N2O2) (BAEH)",
            "1,2-Bis(benzoyl)hydrazine (C16H14N2O2) (BBEH)",
            "1-Carboethoxyhydrazine (C3H8N2O2) (CEH)",
            "1-Carbophenoxyhydrazine (C8H10N2O2) (CPhEH)",
            "1-Hydroxyethoxyhydrazine (C2H8N2O2) (HEEH)",
            "1-Acetoxyhydrazine (C3H6N2O2) (AEH)",
            "1-Benzoxyhydrazine (C8H8N2O2) (BEH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydrazine (N2H4) itself (HZ)",
                "Methylhydrazine (CH3NHNH2) (MMH)",
                "Dimethylhydrazine (C2H6N2) (UDMH)",
                "Ethylhydrazine (C2H5NHNH2) (EEH)",
                "Phenylhydrazine (C6H5NHNH2) (PHH)",
                "1,1-Dimethylhydrazine (C3H8N2) (UDMH)",
                "1,2-Dimethylhydrazine (C3H8N2) (DDMH)",
                "Diethylhydrazine (C4H10N2) (DEH)",
                "Diphenylhydrazine (C12H12N2) (DPH)",
                "Bis(2-carboxyethyl)hydrazine (C6H10N2O2) (BCHE)",
                "Bis(2-hydroxyethyl)hydrazine (C4H10N2O2) (BHEH)",
                "1-Carbethylhydrazine (C2H6N2O) (CMH)",
                "1-Hydroxymethylhydrazine (C2H6N2O) (HMH)",
                "1-Acetylhydrazine (C3H6N2O) (AEH)",
                "1-Benzoylhydrazine (C8H8N2O) (BEH)",
                "1,2-Bis(acetyl)hydrazine (C6H10N2O2) (BAEH)",
                "1,2-Bis(benzoyl)hydrazine (C16H14N2O2) (BBEH)",
                "1-Carboethoxyhydrazine (C3H8N2O2) (CEH)",
                "1-Carbophenoxyhydrazine (C8H10N2O2) (CPhEH)",
                "1-Hydroxyethoxyhydrazine (C2H8N2O2) (HEEH)",
                "1-Acetoxyhydrazine (C3H6N2O2) (AEH)",
                "1-Benzoxyhydrazine (C8H8N2O2) (BEH)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,1-Dimethylhydrazine (C3H8N2) (UDMH)",
                "1,2-Bis(acetyl)hydrazine (C6H10N2O2) (BAEH)",
                "1,2-Bis(benzoyl)hydrazine (C16H14N2O2) (BBEH)",
                "1,2-Dimethylhydrazine (C3H8N2) (DDMH)",
                "1-Acetoxyhydrazine (C3H6N2O2) (AEH)",
                "1-Acetylhydrazine (C3H6N2O) (AEH)",
                "1-Benzoxyhydrazine (C8H8N2O2) (BEH)",
                "1-Benzoylhydrazine (C8H8N2O) (BEH)",
                "1-Carbethylhydrazine (C2H6N2O) (CMH)",
                "1-Carboethoxyhydrazine (C3H8N2O2) (CEH)",
                "1-Carbophenoxyhydrazine (C8H10N2O2) (CPhEH)",
                "1-Hydroxyethoxyhydrazine (C2H8N2O2) (HEEH)",
                "1-Hydroxymethylhydrazine (C2H6N2O) (HMH)",
                "Bis(2-carboxyethyl)hydrazine (C6H10N2O2) (BCHE)",
                "Bis(2-hydroxyethyl)hydrazine (C4H10N2O2) (BHEH)",
                "Diethylhydrazine (C4H10N2) (DEH)",
                "Dimethylhydrazine (C2H6N2) (UDMH)",
                "Diphenylhydrazine (C12H12N2) (DPH)",
                "Ethylhydrazine (C2H5NHNH2) (EEH)",
                "Hydrazine (N2H4) itself (HZ)",
                "Methylhydrazine (CH3NHNH2) (MMH)",
                "Phenylhydrazine (C6H5NHNH2) (PHH)"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "hydrazine",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "N2H4",
                "Canonical name": "Nitrous oxide"
            },
            {
                "Referent": "N2H4 (N2H2)",
                "Canonical name": "Dinitrogen"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nitrous oxide",
                "Dinitrogen"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"N2H4 (N2H2)\", \"Canonical name\": \"Dinitrogen\"}",
                "{\"Referent\": \"N2H4\", \"Canonical name\": \"Nitrous oxide\"}"
            ],
            "TP": 2,
            "FP": 0,
            "FN": 0
        }
    }
]