[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "methyl (CH3)",
            "ethyl (C2H5)",
            "propyl (C3H7)",
            "butyl (C4H9)",
            "methoxy (-OCH3)",
            "ethoxy (-OC2H5)",
            "propoxy (-OC3H7)",
            "butoxy (-OC4H9)",
            "methylthio (-SC2H5)",
            "ethylthio (-SC2H5)",
            "aminomethyl (-CH2NH2)",
            "aminopropyl (-C3H6NH2)",
            "carboxyl (-COOH)",
            "cyanide (-CN)",
            "nitro (-NO2)",
            "hydroxyl (-OH)",
            "halogens (F, Cl, Br, I)",
            "sulfhydryl (-SH)",
            "alkene (C=C)",
            "alkyne (-C\u2261C-)",
            "amide (-CONH2)",
            "ester (-COOR)",
            "ketone (-CO-)",
            "aldehyde (-CHO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methyl (CH3)",
                "ethyl (C2H5)",
                "propyl (C3H7)",
                "butyl (C4H9)",
                "methoxy (-OCH3)",
                "ethoxy (-OC2H5)",
                "propoxy (-OC3H7)",
                "butoxy (-OC4H9)",
                "methylthio (-SC2H5)",
                "ethylthio (-SC2H5)",
                "aminomethyl (-CH2NH2)",
                "aminopropyl (-C3H6NH2)",
                "carboxyl (-COOH)",
                "cyanide (-CN)",
                "nitro (-NO2)",
                "hydroxyl (-OH)",
                "halogens (F, Cl, Br, I)",
                "sulfhydryl (-SH)",
                "alkene (C=C)",
                "alkyne (-C\u2261C-)",
                "amide (-CONH2)",
                "ester (-COOR)",
                "ketone (-CO-)",
                "aldehyde (-CHO)"
            ],
            "mismatches": [],
            "true_referents": [
                "aldehyde (-CHO)",
                "alkene (C=C)",
                "alkyne (-C\u2261C-)",
                "amide (-CONH2)",
                "aminomethyl (-CH2NH2)",
                "aminopropyl (-C3H6NH2)",
                "butoxy (-OC4H9)",
                "butyl (C4H9)",
                "carboxyl (-COOH)",
                "cyanide (-CN)",
                "ester (-COOR)",
                "ethoxy (-OC2H5)",
                "ethyl (C2H5)",
                "ethylthio (-SC2H5)",
                "halogens (F, Cl, Br, I)",
                "hydroxyl (-OH)",
                "ketone (-CO-)",
                "methoxy (-OCH3)",
                "methyl (CH3)",
                "methylthio (-SC2H5)",
                "nitro (-NO2)",
                "propoxy (-OC3H7)",
                "propyl (C3H7)",
                "sulfhydryl (-SH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl group (-OH)",
            "Carboxyl group (-COOH)",
            "Amino group (-NH2)",
            "Methyl group (-CH3)",
            "Phenyl group (C6H5-)",
            "Hydroperoxyl group (-OOH)",
            "Alkoxyl group (-OR)",
            "Alkoxy group (-OR, where R is an alkyl group)",
            "Carbonyl group (C=O)",
            "Carbonyl group (ketone, >C=O)",
            "Carbonyl group (aldehyde, -CHO)",
            "Nitro group (-NO2)",
            "Sulfhydryl group (-SH)",
            "Thiol group (-SH)",
            "Sulfonic acid group (-SO3H)",
            "Sulfonyl group (-SO2-)",
            "Phosphate group (-PO4H2)",
            "Acetyl group (-COCH3)",
            "Benzyl group (C6H5CH2-)",
            "Formyl group (-CHO)",
            "Cyano group (-CN)",
            "Iodo group (-I)",
            "Bromo group (-Br)",
            "Chloro group (-Cl)",
            "Fluoro group (-F)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl group (-OH)",
                "Carboxyl group (-COOH)",
                "Amino group (-NH2)",
                "Methyl group (-CH3)",
                "Phenyl group (C6H5-)",
                "Hydroperoxyl group (-OOH)",
                "Alkoxyl group (-OR)",
                "Alkoxy group (-OR, where R is an alkyl group)",
                "Carbonyl group (C=O)",
                "Carbonyl group (ketone, >C=O)",
                "Carbonyl group (aldehyde, -CHO)",
                "Nitro group (-NO2)",
                "Sulfhydryl group (-SH)",
                "Thiol group (-SH)",
                "Sulfonic acid group (-SO3H)",
                "Sulfonyl group (-SO2-)",
                "Phosphate group (-PO4H2)",
                "Acetyl group (-COCH3)",
                "Benzyl group (C6H5CH2-)",
                "Formyl group (-CHO)",
                "Cyano group (-CN)",
                "Iodo group (-I)",
                "Bromo group (-Br)",
                "Chloro group (-Cl)"
            ],
            "mismatches": [
                "Fluoro group (-F)"
            ],
            "true_referents": [
                "Acetyl group (-COCH3)",
                "Alkoxy group (-OR, where R is an alkyl group)",
                "Alkoxyl group (-OR)",
                "Amino group (-NH2)",
                "Benzyl group (C6H5CH2-)",
                "Bromo group (-Br)",
                "Carbonyl group (C=O)",
                "Carbonyl group (aldehyde, -CHO)",
                "Carbonyl group (ketone, >C=O)",
                "Carboxyl group (-COOH)",
                "Chloro group (-Cl)",
                "Cyano group (-CN)",
                "Formyl group (-CHO)",
                "Hydroperoxyl group (-OOH)",
                "Hydroxyl group (-OH)",
                "Iodo group (-I)",
                "Methyl group (-CH3)",
                "Nitro group (-NO2)",
                "Phenyl group (C6H5-)",
                "Phosphate group (-PO4H2)",
                "Sulfhydryl group (-SH)",
                "Sulfonic acid group (-SO3H)",
                "Sulfonyl group (-SO2-)",
                "Thiol group (-SH)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Methyl group (CH3-)",
            "Ethyl group (C2H5-)",
            "Hydroxyl group (-OH)",
            "Carboxyl group (-COOH)",
            "Amino group (-NH2)",
            "Methylmercaptan group (-SCH3)",
            "Nitro group (-NO2)",
            "Sulfhydryl group (-SH)",
            "Phenyl group (C6H5-)",
            "Acyloxy group (-OCO-)",
            "Cyano group (-CN)",
            "Formyl group (-CHO)",
            "Acetyl group (-COCH3)",
            "Carbamoyl group (-CONH2)",
            "Ester group (-COOR)",
            "Amide group (-CONH2)",
            "Aldehyde group (-CHO)",
            "Ketone group (-CO-)",
            "Ether group (-O-)",
            "Halogen group (-X, where X is F, Cl, Br, I)",
            "Sulfonyl group (-SO2-)",
            "Phosphoryl group (-PO3-)",
            "Methoxy group (-OCH3)",
            "Epoxide group (-O-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl group (CH3-)",
                "Ethyl group (C2H5-)",
                "Hydroxyl group (-OH)",
                "Carboxyl group (-COOH)",
                "Amino group (-NH2)",
                "Methylmercaptan group (-SCH3)",
                "Nitro group (-NO2)",
                "Sulfhydryl group (-SH)",
                "Phenyl group (C6H5-)",
                "Acyloxy group (-OCO-)",
                "Cyano group (-CN)",
                "Formyl group (-CHO)",
                "Acetyl group (-COCH3)",
                "Carbamoyl group (-CONH2)",
                "Ester group (-COOR)",
                "Amide group (-CONH2)",
                "Aldehyde group (-CHO)",
                "Ketone group (-CO-)",
                "Ether group (-O-)",
                "Halogen group (-X, where X is F, Cl, Br, I)",
                "Sulfonyl group (-SO2-)",
                "Phosphoryl group (-PO3-)",
                "Methoxy group (-OCH3)",
                "Epoxide group (-O-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl group (-COCH3)",
                "Acyloxy group (-OCO-)",
                "Aldehyde group (-CHO)",
                "Amide group (-CONH2)",
                "Amino group (-NH2)",
                "Carbamoyl group (-CONH2)",
                "Carboxyl group (-COOH)",
                "Cyano group (-CN)",
                "Epoxide group (-O-)",
                "Ester group (-COOR)",
                "Ether group (-O-)",
                "Ethyl group (C2H5-)",
                "Formyl group (-CHO)",
                "Halogen group (-X, where X is F, Cl, Br, I)",
                "Hydroxyl group (-OH)",
                "Ketone group (-CO-)",
                "Methoxy group (-OCH3)",
                "Methyl group (CH3-)",
                "Methylmercaptan group (-SCH3)",
                "Nitro group (-NO2)",
                "Phenyl group (C6H5-)",
                "Phosphoryl group (-PO3-)",
                "Sulfhydryl group (-SH)",
                "Sulfonyl group (-SO2-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Methyl group (Me)",
            "Ethyl group (Et)",
            "Isopropyl group (iPr)",
            "tert-Butyl group (tBu)",
            "Phenyl group (Ph)",
            "Hydroxyl group (OH)",
            "Amino group (NH2)",
            "Carboxyl group (COOH)",
            "Aldehyde group (CHO)",
            "Ketone group (C=O)",
            "Ether group (R-O-R')",
            "Ester group (R-COO-R')",
            "Amide group (R-CO-NH2)",
            "Nitro group (NO2)",
            "Halogen (F, Cl, Br, I)",
            "Cyano group (CN)",
            "Sulfhydryl group (SH)",
            "Phosphoryl group (PO4H2)",
            "Acetyl group (COCH3)",
            "Benzoyl group (COC6H5)",
            "Trifluoromethyl group (CF3)",
            "Methoxy group (OCH3)",
            "Formyl group (CHO)",
            "Vinyl group (CH2=CH-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl group (Me)",
                "Ethyl group (Et)",
                "Isopropyl group (iPr)",
                "tert-Butyl group (tBu)",
                "Phenyl group (Ph)",
                "Hydroxyl group (OH)",
                "Amino group (NH2)",
                "Carboxyl group (COOH)",
                "Aldehyde group (CHO)",
                "Ketone group (C=O)",
                "Ether group (R-O-R')",
                "Ester group (R-COO-R')",
                "Amide group (R-CO-NH2)",
                "Nitro group (NO2)",
                "Halogen (F, Cl, Br, I)",
                "Cyano group (CN)",
                "Sulfhydryl group (SH)",
                "Phosphoryl group (PO4H2)",
                "Acetyl group (COCH3)",
                "Benzoyl group (COC6H5)",
                "Trifluoromethyl group (CF3)",
                "Methoxy group (OCH3)",
                "Formyl group (CHO)",
                "Vinyl group (CH2=CH-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl group (COCH3)",
                "Aldehyde group (CHO)",
                "Amide group (R-CO-NH2)",
                "Amino group (NH2)",
                "Benzoyl group (COC6H5)",
                "Carboxyl group (COOH)",
                "Cyano group (CN)",
                "Ester group (R-COO-R')",
                "Ether group (R-O-R')",
                "Ethyl group (Et)",
                "Formyl group (CHO)",
                "Halogen (F, Cl, Br, I)",
                "Hydroxyl group (OH)",
                "Isopropyl group (iPr)",
                "Ketone group (C=O)",
                "Methoxy group (OCH3)",
                "Methyl group (Me)",
                "Nitro group (NO2)",
                "Phenyl group (Ph)",
                "Phosphoryl group (PO4H2)",
                "Sulfhydryl group (SH)",
                "Trifluoromethyl group (CF3)",
                "Vinyl group (CH2=CH-)",
                "tert-Butyl group (tBu)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl Group (OH)",
            "Carboxyl Group (COOH)",
            "Amino Group (NH2)",
            "Phosphate Group (PO4)",
            "Methyl Group (CH3)",
            "Ethyl Group (C2H5)",
            "Carbonyl Group (C=O)",
            "Aldehyde Group (CHO)",
            "Ketone Group (RCOR')",
            "Sulfhydryl Group (SH)",
            "Nitro Group (NO2)",
            "Amide Group (CONH2)",
            "Ester Group (COOR)",
            "Ether Group (ROR')",
            "Halogen Group (X)",
            "Thiol Group (RSH)",
            "Acetyl Group (COCH3)",
            "Vinyl Group (C2H3)",
            "Phenyl Group (C6H5)",
            "Cyano Group (CN)",
            "Isopropyl Group (C3H7)",
            "Benzyl Group (C6H5CH2)",
            "Allyl Group (C3H5)",
            "Isobutyl Group (C4H9)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl Group (OH)",
                "Carboxyl Group (COOH)",
                "Amino Group (NH2)",
                "Phosphate Group (PO4)",
                "Methyl Group (CH3)",
                "Ethyl Group (C2H5)",
                "Carbonyl Group (C=O)",
                "Aldehyde Group (CHO)",
                "Ketone Group (RCOR')",
                "Sulfhydryl Group (SH)",
                "Nitro Group (NO2)",
                "Amide Group (CONH2)",
                "Ester Group (COOR)",
                "Ether Group (ROR')",
                "Halogen Group (X)",
                "Thiol Group (RSH)",
                "Acetyl Group (COCH3)",
                "Vinyl Group (C2H3)",
                "Phenyl Group (C6H5)",
                "Cyano Group (CN)",
                "Isopropyl Group (C3H7)",
                "Benzyl Group (C6H5CH2)",
                "Allyl Group (C3H5)",
                "Isobutyl Group (C4H9)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl Group (COCH3)",
                "Aldehyde Group (CHO)",
                "Allyl Group (C3H5)",
                "Amide Group (CONH2)",
                "Amino Group (NH2)",
                "Benzyl Group (C6H5CH2)",
                "Carbonyl Group (C=O)",
                "Carboxyl Group (COOH)",
                "Cyano Group (CN)",
                "Ester Group (COOR)",
                "Ether Group (ROR')",
                "Ethyl Group (C2H5)",
                "Halogen Group (X)",
                "Hydroxyl Group (OH)",
                "Isobutyl Group (C4H9)",
                "Isopropyl Group (C3H7)",
                "Ketone Group (RCOR')",
                "Methyl Group (CH3)",
                "Nitro Group (NO2)",
                "Phenyl Group (C6H5)",
                "Phosphate Group (PO4)",
                "Sulfhydryl Group (SH)",
                "Thiol Group (RSH)",
                "Vinyl Group (C2H3)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Methyl group (\u2212CH3)",
            "Ethyl group (\u2212C2H5)",
            "Propyl group (\u2212C3H7)",
            "Butyl group (\u2212C4H9)",
            "Isopropyl group (\u2212C3H7)",
            "Amino group (\u2212NH2)",
            "Hydroxyl group (\u2212OH)",
            "Carboxyl group (\u2212COOH)",
            "Nitro group (\u2212NO2)",
            "Allyl group (\u2212C3H5)",
            "Vinyl group (\u2212C2H3)",
            "Phenyl group (\u2212C6H5)",
            "Benzyl group (\u2212C7H7)",
            "Cyclopropyl group (\u2212C3H5)",
            "Cyclobutyl group (\u2212C4H7)",
            "Cyclopentyl group (\u2212C5H9)",
            "Cyclohexyl group (\u2212C6H11)",
            "Thioether group (\u2212S\u2212)",
            "Sulfhydryl group (\u2212SH)",
            "Phosphoryl group (\u2212PO4)",
            "Cyanide group (\u2212CN)",
            "Formyl group (\u2212CHO)",
            "Iodopropyl group (\u2212C3H7I)",
            "Fluoromethyl group (\u2212CH2F)",
            "Chloromethyl group (\u2212CH2Cl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl group (\u2212CH3)",
                "Ethyl group (\u2212C2H5)",
                "Propyl group (\u2212C3H7)",
                "Butyl group (\u2212C4H9)",
                "Isopropyl group (\u2212C3H7)",
                "Amino group (\u2212NH2)",
                "Hydroxyl group (\u2212OH)",
                "Carboxyl group (\u2212COOH)",
                "Nitro group (\u2212NO2)",
                "Allyl group (\u2212C3H5)",
                "Vinyl group (\u2212C2H3)",
                "Phenyl group (\u2212C6H5)",
                "Benzyl group (\u2212C7H7)",
                "Cyclopropyl group (\u2212C3H5)",
                "Cyclobutyl group (\u2212C4H7)",
                "Cyclopentyl group (\u2212C5H9)",
                "Cyclohexyl group (\u2212C6H11)",
                "Thioether group (\u2212S\u2212)",
                "Sulfhydryl group (\u2212SH)",
                "Phosphoryl group (\u2212PO4)",
                "Cyanide group (\u2212CN)",
                "Formyl group (\u2212CHO)",
                "Iodopropyl group (\u2212C3H7I)",
                "Fluoromethyl group (\u2212CH2F)"
            ],
            "mismatches": [
                "Chloromethyl group (\u2212CH2Cl)"
            ],
            "true_referents": [
                "Allyl group (\u2212C3H5)",
                "Amino group (\u2212NH2)",
                "Benzyl group (\u2212C7H7)",
                "Butyl group (\u2212C4H9)",
                "Carboxyl group (\u2212COOH)",
                "Cyanide group (\u2212CN)",
                "Cyclobutyl group (\u2212C4H7)",
                "Cyclohexyl group (\u2212C6H11)",
                "Cyclopentyl group (\u2212C5H9)",
                "Cyclopropyl group (\u2212C3H5)",
                "Ethyl group (\u2212C2H5)",
                "Fluoromethyl group (\u2212CH2F)",
                "Formyl group (\u2212CHO)",
                "Hydroxyl group (\u2212OH)",
                "Iodopropyl group (\u2212C3H7I)",
                "Isopropyl group (\u2212C3H7)",
                "Methyl group (\u2212CH3)",
                "Nitro group (\u2212NO2)",
                "Phenyl group (\u2212C6H5)",
                "Phosphoryl group (\u2212PO4)",
                "Propyl group (\u2212C3H7)",
                "Sulfhydryl group (\u2212SH)",
                "Thioether group (\u2212S\u2212)",
                "Vinyl group (\u2212C2H3)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl group (OH)",
            "Methyl group (CH3)",
            "Carboxyl group (COOH)",
            "Amino group (NH2)",
            "Phosphate group (PO4)",
            "Sulfhydryl group (SH)",
            "Aldehyde group (CHO)",
            "Ketone group (RCOR')",
            "Ester group (RCOO)",
            "Ether group (ROR')",
            "Aryl group (Ar)",
            "Vinyl group (C2H3)",
            "Acyl group (RCO)",
            "Alkyl group (R)",
            "Amide group (CONH2)",
            "Carbonyl group (C=O)",
            "Cyanide group (CN)",
            "Epoxide group (COC)",
            "Guanidinium group (C(NH2)3)",
            "Imine group (CN)",
            "Isocyanate group (NCO)",
            "Nitrate group (NO3)",
            "Nitro group (NO2)",
            "Sulfate group (SO4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl group (OH)",
                "Methyl group (CH3)",
                "Carboxyl group (COOH)",
                "Amino group (NH2)",
                "Phosphate group (PO4)",
                "Sulfhydryl group (SH)",
                "Aldehyde group (CHO)",
                "Ketone group (RCOR')",
                "Ester group (RCOO)",
                "Ether group (ROR')",
                "Aryl group (Ar)",
                "Vinyl group (C2H3)",
                "Acyl group (RCO)",
                "Alkyl group (R)",
                "Amide group (CONH2)",
                "Carbonyl group (C=O)",
                "Cyanide group (CN)",
                "Epoxide group (COC)",
                "Guanidinium group (C(NH2)3)",
                "Imine group (CN)",
                "Isocyanate group (NCO)",
                "Nitrate group (NO3)",
                "Nitro group (NO2)",
                "Sulfate group (SO4)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acyl group (RCO)",
                "Aldehyde group (CHO)",
                "Alkyl group (R)",
                "Amide group (CONH2)",
                "Amino group (NH2)",
                "Aryl group (Ar)",
                "Carbonyl group (C=O)",
                "Carboxyl group (COOH)",
                "Cyanide group (CN)",
                "Epoxide group (COC)",
                "Ester group (RCOO)",
                "Ether group (ROR')",
                "Guanidinium group (C(NH2)3)",
                "Hydroxyl group (OH)",
                "Imine group (CN)",
                "Isocyanate group (NCO)",
                "Ketone group (RCOR')",
                "Methyl group (CH3)",
                "Nitrate group (NO3)",
                "Nitro group (NO2)",
                "Phosphate group (PO4)",
                "Sulfate group (SO4)",
                "Sulfhydryl group (SH)",
                "Vinyl group (C2H3)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Methyl group (CH3)",
            "Ethyl group (C2H5)",
            "Propyl group (C3H7)",
            "Isopropyl group (C3H7)",
            "Butyl group (C4H9)",
            "Isobutyl group (C4H9)",
            "Pentyl group (C5H11)",
            "Hexyl group (C6H13)",
            "Heptyl group (C7H15)",
            "Octyl group (C8H17)",
            "Nonyl group (C9H19)",
            "Decyl group (C10H21)",
            "Phenyl group (C6H5)",
            "Benzyl group (C6H5CH2)",
            "Allyl group (C3H5)",
            "Vinyl group (CH2=CH)",
            "Acetyl group (CH3CO)",
            "Formyl group (CHO)",
            "Hydroxyl group (OH)",
            "Amino group (NH2)",
            "Carboxyl group (COOH)",
            "Sulfhydryl group (SH)",
            "Phosphate group (PO4)",
            "Methylamine group (CH3NH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl group (CH3)",
                "Ethyl group (C2H5)",
                "Propyl group (C3H7)",
                "Isopropyl group (C3H7)",
                "Butyl group (C4H9)",
                "Isobutyl group (C4H9)",
                "Pentyl group (C5H11)",
                "Hexyl group (C6H13)",
                "Heptyl group (C7H15)",
                "Octyl group (C8H17)",
                "Nonyl group (C9H19)",
                "Decyl group (C10H21)",
                "Phenyl group (C6H5)",
                "Benzyl group (C6H5CH2)",
                "Allyl group (C3H5)",
                "Vinyl group (CH2=CH)",
                "Acetyl group (CH3CO)",
                "Formyl group (CHO)",
                "Hydroxyl group (OH)",
                "Amino group (NH2)",
                "Carboxyl group (COOH)",
                "Sulfhydryl group (SH)",
                "Phosphate group (PO4)",
                "Methylamine group (CH3NH2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl group (CH3CO)",
                "Allyl group (C3H5)",
                "Amino group (NH2)",
                "Benzyl group (C6H5CH2)",
                "Butyl group (C4H9)",
                "Carboxyl group (COOH)",
                "Decyl group (C10H21)",
                "Ethyl group (C2H5)",
                "Formyl group (CHO)",
                "Heptyl group (C7H15)",
                "Hexyl group (C6H13)",
                "Hydroxyl group (OH)",
                "Isobutyl group (C4H9)",
                "Isopropyl group (C3H7)",
                "Methyl group (CH3)",
                "Methylamine group (CH3NH2)",
                "Nonyl group (C9H19)",
                "Octyl group (C8H17)",
                "Pentyl group (C5H11)",
                "Phenyl group (C6H5)",
                "Phosphate group (PO4)",
                "Propyl group (C3H7)",
                "Sulfhydryl group (SH)",
                "Vinyl group (CH2=CH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl group (\u2013OH)",
            "Carbonyl group (C=O)",
            "Carboxyl group (\u2013COOH)",
            "Amino group (\u2013NH\u2082)",
            "Methyl group (\u2013CH\u2083)",
            "Ethyl group (\u2013C\u2082H\u2085)",
            "Sulfhydryl group (\u2013SH)",
            "Phosphate group (\u2013PO\u2084\u00b2\u207b)",
            "Nitro group (\u2013NO\u2082)",
            "Alkene group (C=C)",
            "Alkyne group (C\u2261C)",
            "Aldehyde group (\u2013CHO)",
            "Ester group (\u2013COO\u2013)",
            "Ether group (\u2013O\u2013)",
            "Amide group (\u2013CONH\u2082)",
            "Phenyl group (\u2013C\u2086H\u2085)",
            "Vinyl group (\u2013CH=CH\u2082)",
            "Bromo group (\u2013Br)",
            "Chloro group (\u2013Cl)",
            "Iodo group (\u2013I)",
            "Fluoro group (\u2013F)",
            "Sulfonic acid group (\u2013SO\u2083H)",
            "Nitrile group (\u2013C\u2261N)",
            "Peroxide group (\u2013OOH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl group (\u2013OH)",
                "Carbonyl group (C=O)",
                "Carboxyl group (\u2013COOH)",
                "Amino group (\u2013NH\u2082)",
                "Methyl group (\u2013CH\u2083)",
                "Ethyl group (\u2013C\u2082H\u2085)",
                "Sulfhydryl group (\u2013SH)",
                "Phosphate group (\u2013PO\u2084\u00b2\u207b)",
                "Nitro group (\u2013NO\u2082)",
                "Alkene group (C=C)",
                "Alkyne group (C\u2261C)",
                "Aldehyde group (\u2013CHO)",
                "Ester group (\u2013COO\u2013)",
                "Ether group (\u2013O\u2013)",
                "Amide group (\u2013CONH\u2082)",
                "Phenyl group (\u2013C\u2086H\u2085)",
                "Vinyl group (\u2013CH=CH\u2082)",
                "Bromo group (\u2013Br)",
                "Chloro group (\u2013Cl)",
                "Iodo group (\u2013I)",
                "Fluoro group (\u2013F)",
                "Sulfonic acid group (\u2013SO\u2083H)",
                "Nitrile group (\u2013C\u2261N)",
                "Peroxide group (\u2013OOH)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aldehyde group (\u2013CHO)",
                "Alkene group (C=C)",
                "Alkyne group (C\u2261C)",
                "Amide group (\u2013CONH\u2082)",
                "Amino group (\u2013NH\u2082)",
                "Bromo group (\u2013Br)",
                "Carbonyl group (C=O)",
                "Carboxyl group (\u2013COOH)",
                "Chloro group (\u2013Cl)",
                "Ester group (\u2013COO\u2013)",
                "Ether group (\u2013O\u2013)",
                "Ethyl group (\u2013C\u2082H\u2085)",
                "Fluoro group (\u2013F)",
                "Hydroxyl group (\u2013OH)",
                "Iodo group (\u2013I)",
                "Methyl group (\u2013CH\u2083)",
                "Nitrile group (\u2013C\u2261N)",
                "Nitro group (\u2013NO\u2082)",
                "Peroxide group (\u2013OOH)",
                "Phenyl group (\u2013C\u2086H\u2085)",
                "Phosphate group (\u2013PO\u2084\u00b2\u207b)",
                "Sulfhydryl group (\u2013SH)",
                "Sulfonic acid group (\u2013SO\u2083H)",
                "Vinyl group (\u2013CH=CH\u2082)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl group (-OH)",
            "Carboxyl group (-COOH)",
            "Amino group (-NH2)",
            "Methyl group (-CH3)",
            "Carbonyl group (C=O)",
            "Aldehyde group (-CHO)",
            "Ketone group (-CO-)",
            "Ether group (-O-)",
            "Ester group (-COO-)",
            "Amide group (-CONH2)",
            "Thiol group (-SH)",
            "Halogen (F, Cl, Br, I)",
            "Nitro group (-NO2)",
            "Sulfonic acid group (-SO3H)",
            "Phosphate group (-PO4)",
            "Cyano group (-CN)",
            "Alkyl group (CnH2n+1-)",
            "Phenyl group (C6H5-)",
            "Benzyl group (C6H5CH2-)",
            "Vinyl group (-CH=CH2)",
            "Acetyl group (CH3CO-)",
            "Trifluoromethyl group (-CF3)",
            "Sulfonyl group (-SO2-)",
            "Isopropyl group (-CH(CH3)2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl group (-OH)",
                "Carboxyl group (-COOH)",
                "Amino group (-NH2)",
                "Methyl group (-CH3)",
                "Carbonyl group (C=O)",
                "Aldehyde group (-CHO)",
                "Ketone group (-CO-)",
                "Ether group (-O-)",
                "Ester group (-COO-)",
                "Amide group (-CONH2)",
                "Thiol group (-SH)",
                "Halogen (F, Cl, Br, I)",
                "Nitro group (-NO2)",
                "Sulfonic acid group (-SO3H)",
                "Phosphate group (-PO4)",
                "Cyano group (-CN)",
                "Alkyl group (CnH2n+1-)",
                "Phenyl group (C6H5-)",
                "Benzyl group (C6H5CH2-)",
                "Vinyl group (-CH=CH2)",
                "Acetyl group (CH3CO-)",
                "Trifluoromethyl group (-CF3)",
                "Sulfonyl group (-SO2-)",
                "Isopropyl group (-CH(CH3)2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl group (CH3CO-)",
                "Aldehyde group (-CHO)",
                "Alkyl group (CnH2n+1-)",
                "Amide group (-CONH2)",
                "Amino group (-NH2)",
                "Benzyl group (C6H5CH2-)",
                "Carbonyl group (C=O)",
                "Carboxyl group (-COOH)",
                "Cyano group (-CN)",
                "Ester group (-COO-)",
                "Ether group (-O-)",
                "Halogen (F, Cl, Br, I)",
                "Hydroxyl group (-OH)",
                "Isopropyl group (-CH(CH3)2)",
                "Ketone group (-CO-)",
                "Methyl group (-CH3)",
                "Nitro group (-NO2)",
                "Phenyl group (C6H5-)",
                "Phosphate group (-PO4)",
                "Sulfonic acid group (-SO3H)",
                "Sulfonyl group (-SO2-)",
                "Thiol group (-SH)",
                "Trifluoromethyl group (-CF3)",
                "Vinyl group (-CH=CH2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Methyl group (Me)",
            "Ethyl group (Et)",
            "Propyl group (Pr)",
            "Butyl group (Bu)",
            "Pentyl group",
            "Hexyl group",
            "Heptyl group",
            "Octyl group",
            "Nonyl group",
            "Decyl group",
            "Phenyl group (Ph)",
            "Benzyl group (Bn)",
            "Hydroxyl group (OH)",
            "Carboxyl group (COOH)",
            "Amino group (NH2)",
            "Cyano group (CN)",
            "Nitro group (NO2)",
            "Sulfhydryl group (SH)",
            "Phosphate group (PO4)",
            "Acetyl group (Ac)",
            "Formyl group (CHO)",
            "Amido group (CONH2)",
            "Ester group (COOR)",
            "Ether group (OR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl group (Me)",
                "Ethyl group (Et)",
                "Propyl group (Pr)",
                "Butyl group (Bu)",
                "Pentyl group",
                "Hexyl group",
                "Heptyl group",
                "Octyl group",
                "Nonyl group",
                "Decyl group",
                "Phenyl group (Ph)",
                "Benzyl group (Bn)",
                "Hydroxyl group (OH)",
                "Carboxyl group (COOH)",
                "Amino group (NH2)",
                "Cyano group (CN)",
                "Nitro group (NO2)",
                "Sulfhydryl group (SH)",
                "Phosphate group (PO4)",
                "Acetyl group (Ac)",
                "Formyl group (CHO)",
                "Amido group (CONH2)",
                "Ester group (COOR)",
                "Ether group (OR)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl group (Ac)",
                "Amido group (CONH2)",
                "Amino group (NH2)",
                "Benzyl group (Bn)",
                "Butyl group (Bu)",
                "Carboxyl group (COOH)",
                "Cyano group (CN)",
                "Decyl group",
                "Ester group (COOR)",
                "Ether group (OR)",
                "Ethyl group (Et)",
                "Formyl group (CHO)",
                "Heptyl group",
                "Hexyl group",
                "Hydroxyl group (OH)",
                "Methyl group (Me)",
                "Nitro group (NO2)",
                "Nonyl group",
                "Octyl group",
                "Pentyl group",
                "Phenyl group (Ph)",
                "Phosphate group (PO4)",
                "Propyl group (Pr)",
                "Sulfhydryl group (SH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Methyl group (CH3)",
            "Ethyl group (C2H5)",
            "Propyl group (C3H7)",
            "Butyl group (C4H9)",
            "Isopropyl group ((CH3)2CH)",
            "Tert-butyl group ((CH3)3C)",
            "Phenyl group (C6H5)",
            "Benzyl group (C6H5CH2)",
            "Vinyl group (CH2=CH)",
            "Allyl group (CH2=CHCH2)",
            "Hydroxyl group (OH)",
            "Amino group (NH2)",
            "Nitro group (NO2)",
            "Carboxyl group (COOH)",
            "Carbonyl group (C=O)",
            "Sulfhydryl group (SH)",
            "Phosphate group (PO4)",
            "Halogen (F, Cl, Br, I)",
            "Alkoxy group (OR)",
            "Ester group (COOR)",
            "Amide group (CONH2)",
            "Nitrile group (CN)",
            "Isocyanate group (NCO)",
            "Isothiocyanate group (NCS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl group (CH3)",
                "Ethyl group (C2H5)",
                "Propyl group (C3H7)",
                "Butyl group (C4H9)",
                "Isopropyl group ((CH3)2CH)",
                "Tert-butyl group ((CH3)3C)",
                "Phenyl group (C6H5)",
                "Benzyl group (C6H5CH2)",
                "Vinyl group (CH2=CH)",
                "Allyl group (CH2=CHCH2)",
                "Hydroxyl group (OH)",
                "Amino group (NH2)",
                "Nitro group (NO2)",
                "Carboxyl group (COOH)",
                "Carbonyl group (C=O)",
                "Sulfhydryl group (SH)",
                "Phosphate group (PO4)",
                "Halogen (F, Cl, Br, I)",
                "Alkoxy group (OR)",
                "Ester group (COOR)",
                "Amide group (CONH2)",
                "Nitrile group (CN)",
                "Isocyanate group (NCO)",
                "Isothiocyanate group (NCS)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alkoxy group (OR)",
                "Allyl group (CH2=CHCH2)",
                "Amide group (CONH2)",
                "Amino group (NH2)",
                "Benzyl group (C6H5CH2)",
                "Butyl group (C4H9)",
                "Carbonyl group (C=O)",
                "Carboxyl group (COOH)",
                "Ester group (COOR)",
                "Ethyl group (C2H5)",
                "Halogen (F, Cl, Br, I)",
                "Hydroxyl group (OH)",
                "Isocyanate group (NCO)",
                "Isopropyl group ((CH3)2CH)",
                "Isothiocyanate group (NCS)",
                "Methyl group (CH3)",
                "Nitrile group (CN)",
                "Nitro group (NO2)",
                "Phenyl group (C6H5)",
                "Phosphate group (PO4)",
                "Propyl group (C3H7)",
                "Sulfhydryl group (SH)",
                "Tert-butyl group ((CH3)3C)",
                "Vinyl group (CH2=CH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Methyl (CH3)",
            "Ethyl (C2H5)",
            "Propyl (C3H7)",
            "Butyl (C4H9)",
            "Pentyl (C5H11)",
            "Hexyl (C6H13)",
            "Heptyl (C7H15)",
            "Octyl (C8H17)",
            "Nonyl (C9H19)",
            "Decyl (C10H21)",
            "Hydroxyl (OH)",
            "Amino (NH2)",
            "Carboxyl (COOH)",
            "Nitro (NO2)",
            "Sulfhydryl (SH)",
            "Cyano (CN)",
            "Halogen (F, Cl, Br, I)",
            "Alkoxy (OR)",
            "Acyl (COR)",
            "Phosphoryl (PO4)",
            "Sulfonyl (SO3H)",
            "Silyl (SiR3)",
            "Boronyl (BR2)",
            "Stannyl (SnR3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl (CH3)",
                "Ethyl (C2H5)",
                "Propyl (C3H7)",
                "Butyl (C4H9)",
                "Pentyl (C5H11)",
                "Hexyl (C6H13)",
                "Heptyl (C7H15)",
                "Octyl (C8H17)",
                "Nonyl (C9H19)",
                "Decyl (C10H21)",
                "Hydroxyl (OH)",
                "Amino (NH2)",
                "Carboxyl (COOH)",
                "Nitro (NO2)",
                "Sulfhydryl (SH)",
                "Cyano (CN)",
                "Halogen (F, Cl, Br, I)",
                "Alkoxy (OR)",
                "Acyl (COR)",
                "Phosphoryl (PO4)",
                "Sulfonyl (SO3H)",
                "Silyl (SiR3)",
                "Boronyl (BR2)",
                "Stannyl (SnR3)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acyl (COR)",
                "Alkoxy (OR)",
                "Amino (NH2)",
                "Boronyl (BR2)",
                "Butyl (C4H9)",
                "Carboxyl (COOH)",
                "Cyano (CN)",
                "Decyl (C10H21)",
                "Ethyl (C2H5)",
                "Halogen (F, Cl, Br, I)",
                "Heptyl (C7H15)",
                "Hexyl (C6H13)",
                "Hydroxyl (OH)",
                "Methyl (CH3)",
                "Nitro (NO2)",
                "Nonyl (C9H19)",
                "Octyl (C8H17)",
                "Pentyl (C5H11)",
                "Phosphoryl (PO4)",
                "Propyl (C3H7)",
                "Silyl (SiR3)",
                "Stannyl (SnR3)",
                "Sulfhydryl (SH)",
                "Sulfonyl (SO3H)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Functional group (FG)",
            "Alkyl group (R)",
            "Alkenyl group (R)",
            "Alkynyl group (R)",
            "Hydroxyl group (OH)",
            "Methoxy group (OMe)",
            "Ethoxy group (OEt)",
            "Acetyl group (Ac)",
            "Carboxyl group (COOH)",
            "Amide group (CONH2)",
            "Phenyl group (Ph)",
            "Thiophenyl group (SPh)",
            "Thioalkyl group (SR)",
            "Aldehyde group (CHO)",
            "Ketone group (COR)",
            "Carbonyl group (CO)",
            "Hydroperoxy group (OOH)",
            "Epoxide group (O)",
            "Thiol group (SH)",
            "Amine group (RNH2)",
            "Quaternary ammonium group (R3N+)",
            "Phosphoryl group (PO3)",
            "Sulfonamide group (SO2NH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Functional group (FG)",
                "Alkyl group (R)",
                "Alkenyl group (R)",
                "Alkynyl group (R)",
                "Hydroxyl group (OH)",
                "Methoxy group (OMe)",
                "Ethoxy group (OEt)",
                "Acetyl group (Ac)",
                "Carboxyl group (COOH)",
                "Amide group (CONH2)",
                "Phenyl group (Ph)",
                "Thiophenyl group (SPh)",
                "Thioalkyl group (SR)",
                "Aldehyde group (CHO)",
                "Ketone group (COR)",
                "Carbonyl group (CO)",
                "Hydroperoxy group (OOH)",
                "Epoxide group (O)",
                "Thiol group (SH)",
                "Amine group (RNH2)",
                "Quaternary ammonium group (R3N+)",
                "Phosphoryl group (PO3)",
                "Sulfonamide group (SO2NH2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl group (Ac)",
                "Aldehyde group (CHO)",
                "Alkenyl group (R)",
                "Alkyl group (R)",
                "Alkynyl group (R)",
                "Amide group (CONH2)",
                "Amine group (RNH2)",
                "Carbonyl group (CO)",
                "Carboxyl group (COOH)",
                "Epoxide group (O)",
                "Ethoxy group (OEt)",
                "Functional group (FG)",
                "Hydroperoxy group (OOH)",
                "Hydroxyl group (OH)",
                "Ketone group (COR)",
                "Methoxy group (OMe)",
                "Phenyl group (Ph)",
                "Phosphoryl group (PO3)",
                "Quaternary ammonium group (R3N+)",
                "Sulfonamide group (SO2NH2)",
                "Thioalkyl group (SR)",
                "Thiol group (SH)",
                "Thiophenyl group (SPh)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Methyl group (CH3)",
            "Ethyl group (C2H5)",
            "Phenyl group (C6H5)",
            "Methoxy group (OCH3)",
            "Hydroxyl group (OH)",
            "Amino group (NH2)",
            "Carboxyl group (COOH)",
            "Cyano group (CN)",
            "Nitro group (NO2)",
            "Sulfo group (SO3H)",
            "Aldehyde group (CHO)",
            "Keto group (COR)",
            "Ester group (COOR)",
            "Amido group (CONH)",
            "Fluoro group (F)",
            "Chloro group (Cl)",
            "Bromo group (Br)",
            "Iodo group (I)",
            "Trifluoromethyl group (CF3)",
            "Triphenylmethyl group (C19H15)",
            "Tert-butyl group (C4H9)",
            "Cyclohexyl group (C6H11)",
            "Benzyl group (C7H7)",
            " Allyl group (C3H5)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl group (CH3)",
                "Ethyl group (C2H5)",
                "Phenyl group (C6H5)",
                "Methoxy group (OCH3)",
                "Hydroxyl group (OH)",
                "Amino group (NH2)",
                "Carboxyl group (COOH)",
                "Cyano group (CN)",
                "Nitro group (NO2)",
                "Sulfo group (SO3H)",
                "Aldehyde group (CHO)",
                "Keto group (COR)",
                "Ester group (COOR)",
                "Amido group (CONH)",
                "Fluoro group (F)",
                "Chloro group (Cl)",
                "Bromo group (Br)",
                "Iodo group (I)",
                "Trifluoromethyl group (CF3)",
                "Triphenylmethyl group (C19H15)",
                "Tert-butyl group (C4H9)",
                "Cyclohexyl group (C6H11)",
                "Benzyl group (C7H7)",
                " Allyl group (C3H5)"
            ],
            "mismatches": [],
            "true_referents": [
                " Allyl group (C3H5)",
                "Aldehyde group (CHO)",
                "Amido group (CONH)",
                "Amino group (NH2)",
                "Benzyl group (C7H7)",
                "Bromo group (Br)",
                "Carboxyl group (COOH)",
                "Chloro group (Cl)",
                "Cyano group (CN)",
                "Cyclohexyl group (C6H11)",
                "Ester group (COOR)",
                "Ethyl group (C2H5)",
                "Fluoro group (F)",
                "Hydroxyl group (OH)",
                "Iodo group (I)",
                "Keto group (COR)",
                "Methoxy group (OCH3)",
                "Methyl group (CH3)",
                "Nitro group (NO2)",
                "Phenyl group (C6H5)",
                "Sulfo group (SO3H)",
                "Tert-butyl group (C4H9)",
                "Trifluoromethyl group (CF3)",
                "Triphenylmethyl group (C19H15)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Carbon",
                "Canonical Name": "Carbon",
                "Definition": [
                    "it is an atom or group of atoms",
                    "it acts as a unit",
                    "it has replaced a hydrogen atom in a hydrocarbon molecule",
                    "its presence imparts characteristic properties to the molecule"
                ]
            },
            {
                "Referent": "Oxygen",
                "Canonical Name": "Oxygen",
                "Definition": [
                    "it is an atom or group of atoms",
                    "it acts as a unit",
                    "it has replaced a hydrogen atom in a hydrocarbon molecule",
                    "its presence imparts characteristic properties to the molecule"
                ]
            },
            {
                "Referent": "Nitrogen",
                "Canonical Name": "Nitrogen",
                "Definition": [
                    "it is an atom or group of atoms",
                    "it acts as a unit",
                    "it has replaced a hydrogen atom in a hydrocarbon molecule",
                    "its presence imparts characteristic properties to the molecule"
                ]
            },
            {
                "Referent": "Phosphorus",
                "Canonical Name": "Phosphorus",
                "Definition": [
                    "it is an atom or group of atoms",
                    "it acts as a unit",
                    "it has replaced a hydrogen atom in a hydrocarbon molecule",
                    "its presence imparts characteristic properties to the molecule"
                ]
            },
            {
                "Referent": "Sulfur",
                "Canonical Name": "Sulfur",
                "Definition": [
                    "it is an atom or group of atoms",
                    "it acts as a unit",
                    "it has replaced a hydrogen atom in a hydrocarbon molecule",
                    "its presence imparts characteristic properties to the molecule"
                ]
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Carbon",
                "Oxygen",
                "Nitrogen",
                "Phosphorus",
                "Sulfur"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"Carbon\", \"Canonical Name\": \"Carbon\", \"Definition\": [\"it is an atom or group of atoms\", \"it acts as a unit\", \"it has replaced a hydrogen atom in a hydrocarbon molecule\", \"its presence imparts characteristic properties to the molecule\"]}",
                "{\"Referent\": \"Nitrogen\", \"Canonical Name\": \"Nitrogen\", \"Definition\": [\"it is an atom or group of atoms\", \"it acts as a unit\", \"it has replaced a hydrogen atom in a hydrocarbon molecule\", \"its presence imparts characteristic properties to the molecule\"]}",
                "{\"Referent\": \"Oxygen\", \"Canonical Name\": \"Oxygen\", \"Definition\": [\"it is an atom or group of atoms\", \"it acts as a unit\", \"it has replaced a hydrogen atom in a hydrocarbon molecule\", \"its presence imparts characteristic properties to the molecule\"]}",
                "{\"Referent\": \"Phosphorus\", \"Canonical Name\": \"Phosphorus\", \"Definition\": [\"it is an atom or group of atoms\", \"it acts as a unit\", \"it has replaced a hydrogen atom in a hydrocarbon molecule\", \"its presence imparts characteristic properties to the molecule\"]}",
                "{\"Referent\": \"Sulfur\", \"Canonical Name\": \"Sulfur\", \"Definition\": [\"it is an atom or group of atoms\", \"it acts as a unit\", \"it has replaced a hydrogen atom in a hydrocarbon molecule\", \"its presence imparts characteristic properties to the molecule\"]}"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 0
        }
    }
]