[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Alcohol (\u2013OH)",
            "Amine (\u2013NH2)",
            "Carboxylic acid (\u2013COOH)",
            "Ester (\u2013COO\u2013)",
            "Ether (\u2013O\u2013)",
            "Aldehyde (\u2013CHO)",
            "Ketone (C=O)",
            "Amino acid (\u2013NH2 and \u2013COOH)",
            "Nitrile (\u2013CN)",
            "Phosphate (PO4^3-)",
            "Sulfate (SO4^2-)",
            "Thiol (\u2013SH)",
            "Amide (\u2013CONH2)",
            "Epoxy (\u2013O\u2013)",
            "Imine (C=NH)",
            "Hydroxyl (\u2013OH)",
            "Nitro (\u2013NO2)",
            "Phenol (\u2013OH attached to an aromatic ring)",
            "Sulfide (\u2013S\u2013)",
            "Sulfonic acid (\u2013SO3H)",
            "Thiocyanate (\u2013SCN)",
            "Alkene (C=C)",
            "Azide (\u2013N3)",
            "Isothiocyanate (\u2013N=C=S)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alcohol (\u2013OH)",
                "Amine (\u2013NH2)",
                "Carboxylic acid (\u2013COOH)",
                "Ester (\u2013COO\u2013)",
                "Ether (\u2013O\u2013)",
                "Aldehyde (\u2013CHO)",
                "Ketone (C=O)",
                "Amino acid (\u2013NH2 and \u2013COOH)",
                "Nitrile (\u2013CN)",
                "Phosphate (PO4^3-)",
                "Sulfate (SO4^2-)",
                "Thiol (\u2013SH)",
                "Amide (\u2013CONH2)",
                "Epoxy (\u2013O\u2013)",
                "Imine (C=NH)",
                "Hydroxyl (\u2013OH)",
                "Nitro (\u2013NO2)",
                "Phenol (\u2013OH attached to an aromatic ring)",
                "Sulfide (\u2013S\u2013)",
                "Sulfonic acid (\u2013SO3H)",
                "Thiocyanate (\u2013SCN)",
                "Alkene (C=C)",
                "Azide (\u2013N3)",
                "Isothiocyanate (\u2013N=C=S)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alcohol (\u2013OH)",
                "Aldehyde (\u2013CHO)",
                "Alkene (C=C)",
                "Amide (\u2013CONH2)",
                "Amine (\u2013NH2)",
                "Amino acid (\u2013NH2 and \u2013COOH)",
                "Azide (\u2013N3)",
                "Carboxylic acid (\u2013COOH)",
                "Epoxy (\u2013O\u2013)",
                "Ester (\u2013COO\u2013)",
                "Ether (\u2013O\u2013)",
                "Hydroxyl (\u2013OH)",
                "Imine (C=NH)",
                "Isothiocyanate (\u2013N=C=S)",
                "Ketone (C=O)",
                "Nitrile (\u2013CN)",
                "Nitro (\u2013NO2)",
                "Phenol (\u2013OH attached to an aromatic ring)",
                "Phosphate (PO4^3-)",
                "Sulfate (SO4^2-)",
                "Sulfide (\u2013S\u2013)",
                "Sulfonic acid (\u2013SO3H)",
                "Thiocyanate (\u2013SCN)",
                "Thiol (\u2013SH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl group (-OH)",
            "Carbonyl group (>C=O)",
            "Carboxyl group (-COOH)",
            "Amino group (-NH2)",
            "Sulfhydryl group (-SH)",
            "Phosphate group (-PO4)",
            "Methyl group (-CH3)",
            "Ethyl group (-C2H5)",
            "Alkene group (C=C)",
            "Alkyne group (C\u2261C)",
            "Ester group (-COO-)",
            "Amide group (-CONH2)",
            "Ether group (R-O-R')",
            "Nitrile group (-C\u2261N)",
            "Aldehyde group (-CHO)",
            "Ketone group (RC(=O)R')",
            "Halide group (R-X, where X = F, Cl, Br, I)",
            "Nitro group (-NO2)",
            "Hydrazine group (-NH-NH2)",
            "Imine group (R1R2C=NR3)",
            "Thiol group (-SH)",
            "Phenyl group (C6H5-)",
            "Acetyl group (-COCH3)",
            "Guanidino group (-C(=NH2)2NH-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl group (-OH)",
                "Carbonyl group (>C=O)",
                "Carboxyl group (-COOH)",
                "Amino group (-NH2)",
                "Sulfhydryl group (-SH)",
                "Phosphate group (-PO4)",
                "Methyl group (-CH3)",
                "Ethyl group (-C2H5)",
                "Alkene group (C=C)",
                "Alkyne group (C\u2261C)",
                "Ester group (-COO-)",
                "Amide group (-CONH2)",
                "Ether group (R-O-R')",
                "Nitrile group (-C\u2261N)",
                "Aldehyde group (-CHO)",
                "Ketone group (RC(=O)R')",
                "Halide group (R-X, where X = F, Cl, Br, I)",
                "Nitro group (-NO2)",
                "Hydrazine group (-NH-NH2)",
                "Imine group (R1R2C=NR3)",
                "Thiol group (-SH)",
                "Phenyl group (C6H5-)",
                "Acetyl group (-COCH3)",
                "Guanidino group (-C(=NH2)2NH-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl group (-COCH3)",
                "Aldehyde group (-CHO)",
                "Alkene group (C=C)",
                "Alkyne group (C\u2261C)",
                "Amide group (-CONH2)",
                "Amino group (-NH2)",
                "Carbonyl group (>C=O)",
                "Carboxyl group (-COOH)",
                "Ester group (-COO-)",
                "Ether group (R-O-R')",
                "Ethyl group (-C2H5)",
                "Guanidino group (-C(=NH2)2NH-)",
                "Halide group (R-X, where X = F, Cl, Br, I)",
                "Hydrazine group (-NH-NH2)",
                "Hydroxyl group (-OH)",
                "Imine group (R1R2C=NR3)",
                "Ketone group (RC(=O)R')",
                "Methyl group (-CH3)",
                "Nitrile group (-C\u2261N)",
                "Nitro group (-NO2)",
                "Phenyl group (C6H5-)",
                "Phosphate group (-PO4)",
                "Sulfhydryl group (-SH)",
                "Thiol group (-SH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl group (\u2013OH)",
            "Carboxyl group (\u2013COOH)",
            "Amino group (\u2013NH2)",
            "Methyl group (\u2013CH3)",
            "Ethyl group (\u2013C2H5)",
            "Hydroperoxy group (\u2013OOH)",
            "Aldehyde group (\u2013CHO)",
            "Ketone group (\u2013C(=O)R)",
            "Ester group (\u2013COOR)",
            "Ether group (\u2013O\u2013R)",
            "Thiol group (\u2013SH)",
            "Sulfide group (\u2013S\u2013R)",
            "Sulfonyl group (\u2013SO2R)",
            "Nitro group (\u2013NO2)",
            "Cyano group (\u2013CN)",
            "Isocyano group (\u2013NC)",
            "Isothiocyano group (\u2013NCS)",
            "Azo group (\u2013N=N\u2013)",
            "Hydrazino group (\u2013NHNH2)",
            "Acyl group (\u2013C(=O)R)",
            "Amide group (\u2013CONH2)",
            "Imine group (\u2013C(=NH)R)",
            "Enamine group (\u2013C(=NR)R')",
            "Alkene group (\u2013C=C\u2013)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl group (\u2013OH)",
                "Carboxyl group (\u2013COOH)",
                "Amino group (\u2013NH2)",
                "Methyl group (\u2013CH3)",
                "Ethyl group (\u2013C2H5)",
                "Hydroperoxy group (\u2013OOH)",
                "Aldehyde group (\u2013CHO)",
                "Ketone group (\u2013C(=O)R)",
                "Ester group (\u2013COOR)",
                "Ether group (\u2013O\u2013R)",
                "Thiol group (\u2013SH)",
                "Sulfide group (\u2013S\u2013R)",
                "Sulfonyl group (\u2013SO2R)",
                "Nitro group (\u2013NO2)",
                "Cyano group (\u2013CN)",
                "Isocyano group (\u2013NC)",
                "Isothiocyano group (\u2013NCS)",
                "Azo group (\u2013N=N\u2013)",
                "Hydrazino group (\u2013NHNH2)",
                "Acyl group (\u2013C(=O)R)",
                "Amide group (\u2013CONH2)",
                "Imine group (\u2013C(=NH)R)",
                "Enamine group (\u2013C(=NR)R')",
                "Alkene group (\u2013C=C\u2013)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acyl group (\u2013C(=O)R)",
                "Aldehyde group (\u2013CHO)",
                "Alkene group (\u2013C=C\u2013)",
                "Amide group (\u2013CONH2)",
                "Amino group (\u2013NH2)",
                "Azo group (\u2013N=N\u2013)",
                "Carboxyl group (\u2013COOH)",
                "Cyano group (\u2013CN)",
                "Enamine group (\u2013C(=NR)R')",
                "Ester group (\u2013COOR)",
                "Ether group (\u2013O\u2013R)",
                "Ethyl group (\u2013C2H5)",
                "Hydrazino group (\u2013NHNH2)",
                "Hydroperoxy group (\u2013OOH)",
                "Hydroxyl group (\u2013OH)",
                "Imine group (\u2013C(=NH)R)",
                "Isocyano group (\u2013NC)",
                "Isothiocyano group (\u2013NCS)",
                "Ketone group (\u2013C(=O)R)",
                "Methyl group (\u2013CH3)",
                "Nitro group (\u2013NO2)",
                "Sulfide group (\u2013S\u2013R)",
                "Sulfonyl group (\u2013SO2R)",
                "Thiol group (\u2013SH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl Group (OH)",
            "Methyl Group (CH3)",
            "Methylene Group (CH2)",
            "Carboxyl Group (COOH)",
            "Carbonyl Group (C=O)",
            "Aldehyde Group (R-CHO)",
            "Ketone Group (R-CO-R')",
            "Amino Group (NH2)",
            "Nitro Group (NO2)",
            "Halogen Group (X)",
            "Ether Group (R-O-R')",
            "Ester Group (R-COO-R')",
            "Amide Group (R-CO-NH2)",
            "Thiol Group (SH)",
            "Sulfhydryl Group (SH)",
            "Phosphoryl Group (PO4H2)",
            "Phosphate Group (PO4^3-)",
            "Cyano Group (CN)",
            "Isocyanato Group (NCO)",
            "Epoxide Group (C2H4O)",
            "Acyl Halide (R-COX)",
            "Alkynyl Group (C\u2261CH)",
            "Aryl Group (Ar)",
            "Alkyl Group (R)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl Group (OH)",
                "Methyl Group (CH3)",
                "Methylene Group (CH2)",
                "Carboxyl Group (COOH)",
                "Carbonyl Group (C=O)",
                "Aldehyde Group (R-CHO)",
                "Ketone Group (R-CO-R')",
                "Amino Group (NH2)",
                "Nitro Group (NO2)",
                "Halogen Group (X)",
                "Ether Group (R-O-R')",
                "Ester Group (R-COO-R')",
                "Amide Group (R-CO-NH2)",
                "Thiol Group (SH)",
                "Sulfhydryl Group (SH)",
                "Phosphoryl Group (PO4H2)",
                "Phosphate Group (PO4^3-)",
                "Cyano Group (CN)",
                "Isocyanato Group (NCO)",
                "Epoxide Group (C2H4O)",
                "Acyl Halide (R-COX)",
                "Alkynyl Group (C\u2261CH)",
                "Aryl Group (Ar)",
                "Alkyl Group (R)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acyl Halide (R-COX)",
                "Aldehyde Group (R-CHO)",
                "Alkyl Group (R)",
                "Alkynyl Group (C\u2261CH)",
                "Amide Group (R-CO-NH2)",
                "Amino Group (NH2)",
                "Aryl Group (Ar)",
                "Carbonyl Group (C=O)",
                "Carboxyl Group (COOH)",
                "Cyano Group (CN)",
                "Epoxide Group (C2H4O)",
                "Ester Group (R-COO-R')",
                "Ether Group (R-O-R')",
                "Halogen Group (X)",
                "Hydroxyl Group (OH)",
                "Isocyanato Group (NCO)",
                "Ketone Group (R-CO-R')",
                "Methyl Group (CH3)",
                "Methylene Group (CH2)",
                "Nitro Group (NO2)",
                "Phosphate Group (PO4^3-)",
                "Phosphoryl Group (PO4H2)",
                "Sulfhydryl Group (SH)",
                "Thiol Group (SH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl (OH)",
            "Carbonyl (C=O)",
            "Carboxyl (COOH)",
            "Amino (NH2)",
            "Sulfhydryl (SH)",
            "Phosphate (PO4)",
            "Methyl (CH3)",
            "Ethyl (C2H5)",
            "Phenyl (C6H5)",
            "Aldehyde (CHO)",
            "Ketone (RCOR')",
            "Ester (COOR')",
            "Ether (ROR')",
            "Amide (CONH2)",
            "Nitrile (CN)",
            "Thiol (RSH)",
            "Imine (C=NH)",
            "Azide (N3)",
            "Acyl chloride (COCl)",
            "Anhydride (RCOOCOR')",
            "Isocyanate (NCO)",
            "Isothiocyanate (NCS)",
            "Nitro (NO2)",
            "Sulfonic acid (SO3H)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl (OH)",
                "Carbonyl (C=O)",
                "Carboxyl (COOH)",
                "Amino (NH2)",
                "Sulfhydryl (SH)",
                "Phosphate (PO4)",
                "Methyl (CH3)",
                "Ethyl (C2H5)",
                "Phenyl (C6H5)",
                "Aldehyde (CHO)",
                "Ketone (RCOR')",
                "Ester (COOR')",
                "Ether (ROR')",
                "Amide (CONH2)",
                "Nitrile (CN)",
                "Thiol (RSH)",
                "Imine (C=NH)",
                "Azide (N3)",
                "Acyl chloride (COCl)",
                "Anhydride (RCOOCOR')",
                "Isocyanate (NCO)",
                "Isothiocyanate (NCS)",
                "Nitro (NO2)",
                "Sulfonic acid (SO3H)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acyl chloride (COCl)",
                "Aldehyde (CHO)",
                "Amide (CONH2)",
                "Amino (NH2)",
                "Anhydride (RCOOCOR')",
                "Azide (N3)",
                "Carbonyl (C=O)",
                "Carboxyl (COOH)",
                "Ester (COOR')",
                "Ether (ROR')",
                "Ethyl (C2H5)",
                "Hydroxyl (OH)",
                "Imine (C=NH)",
                "Isocyanate (NCO)",
                "Isothiocyanate (NCS)",
                "Ketone (RCOR')",
                "Methyl (CH3)",
                "Nitrile (CN)",
                "Nitro (NO2)",
                "Phenyl (C6H5)",
                "Phosphate (PO4)",
                "Sulfhydryl (SH)",
                "Sulfonic acid (SO3H)",
                "Thiol (RSH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl group (\u2013OH)",
            "Carbonyl group (C=O)",
            "Carboxyl group (\u2013COOH)",
            "Amino group (\u2013NH2)",
            "Sulfhydryl group (\u2013SH)",
            "Phosphate group (\u2013PO4^2\u2212)",
            "Methyl group (\u2013CH3)",
            "Ethyl group (\u2013C2H5)",
            "Phenyl group (\u2013C6H5)",
            "Alkyl group (\u2013R)",
            "Alkenyl group (\u2013C=C\u2013)",
            "Alkynyl group (\u2013C\u2261C\u2013)",
            "Nitrile group (\u2013C\u2261N)",
            "Isocyanate group (\u2013N=C=O)",
            "Acyl group (\u2013C(=O)\u2013R)",
            "Ester group (\u2013COOR)",
            "Amide group (\u2013C(=O)NR2)",
            "Thioether group (\u2013S\u2013)",
            "Nitro group (\u2013NO2)",
            "Haloalkane group (\u2013X)",
            "Imines group (\u2013C=NR)",
            "Oxime group (\u2013C=N\u2013OH)",
            "Hydrazone group (\u2013C=N\u2013NH2)",
            "Sulfone group (\u2013SO2\u2013)",
            "Quaternary ammonium group (NR4+)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl group (\u2013OH)",
                "Carbonyl group (C=O)",
                "Carboxyl group (\u2013COOH)",
                "Amino group (\u2013NH2)",
                "Sulfhydryl group (\u2013SH)",
                "Phosphate group (\u2013PO4^2\u2212)",
                "Methyl group (\u2013CH3)",
                "Ethyl group (\u2013C2H5)",
                "Phenyl group (\u2013C6H5)",
                "Alkyl group (\u2013R)",
                "Alkenyl group (\u2013C=C\u2013)",
                "Alkynyl group (\u2013C\u2261C\u2013)",
                "Nitrile group (\u2013C\u2261N)",
                "Isocyanate group (\u2013N=C=O)",
                "Acyl group (\u2013C(=O)\u2013R)",
                "Ester group (\u2013COOR)",
                "Amide group (\u2013C(=O)NR2)",
                "Thioether group (\u2013S\u2013)",
                "Nitro group (\u2013NO2)",
                "Haloalkane group (\u2013X)",
                "Imines group (\u2013C=NR)",
                "Oxime group (\u2013C=N\u2013OH)",
                "Hydrazone group (\u2013C=N\u2013NH2)",
                "Sulfone group (\u2013SO2\u2013)"
            ],
            "mismatches": [
                "Quaternary ammonium group (NR4+)"
            ],
            "true_referents": [
                "Acyl group (\u2013C(=O)\u2013R)",
                "Alkenyl group (\u2013C=C\u2013)",
                "Alkyl group (\u2013R)",
                "Alkynyl group (\u2013C\u2261C\u2013)",
                "Amide group (\u2013C(=O)NR2)",
                "Amino group (\u2013NH2)",
                "Carbonyl group (C=O)",
                "Carboxyl group (\u2013COOH)",
                "Ester group (\u2013COOR)",
                "Ethyl group (\u2013C2H5)",
                "Haloalkane group (\u2013X)",
                "Hydrazone group (\u2013C=N\u2013NH2)",
                "Hydroxyl group (\u2013OH)",
                "Imines group (\u2013C=NR)",
                "Isocyanate group (\u2013N=C=O)",
                "Methyl group (\u2013CH3)",
                "Nitrile group (\u2013C\u2261N)",
                "Nitro group (\u2013NO2)",
                "Oxime group (\u2013C=N\u2013OH)",
                "Phenyl group (\u2013C6H5)",
                "Phosphate group (\u2013PO4^2\u2212)",
                "Sulfhydryl group (\u2013SH)",
                "Sulfone group (\u2013SO2\u2013)",
                "Thioether group (\u2013S\u2013)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl group (OH)",
            "Methyl group (CH3)",
            "Carboxyl group (COOH)",
            "Amino group (NH2)",
            "Phosphate group (PO4)",
            "Sulhydryl group (SH)",
            "Aldehyde group (CHO)",
            "Ketone group (RCOR')",
            "Ester group (RCOOR')",
            "Ether group (ROR')",
            "Amide group (RCONR2)",
            "Phenyl group (C6H5)",
            "Acyl group (RCO)",
            "Alkene group (C=C)",
            "Alkyne group (C\u2261C)",
            "Aryl group (Ar)",
            "Azide group (N3)",
            "Isocyanate group (NCO)",
            "Nitro group (NO2)",
            "Sulfate group (SO4)",
            "Thiol group (RSH)",
            "Benzyl group (C6H5CH2)",
            "Vinyl group (CH=CH2)",
            "Cyano group (CN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl group (OH)",
                "Methyl group (CH3)",
                "Carboxyl group (COOH)",
                "Amino group (NH2)",
                "Phosphate group (PO4)",
                "Sulhydryl group (SH)",
                "Aldehyde group (CHO)",
                "Ketone group (RCOR')",
                "Ester group (RCOOR')",
                "Ether group (ROR')",
                "Amide group (RCONR2)",
                "Phenyl group (C6H5)",
                "Acyl group (RCO)",
                "Alkene group (C=C)",
                "Alkyne group (C\u2261C)",
                "Aryl group (Ar)",
                "Azide group (N3)",
                "Isocyanate group (NCO)",
                "Nitro group (NO2)",
                "Sulfate group (SO4)",
                "Thiol group (RSH)",
                "Benzyl group (C6H5CH2)",
                "Vinyl group (CH=CH2)",
                "Cyano group (CN)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acyl group (RCO)",
                "Aldehyde group (CHO)",
                "Alkene group (C=C)",
                "Alkyne group (C\u2261C)",
                "Amide group (RCONR2)",
                "Amino group (NH2)",
                "Aryl group (Ar)",
                "Azide group (N3)",
                "Benzyl group (C6H5CH2)",
                "Carboxyl group (COOH)",
                "Cyano group (CN)",
                "Ester group (RCOOR')",
                "Ether group (ROR')",
                "Hydroxyl group (OH)",
                "Isocyanate group (NCO)",
                "Ketone group (RCOR')",
                "Methyl group (CH3)",
                "Nitro group (NO2)",
                "Phenyl group (C6H5)",
                "Phosphate group (PO4)",
                "Sulfate group (SO4)",
                "Sulhydryl group (SH)",
                "Thiol group (RSH)",
                "Vinyl group (CH=CH2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl group (OH)",
            "Carbonyl group (C=O)",
            "Amino group (NH2)",
            "Carboxyl group (COOH)",
            "Sulfhydryl group (SH)",
            "Phosphate group (PO4)",
            "Methyl group (CH3)",
            "Aldehyde group (CHO)",
            "Ester group (COOC)",
            "Ether group (C-O-C)",
            "Amide group (CONH2)",
            "Ketone group (RCOR')",
            "Sulfate group (SO4)",
            "Nitrile group (CN)",
            "Halogen group (F, Cl, Br, I)",
            "Alcohol group (R-OH)",
            "Thiol group (R-SH)",
            "Alkene group (C=C)",
            "Alkyne group (C\u2261C)",
            "Aryl group (C6H5-)",
            "Phenol group (C6H5OH)",
            "Epoxy group (C-O-C)",
            "Imine group (C=N)",
            "Thioether group (C-S-C)",
            "Acetyl group (COCH3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl group (OH)",
                "Carbonyl group (C=O)",
                "Amino group (NH2)",
                "Carboxyl group (COOH)",
                "Sulfhydryl group (SH)",
                "Phosphate group (PO4)",
                "Methyl group (CH3)",
                "Aldehyde group (CHO)",
                "Ester group (COOC)",
                "Ether group (C-O-C)",
                "Amide group (CONH2)",
                "Ketone group (RCOR')",
                "Sulfate group (SO4)",
                "Nitrile group (CN)",
                "Halogen group (F, Cl, Br, I)",
                "Alcohol group (R-OH)",
                "Thiol group (R-SH)",
                "Alkene group (C=C)",
                "Alkyne group (C\u2261C)",
                "Aryl group (C6H5-)",
                "Phenol group (C6H5OH)",
                "Epoxy group (C-O-C)",
                "Imine group (C=N)",
                "Thioether group (C-S-C)"
            ],
            "mismatches": [
                "Acetyl group (COCH3)"
            ],
            "true_referents": [
                "Alcohol group (R-OH)",
                "Aldehyde group (CHO)",
                "Alkene group (C=C)",
                "Alkyne group (C\u2261C)",
                "Amide group (CONH2)",
                "Amino group (NH2)",
                "Aryl group (C6H5-)",
                "Carbonyl group (C=O)",
                "Carboxyl group (COOH)",
                "Epoxy group (C-O-C)",
                "Ester group (COOC)",
                "Ether group (C-O-C)",
                "Halogen group (F, Cl, Br, I)",
                "Hydroxyl group (OH)",
                "Imine group (C=N)",
                "Ketone group (RCOR')",
                "Methyl group (CH3)",
                "Nitrile group (CN)",
                "Phenol group (C6H5OH)",
                "Phosphate group (PO4)",
                "Sulfate group (SO4)",
                "Sulfhydryl group (SH)",
                "Thioether group (C-S-C)",
                "Thiol group (R-SH)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl group (\u2013OH)",
            "Carbonyl group (C=O)",
            "Carboxyl group (\u2013COOH)",
            "Amino group (\u2013NH\u2082)",
            "Sulfhydryl group (\u2013SH)",
            "Phosphate group (\u2013PO\u2084\u00b3\u207b)",
            "Methyl group (\u2013CH\u2083)",
            "Ethyl group (\u2013C\u2082H\u2085)",
            "Aldehyde group (\u2013CHO)",
            "Ketone group (C=O in ketones)",
            "Ester group (\u2013COO\u2013)",
            "Ether group (R\u2013O\u2013R')",
            "Nitro group (\u2013NO\u2082)",
            "Halogen groups (\u2013F, \u2013Cl, \u2013Br, \u2013I)",
            "Imine group (C=N)",
            "Alkene group (C=C)",
            "Alkyne group (C\u2261C)",
            "Phenyl group (\u2013C\u2086H\u2085)",
            "Vinyl group (\u2013CH=CH\u2082)",
            "Benzyl group (\u2013CH\u2082\u2013C\u2086H\u2085)",
            "Nitrate group (\u2013ONO\u2082)",
            "Sulfonic acid group (\u2013SO\u2083H)",
            "Amide group (\u2013CONH\u2082)",
            "Hydrazine group (\u2013NH\u2013NH\u2082)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl group (\u2013OH)",
                "Carbonyl group (C=O)",
                "Carboxyl group (\u2013COOH)",
                "Amino group (\u2013NH\u2082)",
                "Sulfhydryl group (\u2013SH)",
                "Phosphate group (\u2013PO\u2084\u00b3\u207b)",
                "Methyl group (\u2013CH\u2083)",
                "Ethyl group (\u2013C\u2082H\u2085)",
                "Aldehyde group (\u2013CHO)",
                "Ketone group (C=O in ketones)",
                "Ester group (\u2013COO\u2013)",
                "Ether group (R\u2013O\u2013R')",
                "Nitro group (\u2013NO\u2082)",
                "Halogen groups (\u2013F, \u2013Cl, \u2013Br, \u2013I)",
                "Imine group (C=N)",
                "Alkene group (C=C)",
                "Alkyne group (C\u2261C)",
                "Phenyl group (\u2013C\u2086H\u2085)",
                "Vinyl group (\u2013CH=CH\u2082)",
                "Benzyl group (\u2013CH\u2082\u2013C\u2086H\u2085)",
                "Nitrate group (\u2013ONO\u2082)",
                "Sulfonic acid group (\u2013SO\u2083H)",
                "Amide group (\u2013CONH\u2082)",
                "Hydrazine group (\u2013NH\u2013NH\u2082)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aldehyde group (\u2013CHO)",
                "Alkene group (C=C)",
                "Alkyne group (C\u2261C)",
                "Amide group (\u2013CONH\u2082)",
                "Amino group (\u2013NH\u2082)",
                "Benzyl group (\u2013CH\u2082\u2013C\u2086H\u2085)",
                "Carbonyl group (C=O)",
                "Carboxyl group (\u2013COOH)",
                "Ester group (\u2013COO\u2013)",
                "Ether group (R\u2013O\u2013R')",
                "Ethyl group (\u2013C\u2082H\u2085)",
                "Halogen groups (\u2013F, \u2013Cl, \u2013Br, \u2013I)",
                "Hydrazine group (\u2013NH\u2013NH\u2082)",
                "Hydroxyl group (\u2013OH)",
                "Imine group (C=N)",
                "Ketone group (C=O in ketones)",
                "Methyl group (\u2013CH\u2083)",
                "Nitrate group (\u2013ONO\u2082)",
                "Nitro group (\u2013NO\u2082)",
                "Phenyl group (\u2013C\u2086H\u2085)",
                "Phosphate group (\u2013PO\u2084\u00b3\u207b)",
                "Sulfhydryl group (\u2013SH)",
                "Sulfonic acid group (\u2013SO\u2083H)",
                "Vinyl group (\u2013CH=CH\u2082)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl group (-OH)",
            "Carbonyl group (C=O)",
            "Carboxyl group (-COOH)",
            "Amino group (-NH2)",
            "Thiol group (-SH)",
            "Methyl group (-CH3)",
            "Aldehyde group (-CHO)",
            "Ketone group (-C(=O)-)",
            "Ether group (-O-)",
            "Ester group (-COO-)",
            "Amide group (-CONH2)",
            "Phosphate group (-PO4)",
            "Sulfate group (-SO4)",
            "Nitro group (-NO2)",
            "Alkene group (C=C)",
            "Alkyne group (C\u2261C)",
            "Halide group (-X, where X is F, Cl, Br, or I)",
            "Nitrile group (-C\u2261N)",
            "Isocyanate group (-N=C=O)",
            "Azide group (-N3)",
            "Sulfoxide group (S=O)",
            "Sulfonyl group (-SO2-)",
            "Phosphine group (-PH2)",
            "Imine group (C=N)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl group (-OH)",
                "Carbonyl group (C=O)",
                "Carboxyl group (-COOH)",
                "Amino group (-NH2)",
                "Thiol group (-SH)",
                "Methyl group (-CH3)",
                "Aldehyde group (-CHO)",
                "Ketone group (-C(=O)-)",
                "Ether group (-O-)",
                "Ester group (-COO-)",
                "Amide group (-CONH2)",
                "Phosphate group (-PO4)",
                "Sulfate group (-SO4)",
                "Nitro group (-NO2)",
                "Alkene group (C=C)",
                "Alkyne group (C\u2261C)",
                "Halide group (-X, where X is F, Cl, Br, or I)",
                "Nitrile group (-C\u2261N)",
                "Isocyanate group (-N=C=O)",
                "Azide group (-N3)",
                "Sulfoxide group (S=O)",
                "Sulfonyl group (-SO2-)",
                "Phosphine group (-PH2)",
                "Imine group (C=N)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aldehyde group (-CHO)",
                "Alkene group (C=C)",
                "Alkyne group (C\u2261C)",
                "Amide group (-CONH2)",
                "Amino group (-NH2)",
                "Azide group (-N3)",
                "Carbonyl group (C=O)",
                "Carboxyl group (-COOH)",
                "Ester group (-COO-)",
                "Ether group (-O-)",
                "Halide group (-X, where X is F, Cl, Br, or I)",
                "Hydroxyl group (-OH)",
                "Imine group (C=N)",
                "Isocyanate group (-N=C=O)",
                "Ketone group (-C(=O)-)",
                "Methyl group (-CH3)",
                "Nitrile group (-C\u2261N)",
                "Nitro group (-NO2)",
                "Phosphate group (-PO4)",
                "Phosphine group (-PH2)",
                "Sulfate group (-SO4)",
                "Sulfonyl group (-SO2-)",
                "Sulfoxide group (S=O)",
                "Thiol group (-SH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl (OH)",
            "Carboxyl (COOH)",
            "Carbonyl (C=O)",
            "Amino (NH2)",
            "Thiol (SH)",
            "Phosphate (PO4)",
            "Sulfhydryl (SH)",
            "Ester (COOR)",
            "Amide (CONH2)",
            "Ether (R-O-R)",
            "Nitrile (CN)",
            "Alkene (C=C)",
            "Alkyne (C\u2261C)",
            "Haloalkane (R-X)",
            "Sulfoxide (S=O)",
            "Sulfone (SO2)",
            "Azide (N3)",
            "Nitro (NO2)",
            "Isocyanate (NCO)",
            "Isothiocyanate (NCS)",
            "Epoxide (Oxirane)",
            "Azo (R-N=N-R)",
            "Peroxide (ROOR)",
            "Imine (C=N)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl (OH)",
                "Carboxyl (COOH)",
                "Carbonyl (C=O)",
                "Amino (NH2)",
                "Thiol (SH)",
                "Phosphate (PO4)",
                "Sulfhydryl (SH)",
                "Ester (COOR)",
                "Amide (CONH2)",
                "Ether (R-O-R)",
                "Nitrile (CN)",
                "Alkene (C=C)",
                "Alkyne (C\u2261C)",
                "Haloalkane (R-X)",
                "Sulfoxide (S=O)",
                "Sulfone (SO2)",
                "Azide (N3)",
                "Nitro (NO2)",
                "Isocyanate (NCO)",
                "Isothiocyanate (NCS)",
                "Epoxide (Oxirane)",
                "Azo (R-N=N-R)",
                "Peroxide (ROOR)",
                "Imine (C=N)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alkene (C=C)",
                "Alkyne (C\u2261C)",
                "Amide (CONH2)",
                "Amino (NH2)",
                "Azide (N3)",
                "Azo (R-N=N-R)",
                "Carbonyl (C=O)",
                "Carboxyl (COOH)",
                "Epoxide (Oxirane)",
                "Ester (COOR)",
                "Ether (R-O-R)",
                "Haloalkane (R-X)",
                "Hydroxyl (OH)",
                "Imine (C=N)",
                "Isocyanate (NCO)",
                "Isothiocyanate (NCS)",
                "Nitrile (CN)",
                "Nitro (NO2)",
                "Peroxide (ROOR)",
                "Phosphate (PO4)",
                "Sulfhydryl (SH)",
                "Sulfone (SO2)",
                "Sulfoxide (S=O)",
                "Thiol (SH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl group (\u2013OH)",
            "Carbonyl group (\u2013C=O)",
            "Carboxyl group (\u2013COOH)",
            "Amino group (\u2013NH2)",
            "Thiol group (\u2013SH)",
            "Ether group (\u2013O\u2013)",
            "Ester group (\u2013COO\u2013)",
            "Amide group (\u2013CONH\u2013)",
            "Phosphate group (\u2013OPO3H\u2013)",
            "Sulfonate group (\u2013SO3H)",
            "Nitro group (\u2013NO2)",
            "Nitrile group (\u2013C\u2261N)",
            "Alkene group (\u2013C=C\u2013)",
            "Alkyne group (\u2013C\u2261C\u2013)",
            "Aromatic ring",
            "Halide group (\u2013X, where X = F, Cl, Br, I)",
            "Aldehyde group (\u2013CHO)",
            "Ketone group (\u2013C(=O)\u2013)",
            "Amine group (\u2013NR2, where R = alkyl or aryl)",
            "Sulfide group (\u2013S\u2013)",
            "Disulfide group (\u2013S\u2013S\u2013)",
            "Epoxide group",
            "Isocyanate group (\u2013N=C=O)",
            "Isothiocyanate group (\u2013N=C=S)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl group (\u2013OH)",
                "Carbonyl group (\u2013C=O)",
                "Carboxyl group (\u2013COOH)",
                "Amino group (\u2013NH2)",
                "Thiol group (\u2013SH)",
                "Ether group (\u2013O\u2013)",
                "Ester group (\u2013COO\u2013)",
                "Amide group (\u2013CONH\u2013)",
                "Phosphate group (\u2013OPO3H\u2013)",
                "Sulfonate group (\u2013SO3H)",
                "Nitro group (\u2013NO2)",
                "Nitrile group (\u2013C\u2261N)",
                "Alkene group (\u2013C=C\u2013)",
                "Alkyne group (\u2013C\u2261C\u2013)",
                "Aromatic ring",
                "Halide group (\u2013X, where X = F, Cl, Br, I)",
                "Aldehyde group (\u2013CHO)",
                "Ketone group (\u2013C(=O)\u2013)",
                "Amine group (\u2013NR2, where R = alkyl or aryl)",
                "Sulfide group (\u2013S\u2013)",
                "Disulfide group (\u2013S\u2013S\u2013)",
                "Epoxide group",
                "Isocyanate group (\u2013N=C=O)",
                "Isothiocyanate group (\u2013N=C=S)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aldehyde group (\u2013CHO)",
                "Alkene group (\u2013C=C\u2013)",
                "Alkyne group (\u2013C\u2261C\u2013)",
                "Amide group (\u2013CONH\u2013)",
                "Amine group (\u2013NR2, where R = alkyl or aryl)",
                "Amino group (\u2013NH2)",
                "Aromatic ring",
                "Carbonyl group (\u2013C=O)",
                "Carboxyl group (\u2013COOH)",
                "Disulfide group (\u2013S\u2013S\u2013)",
                "Epoxide group",
                "Ester group (\u2013COO\u2013)",
                "Ether group (\u2013O\u2013)",
                "Halide group (\u2013X, where X = F, Cl, Br, I)",
                "Hydroxyl group (\u2013OH)",
                "Isocyanate group (\u2013N=C=O)",
                "Isothiocyanate group (\u2013N=C=S)",
                "Ketone group (\u2013C(=O)\u2013)",
                "Nitrile group (\u2013C\u2261N)",
                "Nitro group (\u2013NO2)",
                "Phosphate group (\u2013OPO3H\u2013)",
                "Sulfide group (\u2013S\u2013)",
                "Sulfonate group (\u2013SO3H)",
                "Thiol group (\u2013SH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl Group (-OH)",
            "Carboxyl Group (-COOH)",
            "Amino Group (-NH2)",
            "Carbonyl Group (C=O)",
            "Sulfhydryl Group (-SH)",
            "Alkyl Group (-R)",
            "Ether Group (-O-)",
            "Ester Group (-COO-)",
            "Nitro Group (-NO2)",
            "Halogen Group (-X, where X = F, Cl, Br, I)",
            "Phosphate Group (-PO4)",
            "Cyano Group (-CN)",
            "Aldehyde Group (-CHO)",
            "Ketone Group (C=O)",
            "Amide Group (-CONH2)",
            "Thioether Group (-S-)",
            "Sulfonyl Group (-SO2-)",
            "Phosphonate Group (-PO3H2)",
            "Epoxy Group (C-O-C)",
            "Acyl Halide Group (-COX, where X = F, Cl, Br, I)",
            "Isocyanate Group (-N=C=O)",
            "Isothiocyanate Group (-N=C=S)",
            "Diazonium Group (-N\u2261N+)",
            "Hydrazine Group (-NH-NH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl Group (-OH)",
                "Carboxyl Group (-COOH)",
                "Amino Group (-NH2)",
                "Carbonyl Group (C=O)",
                "Sulfhydryl Group (-SH)",
                "Alkyl Group (-R)",
                "Ether Group (-O-)",
                "Ester Group (-COO-)",
                "Nitro Group (-NO2)",
                "Halogen Group (-X, where X = F, Cl, Br, I)",
                "Phosphate Group (-PO4)",
                "Cyano Group (-CN)",
                "Aldehyde Group (-CHO)",
                "Ketone Group (C=O)",
                "Amide Group (-CONH2)",
                "Thioether Group (-S-)",
                "Sulfonyl Group (-SO2-)",
                "Phosphonate Group (-PO3H2)",
                "Epoxy Group (C-O-C)",
                "Acyl Halide Group (-COX, where X = F, Cl, Br, I)",
                "Isocyanate Group (-N=C=O)",
                "Isothiocyanate Group (-N=C=S)",
                "Diazonium Group (-N\u2261N+)",
                "Hydrazine Group (-NH-NH2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acyl Halide Group (-COX, where X = F, Cl, Br, I)",
                "Aldehyde Group (-CHO)",
                "Alkyl Group (-R)",
                "Amide Group (-CONH2)",
                "Amino Group (-NH2)",
                "Carbonyl Group (C=O)",
                "Carboxyl Group (-COOH)",
                "Cyano Group (-CN)",
                "Diazonium Group (-N\u2261N+)",
                "Epoxy Group (C-O-C)",
                "Ester Group (-COO-)",
                "Ether Group (-O-)",
                "Halogen Group (-X, where X = F, Cl, Br, I)",
                "Hydrazine Group (-NH-NH2)",
                "Hydroxyl Group (-OH)",
                "Isocyanate Group (-N=C=O)",
                "Isothiocyanate Group (-N=C=S)",
                "Ketone Group (C=O)",
                "Nitro Group (-NO2)",
                "Phosphate Group (-PO4)",
                "Phosphonate Group (-PO3H2)",
                "Sulfhydryl Group (-SH)",
                "Sulfonyl Group (-SO2-)",
                "Thioether Group (-S-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Alkyl group (-CH3, -CH2CH3, etc.) (R)",
            "Alkenyl group (-CH=CH2, -CH=CHCH3, etc.) (R)",
            "Alkynyl group (-C\u2261CH, -C\u2261CCH3, etc.) (R)",
            "Amino group (-NH2)",
            "Carbonyl group (C=O)",
            "Carboxyl group (-COOH)",
            "Carboxamide group (-CO-NH2)",
            "Ester group (-COO-R)",
            "Ether group (-O-R)",
            "Halogen group (F, Cl, Br, I)",
            "Hydroxyl group (-OH)",
            "Imine group (-CH=N-R)",
            "Isocyanate group (-N=C=O)",
            "Ketone group (C=O)",
            "Methoxy group (-O-CH3)",
            "Nitrile group (-CN)",
            "Nitro group (-NO2)",
            "Phenyl group (-C6H5)",
            "Phosphoryl group (-PO3H2)",
            "Sulfate group (-SO3H)",
            "Sulfhydryl group (-SH)",
            "Sulfonamide group (-SO2-NH2)",
            "Sulfonyl group (-SO2-R)",
            "Thiol group (-SH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alkyl group (-CH3, -CH2CH3, etc.) (R)",
                "Alkenyl group (-CH=CH2, -CH=CHCH3, etc.) (R)",
                "Alkynyl group (-C\u2261CH, -C\u2261CCH3, etc.) (R)",
                "Amino group (-NH2)",
                "Carbonyl group (C=O)",
                "Carboxyl group (-COOH)",
                "Carboxamide group (-CO-NH2)",
                "Ester group (-COO-R)",
                "Ether group (-O-R)",
                "Halogen group (F, Cl, Br, I)",
                "Hydroxyl group (-OH)",
                "Imine group (-CH=N-R)",
                "Isocyanate group (-N=C=O)",
                "Ketone group (C=O)",
                "Methoxy group (-O-CH3)",
                "Nitrile group (-CN)",
                "Nitro group (-NO2)",
                "Phenyl group (-C6H5)",
                "Phosphoryl group (-PO3H2)",
                "Sulfate group (-SO3H)",
                "Sulfhydryl group (-SH)",
                "Sulfonamide group (-SO2-NH2)",
                "Sulfonyl group (-SO2-R)",
                "Thiol group (-SH)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alkenyl group (-CH=CH2, -CH=CHCH3, etc.) (R)",
                "Alkyl group (-CH3, -CH2CH3, etc.) (R)",
                "Alkynyl group (-C\u2261CH, -C\u2261CCH3, etc.) (R)",
                "Amino group (-NH2)",
                "Carbonyl group (C=O)",
                "Carboxamide group (-CO-NH2)",
                "Carboxyl group (-COOH)",
                "Ester group (-COO-R)",
                "Ether group (-O-R)",
                "Halogen group (F, Cl, Br, I)",
                "Hydroxyl group (-OH)",
                "Imine group (-CH=N-R)",
                "Isocyanate group (-N=C=O)",
                "Ketone group (C=O)",
                "Methoxy group (-O-CH3)",
                "Nitrile group (-CN)",
                "Nitro group (-NO2)",
                "Phenyl group (-C6H5)",
                "Phosphoryl group (-PO3H2)",
                "Sulfate group (-SO3H)",
                "Sulfhydryl group (-SH)",
                "Sulfonamide group (-SO2-NH2)",
                "Sulfonyl group (-SO2-R)",
                "Thiol group (-SH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Hydroxyl group (OH)",
            "Carbonyl group (CO)",
            "Carboxyl group (COOH)",
            "Amino group (NH2)",
            "Methyl group (CH3)",
            "Methylene group (CH2)",
            "Methoxy group (OCH3)",
            "Epoxy group",
            "Aldehyde group (CHO)",
            "Ketone group (RC(=O)R')",
            "Ester group (RC(=O)OR')",
            "Ether group (R-O-R')",
            "Amide group (RCONR')",
            "Nitrile group (CN)",
            "Isocyanate group (NCO)",
            "Cyano group (CN)",
            "Alkyl group (R)",
            "Aryl group (Ar)",
            "Vinyl group",
            "Allyl group",
            "Acyl group (RC(=O)-)",
            "Sulfhydryl group (SH)",
            "Phosphoryl group (PO4)",
            "Thiol group (RSH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxyl group (OH)",
                "Carbonyl group (CO)",
                "Carboxyl group (COOH)",
                "Amino group (NH2)",
                "Methyl group (CH3)",
                "Methylene group (CH2)",
                "Methoxy group (OCH3)",
                "Epoxy group",
                "Aldehyde group (CHO)",
                "Ketone group (RC(=O)R')",
                "Ester group (RC(=O)OR')",
                "Ether group (R-O-R')",
                "Amide group (RCONR')",
                "Nitrile group (CN)",
                "Isocyanate group (NCO)",
                "Cyano group (CN)",
                "Alkyl group (R)",
                "Aryl group (Ar)",
                "Vinyl group",
                "Allyl group",
                "Acyl group (RC(=O)-)",
                "Sulfhydryl group (SH)",
                "Phosphoryl group (PO4)",
                "Thiol group (RSH)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acyl group (RC(=O)-)",
                "Aldehyde group (CHO)",
                "Alkyl group (R)",
                "Allyl group",
                "Amide group (RCONR')",
                "Amino group (NH2)",
                "Aryl group (Ar)",
                "Carbonyl group (CO)",
                "Carboxyl group (COOH)",
                "Cyano group (CN)",
                "Epoxy group",
                "Ester group (RC(=O)OR')",
                "Ether group (R-O-R')",
                "Hydroxyl group (OH)",
                "Isocyanate group (NCO)",
                "Ketone group (RC(=O)R')",
                "Methoxy group (OCH3)",
                "Methyl group (CH3)",
                "Methylene group (CH2)",
                "Nitrile group (CN)",
                "Phosphoryl group (PO4)",
                "Sulfhydryl group (SH)",
                "Thiol group (RSH)",
                "Vinyl group"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "functional group",
        "domain": "chemistry",
        "response": [
            "Acetyl group",
            "Alkenyl group",
            "Alkyl group",
            "Aldehyde group",
            "Amide group",
            "Aromatic group",
            "Carboxylic acid group",
            "Ether group",
            "Halogenoalkane group",
            "Hydroxyl group",
            "Iminium ion",
            "Isocyanate group",
            "Isothiocyanate group",
            "Isothiocyanate group",
            "Ketone group",
            "Methyl group",
            "Nitrile group",
            "Phenol group",
            "Primary amine group",
            "Secondary amine group",
            "Sulfonyl group",
            "Sulfonyl group",
            "Thiol group",
            "Thioether group",
            "Thiol group",
            "Trifluoromethanesulfonyl group"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl group",
                "Alkenyl group",
                "Alkyl group",
                "Aldehyde group",
                "Amide group",
                "Aromatic group",
                "Carboxylic acid group",
                "Ether group",
                "Halogenoalkane group",
                "Hydroxyl group",
                "Iminium ion",
                "Isocyanate group",
                "Isothiocyanate group",
                "Ketone group",
                "Methyl group",
                "Nitrile group",
                "Phenol group",
                "Primary amine group",
                "Secondary amine group",
                "Sulfonyl group",
                "Thiol group",
                "Thioether group"
            ],
            "mismatches": [
                "Trifluoromethanesulfonyl group"
            ],
            "true_referents": [
                "Acetyl group",
                "Aldehyde group",
                "Alkenyl group",
                "Alkyl group",
                "Amide group",
                "Aromatic group",
                "Carboxylic acid group",
                "Ether group",
                "Halogenoalkane group",
                "Hydroxyl group",
                "Iminium ion",
                "Isocyanate group",
                "Isothiocyanate group",
                "Ketone group",
                "Methyl group",
                "Nitrile group",
                "Phenol group",
                "Primary amine group",
                "Secondary amine group",
                "Sulfonyl group",
                "Thioether group",
                "Thiol group"
            ],
            "TP": 22,
            "FP": 1,
            "FN": 0
        }
    }
]