[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane chloride (CH3Cl)",
            "Ethane chloride (C2H5Cl)",
            "Bromoethane (C2H5Br)",
            "1,2-Dibromoethane (C2H4Br2)",
            "Tetrachloromethane (CCl4)",
            "Trichloromethane (CHCl3)",
            "Bromochloromethane (CH2BrCl)",
            "Chloroform (CHCl3)",
            "Bromomethane (CH3Br)",
            "1,1-Dichloroethane (C2H4Cl2)",
            "1,2-Dichloroethane (C2H4Cl2)",
            "1,1,2-Trichloroethane (C2H3Cl3)",
            "1,1,1-Trichloroethane (C2H3Cl3)",
            "Bromochlorodifluoromethane (CF2ClBr)",
            "1,2-Dibromo-1-chloroethane (C2H3Br2Cl)",
            "1,1-Dibromo-2-chloroethane (C2H3Br2Cl)",
            "1,2-Dichloro-1-fluoroethane (C2H4Cl2F)",
            "1,1-Dichloro-2-fluoroethane (C2H4Cl2F)",
            "1,1-Dichloro-1-fluoroethane (C2H4Cl2F)",
            "1,1,1-Trichloro-2-fluoroethane (C2H2Cl3F)",
            "1,1,2-Trichloro-1-fluoroethane (C2H2Cl3F)",
            "1,1,1-Trifluoro-2-chloroethane (C2H2F3Cl)",
            "1,1,2-Trifluoro-1-chloroethane (C2H2F3Cl)",
            "1,1-Difluoro-2-chloroethane (C2H4F2Cl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "1,1,1-Trichloroethane (C2H3Cl3)",
                "1,1,2-Trichloroethane (C2H3Cl3)"
            ],
            "mismatches": [
                "Methane chloride (CH3Cl)",
                "Ethane chloride (C2H5Cl)",
                "Bromoethane (C2H5Br)",
                "1,2-Dibromoethane (C2H4Br2)",
                "Tetrachloromethane (CCl4)",
                "Bromochloromethane (CH2BrCl)",
                "Bromomethane (CH3Br)",
                "1,1-Dichloroethane (C2H4Cl2)",
                "1,2-Dichloroethane (C2H4Cl2)",
                "Bromochlorodifluoromethane (CF2ClBr)",
                "1,2-Dibromo-1-chloroethane (C2H3Br2Cl)",
                "1,1-Dibromo-2-chloroethane (C2H3Br2Cl)",
                "1,2-Dichloro-1-fluoroethane (C2H4Cl2F)",
                "1,1-Dichloro-2-fluoroethane (C2H4Cl2F)",
                "1,1-Dichloro-1-fluoroethane (C2H4Cl2F)",
                "1,1,1-Trichloro-2-fluoroethane (C2H2Cl3F)",
                "1,1,2-Trichloro-1-fluoroethane (C2H2Cl3F)",
                "1,1,1-Trifluoro-2-chloroethane (C2H2F3Cl)",
                "1,1,2-Trifluoro-1-chloroethane (C2H2F3Cl)",
                "1,1-Difluoro-2-chloroethane (C2H4F2Cl)"
            ],
            "true_referents": [
                "Bromochlorofluorocarbons",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorofluorocarbons, Ethane",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Trihalomethanes"
            ],
            "TP": 3,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Carbon tetrachloride (CCl4)",
            "Bromomethane (CH3Br)",
            "Dichloromethane (CH2Cl2)",
            "Chlorobenzene (C6H5Cl)",
            "Bromobenzene (C6H5Br)",
            "1,2-Dichloroethane (C2H4Cl2)",
            "1-Bromo-2-chloroethane (C2H4BrCl)",
            "1,2-Dibromoethane (C2H4Br2)",
            "1,1,1-Trichloroethane (C2H3Cl3)",
            "Tetrachloroethylene (C2Cl4)",
            "1,1,2,2-Tetrachloroethane (C2H2Cl4)",
            "Chloroform (CHCl3)",
            "Bromochloromethane (CH2BrCl)",
            "1,1,2-Trichloroethane (C2H3Cl3)",
            "Trichlorofluoromethane (CCl3F)",
            "1-Chloropropane (C3H7Cl)",
            "1-Bromopropane (C3H7Br)",
            "2-Chloro-2-methylpropane (C4H9Cl)",
            "1,1-Dichloroethane (C2H4Cl2)",
            "1,1,2-Trichloro-1,2,2-trifluoroethane (C2Cl3F3)",
            "1,2-Dibromopropane (C3H6Br2)",
            "1,2-Dichloropropane (C3H6Cl2)",
            "1-Bromo-2-chloro-2-fluoroethane (C2H3BrClF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Carbon tetrachloride (CCl4)",
                "Tetrachloroethylene (C2Cl4)"
            ],
            "mismatches": [
                "Bromomethane (CH3Br)",
                "Dichloromethane (CH2Cl2)",
                "Chlorobenzene (C6H5Cl)",
                "Bromobenzene (C6H5Br)",
                "1,2-Dichloroethane (C2H4Cl2)",
                "1-Bromo-2-chloroethane (C2H4BrCl)",
                "1,2-Dibromoethane (C2H4Br2)",
                "1,1,1-Trichloroethane (C2H3Cl3)",
                "1,1,2,2-Tetrachloroethane (C2H2Cl4)",
                "Bromochloromethane (CH2BrCl)",
                "1,1,2-Trichloroethane (C2H3Cl3)",
                "Trichlorofluoromethane (CCl3F)",
                "1-Chloropropane (C3H7Cl)",
                "1-Bromopropane (C3H7Br)",
                "2-Chloro-2-methylpropane (C4H9Cl)",
                "1,1-Dichloroethane (C2H4Cl2)",
                "1,1,2-Trichloro-1,2,2-trifluoroethane (C2Cl3F3)",
                "1,2-Dibromopropane (C3H6Br2)",
                "1,2-Dichloropropane (C3H6Cl2)",
                "1-Bromo-2-chloro-2-fluoroethane (C2H3BrClF)"
            ],
            "true_referents": [
                "Bromobenzenes",
                "Bromochlorofluorocarbons",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethylene Dibromide",
                "Hexachlorobenzene",
                "Hydrocarbons, Brominated",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroepoxypropane",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Trihalomethanes"
            ],
            "TP": 3,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroethane (Ethyl chloride)",
            "Bromomethane (Methyl bromide)",
            "Iodoethane (Ethyl iodide)",
            "Chloroform (Trichloromethane)",
            "Carbon tetrachloride (Tetrachloromethane)",
            "Dichloromethane (Methylene chloride)",
            "Tetrafluoroethane (HFC-134a)",
            "1,2-Dichloroethane",
            "1,1,1-Trichloroethane",
            "1,2-Dibromoethane",
            "Chlorobenzene",
            "Bromobenzene",
            "Iodobenzene",
            "1,1-Dichloroethene",
            "1,2-Dichloroethene",
            "Vinyl chloride (Chloroethene)",
            "Trifluoroacetic acid (TFA)",
            "Hexachlorobutadiene",
            "1,1,2,2-Tetrachloroethane",
            "1,2,3-Trichloropropane",
            "1,1,2-Trichloro-1,2,2-trifluoroethane (CFC-113)",
            "1,2-Dichloropropane",
            "1,3-Dichloropropene",
            "1,1-Dichloroethylene"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (Trichloromethane)",
                "Carbon tetrachloride (Tetrachloromethane)",
                "Dichloromethane (Methylene chloride)",
                "1,2-Dibromoethane",
                "Chlorobenzene",
                "Bromobenzene",
                "Iodobenzene",
                "Vinyl chloride (Chloroethene)",
                "Trifluoroacetic acid (TFA)"
            ],
            "mismatches": [
                "Chloroethane (Ethyl chloride)",
                "Bromomethane (Methyl bromide)",
                "Iodoethane (Ethyl iodide)",
                "Tetrafluoroethane (HFC-134a)",
                "1,2-Dichloroethane",
                "1,1,1-Trichloroethane",
                "1,1-Dichloroethene",
                "1,2-Dichloroethene",
                "Hexachlorobutadiene",
                "1,1,2,2-Tetrachloroethane",
                "1,2,3-Trichloropropane",
                "1,1,2-Trichloro-1,2,2-trifluoroethane (CFC-113)",
                "1,2-Dichloropropane",
                "1,3-Dichloropropene",
                "1,1-Dichloroethylene"
            ],
            "true_referents": [
                "3-Iodobenzylguanidine",
                "Bromobenzenes",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorofluorocarbons, Ethane",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Dichloroethylenes",
                "Dinitrochlorobenzene",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Fluoroacetates",
                "Fluorobenzenes",
                "Fluorocarbons",
                "Heptachlor",
                "Hexachlorobenzene",
                "Hexachlorocyclohexane",
                "Hydrocarbons, Iodinated",
                "Iodoacetic Acid",
                "Iodobenzenes",
                "Iophendylate",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroacetic Acid",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Vinyl Chloride"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloromethane (CH3Cl)",
            "Bromoethane (C2H5Br)",
            "Iodoethane (C2H5I)",
            "Dichloromethane (CH2Cl2)",
            "Trichloromethane (CHCl3) - Chloroform",
            "Tetrachloromethane (CCl4) - Carbon Tetrachloride",
            "1-Bromopropane (C3H7Br)",
            "2-Chloropropane (C3H7Cl)",
            "1,2-Dibromoethane (C2H4Br2)",
            "1-Chlorobutane (C4H9Cl)",
            "2-Chlorobutane (C4H9Cl)",
            "Pentafluoroethane (C2HF5)",
            "Trifluoromethane (CHF3)",
            "Hexafluoroethane (C2F6)",
            "Vinyl Chloride (C2H3Cl)",
            "Allyl Chloride (C3H5Cl)",
            "2,2-Dichloropropane (C3H6Cl2)",
            "1-Bromo-2-chloroethane (C2H4BrCl)",
            "1,1,2-Trichloroethane (C2H3Cl3)",
            "1,1,1-Trifluoroethane (C2H3F3)",
            "Difluorobromomethane (CHBrF2)",
            "Chlorofluoromethane (CH2ClF)",
            "1-Chloropropane (C3H7Cl)",
            "2-Bromopropane (C3H7Br)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Carbon Tetrachloride",
                "Ethylene Dibromide",
                "Vinyl Chloride"
            ],
            "mismatches": [
                "Chloromethane (CH3Cl)",
                "Bromoethane (C2H5Br)",
                "Iodoethane (C2H5I)",
                "Dichloromethane (CH2Cl2)",
                "Trichloromethane (CHCl3) - Chloroform",
                "1-Bromopropane (C3H7Br)",
                "2-Chloropropane (C3H7Cl)",
                "1-Chlorobutane (C4H9Cl)",
                "2-Chlorobutane (C4H9Cl)",
                "Pentafluoroethane (C2HF5)",
                "Trifluoromethane (CHF3)",
                "Hexafluoroethane (C2F6)",
                "Allyl Chloride (C3H5Cl)",
                "2,2-Dichloropropane (C3H6Cl2)",
                "1-Bromo-2-chloroethane (C2H4BrCl)",
                "1,1,2-Trichloroethane (C2H3Cl3)",
                "1,1,1-Trifluoroethane (C2H3F3)",
                "Difluorobromomethane (CHBrF2)",
                "Chlorofluoromethane (CH2ClF)",
                "1-Chloropropane (C3H7Cl)",
                "2-Bromopropane (C3H7Br)"
            ],
            "true_referents": [
                "Bromochlorofluorocarbons",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorodiphenyl (54% Chlorine)",
                "Chlorofluorocarbons",
                "Chlorofluorocarbons, Ethane",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Fluorocarbons",
                "Hydrocarbons, Brominated",
                "Hydrocarbons, Fluorinated",
                "Hydrocarbons, Iodinated",
                "Iodoacetic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroepoxypropane",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Trihalomethanes",
                "Vinyl Chloride"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloromethane (CH3Cl)",
            "Bromomethane (CH3Br)",
            "Dichloromethane (CH2Cl2)",
            "Chloroform (CHCl3)",
            "Carbon tetrachloride (CCl4)",
            "Chloroethane (C2H5Cl)",
            "1,2-Dichloroethane (C2H4Cl2)",
            "1,1,1-Trichloroethane (C2H3Cl3)",
            "Tetrachloroethene (C2Cl4)",
            "Chlorobenzene (C6H5Cl)",
            "Bromobenzene (C6H5Br)",
            "Iodobenzene (C6H5I)",
            "Fluorobenzene (C6H5F)",
            "1,2-Dibromoethane (C2H4Br2)",
            "1,1-Dichloroethene (C2H2Cl2)",
            "Vinyl chloride (C2H3Cl)",
            "1,2-Difluoroethane (C2H4F2)",
            "1-Bromo-2-chloroethane (C2H4BrCl)",
            "1-Chloropropane (C3H7Cl)",
            "1-Bromopropane (C3H7Br)",
            "1-Iodopropane (C3H7I)",
            "1-Fluoropropane (C3H7F)",
            "1-Chlorobutane (C4H9Cl)",
            "1-Bromobutane (C4H9Br)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Carbon tetrachloride (CCl4)",
                "Bromobenzene (C6H5Br)",
                "Iodobenzene (C6H5I)",
                "Fluorobenzene (C6H5F)",
                "Vinyl chloride (C2H3Cl)"
            ],
            "mismatches": [
                "Chloromethane (CH3Cl)",
                "Bromomethane (CH3Br)",
                "Dichloromethane (CH2Cl2)",
                "Chloroethane (C2H5Cl)",
                "1,2-Dichloroethane (C2H4Cl2)",
                "1,1,1-Trichloroethane (C2H3Cl3)",
                "Tetrachloroethene (C2Cl4)",
                "Chlorobenzene (C6H5Cl)",
                "1,2-Dibromoethane (C2H4Br2)",
                "1,1-Dichloroethene (C2H2Cl2)",
                "1,2-Difluoroethane (C2H4F2)",
                "1-Bromo-2-chloroethane (C2H4BrCl)",
                "1-Chloropropane (C3H7Cl)",
                "1-Bromopropane (C3H7Br)",
                "1-Iodopropane (C3H7I)",
                "1-Fluoropropane (C3H7F)",
                "1-Chlorobutane (C4H9Cl)",
                "1-Bromobutane (C4H9Br)"
            ],
            "true_referents": [
                "3-Iodobenzylguanidine",
                "Bromobenzenes",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Fluorobenzenes",
                "Fluorocarbons",
                "Hexachlorobenzene",
                "Hydrocarbons, Brominated",
                "Hydrocarbons, Fluorinated",
                "Hydrocarbons, Iodinated",
                "Iodoacetic Acid",
                "Iodobenzenes",
                "Iopanoic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroepoxypropane",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Vinyl Chloride"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Bromoethane (C2H5Br)",
            "Iodoethane (C2H5I)",
            "Dichloromethane (CH2Cl2)",
            "Trichloroethylene (C2HCl3)",
            "Tetrachloroethylene (C2Cl4)",
            "1-Bromo-2-methylpropane (C4H9Br)",
            "Chloroacetic acid (C2HClO2)",
            "1,1-Dichloroethane (C2H4Cl2)",
            "1,2-Dichloropropane (C3H6Cl2)",
            "Bromobenzene (C6H5Br)",
            "1-Chlorobutane (C4H9Cl)",
            "2-Chloropropane (C3H7Cl)",
            "Bromochloromethane (CH2BrCl)",
            "1-Bromo-1-methylcyclopropane (C4H7Br)",
            "1,3-Dichlorobenzene (C6H4Cl2)",
            "1-Chloro-3-methylbutane (C5H11Cl)",
            "1-Iodobutane (C4H9I)",
            "1,1,1-Trichloroethane (C2H3Cl3)",
            "Bromodichloromethane (CHBrCl2)",
            "1-Bromo-3-chloropropane (C3H6BrCl)",
            "2-Bromobutane (C4H9Br)",
            "Chlorodifluoromethane (CHClF2)",
            "1-Chloro-2-methylpropane (C4H9Cl)",
            "Perfluorooctane (C8F18)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Trichloroethylene (C2HCl3)",
                "Tetrachloroethylene (C2Cl4)",
                "Bromobenzene (C6H5Br)",
                "1,1,1-Trichloroethane (C2H3Cl3)"
            ],
            "mismatches": [
                "Bromoethane (C2H5Br)",
                "Iodoethane (C2H5I)",
                "Dichloromethane (CH2Cl2)",
                "1-Bromo-2-methylpropane (C4H9Br)",
                "Chloroacetic acid (C2HClO2)",
                "1,1-Dichloroethane (C2H4Cl2)",
                "1,2-Dichloropropane (C3H6Cl2)",
                "1-Chlorobutane (C4H9Cl)",
                "2-Chloropropane (C3H7Cl)",
                "Bromochloromethane (CH2BrCl)",
                "1-Bromo-1-methylcyclopropane (C4H7Br)",
                "1,3-Dichlorobenzene (C6H4Cl2)",
                "1-Chloro-3-methylbutane (C5H11Cl)",
                "1-Iodobutane (C4H9I)",
                "Bromodichloromethane (CHBrCl2)",
                "1-Bromo-3-chloropropane (C3H6BrCl)",
                "2-Bromobutane (C4H9Br)",
                "Chlorodifluoromethane (CHClF2)",
                "1-Chloro-2-methylpropane (C4H9Cl)",
                "Perfluorooctane (C8F18)"
            ],
            "true_referents": [
                "Bromobenzenes",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chloroacetates",
                "Chlorodiphenyl (54% Chlorine)",
                "Chlorofluorocarbons",
                "Chloroform",
                "Dichloroacetic Acid",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Hexachlorobenzene",
                "Hydrocarbons, Iodinated",
                "Iodoacetic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroacetic Acid",
                "Trichloroethanes",
                "Trichloroethylene"
            ],
            "TP": 5,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloromethane (CH3Cl)",
            "Bromomethane (CH3Br)",
            "Iodomethane (CH3I)",
            "Fluoromethane (CH3F)",
            "Dichloromethane (CH2Cl2)",
            "Dibromomethane (CH2Br2)",
            "Diiodomethane (CH2I2)",
            "Difluoromethane (CH2F2)",
            "Trichloromethane (CHCl3)",
            "Tribromomethane (CHBr3)",
            "Triiodomethane (CHI3)",
            "Trifluoromethane (CHF3)",
            "Tetrachloromethane (CCl4)",
            "Tetrabromomethane (CBr4)",
            "Tetraiodomethane (CI4)",
            "Tetrafluoromethane (CF4)",
            "1,2-Dichloroethane (C2H4Cl2)",
            "1,2-Dibromoethane (C2H4Br2)",
            "1,2-Diiodoethane (C2H4I2)",
            "1,2-Difluoroethane (C2H4F2)",
            "1,1,1-Trichloroethane (C2H3Cl3)",
            "1,1,1-Tribromoethane (C2H3Br3)",
            "1,1,1-Triiodoethane (C2H3I3)",
            "1,1,1-Trifluoroethane (C2H3F3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloromethane (CH3Cl)",
                "Tetrachloromethane (CCl4)",
                "1,2-Dibromoethane (C2H4Br2)",
                "1,1,1-Trichloroethane (C2H3Cl3)"
            ],
            "mismatches": [
                "Bromomethane (CH3Br)",
                "Iodomethane (CH3I)",
                "Fluoromethane (CH3F)",
                "Dichloromethane (CH2Cl2)",
                "Dibromomethane (CH2Br2)",
                "Diiodomethane (CH2I2)",
                "Difluoromethane (CH2F2)",
                "Trichloromethane (CHCl3)",
                "Tribromomethane (CHBr3)",
                "Triiodomethane (CHI3)",
                "Trifluoromethane (CHF3)",
                "Tetrabromomethane (CBr4)",
                "Tetraiodomethane (CI4)",
                "Tetrafluoromethane (CF4)",
                "1,2-Dichloroethane (C2H4Cl2)",
                "1,2-Diiodoethane (C2H4I2)",
                "1,2-Difluoroethane (C2H4F2)",
                "1,1,1-Tribromoethane (C2H3Br3)",
                "1,1,1-Triiodoethane (C2H3I3)",
                "1,1,1-Trifluoroethane (C2H3F3)"
            ],
            "true_referents": [
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorofluorocarbons, Ethane",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethylene Dibromide",
                "Fluorocarbons",
                "Hydrocarbons, Fluorinated",
                "Hydrocarbons, Iodinated",
                "Iodoacetamide",
                "Iodoacetic Acid",
                "Iopanoic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Trihalomethanes"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Bromomethane (CH3Br)",
            "Iodoethane (C2H5I)",
            "Fluorobenzene (C6H5F)",
            "Chlorobenzene (C6H5Cl)",
            "Bromobenzene (C6H5Br)",
            "Iodobenzene (C6H5I)",
            "Chloroethane (C2H5Cl)",
            "Bromoethane (C2H5Br)",
            "Iodoethane (C2H5I)",
            "Chloromethane (CH3Cl)",
            "Bromomethane (CH3Br)",
            "Iodomethane (CH3I)",
            "Chloroethene (C2H3Cl)",
            "Bromoethene (C2H3Br)",
            "Iodoethene (C2H3I)",
            "Chloroethyne (C2HCl)",
            "Bromoethyne (C2HBr)",
            "Iodoethyne (C2HI)",
            "Fluoromethane (CH3F)",
            "Fluoroethane (C2H5F)",
            "Fluoropropane (C3H7F)",
            "Fluorobutane (C4H9F)",
            "Fluoropentane (C5H11F)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Chlorobenzene (C6H5Cl)",
                "Bromobenzene (C6H5Br)",
                "Iodobenzene (C6H5I)",
                "Chloromethane (CH3Cl)",
                "Fluorobenzene (C6H5F)"
            ],
            "mismatches": [
                "Bromomethane (CH3Br)",
                "Iodoethane (C2H5I)",
                "Chloroethane (C2H5Cl)",
                "Bromoethane (C2H5Br)",
                "Iodomethane (CH3I)",
                "Chloroethene (C2H3Cl)",
                "Bromoethene (C2H3Br)",
                "Iodoethene (C2H3I)",
                "Chloroethyne (C2HCl)",
                "Bromoethyne (C2HBr)",
                "Iodoethyne (C2HI)",
                "Fluoromethane (CH3F)",
                "Fluoroethane (C2H5F)",
                "Fluoropropane (C3H7F)",
                "Fluorobutane (C4H9F)",
                "Fluoropentane (C5H11F)"
            ],
            "true_referents": [
                "3-Iodobenzylguanidine",
                "Bromobenzenes",
                "Bromotrichloromethane",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Fluorobenzenes",
                "Fluorocarbons",
                "Hexachlorobenzene",
                "Hydrocarbons, Fluorinated",
                "Hydrocarbons, Iodinated",
                "Iodoacetic Acid",
                "Iodobenzenes",
                "Iophendylate",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethylene",
                "Trifluoroacetic Acid"
            ],
            "TP": 6,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloromethane (CH\u2083Cl)",
            "Dichloromethane (CH\u2082Cl\u2082)",
            "Chloroethane (C\u2082H\u2085Cl)",
            "1,2-Dichloroethane (C\u2082H\u2084Cl\u2082)",
            "Trichloroethane (C\u2082H\u2083Cl\u2083)",
            "Tetrachloroethane (C\u2082H\u2082Cl\u2084)",
            "Fluoromethane (CH\u2083F)",
            "Bromomethane (CH\u2083Br)",
            "Iodomethane (CH\u2083I)",
            "Chloropropane (C\u2083H\u2087Cl)",
            "1,2-Dichloropropane (C\u2083H\u2086Cl\u2082)",
            "Trichloropropane (C\u2083H\u2085Cl\u2083)",
            "Tetrachloropropane (C\u2083H\u2084Cl\u2084)",
            "Fluoropropane (C\u2083H\u2087F)",
            "Bromopropane (C\u2083H\u2087Br)",
            "Iodopropane (C\u2083H\u2087I)",
            "Chlorobenzene (C\u2086H\u2085Cl)",
            "Dichlorobenzene (C\u2086H\u2084Cl\u2082)",
            "Trichlorobenzene (C\u2086H\u2083Cl\u2083)",
            "Tetrachlorobenzene (C\u2086H\u2082Cl\u2084)",
            "Fluorobenzene (C\u2086H\u2085F)",
            "Bromobenzene (C\u2086H\u2085Br)",
            "Iodobenzene (C\u2086H\u2085I)",
            "Carbon Tetrachloride (CCl\u2084)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chlorobenzene (C\u2086H\u2085Cl)",
                "Fluorobenzene (C\u2086H\u2085F)",
                "Bromobenzene (C\u2086H\u2085Br)",
                "Iodobenzene (C\u2086H\u2085I)",
                "Carbon Tetrachloride (CCl\u2084)"
            ],
            "mismatches": [
                "Chloromethane (CH\u2083Cl)",
                "Dichloromethane (CH\u2082Cl\u2082)",
                "Chloroethane (C\u2082H\u2085Cl)",
                "1,2-Dichloroethane (C\u2082H\u2084Cl\u2082)",
                "Trichloroethane (C\u2082H\u2083Cl\u2083)",
                "Tetrachloroethane (C\u2082H\u2082Cl\u2084)",
                "Fluoromethane (CH\u2083F)",
                "Bromomethane (CH\u2083Br)",
                "Iodomethane (CH\u2083I)",
                "Chloropropane (C\u2083H\u2087Cl)",
                "1,2-Dichloropropane (C\u2083H\u2086Cl\u2082)",
                "Trichloropropane (C\u2083H\u2085Cl\u2083)",
                "Tetrachloropropane (C\u2083H\u2084Cl\u2084)",
                "Fluoropropane (C\u2083H\u2087F)",
                "Bromopropane (C\u2083H\u2087Br)",
                "Iodopropane (C\u2083H\u2087I)",
                "Dichlorobenzene (C\u2086H\u2084Cl\u2082)",
                "Trichlorobenzene (C\u2086H\u2083Cl\u2083)",
                "Tetrachlorobenzene (C\u2086H\u2082Cl\u2084)"
            ],
            "true_referents": [
                "Bromobenzenes",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethylene Dibromide",
                "Fluorobenzenes",
                "Fluorocarbons",
                "Hexachlorobenzene",
                "Hydrocarbons, Brominated",
                "Hydrocarbons, Fluorinated",
                "Hydrocarbons, Iodinated",
                "Iodoacetic Acid",
                "Iodobenzenes",
                "Iopanoic Acid",
                "Iophendylate",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroacetic Acid",
                "Trichloroepoxypropane",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloromethane (CH3Cl)",
            "Dichloromethane (CH2Cl2)",
            "Chloroform (CHCl3)",
            "Carbon tetrachloride (CCl4)",
            "Fluoromethane (CH3F)",
            "Difluoromethane (CH2F2)",
            "Trifluoromethane (CHF3)",
            "Tetrafluoromethane (CF4)",
            "Bromomethane (CH3Br)",
            "Iodomethane (CH3I)",
            "Chloroethane (C2H5Cl)",
            "1,2-Dichloroethane (C2H4Cl2)",
            "Trichloroethylene (C2HCl3)",
            "Tetrachloroethylene (C2Cl4)",
            "Vinyl chloride (C2H3Cl)",
            "1-Chloropropane (C3H7Cl)",
            "2-Chloropropane (C3H7Cl)",
            "1-Bromopropane (C3H7Br)",
            "2-Bromopropane (C3H7Br)",
            "1-Iodopropane (C3H7I)",
            "Chlorobenzene (C6H5Cl)",
            "Bromobenzene (C6H5Br)",
            "Iodobenzene (C6H5I)",
            "Fluorobenzene (C6H5F)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Carbon tetrachloride (CCl4)",
                "Trichloroethylene (C2HCl3)",
                "Tetrachloroethylene (C2Cl4)",
                "Vinyl chloride (C2H3Cl)",
                "Chlorobenzene (C6H5Cl)",
                "Bromobenzene (C6H5Br)",
                "Iodobenzene (C6H5I)"
            ],
            "mismatches": [
                "Chloromethane (CH3Cl)",
                "Dichloromethane (CH2Cl2)",
                "Fluoromethane (CH3F)",
                "Difluoromethane (CH2F2)",
                "Trifluoromethane (CHF3)",
                "Tetrafluoromethane (CF4)",
                "Bromomethane (CH3Br)",
                "Iodomethane (CH3I)",
                "Chloroethane (C2H5Cl)",
                "1,2-Dichloroethane (C2H4Cl2)",
                "1-Chloropropane (C3H7Cl)",
                "2-Chloropropane (C3H7Cl)",
                "1-Bromopropane (C3H7Br)",
                "2-Bromopropane (C3H7Br)",
                "1-Iodopropane (C3H7I)",
                "Fluorobenzene (C6H5F)"
            ],
            "true_referents": [
                "3-Iodobenzylguanidine",
                "Bromobenzenes",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chlorofluorocarbons, Ethane",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Fluorobenzenes",
                "Fluorocarbons",
                "Hexachlorobenzene",
                "Hydrocarbons, Brominated",
                "Hydrocarbons, Fluorinated",
                "Hydrocarbons, Iodinated",
                "Iodoacetic Acid",
                "Iodobenzenes",
                "Iopanoic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroepoxypropane",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Vinyl Chloride"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloromethane (CH3Cl)",
            "Bromomethane (CH3Br)",
            "Iodomethane (CH3I)",
            "Dichloromethane (CH2Cl2)",
            "Chloroform (CHCl3)",
            "Carbon tetrachloride (CCl4)",
            "Vinyl chloride (C2H3Cl)",
            "1,2-Dichloroethane (C2H4Cl2)",
            "Trichloroethylene (C2HCl3)",
            "Tetrachloroethylene (C2Cl4)",
            "Chlorobenzene (C6H5Cl)",
            "Bromobenzene (C6H5Br)",
            "Iodobenzene (C6H5I)",
            "1,2-Dichlorobenzene (C6H4Cl2)",
            "1,3-Dichlorobenzene (C6H4Cl2)",
            "1,4-Dichlorobenzene (C6H4Cl2)",
            "1,2,3-Trichlorobenzene (C6H3Cl3)",
            "1,2,4-Trichlorobenzene (C6H3Cl3)",
            "1,3,5-Trichlorobenzene (C6H3Cl3)",
            "1,2,3,4-Tetrachlorobenzene (C6H2Cl4)",
            "1,2,3,5-Tetrachlorobenzene (C6H2Cl4)",
            "1,2,4,5-Tetrachlorobenzene (C6H2Cl4)",
            "Pentachlorobenzene (C6HCl5)",
            "Hexachlorobenzene (C6Cl6)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Carbon tetrachloride (CCl4)",
                "Vinyl chloride (C2H3Cl)",
                "Trichloroethylene (C2HCl3)",
                "Tetrachloroethylene (C2Cl4)",
                "Bromobenzene (C6H5Br)",
                "Iodobenzene (C6H5I)",
                "Hexachlorobenzene (C6Cl6)"
            ],
            "mismatches": [
                "Chloromethane (CH3Cl)",
                "Bromomethane (CH3Br)",
                "Iodomethane (CH3I)",
                "Dichloromethane (CH2Cl2)",
                "1,2-Dichloroethane (C2H4Cl2)",
                "Chlorobenzene (C6H5Cl)",
                "1,2-Dichlorobenzene (C6H4Cl2)",
                "1,3-Dichlorobenzene (C6H4Cl2)",
                "1,4-Dichlorobenzene (C6H4Cl2)",
                "1,2,3-Trichlorobenzene (C6H3Cl3)",
                "1,2,4-Trichlorobenzene (C6H3Cl3)",
                "1,3,5-Trichlorobenzene (C6H3Cl3)",
                "1,2,3,4-Tetrachlorobenzene (C6H2Cl4)",
                "1,2,3,5-Tetrachlorobenzene (C6H2Cl4)",
                "1,2,4,5-Tetrachlorobenzene (C6H2Cl4)",
                "Pentachlorobenzene (C6HCl5)"
            ],
            "true_referents": [
                "3-Iodobenzylguanidine",
                "Bromobenzenes",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Hexachlorobenzene",
                "Hexachlorocyclohexane",
                "Hydrocarbons, Iodinated",
                "Iodoacetic Acid",
                "Iodobenzenes",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene",
                "Vinyl Chloride"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloromethane (CH3Cl)",
            "Bromomethane (CH3Br)",
            "Iodomethane (CH3I)",
            "Fluoromethane (CH3F)",
            "Chloroethane (C2H5Cl)",
            "Bromoethane (C2H5Br)",
            "Iodoethane (C2H5I)",
            "Fluoroethane (C2H5F)",
            "1,1-Dichloroethane (CH3CHCl2)",
            "1,2-Dichloroethane (CH2ClCH2Cl)",
            "1,1,1-Trichloroethane (CH3CCl3)",
            "1,1,2-Trichloroethane (CH2ClCHCl2)",
            "1,1,1,2-Tetrachloroethane (CHCl2CHCl2)",
            "Chloroform (CHCl3)",
            "Bromoform (CHBr3)",
            "Iodoform (CHI3)",
            "Chlorofluoromethane (CH2ClF)",
            "Dichlorodifluoromethane (CCl2F2)",
            "Trichlorofluoromethane (CCl3F)",
            "Tetrachlorofluoroethane (C2Cl4F2)",
            "Vinyl chloride (C2H3Cl)",
            "Vinylidene chloride (C2H2Cl2)",
            "Trichloroethylene (C2HCl3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "1,1,1-Trichloroethane (CH3CCl3)",
                "1,1,2-Trichloroethane (CH2ClCHCl2)",
                "Trichloroethylene (C2HCl3)",
                "Vinyl chloride (C2H3Cl)"
            ],
            "mismatches": [
                "Chloromethane (CH3Cl)",
                "Bromomethane (CH3Br)",
                "Iodomethane (CH3I)",
                "Fluoromethane (CH3F)",
                "Chloroethane (C2H5Cl)",
                "Bromoethane (C2H5Br)",
                "Iodoethane (C2H5I)",
                "Fluoroethane (C2H5F)",
                "1,1-Dichloroethane (CH3CHCl2)",
                "1,2-Dichloroethane (CH2ClCH2Cl)",
                "1,1,1,2-Tetrachloroethane (CHCl2CHCl2)",
                "Bromoform (CHBr3)",
                "Iodoform (CHI3)",
                "Chlorofluoromethane (CH2ClF)",
                "Dichlorodifluoromethane (CCl2F2)",
                "Trichlorofluoromethane (CCl3F)",
                "Tetrachlorofluoroethane (C2Cl4F2)",
                "Vinylidene chloride (C2H2Cl2)"
            ],
            "true_referents": [
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorofluorocarbons",
                "Chlorofluorocarbons, Ethane",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Fluorocarbons",
                "Hydrocarbons, Fluorinated",
                "Hydrocarbons, Iodinated",
                "Iodoacetates",
                "Iodoacetic Acid",
                "Iopanoic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Trihalomethanes",
                "Vinyl Chloride"
            ],
            "TP": 5,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Bromoform (CHBr3)",
            "Iodoform (CHI3)",
            "Carbon tetrachloride (CCl4)",
            "Methylene chloride (CH2Cl2)",
            "Ethyl bromide (CH3CH2Br)",
            "Propyl iodide (CH3CH2CH2I)",
            "Butyl fluoride (CH3CH2CH2CH2F)",
            "Pentyl chloride (CH3CH2CH2CH2CH2Cl)",
            "Hexyl bromide (CH3CH2CH2CH2CH2CH2Br)",
            "Ethylene dichloride (CH2ClCH2Cl)",
            "Vinyl bromide (CH2=CHBr)",
            "Allyl iodide (CH2=CHCH2I)",
            "Propargyl fluoride (HC\u2261CCH2F)",
            "Benzyl chloride (C6H5CH2Cl)",
            "Benzal chloride (C6H5CHCl2)",
            "Benzotrichloride (C6H5CCl3)",
            "Chlorobenzene (C6H5Cl)",
            "Bromobenzene (C6H5Br)",
            "Iodobenzene (C6H5I)",
            "Fluorobenzene (C6H5F)",
            "Dichlorobenzene (C6H4Cl2)",
            "Tribromobenzene (C6H3Br3)",
            "Tetrafluorobenzene (C6H2F4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Carbon tetrachloride (CCl4)",
                "Methylene chloride (CH2Cl2)",
                "Ethylene dichloride (CH2ClCH2Cl)",
                "Chlorobenzene (C6H5Cl)",
                "Bromobenzene (C6H5Br)",
                "Iodobenzene (C6H5I)",
                "Fluorobenzene (C6H5F)"
            ],
            "mismatches": [
                "Bromoform (CHBr3)",
                "Iodoform (CHI3)",
                "Ethyl bromide (CH3CH2Br)",
                "Propyl iodide (CH3CH2CH2I)",
                "Butyl fluoride (CH3CH2CH2CH2F)",
                "Pentyl chloride (CH3CH2CH2CH2CH2Cl)",
                "Hexyl bromide (CH3CH2CH2CH2CH2CH2Br)",
                "Vinyl bromide (CH2=CHBr)",
                "Allyl iodide (CH2=CHCH2I)",
                "Propargyl fluoride (HC\u2261CCH2F)",
                "Benzyl chloride (C6H5CH2Cl)",
                "Benzal chloride (C6H5CHCl2)",
                "Benzotrichloride (C6H5CCl3)",
                "Dichlorobenzene (C6H4Cl2)",
                "Tribromobenzene (C6H3Br3)",
                "Tetrafluorobenzene (C6H2F4)"
            ],
            "true_referents": [
                "3-Iodobenzylguanidine",
                "Bromobenzenes",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Ethylene Dichlorides",
                "Fluoroacetates",
                "Fluorobenzenes",
                "Fluorocarbons",
                "Hexachlorobenzene",
                "Hexachlorocyclohexane",
                "Hydrocarbons, Fluorinated",
                "Hydrocarbons, Iodinated",
                "Iodoacetates",
                "Iodoacetic Acid",
                "Iodobenzenes",
                "Iopanoic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Vinyl Chloride"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloromethane (CH3Cl)",
            "Bromomethane (CH3Br)",
            "Chloroethane (CH3CH2Cl)",
            "Bromoethane (CH3CH2Br)",
            "Chloropropane (CH3CH2CH2Cl)",
            "Bromopropane (CH3CH2CH2Br)",
            "Chlorobutane (CH3CH2CH2CH2Cl)",
            "Bromobutane (CH3CH2CH2CH2Br)",
            "Chloropentane (CH3CH2CH2CH2CH2Cl)",
            "Bromopentane (CH3CH2CH2CH2CH2Br)",
            "Chlorohexane (CH3CH2CH2CH2CH2CH2Cl)",
            "Bromohexane (CH3CH2CH2CH2CH2CH2Br)",
            "Chloroheptane (CH3CH2CH2CH2CH2CH2CH2Cl)",
            "Bromohexane (CH3CH2CH2CH2CH2CH2CH2Br)",
            "Chlorooctane (CH3CH2CH2CH2CH2CH2CH2CH2Cl)",
            "Bromooctane (CH3CH2CH2CH2CH2CH2CH2CH2Br)",
            "Chlorodecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2Cl)",
            "Bromodecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2Br)",
            "Chlorododecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2Cl)",
            "Bromododecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2Br)",
            "Chlorotetradecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2Cl)",
            "Bromotetradecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2Br)",
            "Chlorohexadecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2Cl)",
            "Bromohexadecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2Br)",
            "Chlorooctadecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2Cl)",
            "Bromooctadecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2Br)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Chloromethane (CH3Cl)",
                "Bromomethane (CH3Br)",
                "Chloroethane (CH3CH2Cl)",
                "Bromoethane (CH3CH2Br)",
                "Chloropropane (CH3CH2CH2Cl)",
                "Bromopropane (CH3CH2CH2Br)",
                "Chlorobutane (CH3CH2CH2CH2Cl)",
                "Bromobutane (CH3CH2CH2CH2Br)",
                "Chloropentane (CH3CH2CH2CH2CH2Cl)",
                "Bromopentane (CH3CH2CH2CH2CH2Br)",
                "Chlorohexane (CH3CH2CH2CH2CH2CH2Cl)",
                "Bromohexane (CH3CH2CH2CH2CH2CH2Br)",
                "Chloroheptane (CH3CH2CH2CH2CH2CH2CH2Cl)",
                "Bromohexane (CH3CH2CH2CH2CH2CH2CH2Br)",
                "Chlorooctane (CH3CH2CH2CH2CH2CH2CH2CH2Cl)",
                "Bromooctane (CH3CH2CH2CH2CH2CH2CH2CH2Br)",
                "Chlorodecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2Cl)",
                "Bromodecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2Br)",
                "Chlorododecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2Cl)",
                "Bromododecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2Br)",
                "Chlorotetradecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2Cl)",
                "Bromotetradecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2Br)",
                "Chlorohexadecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2Cl)",
                "Bromohexadecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2Br)",
                "Chlorooctadecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2Cl)",
                "Bromooctadecane (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2Br)"
            ],
            "true_referents": [
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Dichloroacetic Acid",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Hexachlorocyclohexane",
                "Hydrocarbons, Brominated",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroacetic Acid",
                "Trichloroepoxypropane",
                "Trichloroethanes",
                "Trichloroethylene"
            ],
            "TP": 0,
            "FP": 26,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Carbon tetrachloride (CCl4)",
            "Methyl iodide (CH3I)",
            "Bromoform (CHBr3)",
            "Iodoform (CHI3)",
            "1,1,1-Trichloroethane (CH3CHCl3)",
            "1,1,2-Trichloroethane (CHCl2CH2Cl)",
            "1,1-Dichloroethane (CH3CHCl2)",
            "1,2-Dichloroethane (CH2ClCH2Cl)",
            "Vinyl chloride (CH2=CHCl)",
            "Trichloroethylene (ClCH=CCl2)",
            "Tetrachloroethylene (Cl2C=CCl2)",
            "1,1,1,2-Tetrachloroethane (CHCl2CHCl2)",
            "Dichloromethane (CH2Cl2)",
            "Chlorobenzene (C6H5Cl)",
            "1,2-Dichlorobenzene (C6H4Cl2)",
            "1,4-Dichlorobenzene (C6H4Cl2)",
            "Hexachlorobenzene (C6Cl6)",
            "Pentachlorobenzene (C6HCl5)",
            "1,2,4-Trichlorobenzene (C6H3Cl3)",
            "1,2,3-Trichlorobenzene (C6H3Cl3)",
            "2,4,6-Trichlorophenol (C6H2Cl3O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Carbon tetrachloride (CCl4)",
                "Vinyl chloride (CH2=CHCl)",
                "Trichloroethylene (ClCH=CCl2)",
                "Tetrachloroethylene (Cl2C=CCl2)",
                "Dichloromethane (CH2Cl2)",
                "Chlorobenzene (C6H5Cl)",
                "Hexachlorobenzene (C6Cl6)"
            ],
            "mismatches": [
                "Methyl iodide (CH3I)",
                "Bromoform (CHBr3)",
                "Iodoform (CHI3)",
                "1,1,1-Trichloroethane (CH3CHCl3)",
                "1,1,2-Trichloroethane (CHCl2CH2Cl)",
                "1,1-Dichloroethane (CH3CHCl2)",
                "1,2-Dichloroethane (CH2ClCH2Cl)",
                "1,1,1,2-Tetrachloroethane (CHCl2CHCl2)",
                "1,2-Dichlorobenzene (C6H4Cl2)",
                "1,4-Dichlorobenzene (C6H4Cl2)",
                "Pentachlorobenzene (C6HCl5)",
                "1,2,4-Trichlorobenzene (C6H3Cl3)",
                "1,2,3-Trichlorobenzene (C6H3Cl3)",
                "2,4,6-Trichlorophenol (C6H2Cl3O)"
            ],
            "true_referents": [
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethylene Dibromide",
                "Hexachlorobenzene",
                "Hexachlorocyclohexane",
                "Hydrocarbons, Iodinated",
                "Iodoacetates",
                "Iodoacetic Acid",
                "Iopanoic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene",
                "Vinyl Chloride"
            ],
            "TP": 8,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            [
                "Canonical name",
                "Ethyl chloride"
            ],
            [
                "Canonical name",
                "Chloroethane"
            ],
            [
                "Canonical name",
                "Dichloroethane"
            ],
            [
                "Canonical name",
                "Trichloroethane"
            ]
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ethyl chloride"
            ],
            "mismatches": [
                "Chloroethane",
                "Dichloroethane",
                "Trichloroethane"
            ],
            "true_referents": [
                "Dichlorodiphenyl Dichloroethylene",
                "Ethyl Chloride",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene"
            ],
            "TP": 1,
            "FP": 3,
            "FN": 0
        }
    }
]