[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Bromoform (CHBr3)",
            "Carbon tetrachloride (CCl4)",
            "Dichloromethane (CH2Cl2)",
            "Trichloroethylene (C2HCl3)",
            "Tetrachloroethylene (C2Cl4)",
            "Methylene chloride (CH2Cl2)",
            "Dibromomethane (CH2Br2)",
            "1,2-Dichloroethane (C2H4Cl2)",
            "Hexachlorobenzene (C6Cl6)",
            "Perchloroethylene (C2Cl4)",
            "1,2-Dibromoethane (C2H4Br2)",
            "Hexachlorocyclohexane (C6H6Cl6)",
            "1,1,1-Trichloroethane (C2H3Cl3)",
            "1,1-Dichloroethane (C2H4Cl2)",
            "1,1,2-Trichloroethane (C2H3Cl3)",
            "1,2-Dichloropropane (C3H6Cl2)",
            "1,1-Dichloropropene (C3H4Cl2)",
            "1,1,1-Trichloro-2-propanol (C3H6Cl3O)",
            "1,1,2,2-Tetrachloroethane (C2H2Cl4)",
            "1,2-Dichloro-1,1,2-trifluoroethane (C2H2Cl2F2)",
            "1,1-Dichloro-2,2,2-trifluoroethane (C2H2Cl2F3)",
            "1,1,2-Trichloro-1,2,2-trifluoroethane (C2H2Cl3F2)",
            "1,1-Dichloro-1-fluoroethane (C2H4Cl2F)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Carbon tetrachloride (CCl4)",
                "Trichloroethylene (C2HCl3)",
                "Tetrachloroethylene (C2Cl4)",
                "Methylene chloride (CH2Cl2)",
                "Hexachlorobenzene (C6Cl6)",
                "Hexachlorocyclohexane (C6H6Cl6)"
            ],
            "mismatches": [
                "Bromoform (CHBr3)",
                "Dichloromethane (CH2Cl2)",
                "Dibromomethane (CH2Br2)",
                "1,2-Dichloroethane (C2H4Cl2)",
                "Perchloroethylene (C2Cl4)",
                "1,2-Dibromoethane (C2H4Br2)",
                "1,1,1-Trichloroethane (C2H3Cl3)",
                "1,1-Dichloroethane (C2H4Cl2)",
                "1,1,2-Trichloroethane (C2H3Cl3)",
                "1,2-Dichloropropane (C3H6Cl2)",
                "1,1-Dichloropropene (C3H4Cl2)",
                "1,1,1-Trichloro-2-propanol (C3H6Cl3O)",
                "1,1,2,2-Tetrachloroethane (C2H2Cl4)",
                "1,2-Dichloro-1,1,2-trifluoroethane (C2H2Cl2F2)",
                "1,1-Dichloro-2,2,2-trifluoroethane (C2H2Cl2F3)",
                "1,1,2-Trichloro-1,2,2-trifluoroethane (C2H2Cl3F2)",
                "1,1-Dichloro-1-fluoroethane (C2H4Cl2F)"
            ],
            "true_referents": [
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Hexachlorobenzene",
                "Hexachlorocyclohexane",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroacetic Acid",
                "Trichloroepoxypropane",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Carbon Tetrachloride (CCl4)",
            "Bromochloromethane (CH2BrCl)",
            "1,2-Dibromoethane (C2H4Br2)",
            "Trichloroethylene (C2HCl3)",
            "Tetrachloroethylene (C2Cl4)",
            "Bromodichloromethane (CHBrCl2)",
            "Dichloromethane (CH2Cl2)",
            "1,1,1-Trichloroethane (C2H3Cl3)",
            "Chlorobenzene (C6H5Cl)",
            "Hexachlorobenzene (C6Cl6)",
            "1,1,2,2-Tetrachloroethane (C2H2Cl4)",
            "1,2-Dichloropropane (C3H6Cl2)",
            "Chloroform (CHCl3)",
            "Chlorodifluoromethane (CHClF2)",
            "Chloroform (CHCl3)",
            "Bromoform (CHBr3)",
            "Carbon Tetrabromide (CBr4)",
            "1-Bromo-2-chloroethane (C2H4BrCl)",
            "1,1,2-Trichloro-1,2,2-trifluoroethane (C2HCl3F3)",
            "Chloroethane (C2H5Cl)",
            "Bromofluoromethane (CH2BrF)",
            "1,2-Dichloro-1,1,2,2-tetrafluoroethane (C2Cl2F4)",
            "Chloropentafluoroethane (C2ClF5)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Carbon Tetrachloride (CCl4)",
                "Trichloroethylene (C2HCl3)",
                "Tetrachloroethylene (C2Cl4)",
                "Hexachlorobenzene (C6Cl6)"
            ],
            "mismatches": [
                "Bromochloromethane (CH2BrCl)",
                "1,2-Dibromoethane (C2H4Br2)",
                "Bromodichloromethane (CHBrCl2)",
                "Dichloromethane (CH2Cl2)",
                "1,1,1-Trichloroethane (C2H3Cl3)",
                "Chlorobenzene (C6H5Cl)",
                "1,1,2,2-Tetrachloroethane (C2H2Cl4)",
                "1,2-Dichloropropane (C3H6Cl2)",
                "Chlorodifluoromethane (CHClF2)",
                "Bromoform (CHBr3)",
                "Carbon Tetrabromide (CBr4)",
                "1-Bromo-2-chloroethane (C2H4BrCl)",
                "1,1,2-Trichloro-1,2,2-trifluoroethane (C2HCl3F3)",
                "Chloroethane (C2H5Cl)",
                "Bromofluoromethane (CH2BrF)",
                "1,2-Dichloro-1,1,2,2-tetrafluoroethane (C2Cl2F4)",
                "Chloropentafluoroethane (C2ClF5)"
            ],
            "true_referents": [
                "Bromochlorofluorocarbons",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chlorofluorocarbons",
                "Chlorofluorocarbons, Ethane",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethylene Dibromide",
                "Hexachlorobenzene",
                "Hexachlorocyclohexane",
                "Methyl Chloride",
                "Methylene Chloride",
                "Polybrominated Biphenyls",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid"
            ],
            "TP": 5,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Carbon Tetrachloride (CCl4)",
            "Dichloromethane (DCM)",
            "Trichloroethylene (TCE)",
            "Perchloroethylene (PCE)",
            "Freon-12 (CCl2F2)",
            "Freon-11 (CCl3F)",
            "Freon-22 (CHClF2)",
            "Chlorobenzene (C6H5Cl)",
            "Dichlorobenzene (DCB)",
            "Trichlorobenzene (TCB)",
            "1,2-Dichloroethane (DCE)",
            "1,1,1-Trichloroethane (TCA)",
            "Hexachlorobenzene (HCB)",
            "Dichlorodifluoromethane (CCl2F2)",
            "Chloroprene (2-Chloro-1,3-butadiene)",
            "Vinyl Chloride (VC)",
            "Bromochloromethane (CH2BrCl)",
            "Dibromochloromethane (CHBr2Cl)",
            "Chloropicrin (CCl3NO2)",
            "1,1,2-Trichloro-1,2,2-trifluoroethane (CFC-113)",
            "Bromotrifluoromethane (CF3Br)",
            "Hexachlorobutadiene (HCBD)",
            "1,1,2,2-Tetrachloroethane (TCE)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Carbon Tetrachloride (CCl4)",
                "Trichloroethylene (TCE)",
                "Hexachlorobenzene (HCB)",
                "Vinyl Chloride (VC)"
            ],
            "mismatches": [
                "Dichloromethane (DCM)",
                "Perchloroethylene (PCE)",
                "Freon-12 (CCl2F2)",
                "Freon-11 (CCl3F)",
                "Freon-22 (CHClF2)",
                "Chlorobenzene (C6H5Cl)",
                "Dichlorobenzene (DCB)",
                "Trichlorobenzene (TCB)",
                "1,2-Dichloroethane (DCE)",
                "1,1,1-Trichloroethane (TCA)",
                "Dichlorodifluoromethane (CCl2F2)",
                "Chloroprene (2-Chloro-1,3-butadiene)",
                "Bromochloromethane (CH2BrCl)",
                "Dibromochloromethane (CHBr2Cl)",
                "Chloropicrin (CCl3NO2)",
                "1,1,2-Trichloro-1,2,2-trifluoroethane (CFC-113)",
                "Bromotrifluoromethane (CF3Br)",
                "Hexachlorobutadiene (HCBD)",
                "1,1,2,2-Tetrachloroethane (TCE)"
            ],
            "true_referents": [
                "Bromochlorofluorocarbons",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chlorofluorocarbons",
                "Chlorofluorocarbons, Ethane",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Dinitrochlorobenzene",
                "Heptachlor",
                "Hexachlorobenzene",
                "Hexachlorocyclohexane",
                "Methyl Chloride",
                "Methylene Chloride",
                "Polychlorinated Biphenyls",
                "Tetrachloroethylene",
                "Trichloroacetic Acid",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Vinyl Chloride"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloromethane (CH3Cl)",
            "Dichloromethane (CH2Cl2)",
            "Chloroform (CHCl3)",
            "Carbon Tetrachloride (CCl4)",
            "1,1-Dichloroethane (1,1-DCE)",
            "1,2-Dichloroethane (1,2-DCE)",
            "Trichloroethane (TCE)",
            "Tetrachloroethylene (PCE)",
            "Vinyl Chloride (VC)",
            "Fluoromethane (CH3F)",
            "Difluoromethane (CH2F2)",
            "Trifluoromethane (CHF3)",
            "Bromomethane (CH3Br)",
            "1,2-Dibromoethane (EDB)",
            "Iodomethane (CH3I)",
            "2-Chloropropane (Isopropyl Chloride)",
            "2-Bromopropane (Isopropyl Bromide)",
            "Hexachloroethane (C2Cl6)",
            "Pentachloroethane (C2HCl5)",
            "1,1,1-Trichloroethane (Methyl Chloroform)",
            "Freon-11 (Trichlorofluoromethane, CFCl3)",
            "Freon-12 (Dichlorodifluoromethane, CF2Cl2)",
            "Halothane (2-Bromo-2-chloro-1,1,1-trifluoroethane)",
            "Sevoflurane (1,1,1,3,3,3-Hexafluoro-2-(fluoromethoxy)propane)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Carbon Tetrachloride (CCl4)",
                "Tetrachloroethylene (PCE)",
                "Vinyl Chloride (VC)",
                "Halothane (2-Bromo-2-chloro-1,1,1-trifluoroethane)",
                "Sevoflurane (1,1,1,3,3,3-Hexafluoro-2-(fluoromethoxy)propane)"
            ],
            "mismatches": [
                "Chloromethane (CH3Cl)",
                "Dichloromethane (CH2Cl2)",
                "1,1-Dichloroethane (1,1-DCE)",
                "1,2-Dichloroethane (1,2-DCE)",
                "Trichloroethane (TCE)",
                "Fluoromethane (CH3F)",
                "Difluoromethane (CH2F2)",
                "Trifluoromethane (CHF3)",
                "Bromomethane (CH3Br)",
                "1,2-Dibromoethane (EDB)",
                "Iodomethane (CH3I)",
                "2-Chloropropane (Isopropyl Chloride)",
                "2-Bromopropane (Isopropyl Bromide)",
                "Hexachloroethane (C2Cl6)",
                "Pentachloroethane (C2HCl5)",
                "1,1,1-Trichloroethane (Methyl Chloroform)",
                "Freon-11 (Trichlorofluoromethane, CFCl3)",
                "Freon-12 (Dichlorodifluoromethane, CF2Cl2)"
            ],
            "true_referents": [
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorofluorocarbons",
                "Chlorofluorocarbons, Ethane",
                "Chloroform",
                "Desflurane",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethylene Dibromide",
                "Fluorocarbons",
                "Halothane",
                "Hexachlorobenzene",
                "Hydrocarbons, Brominated",
                "Hydrocarbons, Fluorinated",
                "Hydrocarbons, Iodinated",
                "Iodoacetic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Sevoflurane",
                "Tetrachloroethylene",
                "Trichloroepoxypropane",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Vinyl Chloride"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Carbon tetrachloride (CCl4)",
            "Dichloromethane (CH2Cl2)",
            "Trichloroethylene (C2HCl3)",
            "Tetrachloroethylene (C2Cl4)",
            "Chlorobenzene (C6H5Cl)",
            "Bromoform (CHBr3)",
            "Dibromomethane (CH2Br2)",
            "Bromochloromethane (CH2BrCl)",
            "1,2-Dibromoethane (C2H4Br2)",
            "Ethyl bromide (C2H5Br)",
            "Iodoform (CHI3)",
            "Methyl iodide (CH3I)",
            "1,1,1-Trichloroethane (C2H3Cl3)",
            "Hexachlorobenzene (C6Cl6)",
            "1,2-Dichloroethane (C2H4Cl2)",
            "Chlorodifluoromethane (CHClF2)",
            "Chlorotrifluoromethane (CClF3)",
            "Bromodichloromethane (CHBrCl2)",
            "1,2-Dichloropropane (C3H6Cl2)",
            "Chloromethane (CH3Cl)",
            "1,1-Dichloroethene (C2H2Cl2)",
            "Vinyl chloride (C2H3Cl)",
            "1,1,2-Trichloroethane (C2H3Cl3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Carbon tetrachloride (CCl4)",
                "Dichloromethane (CH2Cl2)",
                "Trichloroethylene (C2HCl3)",
                "Tetrachloroethylene (C2Cl4)",
                "Hexachlorobenzene (C6Cl6)",
                "Vinyl chloride (C2H3Cl)"
            ],
            "mismatches": [
                "Chlorobenzene (C6H5Cl)",
                "Bromoform (CHBr3)",
                "Dibromomethane (CH2Br2)",
                "Bromochloromethane (CH2BrCl)",
                "1,2-Dibromoethane (C2H4Br2)",
                "Ethyl bromide (C2H5Br)",
                "Iodoform (CHI3)",
                "Methyl iodide (CH3I)",
                "1,1,1-Trichloroethane (C2H3Cl3)",
                "1,2-Dichloroethane (C2H4Cl2)",
                "Chlorodifluoromethane (CHClF2)",
                "Chlorotrifluoromethane (CClF3)",
                "Bromodichloromethane (CHBrCl2)",
                "1,2-Dichloropropane (C3H6Cl2)",
                "Chloromethane (CH3Cl)",
                "1,1-Dichloroethene (C2H2Cl2)",
                "1,1,2-Trichloroethane (C2H3Cl3)"
            ],
            "true_referents": [
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chlorofluorocarbons",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Hexachlorobenzene",
                "Hexachlorocyclohexane",
                "Hydrocarbons, Iodinated",
                "Iodoacetates",
                "Iodoacetic Acid",
                "Iopanoic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Vinyl Chloride"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Dichloromethane (DCM)",
            "Trichloroethylene (TCE)",
            "Tetrachloroethylene (PERC)",
            "Bromoform (CHBr3)",
            "Iodoform (CHI3)",
            "1,1,1-Trichloroethane (TCA)",
            "1,2-Dichloroethane (EDC)",
            "Vinyl chloride (C2H3Cl)",
            "Benzyl chloride (C7H7Cl)",
            "Hexachlorobenzene (HCB)",
            "Polychlorinated biphenyls (PCBs)",
            "1,1-Dichloroethylene (DCE)",
            "Perfluorooctanoic acid (PFOA)",
            "Chlorobenzene (C6H5Cl)",
            "Fluorobenzene (C6H5F)",
            "2-Bromopropane (C3H7Br)",
            "1-Bromo-2-propanol (C3H7BrO)",
            "Ethylene dibromide (EDB)",
            "1,2,3-Trichloropropane (TCP)",
            "Decabromodiphenyl ether (DBDE)",
            "Tris(1-chloro-2-propyl) phosphate (TCPP)",
            "Chlorinated paraffins",
            "Dibromochloropropane (DBCP)",
            "Perfluorooctanesulfonic acid (PFOS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform",
                "Trichloroethylene",
                "Tetrachloroethylene",
                "Vinyl Chloride",
                "Hexachlorobenzene",
                "Polychlorinated Biphenyls",
                "Chlorobenzene",
                "Fluorobenzene",
                "Ethylene Dibromide"
            ],
            "mismatches": [
                "Dichloromethane (DCM)",
                "Bromoform (CHBr3)",
                "Iodoform (CHI3)",
                "1,1,1-Trichloroethane (TCA)",
                "1,2-Dichloroethane (EDC)",
                "Benzyl chloride (C7H7Cl)",
                "1,1-Dichloroethylene (DCE)",
                "Perfluorooctanoic acid (PFOA)",
                "2-Bromopropane (C3H7Br)",
                "1-Bromo-2-propanol (C3H7BrO)",
                "1,2,3-Trichloropropane (TCP)",
                "Decabromodiphenyl ether (DBDE)",
                "Tris(1-chloro-2-propyl) phosphate (TCPP)",
                "Chlorinated paraffins",
                "Dibromochloropropane (DBCP)",
                "Perfluorooctanesulfonic acid (PFOS)"
            ],
            "true_referents": [
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chlorofluorocarbons",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Dichloroethylenes",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Ethylene Dichlorides",
                "Fluorobenzenes",
                "Fluorocarbons",
                "Hexachlorobenzene",
                "Hexachlorocyclohexane",
                "Hydrocarbons, Brominated",
                "Hydrocarbons, Chlorinated",
                "Hydrocarbons, Fluorinated",
                "Iodoacetates",
                "Iodoacetic Acid",
                "Iopanoic Acid",
                "Methylene Chloride",
                "Polybrominated Biphenyls",
                "Polychlorinated Biphenyls",
                "Tetrachloroethylene",
                "Trichloroacetic Acid",
                "Trichloroepoxypropane",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Vinyl Chloride"
            ],
            "TP": 9,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Dichloromethane (CH2Cl2)",
            "Tetrachloromethane (CCl4)",
            "Trichloroethene (C2HCl3)",
            "Perfluorooctanoic acid (PFOA)",
            "Polytetrafluoroethylene (PTFE)",
            "Hexafluoropropylene (C3F6)",
            "Bromodichloromethane (CHCl2Br)",
            "Chlorodifluoromethane (CHClF2)",
            "Trichlorofluoromethane (CCl3F)",
            "Dichlorodifluoromethane (CCl2F2)",
            "Bromotrifluoromethane (CBrF3)",
            "Chloropentafluoroethane (C2ClF5)",
            "Dichlorotetrafluoroethane (C2Cl2F4)",
            "Trichlorotrifluoroethane (C2Cl3F3)",
            "Bromochlorodifluoromethane (CClBrF2)",
            "Dibromotetrafluoroethane (C2Br2F4)",
            "Bromofluorocarbon (CBrF3)",
            "Chlorofluorocarbon (CFC)",
            "Hydrochlorofluorocarbon (HCFC)",
            "Hydrofluorocarbon (HFC)",
            "Perfluorocarbon (PFC)",
            "Bromofluorocarbons (Halons)",
            "Polychlorinated biphenyls (PCBs)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Tetrachloromethane (CCl4)",
                "Trichloroethene (C2HCl3)",
                "Polychlorinated biphenyls (PCBs)"
            ],
            "mismatches": [
                "Dichloromethane (CH2Cl2)",
                "Perfluorooctanoic acid (PFOA)",
                "Polytetrafluoroethylene (PTFE)",
                "Hexafluoropropylene (C3F6)",
                "Bromodichloromethane (CHCl2Br)",
                "Chlorodifluoromethane (CHClF2)",
                "Trichlorofluoromethane (CCl3F)",
                "Dichlorodifluoromethane (CCl2F2)",
                "Bromotrifluoromethane (CBrF3)",
                "Chloropentafluoroethane (C2ClF5)",
                "Dichlorotetrafluoroethane (C2Cl2F4)",
                "Trichlorotrifluoroethane (C2Cl3F3)",
                "Bromochlorodifluoromethane (CClBrF2)",
                "Dibromotetrafluoroethane (C2Br2F4)",
                "Bromofluorocarbon (CBrF3)",
                "Chlorofluorocarbon (CFC)",
                "Hydrochlorofluorocarbon (HCFC)",
                "Hydrofluorocarbon (HFC)",
                "Perfluorocarbon (PFC)",
                "Bromofluorocarbons (Halons)"
            ],
            "true_referents": [
                "Bromochlorofluorocarbons",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorofluorocarbons",
                "Chlorofluorocarbons, Ethane",
                "Chlorofluorocarbons, Methane",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Fluorocarbon Polymers",
                "Fluorocarbons",
                "Hydrocarbons, Chlorinated",
                "Hydrocarbons, Fluorinated",
                "Methyl Chloride",
                "Methylene Chloride",
                "Polybrominated Biphenyls",
                "Polychlorinated Biphenyls",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Trihalomethanes",
                "Vinyl Chloride"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Bromobenzene (C6H5Br)",
            "Dichloromethane (CH2Cl2)",
            "Trichloroethylene (C2HCl3)",
            "Iodoform (CHI3)",
            "Dibromomethane (CH2Br2)",
            "Chlorobenzene (C6H5Cl)",
            "Fluoromethane (CH3F)",
            "Bromochloromethane (CH2BrCl)",
            "Trifluoromethane (CHF3)",
            "Tetrachloromethane (CCl4)",
            "1,2-Dichloroethane (C2H4Cl2)",
            "1,1,1-Trichloroethane (C2H3Cl3)",
            "1,1-Dichloroethene (C2H2Cl2)",
            "1,2-Dibromoethane (C2H4Br2)",
            "1,1-Dichloroethane (C2H4Cl2)",
            "1,2-Dichloropropane (C3H6Cl2)",
            "1,1,2-Trichloroethane (C2H3Cl3)",
            "1,1,2,2-Tetrachloroethane (C2H2Cl4)",
            "1,2-Dichlorobenzene (C6H4Cl2)",
            "1,4-Dichlorobenzene (C6H4Cl2)",
            "1,3-Dichlorobenzene (C6H4Cl2)",
            "1,2,3-Trichlorobenzene (C6H3Cl3)",
            "1,2,4-Trichlorobenzene (C6H3Cl3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Bromobenzene (C6H5Br)",
                "Trichloroethylene (C2HCl3)",
                "Chlorobenzene (C6H5Cl)",
                "1,1,1-Trichloroethane (C2H3Cl3)",
                "1,1,2-Trichloroethane (C2H3Cl3)"
            ],
            "mismatches": [
                "Dichloromethane (CH2Cl2)",
                "Iodoform (CHI3)",
                "Dibromomethane (CH2Br2)",
                "Fluoromethane (CH3F)",
                "Bromochloromethane (CH2BrCl)",
                "Trifluoromethane (CHF3)",
                "Tetrachloromethane (CCl4)",
                "1,2-Dichloroethane (C2H4Cl2)",
                "1,1-Dichloroethene (C2H2Cl2)",
                "1,2-Dibromoethane (C2H4Br2)",
                "1,1-Dichloroethane (C2H4Cl2)",
                "1,2-Dichloropropane (C3H6Cl2)",
                "1,1,2,2-Tetrachloroethane (C2H2Cl4)",
                "1,2-Dichlorobenzene (C6H4Cl2)",
                "1,4-Dichlorobenzene (C6H4Cl2)",
                "1,3-Dichlorobenzene (C6H4Cl2)",
                "1,2,3-Trichlorobenzene (C6H3Cl3)",
                "1,2,4-Trichlorobenzene (C6H3Cl3)"
            ],
            "true_referents": [
                "Bromobenzenes",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chlorofluorocarbons, Ethane",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethylene Dibromide",
                "Fluorocarbons",
                "Hexachlorobenzene",
                "Hydrocarbons, Fluorinated",
                "Iodoacetates",
                "Iodoacetic Acid",
                "Iopanoic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl\u2083)",
            "Carbon Tetrachloride (CCl\u2084)",
            "Dichloromethane (CH\u2082Cl\u2082)",
            "Trichlorofluoromethane (CFC-11)",
            "Dichlorodifluoromethane (CFC-12)",
            "Monochlorotrifluoromethane (CFC-13)",
            "Vinyl Chloride (C\u2082H\u2083Cl)",
            "Polyvinyl Chloride (PVC)",
            "Methyl Bromide (CH\u2083Br)",
            "Iodoform (CHI\u2083)",
            "Bromobenzene (C\u2086H\u2085Br)",
            "Fluorobenzene (C\u2086H\u2085F)",
            "Tetrafluoroethylene (C\u2082F\u2084)",
            "Perfluorooctane (C\u2088F\u2081\u2088)",
            "Dichlorodiphenyltrichloroethane (DDT)",
            "Pentachlorophenol (C\u2086Cl\u2085OH)",
            "Trichloroethylene (C\u2082HCl\u2083)",
            "1,2-Dichloroethane (C\u2082H\u2084Cl\u2082)",
            "Chlorobenzene (C\u2086H\u2085Cl)",
            "Chloroprocaine",
            "Dichlorvos (2,2-Dichlorovinyl Dimethyl Phosphate)",
            "Perfluoro-2,3-dimethylbutane (FC-72)",
            "Bromoform (CHBr\u2083)",
            "Halothane (C\u2082HBrClF\u2083)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl\u2083)",
                "Carbon Tetrachloride (CCl\u2084)",
                "Vinyl Chloride (C\u2082H\u2083Cl)",
                "Bromobenzene (C\u2086H\u2085Br)",
                "Fluorobenzene (C\u2086H\u2085F)",
                "Dichlorodiphenyltrichloroethane (DDT)",
                "Trichloroethylene (C\u2082HCl\u2083)",
                "Chlorobenzene (C\u2086H\u2085Cl)",
                "Halothane (C\u2082HBrClF\u2083)"
            ],
            "mismatches": [
                "Dichloromethane (CH\u2082Cl\u2082)",
                "Trichlorofluoromethane (CFC-11)",
                "Dichlorodifluoromethane (CFC-12)",
                "Monochlorotrifluoromethane (CFC-13)",
                "Polyvinyl Chloride (PVC)",
                "Methyl Bromide (CH\u2083Br)",
                "Iodoform (CHI\u2083)",
                "Tetrafluoroethylene (C\u2082F\u2084)",
                "Perfluorooctane (C\u2088F\u2081\u2088)",
                "Pentachlorophenol (C\u2086Cl\u2085OH)",
                "1,2-Dichloroethane (C\u2082H\u2084Cl\u2082)",
                "Chloroprocaine",
                "Dichlorvos (2,2-Dichlorovinyl Dimethyl Phosphate)",
                "Perfluoro-2,3-dimethylbutane (FC-72)",
                "Bromoform (CHBr\u2083)"
            ],
            "true_referents": [
                "Bromobenzenes",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chlorofluorocarbons",
                "Chlorofluorocarbons, Ethane",
                "Chloroform",
                "DDT",
                "Dichloroacetic Acid",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Dieldrin",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Fluorobenzenes",
                "Fluorocarbons",
                "Halothane",
                "Hexachlorobenzene",
                "Hydrocarbons, Fluorinated",
                "Iodoacetates",
                "Iodoacetic Acid",
                "Iopanoic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Vinyl Chloride"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Carbon tetrachloride (CCl4)",
            "Dichloromethane (CH2Cl2)",
            "Trichloroethylene (TCE)",
            "Perchloroethylene (PCE)",
            "1,2-Dichloroethane (EDC)",
            "Vinyl chloride (VC)",
            "Methyl chloride (CH3Cl)",
            "Chlorobenzene",
            "Bromobenzene",
            "Iodobenzene",
            "Fluorobenzene",
            "1,1,1-Trichloroethane (TCA)",
            "Tetrachloroethane",
            "Hexachlorobenzene (HCB)",
            "Dichlorodifluoromethane (CFC-12)",
            "Trichlorofluoromethane (CFC-11)",
            "Bromochloromethane",
            "Bromoform (CHBr3)",
            "Iodoform (CHI3)",
            "1,2-Dibromoethane (EDB)",
            "Chloropicrin",
            "Hexachlorocyclohexane (HCH)",
            "Polychlorinated biphenyls (PCBs)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform",
                "Carbon Tetrachloride",
                "Trichloroethylene",
                "Vinyl Chloride",
                "Methyl Chloride",
                "Chlorobenzenes",
                "Bromobenzenes",
                "Iodobenzenes",
                "Fluorobenzenes",
                "Hexachlorobenzene",
                "Hexachlorocyclohexane",
                "Polychlorinated Biphenyls"
            ],
            "mismatches": [
                "Dichloromethane (CH2Cl2)",
                "Perchloroethylene (PCE)",
                "1,2-Dichloroethane (EDC)",
                "1,1,1-Trichloroethane (TCA)",
                "Tetrachloroethane",
                "Dichlorodifluoromethane (CFC-12)",
                "Trichlorofluoromethane (CFC-11)",
                "Bromochloromethane",
                "Bromoform (CHBr3)",
                "Iodoform (CHI3)",
                "Chloropicrin"
            ],
            "true_referents": [
                "3-Iodobenzylguanidine",
                "Bromobenzenes",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorambucil",
                "Chlorobenzenes",
                "Chlorofluorocarbons",
                "Chlorofluorocarbons, Ethane",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Dinitrochlorobenzene",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Ethylene Dichlorides",
                "Fluorobenzenes",
                "Hexachlorobenzene",
                "Hexachlorocyclohexane",
                "Hydrocarbons, Brominated",
                "Hydrocarbons, Chlorinated",
                "Hydrocarbons, Fluorinated",
                "Iodoacetates",
                "Iodoacetic Acid",
                "Iodobenzenes",
                "Iopanoic Acid",
                "Iophendylate",
                "Methoxychlor",
                "Methyl Chloride",
                "Methylene Chloride",
                "Polybrominated Biphenyls",
                "Polychlorinated Biphenyls",
                "Tetrachloroethylene",
                "Trichloroacetic Acid",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Vinyl Chloride"
            ],
            "TP": 12,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Dichloromethane (CH2Cl2)",
            "Tetrachloroethylene (C2Cl4)",
            "Trichloroethylene (C2HCl3)",
            "1,2-Dichloroethane (C2H4Cl2)",
            "Vinyl chloride (C2H3Cl)",
            "1,1,1-Trichloroethane (CH3CCl3)",
            "Methyl chloride (CH3Cl)",
            "Methyl bromide (CH3Br)",
            "Methyl iodide (CH3I)",
            "Bromoform (CHBr3)",
            "Dibromomethane (CH2Br2)",
            "Iodoform (CHI3)",
            "Diiodomethane (CH2I2)",
            "1-Chlorobutane (C4H9Cl)",
            "2-Chlorobutane (C4H9Cl)",
            "1-Bromobutane (C4H9Br)",
            "2-Bromobutane (C4H9Br)",
            "1-Iodobutane (C4H9I)",
            "2-Iodobutane (C4H9I)",
            "Chlorobenzene (C6H5Cl)",
            "Bromobenzene (C6H5Br)",
            "Iodobenzene (C6H5I)",
            "1,2-Dichlorobenzene (C6H4Cl2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Tetrachloroethylene (C2Cl4)",
                "Trichloroethylene (C2HCl3)",
                "Vinyl chloride (C2H3Cl)",
                "Methyl chloride (CH3Cl)",
                "Chlorobenzene (C6H5Cl)",
                "Bromobenzene (C6H5Br)",
                "Iodobenzene (C6H5I)"
            ],
            "mismatches": [
                "Dichloromethane (CH2Cl2)",
                "1,2-Dichloroethane (C2H4Cl2)",
                "1,1,1-Trichloroethane (CH3CCl3)",
                "Methyl bromide (CH3Br)",
                "Methyl iodide (CH3I)",
                "Bromoform (CHBr3)",
                "Dibromomethane (CH2Br2)",
                "Iodoform (CHI3)",
                "Diiodomethane (CH2I2)",
                "1-Chlorobutane (C4H9Cl)",
                "2-Chlorobutane (C4H9Cl)",
                "1-Bromobutane (C4H9Br)",
                "2-Bromobutane (C4H9Br)",
                "1-Iodobutane (C4H9I)",
                "2-Iodobutane (C4H9I)",
                "1,2-Dichlorobenzene (C6H4Cl2)"
            ],
            "true_referents": [
                "3-Iodobenzylguanidine",
                "Bromobenzenes",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Hexachlorobenzene",
                "Hydrocarbons, Iodinated",
                "Iodoacetates",
                "Iodoacetic Acid",
                "Iodobenzenes",
                "Iopanoic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene",
                "Vinyl Chloride"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Carbon tetrachloride (CCl4)",
            "Dichloromethane (CH2Cl2)",
            "Trichloroethylene (C2HCl3)",
            "Tetrachloroethylene (C2Cl4)",
            "Vinyl chloride (C2H3Cl)",
            "Freon-11 (CFCl3)",
            "Freon-12 (CF2Cl2)",
            "Freon-113 (C2F3Cl3)",
            "Freon-114 (C2F4Cl2)",
            "Freon-115 (C2F5Cl)",
            "Methyl chloride (CH3Cl)",
            "Methyl bromide (CH3Br)",
            "Ethyl chloride (C2H5Cl)",
            "Allyl chloride (C3H5Cl)",
            "Benzyl chloride (C6H5CH2Cl)",
            "Chlorobenzene (C6H5Cl)",
            "Bromobenzene (C6H5Br)",
            "Iodobenzene (C6H5I)",
            "Dichlorobenzene (C6H4Cl2)",
            "Trichlorobenzene (C6H3Cl3)",
            "Hexachlorobenzene (C6Cl6)",
            "Lindane (C6H6Cl6)",
            "Bromoform (CHBr3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Carbon tetrachloride (CCl4)",
                "Trichloroethylene (C2HCl3)",
                "Tetrachloroethylene (C2Cl4)",
                "Vinyl chloride (C2H3Cl)",
                "Methyl chloride (CH3Cl)",
                "Ethyl chloride (C2H5Cl)",
                "Chlorobenzene (C6H5Cl)",
                "Bromobenzene (C6H5Br)",
                "Iodobenzene (C6H5I)",
                "Hexachlorobenzene (C6Cl6)"
            ],
            "mismatches": [
                "Dichloromethane (CH2Cl2)",
                "Freon-11 (CFCl3)",
                "Freon-12 (CF2Cl2)",
                "Freon-113 (C2F3Cl3)",
                "Freon-114 (C2F4Cl2)",
                "Freon-115 (C2F5Cl)",
                "Methyl bromide (CH3Br)",
                "Allyl chloride (C3H5Cl)",
                "Benzyl chloride (C6H5CH2Cl)",
                "Dichlorobenzene (C6H4Cl2)",
                "Trichlorobenzene (C6H3Cl3)",
                "Lindane (C6H6Cl6)",
                "Bromoform (CHBr3)"
            ],
            "true_referents": [
                "3-Iodobenzylguanidine",
                "Bromobenzenes",
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chlorodiphenyl (54% Chlorine)",
                "Chlorofluorocarbons, Ethane",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Hexachlorobenzene",
                "Hexachlorocyclohexane",
                "Iodoacetic Acid",
                "Iodobenzenes",
                "Methyl Chloride",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid",
                "Vinyl Chloride"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methyl Chloride (CH3Cl)",
            "Ethyl Chloride (C2H5Cl)",
            "Propyl Chloride (C3H7Cl)",
            "Butyl Chloride (C4H9Cl)",
            "Chloroform (CHCl3)",
            "Carbon Tetrachloride (CCl4)",
            "Methyl Bromide (CH3Br)",
            "Ethyl Bromide (C2H5Br)",
            "Propyl Bromide (C3H7Br)",
            "Butyl Bromide (C4H9Br)",
            "Bromoform (CHBr3)",
            "Carbon Tetrabromide (CBr4)",
            "Methyl Iodide (CH3I)",
            "Ethyl Iodide (C2H5I)",
            "Propyl Iodide (C3H7I)",
            "Butyl Iodide (C4H9I)",
            "Iodoform (CHI3)",
            "Carbon Tetraiodide (CI4)",
            "Dichloromethane (CH2Cl2)",
            "Trichloroethylene (C2HCl3)",
            "Tetrachloroethylene (C2Cl4)",
            "Hexachloroethane (C2Cl6)",
            "Hexachlorobenzene (C6Cl6)",
            "Polychlorinated Biphenyls (PCBs)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methyl Chloride",
                "Ethyl Chloride",
                "Chloroform",
                "Carbon Tetrachloride",
                "Trichloroethylene",
                "Tetrachloroethylene",
                "Hexachlorobenzene",
                "Polychlorinated Biphenyls"
            ],
            "mismatches": [
                "Propyl Chloride",
                "Butyl Chloride",
                "Methyl Bromide",
                "Ethyl Bromide",
                "Propyl Bromide",
                "Butyl Bromide",
                "Bromoform",
                "Carbon Tetrabromide",
                "Methyl Iodide",
                "Ethyl Iodide",
                "Propyl Iodide",
                "Butyl Iodide",
                "Iodoform",
                "Carbon Tetraiodide",
                "Dichloromethane",
                "Hexachloroethane"
            ],
            "true_referents": [
                "Bromotrichloromethane",
                "Carbon Tetrachloride",
                "Chlorobenzenes",
                "Chloroform",
                "Dichlorodiphenyl Dichloroethylene",
                "Ethyl Chloride",
                "Ethylene Dibromide",
                "Hexachlorobenzene",
                "Hexachlorocyclohexane",
                "Hydrocarbons, Chlorinated",
                "Hydrocarbons, Iodinated",
                "Iodoacetates",
                "Iodoacetic Acid",
                "Iopanoic Acid",
                "Methyl Chloride",
                "Methylene Chloride",
                "Polybrominated Biphenyls",
                "Polychlorinated Biphenyls",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": "[\n\"Chloroform (CHCl3)\" ,\n\"Methoxychlor (MOX)\" ,\n\"Carbon tetrachloride (CCl4)\" ,\n\"Trichloroethylene (TCE)\" ,\n\"Perchloroethylene (PERC)\" ,\n\"1,2-Dichloroethane (EDC)\" ,\n\"Vinyl chloride (VCM)\" ,\n\"1,1,1-Trichloroethane (1,1,1-TCA)\" ,\n\"1,1-Dichloroethylene (1,1-DCE)\" ,\n\"1,2-Dichloropropane (1,2-DCP)\" ,\n\"Carbon disulfide (CS2)\" ,\n\"Chlorobenzene (CB)\" ,\n\"1,3-Dichlorobenzene (1,3-DCB)\" ,\n\"1,4-Dichlorobenzene (1,4-DCB)\" ,\n\"Hexachlorobenzene (HCB)\" ,\n\"Pentachlorophenol (PCP)\" ,\n\"Chlorpyrifos (CPF)\" ,\n\"Endosulfan (ES)\" ,\n\"Aldrin (ALD)\" ,\n\"Dieldrin (DLD)\" ,\n\"Endrin (END)\" ,\n\"Hexachlorocyclohexane (HCH)\" ,\n\"Chlordecone (Kepone)\" ,\n\"Bromodichloromethane (BDCM)\" ,\n\"Bromofluoromethane (BFM)\"",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Chloroform (CHCl3)",
            "Dichloromethane (DCM)",
            "Trichloroethylene (TCE)",
            "Tetrachloroethylene (PCE)",
            "1,1,1-Trichloroethane (TCA)",
            "1,1-Dichloroethane (DCA)",
            "1,2-Dichloroethane (DCA)",
            "Chlorodifluoromethane (HCFC-22)",
            "1,1-Difluoro-1,2,2-trichloroethane (HCFC-121)",
            "Dichlorofluoromethane (HCFC-12)",
            "Trifluoromethane (HFC-23)",
            "1,1,1,2-Tetrachloro-2,2-difluoroethane (HCFC-121a)",
            "Bromodichloromethane (CHBrCl2)",
            "Bromochlorodifluoromethane (Halon 1211)",
            "1,2-Dibromo-1,1,2,2-tetrachloroethane (DBTC)",
            "1,2-Dichloro-1,1,2,2-tetrafluoroethane (HCFC-124)",
            "1,1,2,2-Tetrachloro-1,2-difluoroethane (HCFC-124a)",
            "Iodoethane (C2H5I)",
            "Iodobenzene (C6H5I)",
            "1,4-Diiodobutane (C4H8I2)",
            "2,2,2-Trifluoroethyl iodide (C2H2F3I)",
            "2-Iodo-1,1,1-trifluoroethane (C2H2F3I)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloroform (CHCl3)",
                "Trichloroethylene (TCE)",
                "Tetrachloroethylene (PCE)",
                "Iodobenzene (C6H5I)"
            ],
            "mismatches": [
                "Dichloromethane (DCM)",
                "1,1,1-Trichloroethane (TCA)",
                "1,1-Dichloroethane (DCA)",
                "1,2-Dichloroethane (DCA)",
                "Chlorodifluoromethane (HCFC-22)",
                "1,1-Difluoro-1,2,2-trichloroethane (HCFC-121)",
                "Dichlorofluoromethane (HCFC-12)",
                "Trifluoromethane (HFC-23)",
                "1,1,1,2-Tetrachloro-2,2-difluoroethane (HCFC-121a)",
                "Bromodichloromethane (CHBrCl2)",
                "Bromochlorodifluoromethane (Halon 1211)",
                "1,2-Dibromo-1,1,2,2-tetrachloroethane (DBTC)",
                "1,2-Dichloro-1,1,2,2-tetrafluoroethane (HCFC-124)",
                "1,1,2,2-Tetrachloro-1,2-difluoroethane (HCFC-124a)",
                "Iodoethane (C2H5I)",
                "1,4-Diiodobutane (C4H8I2)",
                "2,2,2-Trifluoroethyl iodide (C2H2F3I)",
                "2-Iodo-1,1,1-trifluoroethane (C2H2F3I)"
            ],
            "true_referents": [
                "3-Iodobenzylguanidine",
                "Bromochlorofluorocarbons",
                "Chlorofluorocarbons",
                "Chlorofluorocarbons, Ethane",
                "Chloroform",
                "Dichloroacetic Acid",
                "Dichlorodiphenyl Dichloroethylene",
                "Dichlorodiphenyldichloroethane",
                "Ethylene Dibromide",
                "Fluorocarbons",
                "Hydrocarbons, Fluorinated",
                "Hydrocarbons, Iodinated",
                "Iodoacetic Acid",
                "Iodobenzenes",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroacetic Acid",
                "Trichloroethanes",
                "Trichloroethylene",
                "Trifluoroacetic Acid"
            ],
            "TP": 4,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "halogenated hydrocarbon",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Chloroform",
                "Canonical Name": "(CHCl3)2"
            },
            {
                "Referent": "Dichloromethane",
                "Canonical Name": "(CH2Cl2)2"
            },
            {
                "Referent": "Trichloroethane",
                "Canonical Name": "(CHClCH3)2"
            },
            {
                "Referent": "Tetrachloroethene",
                "Canonical Name": "(CH2Cl2)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,2,2-Tetrachloroethane",
                "Canonical Name": "(CH2Cl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            },
            {
                "Referent": "1,2-Dichloropropane",
                "Canonical Name": "(CH3CHCl2)2"
            },
            {
                "Referent": "1,1,1-Trichloroethane",
                "Canonical Name": "(CH2ClCH3)2"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Trichloroethane"
            ],
            "mismatches": [
                "Chloroform",
                "Dichloromethane",
                "Tetrachloroethene",
                "1,2-Dichloropropane",
                "1,1,2,2-Tetrachloroethane"
            ],
            "true_referents": [
                "Chlorofluorocarbons, Ethane",
                "Chlorofluorocarbons, Methane",
                "Dichlorodiphenyl Dichloroethylene",
                "Methylene Chloride",
                "Tetrachloroethylene",
                "Trichloroethanes",
                "Trichloroethylene"
            ],
            "TP": 1,
            "FP": 5,
            "FN": 0
        }
    }
]