[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Acetonitrile (ACN)",
            "Dimethyl sulfoxide (DMSO)",
            "Dimethylformamide (DMF)",
            "Hexamethylphosphoramide (HMPA)",
            "Methyl ethyl ketone (MEK)",
            "Nitromethane",
            "N,N-Dimethylacetamide (DMA)",
            "Tetrahydrofuran (THF)",
            "Acetone",
            "Pyridine",
            "Ethyl acetate",
            "Toluene",
            "Benzene",
            "Chloroform",
            "1,4-Dioxane",
            "N-Methyl-2-pyrrolidone (NMP)",
            "Methylene chloride (Dichloromethane)",
            "Acetic acid",
            "Propylene carbonate",
            "Phosphoric acid",
            "Urea",
            "Glycerol",
            "Formamide",
            "Sulfolane"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetonitrile (ACN)",
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylformamide (DMF)",
                "Hexamethylphosphoramide (HMPA)",
                "Methyl ethyl ketone (MEK)",
                "Nitromethane",
                "N,N-Dimethylacetamide (DMA)",
                "Tetrahydrofuran (THF)",
                "Acetone",
                "Pyridine",
                "Ethyl acetate",
                "Toluene",
                "Benzene",
                "Chloroform",
                "1,4-Dioxane",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Methylene chloride (Dichloromethane)",
                "Acetic acid",
                "Propylene carbonate",
                "Phosphoric acid",
                "Urea",
                "Glycerol",
                "Formamide",
                "Sulfolane"
            ],
            "mismatches": [],
            "true_referents": [
                "1,4-Dioxane",
                "Acetic acid",
                "Acetone",
                "Acetonitrile (ACN)",
                "Benzene",
                "Chloroform",
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylformamide (DMF)",
                "Ethyl acetate",
                "Formamide",
                "Glycerol",
                "Hexamethylphosphoramide (HMPA)",
                "Methyl ethyl ketone (MEK)",
                "Methylene chloride (Dichloromethane)",
                "N,N-Dimethylacetamide (DMA)",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Nitromethane",
                "Phosphoric acid",
                "Propylene carbonate",
                "Pyridine",
                "Sulfolane",
                "Tetrahydrofuran (THF)",
                "Toluene",
                "Urea"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Acetonitrile (MeCN)",
            "Dimethyl sulfoxide (DMSO)",
            "Dimethylformamide (DMF)",
            "Acetone (Me2CO)",
            "Nitromethane (CH3NO2)",
            "N,N-Dimethylacetamide (DMAc)",
            "Benzene (C6H6)",
            "Tetrahydrofuran (THF)",
            "Chloroform (CHCl3)",
            "Ethyl acetate (EtOAc)",
            "1,2-Dichloroethane (DCE)",
            "Chloroform-d (CDCl3)",
            "Acetonitrile-d3 (MeCN-d3)",
            "Dichloromethane (DCM)",
            "Methanol-d4 (MeOD4)",
            "Pyridine (C5H5N)",
            "1,1,2,2-Tetrachloroethane (TCE)",
            "Toluene (C7H8)",
            "Dichloromethane-d2 (DCM-d2)",
            "Bromoform (CHBr3)",
            "Methyl tert-butyl ether (MTBE)",
            "Propionitrile (C2H5CN)",
            "Carbon disulfide (CS2)",
            "Trifluoroacetic acid (TFA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetonitrile (MeCN)",
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylformamide (DMF)",
                "Acetone (Me2CO)",
                "Nitromethane (CH3NO2)",
                "N,N-Dimethylacetamide (DMAc)",
                "Benzene (C6H6)",
                "Tetrahydrofuran (THF)",
                "Chloroform (CHCl3)",
                "Ethyl acetate (EtOAc)",
                "1,2-Dichloroethane (DCE)",
                "Chloroform-d (CDCl3)",
                "Acetonitrile-d3 (MeCN-d3)",
                "Dichloromethane (DCM)",
                "Methanol-d4 (MeOD4)",
                "Pyridine (C5H5N)",
                "1,1,2,2-Tetrachloroethane (TCE)",
                "Toluene (C7H8)",
                "Dichloromethane-d2 (DCM-d2)",
                "Bromoform (CHBr3)",
                "Methyl tert-butyl ether (MTBE)",
                "Propionitrile (C2H5CN)",
                "Carbon disulfide (CS2)",
                "Trifluoroacetic acid (TFA)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,1,2,2-Tetrachloroethane (TCE)",
                "1,2-Dichloroethane (DCE)",
                "Acetone (Me2CO)",
                "Acetonitrile (MeCN)",
                "Acetonitrile-d3 (MeCN-d3)",
                "Benzene (C6H6)",
                "Bromoform (CHBr3)",
                "Carbon disulfide (CS2)",
                "Chloroform (CHCl3)",
                "Chloroform-d (CDCl3)",
                "Dichloromethane (DCM)",
                "Dichloromethane-d2 (DCM-d2)",
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylformamide (DMF)",
                "Ethyl acetate (EtOAc)",
                "Methanol-d4 (MeOD4)",
                "Methyl tert-butyl ether (MTBE)",
                "N,N-Dimethylacetamide (DMAc)",
                "Nitromethane (CH3NO2)",
                "Propionitrile (C2H5CN)",
                "Pyridine (C5H5N)",
                "Tetrahydrofuran (THF)",
                "Toluene (C7H8)",
                "Trifluoroacetic acid (TFA)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Acetonitrile (MeCN)",
            "Benzene",
            "Carbon tetrachloride (CCl4)",
            "Chloroform (CHCl3)",
            "Cyclohexane",
            "Dichloromethane (DCM)",
            "Diethyl ether",
            "Dimethyl sulfoxide (DMSO)",
            "Ethyl acetate",
            "Hexane",
            "Methylene chloride",
            "N,N-Dimethylformamide (DMF)",
            "N,N-Dimethylacetamide (DMA)",
            "Nitrobenzene",
            "Petroleum ether",
            "Tetrahydrofuran (THF)",
            "Toluene",
            "1,4-Dioxane",
            "1,2-Dichloroethane",
            "1,2-Dimethoxyethane (DME)",
            "Carbon disulfide (CS2)",
            "Chloroethylene",
            "Ethylene glycol dimethyl ether (DME)",
            "Hexamethylphosphoramide (HMPA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetonitrile (MeCN)",
                "Benzene",
                "Carbon tetrachloride (CCl4)",
                "Chloroform (CHCl3)",
                "Cyclohexane",
                "Dichloromethane (DCM)",
                "Diethyl ether",
                "Dimethyl sulfoxide (DMSO)",
                "Ethyl acetate",
                "Hexane",
                "Methylene chloride",
                "N,N-Dimethylformamide (DMF)",
                "N,N-Dimethylacetamide (DMA)",
                "Nitrobenzene",
                "Petroleum ether",
                "Tetrahydrofuran (THF)",
                "Toluene",
                "1,4-Dioxane",
                "1,2-Dichloroethane",
                "1,2-Dimethoxyethane (DME)",
                "Carbon disulfide (CS2)",
                "Chloroethylene",
                "Ethylene glycol dimethyl ether (DME)",
                "Hexamethylphosphoramide (HMPA)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,2-Dichloroethane",
                "1,2-Dimethoxyethane (DME)",
                "1,4-Dioxane",
                "Acetonitrile (MeCN)",
                "Benzene",
                "Carbon disulfide (CS2)",
                "Carbon tetrachloride (CCl4)",
                "Chloroethylene",
                "Chloroform (CHCl3)",
                "Cyclohexane",
                "Dichloromethane (DCM)",
                "Diethyl ether",
                "Dimethyl sulfoxide (DMSO)",
                "Ethyl acetate",
                "Ethylene glycol dimethyl ether (DME)",
                "Hexamethylphosphoramide (HMPA)",
                "Hexane",
                "Methylene chloride",
                "N,N-Dimethylacetamide (DMA)",
                "N,N-Dimethylformamide (DMF)",
                "Nitrobenzene",
                "Petroleum ether",
                "Tetrahydrofuran (THF)",
                "Toluene"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfoxide (DMSO)",
            "Dimethylformamide (DMF)",
            "Acetonitrile (MeCN)",
            "Acetone (Ace)",
            "Dichloromethane (DCM)",
            "Chloroform (CHCl3)",
            "Tetrahydrofuran (THF)",
            "Diethyl ether (Et2O)",
            "Ethyl acetate (EtOAc)",
            "N-Methyl-2-pyrrolidone (NMP)",
            "Hexane (Hex)",
            "Toluene (Tol)",
            "Benzene (Bz)",
            "Carbon disulfide (CS2)",
            "1,4-Dioxane (Diox)",
            "Propylene carbonate (PC)",
            "Sulfolane (Sulf)",
            "Dimethylacetamide (DMAc)",
            "N,N-Dimethylpropyleneurea (DMPU)",
            "Formamide (HCONH2)",
            "Nitrobenzene (PhNO2)",
            "Cyclopentyl methyl ether (CPME)",
            "2-Methyltetrahydrofuran (2-MeTHF)",
            "Dichloromethane-d2 (CDCl2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylformamide (DMF)",
                "Acetonitrile (MeCN)",
                "Acetone (Ace)",
                "Dichloromethane (DCM)",
                "Chloroform (CHCl3)",
                "Tetrahydrofuran (THF)",
                "Diethyl ether (Et2O)",
                "Ethyl acetate (EtOAc)",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Hexane (Hex)",
                "Toluene (Tol)",
                "Benzene (Bz)",
                "Carbon disulfide (CS2)",
                "1,4-Dioxane (Diox)",
                "Propylene carbonate (PC)",
                "Sulfolane (Sulf)",
                "Dimethylacetamide (DMAc)",
                "N,N-Dimethylpropyleneurea (DMPU)",
                "Formamide (HCONH2)",
                "Nitrobenzene (PhNO2)",
                "Cyclopentyl methyl ether (CPME)",
                "2-Methyltetrahydrofuran (2-MeTHF)",
                "Dichloromethane-d2 (CDCl2)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,4-Dioxane (Diox)",
                "2-Methyltetrahydrofuran (2-MeTHF)",
                "Acetone (Ace)",
                "Acetonitrile (MeCN)",
                "Benzene (Bz)",
                "Carbon disulfide (CS2)",
                "Chloroform (CHCl3)",
                "Cyclopentyl methyl ether (CPME)",
                "Dichloromethane (DCM)",
                "Dichloromethane-d2 (CDCl2)",
                "Diethyl ether (Et2O)",
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylacetamide (DMAc)",
                "Dimethylformamide (DMF)",
                "Ethyl acetate (EtOAc)",
                "Formamide (HCONH2)",
                "Hexane (Hex)",
                "N,N-Dimethylpropyleneurea (DMPU)",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Nitrobenzene (PhNO2)",
                "Propylene carbonate (PC)",
                "Sulfolane (Sulf)",
                "Tetrahydrofuran (THF)",
                "Toluene (Tol)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfoxide (DMSO)",
            "Acetonitrile (MeCN)",
            "N,N-Dimethylformamide (DMF)",
            "Tetrahydrofuran (THF)",
            "Dichloromethane (DCM)",
            "Acetone",
            "Benzene",
            "Carbon tetrachloride (CCl4)",
            "Chloroform (CHCl3)",
            "Ethyl acetate (EtOAc)",
            "Hexane",
            "Cyclohexane",
            "Diethyl ether",
            "Toluene",
            "Pyridine",
            "Nitromethane",
            "1,4-Dioxane",
            "Tetrachloroethylene",
            "Trichloroethylene",
            "Dimethyl carbonate (DMC)",
            "Ethylene carbonate",
            "Propylene carbonate",
            "N-Methyl-2-pyrrolidone (NMP)",
            "Sulfolane"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfoxide (DMSO)",
                "Acetonitrile (MeCN)",
                "N,N-Dimethylformamide (DMF)",
                "Tetrahydrofuran (THF)",
                "Dichloromethane (DCM)",
                "Acetone",
                "Benzene",
                "Carbon tetrachloride (CCl4)",
                "Chloroform (CHCl3)",
                "Ethyl acetate (EtOAc)",
                "Hexane",
                "Cyclohexane",
                "Diethyl ether",
                "Toluene",
                "Pyridine",
                "Nitromethane",
                "1,4-Dioxane",
                "Tetrachloroethylene",
                "Trichloroethylene",
                "Dimethyl carbonate (DMC)",
                "Ethylene carbonate",
                "Propylene carbonate",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Sulfolane"
            ],
            "mismatches": [],
            "true_referents": [
                "1,4-Dioxane",
                "Acetone",
                "Acetonitrile (MeCN)",
                "Benzene",
                "Carbon tetrachloride (CCl4)",
                "Chloroform (CHCl3)",
                "Cyclohexane",
                "Dichloromethane (DCM)",
                "Diethyl ether",
                "Dimethyl carbonate (DMC)",
                "Dimethyl sulfoxide (DMSO)",
                "Ethyl acetate (EtOAc)",
                "Ethylene carbonate",
                "Hexane",
                "N,N-Dimethylformamide (DMF)",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Nitromethane",
                "Propylene carbonate",
                "Pyridine",
                "Sulfolane",
                "Tetrachloroethylene",
                "Tetrahydrofuran (THF)",
                "Toluene",
                "Trichloroethylene"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfoxide (DMSO)",
            "Acetonitrile (MeCN)",
            "Tetrahydrofuran (THF)",
            "Dimethylformamide (DMF)",
            "Ethyl acetate (EtOAc)",
            "Benzene",
            "Cyclohexane",
            "Chloroform (CHCl3)",
            "Dichloromethane (DCM)",
            "Hexane",
            "Toluene",
            "Carbon disulfide (CS2)",
            "Nitrobenzene",
            "1,4-Dioxane",
            "Acetone",
            "Propylene carbonate",
            "Sulfolane",
            "1,2-Dichloroethane",
            "Decalin",
            "Perfluorohexane",
            "Benzonitrile",
            "N-Methylpyrrolidone (NMP)",
            "1,3-Dimethyl-2-imidazolidinone (DMI)",
            "2-Methyl-THF"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfoxide (DMSO)",
                "Acetonitrile (MeCN)",
                "Tetrahydrofuran (THF)",
                "Dimethylformamide (DMF)",
                "Ethyl acetate (EtOAc)",
                "Benzene",
                "Cyclohexane",
                "Chloroform (CHCl3)",
                "Dichloromethane (DCM)",
                "Hexane",
                "Toluene",
                "Carbon disulfide (CS2)",
                "Nitrobenzene",
                "1,4-Dioxane",
                "Acetone",
                "Propylene carbonate",
                "Sulfolane",
                "1,2-Dichloroethane",
                "Decalin",
                "Perfluorohexane",
                "Benzonitrile",
                "N-Methylpyrrolidone (NMP)",
                "1,3-Dimethyl-2-imidazolidinone (DMI)",
                "2-Methyl-THF"
            ],
            "mismatches": [],
            "true_referents": [
                "1,2-Dichloroethane",
                "1,3-Dimethyl-2-imidazolidinone (DMI)",
                "1,4-Dioxane",
                "2-Methyl-THF",
                "Acetone",
                "Acetonitrile (MeCN)",
                "Benzene",
                "Benzonitrile",
                "Carbon disulfide (CS2)",
                "Chloroform (CHCl3)",
                "Cyclohexane",
                "Decalin",
                "Dichloromethane (DCM)",
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylformamide (DMF)",
                "Ethyl acetate (EtOAc)",
                "Hexane",
                "N-Methylpyrrolidone (NMP)",
                "Nitrobenzene",
                "Perfluorohexane",
                "Propylene carbonate",
                "Sulfolane",
                "Tetrahydrofuran (THF)",
                "Toluene"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Acetone (DMK)",
            "Dimethyl sulfoxide (DMSO)",
            "Acetonitrile (MeCN)",
            "Benzene (C6H6)",
            "Toluene (C7H8)",
            "Chlorobenzene (C6H5Cl)",
            "Dichloromethane (DCM)",
            "Tetrahydrofuran (THF)",
            "1,2-Dichloroethane (DCE)",
            "1,4-Dioxane (p-dioxane)",
            "Ethyl acetate (EtOAc)",
            "Methylene chloride (MC)",
            "Nitromethane (NM)",
            "Propylene carbonate (PC)",
            "Pyridine (C5H5N)",
            "Sulfolane (tetramethylene sulfone)",
            "Dimethylformamide (DMF)",
            "Hexamethylphosphoramide (HMPA)",
            "Dimethylacetamide (DMA)",
            "N-Methyl-2-pyrrolidone (NMP)",
            "Cyclohexanone (CH)",
            "Carbon tetrachloride (CCl4)",
            "1,2-Dichlorobenzene (o-DCB)",
            "Trichloroethylene (TCE)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetone (DMK)",
                "Dimethyl sulfoxide (DMSO)",
                "Acetonitrile (MeCN)",
                "Benzene (C6H6)",
                "Toluene (C7H8)",
                "Chlorobenzene (C6H5Cl)",
                "Dichloromethane (DCM)",
                "Tetrahydrofuran (THF)",
                "1,2-Dichloroethane (DCE)",
                "1,4-Dioxane (p-dioxane)",
                "Ethyl acetate (EtOAc)",
                "Methylene chloride (MC)",
                "Nitromethane (NM)",
                "Propylene carbonate (PC)",
                "Pyridine (C5H5N)",
                "Sulfolane (tetramethylene sulfone)",
                "Dimethylformamide (DMF)",
                "Hexamethylphosphoramide (HMPA)",
                "Dimethylacetamide (DMA)",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Cyclohexanone (CH)",
                "Carbon tetrachloride (CCl4)",
                "1,2-Dichlorobenzene (o-DCB)",
                "Trichloroethylene (TCE)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,2-Dichlorobenzene (o-DCB)",
                "1,2-Dichloroethane (DCE)",
                "1,4-Dioxane (p-dioxane)",
                "Acetone (DMK)",
                "Acetonitrile (MeCN)",
                "Benzene (C6H6)",
                "Carbon tetrachloride (CCl4)",
                "Chlorobenzene (C6H5Cl)",
                "Cyclohexanone (CH)",
                "Dichloromethane (DCM)",
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylacetamide (DMA)",
                "Dimethylformamide (DMF)",
                "Ethyl acetate (EtOAc)",
                "Hexamethylphosphoramide (HMPA)",
                "Methylene chloride (MC)",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Nitromethane (NM)",
                "Propylene carbonate (PC)",
                "Pyridine (C5H5N)",
                "Sulfolane (tetramethylene sulfone)",
                "Tetrahydrofuran (THF)",
                "Toluene (C7H8)",
                "Trichloroethylene (TCE)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfoxide (DMSO)",
            "Acetone",
            "Acetonitrile",
            "Diethyl ether",
            "Hexane",
            "Toluene",
            "Chloroform",
            "Carbon disulfide",
            "Methylene chloride",
            "Dichloromethane",
            "1,4-Dioxane",
            "N,N-Dimethylformamide (DMF)",
            "N,N-Dimethylacetamide (DMA)",
            "Ethyl acetate",
            "Methyl tert-butyl ether (MTBE)",
            "Tetrahydrofuran (THF)",
            "Pentane",
            "Cyclohexane",
            "Benzene",
            "Diisopropyl ether",
            "Dichloroethylene",
            "Nitromethane",
            "Propylene carbonate",
            "Dibutyl ether"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfoxide (DMSO)",
                "Acetone",
                "Acetonitrile",
                "Diethyl ether",
                "Hexane",
                "Toluene",
                "Chloroform",
                "Carbon disulfide",
                "Methylene chloride",
                "Dichloromethane",
                "1,4-Dioxane",
                "N,N-Dimethylformamide (DMF)",
                "N,N-Dimethylacetamide (DMA)",
                "Ethyl acetate",
                "Methyl tert-butyl ether (MTBE)",
                "Tetrahydrofuran (THF)",
                "Pentane",
                "Cyclohexane",
                "Benzene",
                "Diisopropyl ether",
                "Dichloroethylene",
                "Nitromethane",
                "Propylene carbonate",
                "Dibutyl ether"
            ],
            "mismatches": [],
            "true_referents": [
                "1,4-Dioxane",
                "Acetone",
                "Acetonitrile",
                "Benzene",
                "Carbon disulfide",
                "Chloroform",
                "Cyclohexane",
                "Dibutyl ether",
                "Dichloroethylene",
                "Dichloromethane",
                "Diethyl ether",
                "Diisopropyl ether",
                "Dimethyl sulfoxide (DMSO)",
                "Ethyl acetate",
                "Hexane",
                "Methyl tert-butyl ether (MTBE)",
                "Methylene chloride",
                "N,N-Dimethylacetamide (DMA)",
                "N,N-Dimethylformamide (DMF)",
                "Nitromethane",
                "Pentane",
                "Propylene carbonate",
                "Tetrahydrofuran (THF)",
                "Toluene"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfoxide (DMSO)",
            "N,N-Dimethylformamide (DMF)",
            "Acetonitrile (MeCN)",
            "Tetrahydrofuran (THF)",
            "Dichloromethane (DCM)",
            "Hexamethylphosphoramide (HMPA)",
            "Dimethylacetamide (DMA)",
            "1,2-Dimethoxyethane (DME)",
            "Sulfolane",
            "N-Methyl-2-pyrrolidone (NMP)",
            "Methyl tert-butyl ether (MTBE)",
            "Chlorobenzene",
            "Benzonitrile",
            "Carbon tetrachloride (CCl\u2084)",
            "Nitrobenzene",
            "Methyl ethyl ketone (MEK)",
            "Propylene carbonate",
            "Dimethyl sulfone (DMSO\u2082)",
            "Trifluorotoluene",
            "Acetone",
            "1,4-Dioxane",
            "Fluoroform",
            "Triglyme",
            "Phosphoramide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfoxide (DMSO)",
                "N,N-Dimethylformamide (DMF)",
                "Acetonitrile (MeCN)",
                "Tetrahydrofuran (THF)",
                "Dichloromethane (DCM)",
                "Hexamethylphosphoramide (HMPA)",
                "Dimethylacetamide (DMA)",
                "1,2-Dimethoxyethane (DME)",
                "Sulfolane",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Methyl tert-butyl ether (MTBE)",
                "Chlorobenzene",
                "Benzonitrile",
                "Carbon tetrachloride (CCl\u2084)",
                "Nitrobenzene",
                "Methyl ethyl ketone (MEK)",
                "Propylene carbonate",
                "Dimethyl sulfone (DMSO\u2082)",
                "Trifluorotoluene",
                "Acetone",
                "1,4-Dioxane",
                "Fluoroform",
                "Triglyme",
                "Phosphoramide"
            ],
            "mismatches": [],
            "true_referents": [
                "1,2-Dimethoxyethane (DME)",
                "1,4-Dioxane",
                "Acetone",
                "Acetonitrile (MeCN)",
                "Benzonitrile",
                "Carbon tetrachloride (CCl\u2084)",
                "Chlorobenzene",
                "Dichloromethane (DCM)",
                "Dimethyl sulfone (DMSO\u2082)",
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylacetamide (DMA)",
                "Fluoroform",
                "Hexamethylphosphoramide (HMPA)",
                "Methyl ethyl ketone (MEK)",
                "Methyl tert-butyl ether (MTBE)",
                "N,N-Dimethylformamide (DMF)",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Nitrobenzene",
                "Phosphoramide",
                "Propylene carbonate",
                "Sulfolane",
                "Tetrahydrofuran (THF)",
                "Trifluorotoluene",
                "Triglyme"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Acetone (Me2CO)",
            "Acetonitrile (MeCN)",
            "Dimethyl sulfoxide (DMSO)",
            "N,N-Dimethylformamide (DMF)",
            "Tetrahydrofuran (THF)",
            "1,4-Dioxane",
            "Diethyl ether (Et2O)",
            "Ethyl acetate (EtOAc)",
            "Dichloromethane (DCM)",
            "Chloroform (CHCl3)",
            "Carbon tetrachloride (CCl4)",
            "Hexane",
            "Toluene",
            "Benzene",
            "Diglyme",
            "N-Methyl-2-pyrrolidone (NMP)",
            "Dimethylacetamide (DMAc)",
            "Propylene carbonate",
            "Nitromethane",
            "Hexamethylphosphoramide (HMPA)",
            "1,2-Dichloroethane (DCE)",
            "Pyridine",
            "Dimethyl carbonate (DMC)",
            "Sulfolane"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetone (Me2CO)",
                "Acetonitrile (MeCN)",
                "Dimethyl sulfoxide (DMSO)",
                "N,N-Dimethylformamide (DMF)",
                "Tetrahydrofuran (THF)",
                "1,4-Dioxane",
                "Diethyl ether (Et2O)",
                "Ethyl acetate (EtOAc)",
                "Dichloromethane (DCM)",
                "Chloroform (CHCl3)",
                "Carbon tetrachloride (CCl4)",
                "Hexane",
                "Toluene",
                "Benzene",
                "Diglyme",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Dimethylacetamide (DMAc)",
                "Propylene carbonate",
                "Nitromethane",
                "Hexamethylphosphoramide (HMPA)",
                "1,2-Dichloroethane (DCE)",
                "Pyridine",
                "Dimethyl carbonate (DMC)",
                "Sulfolane"
            ],
            "mismatches": [],
            "true_referents": [
                "1,2-Dichloroethane (DCE)",
                "1,4-Dioxane",
                "Acetone (Me2CO)",
                "Acetonitrile (MeCN)",
                "Benzene",
                "Carbon tetrachloride (CCl4)",
                "Chloroform (CHCl3)",
                "Dichloromethane (DCM)",
                "Diethyl ether (Et2O)",
                "Diglyme",
                "Dimethyl carbonate (DMC)",
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylacetamide (DMAc)",
                "Ethyl acetate (EtOAc)",
                "Hexamethylphosphoramide (HMPA)",
                "Hexane",
                "N,N-Dimethylformamide (DMF)",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Nitromethane",
                "Propylene carbonate",
                "Pyridine",
                "Sulfolane",
                "Tetrahydrofuran (THF)",
                "Toluene"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Acetone",
            "Acetonitrile (MeCN)",
            "Benzene",
            "Chloroform (CHCl3)",
            "Cyclohexane",
            "Dichloromethane (DCM)",
            "Diethyl ether (Et2O)",
            "Dimethyl sulfoxide (DMSO)",
            "Dimethylacetamide (DMA)",
            "Dimethylformamide (DMF)",
            "1,4-Dioxane",
            "Ethyl acetate (EtOAc)",
            "n-Hexane",
            "Methyl tert-butyl ether (MTBE)",
            "Nitromethane",
            "Propylene carbonate (PC)",
            "Pyridine",
            "Tetrahydrofuran (THF)",
            "Toluene",
            "Triethylamine (TEA)",
            "Trifluoroacetic acid (TFA)",
            "2,2,2-Trifluoroethanol (TFE)",
            "Carbon tetrachloride (CCl4)",
            "tert-Butanol (t-BuOH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetone",
                "Acetonitrile (MeCN)",
                "Benzene",
                "Chloroform (CHCl3)",
                "Cyclohexane",
                "Dichloromethane (DCM)",
                "Diethyl ether (Et2O)",
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylacetamide (DMA)",
                "Dimethylformamide (DMF)",
                "1,4-Dioxane",
                "Ethyl acetate (EtOAc)",
                "n-Hexane",
                "Methyl tert-butyl ether (MTBE)",
                "Nitromethane",
                "Propylene carbonate (PC)",
                "Pyridine",
                "Tetrahydrofuran (THF)",
                "Toluene",
                "Triethylamine (TEA)",
                "Trifluoroacetic acid (TFA)",
                "2,2,2-Trifluoroethanol (TFE)",
                "Carbon tetrachloride (CCl4)",
                "tert-Butanol (t-BuOH)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,4-Dioxane",
                "2,2,2-Trifluoroethanol (TFE)",
                "Acetone",
                "Acetonitrile (MeCN)",
                "Benzene",
                "Carbon tetrachloride (CCl4)",
                "Chloroform (CHCl3)",
                "Cyclohexane",
                "Dichloromethane (DCM)",
                "Diethyl ether (Et2O)",
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylacetamide (DMA)",
                "Dimethylformamide (DMF)",
                "Ethyl acetate (EtOAc)",
                "Methyl tert-butyl ether (MTBE)",
                "Nitromethane",
                "Propylene carbonate (PC)",
                "Pyridine",
                "Tetrahydrofuran (THF)",
                "Toluene",
                "Triethylamine (TEA)",
                "Trifluoroacetic acid (TFA)",
                "n-Hexane",
                "tert-Butanol (t-BuOH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Dimethyl sulfoxide (DMSO)",
            "N,N-Dimethylformamide (DMF)",
            "Acetonitrile (MeCN)",
            "Hexamethylphosphoramide (HMPA)",
            "N-Methylpyrrolidone (NMP)",
            "Sulfolane",
            "Dimethylacetamide (DMAc)",
            "Propylene carbonate",
            "Ethylene carbonate",
            "Dichloromethane (DCM)",
            "Chloroform (CHCl3)",
            "Tetrahydrofuran (THF)",
            "Diethyl ether",
            "Tert-butyl methyl ether (MTBE)",
            "Acetone",
            "Ethyl acetate",
            "Benzene",
            "Toluene",
            "Xylene",
            "Pyridine",
            "1,4-Dioxane",
            "Nitromethane",
            "Nitrobenzene",
            "Hexamethylphosphorictriamide (HMPT)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dimethyl sulfoxide (DMSO)",
                "N,N-Dimethylformamide (DMF)",
                "Acetonitrile (MeCN)",
                "Hexamethylphosphoramide (HMPA)",
                "N-Methylpyrrolidone (NMP)",
                "Sulfolane",
                "Dimethylacetamide (DMAc)",
                "Propylene carbonate",
                "Ethylene carbonate",
                "Dichloromethane (DCM)",
                "Chloroform (CHCl3)",
                "Tetrahydrofuran (THF)",
                "Diethyl ether",
                "Tert-butyl methyl ether (MTBE)",
                "Acetone",
                "Ethyl acetate",
                "Benzene",
                "Toluene",
                "Xylene",
                "Pyridine",
                "1,4-Dioxane",
                "Nitromethane",
                "Nitrobenzene",
                "Hexamethylphosphorictriamide (HMPT)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,4-Dioxane",
                "Acetone",
                "Acetonitrile (MeCN)",
                "Benzene",
                "Chloroform (CHCl3)",
                "Dichloromethane (DCM)",
                "Diethyl ether",
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylacetamide (DMAc)",
                "Ethyl acetate",
                "Ethylene carbonate",
                "Hexamethylphosphoramide (HMPA)",
                "Hexamethylphosphorictriamide (HMPT)",
                "N,N-Dimethylformamide (DMF)",
                "N-Methylpyrrolidone (NMP)",
                "Nitrobenzene",
                "Nitromethane",
                "Propylene carbonate",
                "Pyridine",
                "Sulfolane",
                "Tert-butyl methyl ether (MTBE)",
                "Tetrahydrofuran (THF)",
                "Toluene",
                "Xylene"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Benzene (BEN)",
            "Toluene (TOL)",
            "Xylene (XYL)",
            "Chloroform (CHCl3)",
            "Carbon Tetrachloride (CCl4)",
            "Dichloromethane (CH2Cl2)",
            "Tetrachloroethylene (PCE)",
            "Hexane (HEX)",
            "Cyclohexane (CYC)",
            "Diethyl Ether (DEE)",
            "Tetrahydrofuran (THF)",
            "Dimethyl Sulfoxide (DMSO)",
            "N,N-Dimethylformamide (DMF)",
            "N-Methyl-2-pyrrolidone (NMP)",
            "Acetonitrile (ACN)",
            "Pyridine (PYR)",
            "Ethyl Acetate (EtOAc)",
            "Acetone (ACE)",
            "Dimethyl Carbonate (DMC)",
            "Propylene Carbonate (PC)",
            "Ethylene Carbonate (EC)",
            "Sulfolane (SFN)",
            "Nitromethane (NTM)",
            "Nitrobenzene (NTB)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Benzene (BEN)",
                "Toluene (TOL)",
                "Xylene (XYL)",
                "Chloroform (CHCl3)",
                "Carbon Tetrachloride (CCl4)",
                "Dichloromethane (CH2Cl2)",
                "Tetrachloroethylene (PCE)",
                "Hexane (HEX)",
                "Cyclohexane (CYC)",
                "Diethyl Ether (DEE)",
                "Tetrahydrofuran (THF)",
                "Dimethyl Sulfoxide (DMSO)",
                "N,N-Dimethylformamide (DMF)",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Acetonitrile (ACN)",
                "Pyridine (PYR)",
                "Ethyl Acetate (EtOAc)",
                "Acetone (ACE)",
                "Dimethyl Carbonate (DMC)",
                "Propylene Carbonate (PC)",
                "Ethylene Carbonate (EC)",
                "Sulfolane (SFN)",
                "Nitromethane (NTM)",
                "Nitrobenzene (NTB)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetone (ACE)",
                "Acetonitrile (ACN)",
                "Benzene (BEN)",
                "Carbon Tetrachloride (CCl4)",
                "Chloroform (CHCl3)",
                "Cyclohexane (CYC)",
                "Dichloromethane (CH2Cl2)",
                "Diethyl Ether (DEE)",
                "Dimethyl Carbonate (DMC)",
                "Dimethyl Sulfoxide (DMSO)",
                "Ethyl Acetate (EtOAc)",
                "Ethylene Carbonate (EC)",
                "Hexane (HEX)",
                "N,N-Dimethylformamide (DMF)",
                "N-Methyl-2-pyrrolidone (NMP)",
                "Nitrobenzene (NTB)",
                "Nitromethane (NTM)",
                "Propylene Carbonate (PC)",
                "Pyridine (PYR)",
                "Sulfolane (SFN)",
                "Tetrachloroethylene (PCE)",
                "Tetrahydrofuran (THF)",
                "Toluene (TOL)",
                "Xylene (XYL)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Acetonitrile (MeCN)",
            "Acetone",
            "Benzene",
            "Carbon disulfide (CS2)",
            "Carbon tetrachloride (CCl4)",
            "Chloroform (CHCl3)",
            "Cyclohexane",
            "Dichloromethane (DCM)",
            "Dimethylformamide (DMF)",
            "Dimethyl sulfoxide (DMSO)",
            "Ethyl acetate (EtOAc)",
            "Ethylene glycol",
            "Hexane",
            "Methylene chloride (CH2Cl2)",
            "Methyl tert-butyl ether (MTBE)",
            "N,N-Dimethylformamide (DMF)",
            "Nitromethane (CH3NO2)",
            "Pentane",
            "Pentyl acetate",
            "Toluene",
            "Triethylamine (TEA)",
            "Triphenylphosphine (PPh3)",
            "Xylene"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetonitrile (MeCN)",
                "Acetone",
                "Benzene",
                "Carbon disulfide (CS2)",
                "Carbon tetrachloride (CCl4)",
                "Chloroform (CHCl3)",
                "Cyclohexane",
                "Dichloromethane (DCM)",
                "Dimethylformamide (DMF)",
                "Dimethyl sulfoxide (DMSO)",
                "Ethyl acetate (EtOAc)",
                "Ethylene glycol",
                "Hexane",
                "Methylene chloride (CH2Cl2)",
                "Methyl tert-butyl ether (MTBE)",
                "N,N-Dimethylformamide (DMF)",
                "Nitromethane (CH3NO2)",
                "Pentane",
                "Pentyl acetate",
                "Toluene",
                "Triethylamine (TEA)",
                "Triphenylphosphine (PPh3)",
                "Xylene"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetone",
                "Acetonitrile (MeCN)",
                "Benzene",
                "Carbon disulfide (CS2)",
                "Carbon tetrachloride (CCl4)",
                "Chloroform (CHCl3)",
                "Cyclohexane",
                "Dichloromethane (DCM)",
                "Dimethyl sulfoxide (DMSO)",
                "Dimethylformamide (DMF)",
                "Ethyl acetate (EtOAc)",
                "Ethylene glycol",
                "Hexane",
                "Methyl tert-butyl ether (MTBE)",
                "Methylene chloride (CH2Cl2)",
                "N,N-Dimethylformamide (DMF)",
                "Nitromethane (CH3NO2)",
                "Pentane",
                "Pentyl acetate",
                "Toluene",
                "Triethylamine (TEA)",
                "Triphenylphosphine (PPh3)",
                "Xylene"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            "Benzene (Bz)",
            "Toluene (Tol)",
            "Xylene (Xyl)",
            "Pentane (Pen)",
            "Hexane (Hex)",
            "Heptane (Hep)",
            "Cyclohexane (CyHex)",
            "Carbon tetrachloride (CTC)",
            "Dichloromethane (DCM)",
            "1,2-Dichloroethane (DCE)",
            "Chlorobenzene (ClBz)",
            "Chloroform (CHCl3)",
            "1,1,1-Trichloroethane (TCA)",
            "Acetone (Ac)",
            "Ethyl acetate (EtAc)",
            "Diethyl ether (Et2O)",
            "Tetrahydrofuran (THF)",
            "Dioxane (Diox)",
            "Benzonitrile (BzN)",
            "Acetonitrile (MeCN)",
            "Propionitrile (EtCN)",
            "Butyronitrile (BuCN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Benzene (Bz)",
                "Toluene (Tol)",
                "Xylene (Xyl)",
                "Pentane (Pen)",
                "Hexane (Hex)",
                "Heptane (Hep)",
                "Cyclohexane (CyHex)",
                "Carbon tetrachloride (CTC)",
                "Dichloromethane (DCM)",
                "1,2-Dichloroethane (DCE)",
                "Chlorobenzene (ClBz)",
                "Chloroform (CHCl3)",
                "1,1,1-Trichloroethane (TCA)",
                "Acetone (Ac)",
                "Ethyl acetate (EtAc)",
                "Diethyl ether (Et2O)",
                "Tetrahydrofuran (THF)",
                "Dioxane (Diox)",
                "Benzonitrile (BzN)",
                "Acetonitrile (MeCN)",
                "Propionitrile (EtCN)",
                "Butyronitrile (BuCN)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,1,1-Trichloroethane (TCA)",
                "1,2-Dichloroethane (DCE)",
                "Acetone (Ac)",
                "Acetonitrile (MeCN)",
                "Benzene (Bz)",
                "Benzonitrile (BzN)",
                "Butyronitrile (BuCN)",
                "Carbon tetrachloride (CTC)",
                "Chlorobenzene (ClBz)",
                "Chloroform (CHCl3)",
                "Cyclohexane (CyHex)",
                "Dichloromethane (DCM)",
                "Diethyl ether (Et2O)",
                "Dioxane (Diox)",
                "Ethyl acetate (EtAc)",
                "Heptane (Hep)",
                "Hexane (Hex)",
                "Pentane (Pen)",
                "Propionitrile (EtCN)",
                "Tetrahydrofuran (THF)",
                "Toluene (Tol)",
                "Xylene (Xyl)"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "aprotic solvent",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Acetone",
                "Canonical Name": "Acetone"
            },
            {
                "Referent": "Diethyl ether",
                "Canonical Name": "Diethyl ether"
            },
            {
                "Referent": "Dimethyl sulfoxide",
                "Canonical Name": "Dimethyl sulfoxide"
            },
            {
                "Referent": "Dimethylformamide",
                "Canonical Name": "Dimethylformamide"
            },
            {
                "Referent": "DMSO",
                "Canonical Name": "Dimethyl sulfoxide"
            },
            {
                "Referent": "Ethanol",
                "Canonical Name": "Ethanol"
            },
            {
                "Referent": "Ethyl acetate",
                "Canonical Name": "Ethyl acetate"
            },
            {
                "Referent": "Ethyl ether",
                "Canonical Name": "Ethyl ether"
            },
            {
                "Referent": "Nitromethane",
                "Canonical Name": "Nitromethane"
            },
            {
                "Referent": "Tetrahydrofuran",
                "Canonical Name": "Tetrahydrofuran"
            },
            {
                "Referent": "Tetrahydropyran",
                "Canonical Name": "Tetrahydropyran"
            },
            {
                "Referent": "THF",
                "Canonical Name": "Tetrahydrofuran"
            },
            {
                "Referent": "THP",
                "Canonical Name": "Tetrahydropyran"
            },
            {
                "Referent": "Acetonitrile",
                "Canonical Name": "Acetonitrile"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic anhydride",
                "Canonical Name": "Acetic anhydride"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            },
            {
                "Referent": "Acetic acid",
                "Canonical Name": "Acetic acid"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetone",
                "Diethyl ether",
                "Dimethyl sulfoxide",
                "Dimethylformamide",
                "Ethanol",
                "Ethyl acetate",
                "Ethyl ether",
                "Nitromethane",
                "Tetrahydrofuran",
                "Tetrahydropyran",
                "Acetonitrile",
                "Acetic acid",
                "Acetic anhydride"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"Acetic acid\", \"Canonical Name\": \"Acetic acid\"}",
                "{\"Referent\": \"Acetic anhydride\", \"Canonical Name\": \"Acetic anhydride\"}",
                "{\"Referent\": \"Acetone\", \"Canonical Name\": \"Acetone\"}",
                "{\"Referent\": \"Acetonitrile\", \"Canonical Name\": \"Acetonitrile\"}",
                "{\"Referent\": \"DMSO\", \"Canonical Name\": \"Dimethyl sulfoxide\"}",
                "{\"Referent\": \"Diethyl ether\", \"Canonical Name\": \"Diethyl ether\"}",
                "{\"Referent\": \"Dimethyl sulfoxide\", \"Canonical Name\": \"Dimethyl sulfoxide\"}",
                "{\"Referent\": \"Dimethylformamide\", \"Canonical Name\": \"Dimethylformamide\"}",
                "{\"Referent\": \"Ethanol\", \"Canonical Name\": \"Ethanol\"}",
                "{\"Referent\": \"Ethyl acetate\", \"Canonical Name\": \"Ethyl acetate\"}",
                "{\"Referent\": \"Ethyl ether\", \"Canonical Name\": \"Ethyl ether\"}",
                "{\"Referent\": \"Nitromethane\", \"Canonical Name\": \"Nitromethane\"}",
                "{\"Referent\": \"THF\", \"Canonical Name\": \"Tetrahydrofuran\"}",
                "{\"Referent\": \"THP\", \"Canonical Name\": \"Tetrahydropyran\"}",
                "{\"Referent\": \"Tetrahydrofuran\", \"Canonical Name\": \"Tetrahydrofuran\"}",
                "{\"Referent\": \"Tetrahydropyran\", \"Canonical Name\": \"Tetrahydropyran\"}"
            ],
            "TP": 13,
            "FP": 0,
            "FN": 0
        }
    }
]