[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (AcCl)",
            "Propionyl chloride (PrCl)",
            "Butyryl chloride (BuCl)",
            "Valeryl chloride (VCl)",
            "Hexanoyl chloride (HxCl)",
            "Heptanoyl chloride (HepCl)",
            "Octanoyl chloride (OcCl)",
            "Nonanoyl chloride (NCl)",
            "Decanoyl chloride (DCl)",
            "Undecanoyl chloride (UDCl)",
            "Dodecanoyl chloride (DDCl)",
            "Tridecanoyl chloride (TDCl)",
            "Myristoyl chloride (MCl)",
            "Pentadecanoyl chloride (PDCl)",
            "Palmitoyl chloride (PalmCl)",
            "Stearoyl chloride (StCl)",
            "Oleoyl chloride (OCl)",
            "Linoleoyl chloride (LCl)",
            "Linolenoyl chloride (LNCl)",
            "Arachidoyl chloride (AChl)",
            "Behenoyl chloride (BChl)",
            "Lauric acid chloride (LAChl)",
            "Myristic acid chloride (MAChl)",
            "Palmitic acid chloride (PAAChl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (AcCl)",
                "Propionyl chloride (PrCl)",
                "Butyryl chloride (BuCl)",
                "Valeryl chloride (VCl)",
                "Hexanoyl chloride (HxCl)",
                "Heptanoyl chloride (HepCl)",
                "Octanoyl chloride (OcCl)",
                "Nonanoyl chloride (NCl)",
                "Decanoyl chloride (DCl)",
                "Undecanoyl chloride (UDCl)",
                "Dodecanoyl chloride (DDCl)",
                "Tridecanoyl chloride (TDCl)",
                "Myristoyl chloride (MCl)",
                "Pentadecanoyl chloride (PDCl)",
                "Palmitoyl chloride (PalmCl)",
                "Stearoyl chloride (StCl)",
                "Oleoyl chloride (OCl)",
                "Linoleoyl chloride (LCl)",
                "Linolenoyl chloride (LNCl)",
                "Arachidoyl chloride (AChl)",
                "Behenoyl chloride (BChl)",
                "Lauric acid chloride (LAChl)",
                "Myristic acid chloride (MAChl)",
                "Palmitic acid chloride (PAAChl)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl chloride (AcCl)",
                "Arachidoyl chloride (AChl)",
                "Behenoyl chloride (BChl)",
                "Butyryl chloride (BuCl)",
                "Decanoyl chloride (DCl)",
                "Dodecanoyl chloride (DDCl)",
                "Heptanoyl chloride (HepCl)",
                "Hexanoyl chloride (HxCl)",
                "Lauric acid chloride (LAChl)",
                "Linolenoyl chloride (LNCl)",
                "Linoleoyl chloride (LCl)",
                "Myristic acid chloride (MAChl)",
                "Myristoyl chloride (MCl)",
                "Nonanoyl chloride (NCl)",
                "Octanoyl chloride (OcCl)",
                "Oleoyl chloride (OCl)",
                "Palmitic acid chloride (PAAChl)",
                "Palmitoyl chloride (PalmCl)",
                "Pentadecanoyl chloride (PDCl)",
                "Propionyl chloride (PrCl)",
                "Stearoyl chloride (StCl)",
                "Tridecanoyl chloride (TDCl)",
                "Undecanoyl chloride (UDCl)",
                "Valeryl chloride (VCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH3COCl)",
            "Benzoyl chloride (C6H5COCl)",
            "Propionyl chloride (C2H5COCl)",
            "Butyryl chloride (C3H7COCl)",
            "Valeryl chloride (C4H9COCl)",
            "Formyl chloride (HCOCl)",
            "Acryloyl chloride (CH2=CHCOCl)",
            "Phenylacetyl chloride (C6H5CH2COCl)",
            "Hexanoyl chloride (C5H11COCl)",
            "Heptyl chloride (C6H13COCl)",
            "Octanoyl chloride (C7H15COCl)",
            "Nonanoyl chloride (C8H17COCl)",
            "Decanoyl chloride (C9H19COCl)",
            "Acetylbromide (CH3COBr)",
            "Benzoylbromide (C6H5COBr)",
            "Acetyl fluoride (CH3COF)",
            "Benzoyl fluoride (C6H5COF)",
            "Propionyl bromide (C2H5COBr)",
            "Butyryl bromide (C3H7COBr)",
            "Valeryl bromide (C4H9COBr)",
            "Phenylacetyl bromide (C6H5CH2COBr)",
            "Hexanoyl bromide (C5H11COBr)",
            "Heptyl fluoride (C6H13COF)",
            "Octanoyl fluoride (C7H15COF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH3COCl)",
                "Benzoyl chloride (C6H5COCl)",
                "Propionyl chloride (C2H5COCl)",
                "Butyryl chloride (C3H7COCl)",
                "Valeryl chloride (C4H9COCl)",
                "Formyl chloride (HCOCl)",
                "Acryloyl chloride (CH2=CHCOCl)",
                "Phenylacetyl chloride (C6H5CH2COCl)",
                "Hexanoyl chloride (C5H11COCl)",
                "Heptyl chloride (C6H13COCl)",
                "Octanoyl chloride (C7H15COCl)",
                "Nonanoyl chloride (C8H17COCl)",
                "Decanoyl chloride (C9H19COCl)",
                "Acetylbromide (CH3COBr)",
                "Benzoylbromide (C6H5COBr)",
                "Acetyl fluoride (CH3COF)",
                "Benzoyl fluoride (C6H5COF)",
                "Propionyl bromide (C2H5COBr)",
                "Butyryl bromide (C3H7COBr)",
                "Valeryl bromide (C4H9COBr)",
                "Phenylacetyl bromide (C6H5CH2COBr)",
                "Hexanoyl bromide (C5H11COBr)",
                "Heptyl fluoride (C6H13COF)",
                "Octanoyl fluoride (C7H15COF)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl chloride (CH3COCl)",
                "Acetyl fluoride (CH3COF)",
                "Acetylbromide (CH3COBr)",
                "Acryloyl chloride (CH2=CHCOCl)",
                "Benzoyl chloride (C6H5COCl)",
                "Benzoyl fluoride (C6H5COF)",
                "Benzoylbromide (C6H5COBr)",
                "Butyryl bromide (C3H7COBr)",
                "Butyryl chloride (C3H7COCl)",
                "Decanoyl chloride (C9H19COCl)",
                "Formyl chloride (HCOCl)",
                "Heptyl chloride (C6H13COCl)",
                "Heptyl fluoride (C6H13COF)",
                "Hexanoyl bromide (C5H11COBr)",
                "Hexanoyl chloride (C5H11COCl)",
                "Nonanoyl chloride (C8H17COCl)",
                "Octanoyl chloride (C7H15COCl)",
                "Octanoyl fluoride (C7H15COF)",
                "Phenylacetyl bromide (C6H5CH2COBr)",
                "Phenylacetyl chloride (C6H5CH2COCl)",
                "Propionyl bromide (C2H5COBr)",
                "Propionyl chloride (C2H5COCl)",
                "Valeryl bromide (C4H9COBr)",
                "Valeryl chloride (C4H9COCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl Chloride (CH3COCl)",
            "Benzoyl Chloride (C6H5COCl)",
            "Propionyl Chloride (C2H5COCl)",
            "Butyryl Chloride (C3H7COCl)",
            "Valeryl Chloride (C4H9COCl)",
            "Pivaloyl Chloride (C(CH3)3COCl)",
            "Hexanoyl Chloride (C5H11COCl)",
            "Heptanoyl Chloride (C6H13COCl)",
            "Octanoyl Chloride (C7H15COCl)",
            "Nonanoyl Chloride (C8H17COCl)",
            "Decanoyl Chloride (C9H19COCl)",
            "Lauroyl Chloride (C11H23COCl)",
            "Myrstoyl Chloride (C13H27COCl)",
            "Palmitoyl Chloride (C15H31COCl)",
            "Stearoyl Chloride (C17H35COCl)",
            "Acryloyl Chloride (CH2=CHCOCl)",
            "Methacryloyl Chloride (CH2=C(CH3)COCl)",
            "Cinnamoyl Chloride (C6H5CH=CHCOCl)",
            "Chloroacetyl Chloride (ClCH2COCl)",
            "Bromoacetyl Chloride (BrCH2COCl)",
            "Iodoacetyl Chloride (ICH2COCl)",
            "Fluoroacetyl Chloride (FCH2COCl)",
            "Dichloroacetyl Chloride (Cl2CHCOCl)",
            "Trichloroacetyl Chloride (CCl3COCl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl Chloride (CH3COCl)",
                "Acryloyl Chloride (CH2=CHCOCl)",
                "Benzoyl Chloride (C6H5COCl)",
                "Bromoacetyl Chloride (BrCH2COCl)",
                "Butyryl Chloride (C3H7COCl)",
                "Chloroacetyl Chloride (ClCH2COCl)",
                "Cinnamoyl Chloride (C6H5CH=CHCOCl)",
                "Decanoyl Chloride (C9H19COCl)",
                "Dichloroacetyl Chloride (Cl2CHCOCl)",
                "Fluoroacetyl Chloride (FCH2COCl)",
                "Heptanoyl Chloride (C6H13COCl)",
                "Hexanoyl Chloride (C5H11COCl)",
                "Iodoacetyl Chloride (ICH2COCl)",
                "Lauroyl Chloride (C11H23COCl)",
                "Methacryloyl Chloride (CH2=C(CH3)COCl)",
                "Myrstoyl Chloride (C13H27COCl)",
                "Nonanoyl Chloride (C8H17COCl)",
                "Octanoyl Chloride (C7H15COCl)",
                "Palmitoyl Chloride (C15H31COCl)",
                "Pivaloyl Chloride (C(CH3)3COCl)",
                "Propionyl Chloride (C2H5COCl)",
                "Stearoyl Chloride (C17H35COCl)",
                "Trichloroacetyl Chloride (CCl3COCl)",
                "Valeryl Chloride (C4H9COCl)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl Chloride (CH3COCl)",
                "Acryloyl Chloride (CH2=CHCOCl)",
                "Benzoyl Chloride (C6H5COCl)",
                "Bromoacetyl Chloride (BrCH2COCl)",
                "Butyryl Chloride (C3H7COCl)",
                "Chloroacetyl Chloride (ClCH2COCl)",
                "Cinnamoyl Chloride (C6H5CH=CHCOCl)",
                "Decanoyl Chloride (C9H19COCl)",
                "Dichloroacetyl Chloride (Cl2CHCOCl)",
                "Fluoroacetyl Chloride (FCH2COCl)",
                "Heptanoyl Chloride (C6H13COCl)",
                "Hexanoyl Chloride (C5H11COCl)",
                "Iodoacetyl Chloride (ICH2COCl)",
                "Lauroyl Chloride (C11H23COCl)",
                "Methacryloyl Chloride (CH2=C(CH3)COCl)",
                "Myrstoyl Chloride (C13H27COCl)",
                "Nonanoyl Chloride (C8H17COCl)",
                "Octanoyl Chloride (C7H15COCl)",
                "Palmitoyl Chloride (C15H31COCl)",
                "Pivaloyl Chloride (C(CH3)3COCl)",
                "Propionyl Chloride (C2H5COCl)",
                "Stearoyl Chloride (C17H35COCl)",
                "Trichloroacetyl Chloride (CCl3COCl)",
                "Valeryl Chloride (C4H9COCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (AcCl)",
            "Acetyl bromide (AcBr)",
            "Acetyl iodide (AcI)",
            "Benzoyl chloride (BzCl)",
            "Benzoyl bromide (BzBr)",
            "Propionyl chloride (PrCl)",
            "Propionyl bromide (PrBr)",
            "Butyryl chloride (BuCl)",
            "Butyryl bromide (BuBr)",
            "Isobutyryl chloride (iBuCl)",
            "Isobutyryl bromide (iBuBr)",
            "Valeryl chloride (VaCl)",
            "Valeryl bromide (VaBr)",
            "Formyl chloride (HCOCl)",
            "Formyl bromide (HCOBr)",
            "Succinyl chloride (SucCl)",
            "Succinyl bromide (SucBr)",
            "Adipoyl chloride (AdCl)",
            "Sebacoyl chloride (SebCl)",
            "Palmitoyl chloride (PaCl)",
            "Stearoyl chloride (StCl)",
            "Oleoyl chloride (OlCl)",
            "Linoleoyl chloride (LiCl)",
            "2-Chloropropionyl chloride (2-CPCl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (AcCl)",
                "Acetyl bromide (AcBr)",
                "Acetyl iodide (AcI)",
                "Benzoyl chloride (BzCl)",
                "Benzoyl bromide (BzBr)",
                "Propionyl chloride (PrCl)",
                "Propionyl bromide (PrBr)",
                "Butyryl chloride (BuCl)",
                "Butyryl bromide (BuBr)",
                "Isobutyryl chloride (iBuCl)",
                "Isobutyryl bromide (iBuBr)",
                "Valeryl chloride (VaCl)",
                "Valeryl bromide (VaBr)",
                "Formyl chloride (HCOCl)",
                "Formyl bromide (HCOBr)",
                "Succinyl chloride (SucCl)",
                "Succinyl bromide (SucBr)",
                "Adipoyl chloride (AdCl)",
                "Sebacoyl chloride (SebCl)",
                "Palmitoyl chloride (PaCl)",
                "Stearoyl chloride (StCl)",
                "Oleoyl chloride (OlCl)",
                "Linoleoyl chloride (LiCl)",
                "2-Chloropropionyl chloride (2-CPCl)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Chloropropionyl chloride (2-CPCl)",
                "Acetyl bromide (AcBr)",
                "Acetyl chloride (AcCl)",
                "Acetyl iodide (AcI)",
                "Adipoyl chloride (AdCl)",
                "Benzoyl bromide (BzBr)",
                "Benzoyl chloride (BzCl)",
                "Butyryl bromide (BuBr)",
                "Butyryl chloride (BuCl)",
                "Formyl bromide (HCOBr)",
                "Formyl chloride (HCOCl)",
                "Isobutyryl bromide (iBuBr)",
                "Isobutyryl chloride (iBuCl)",
                "Linoleoyl chloride (LiCl)",
                "Oleoyl chloride (OlCl)",
                "Palmitoyl chloride (PaCl)",
                "Propionyl bromide (PrBr)",
                "Propionyl chloride (PrCl)",
                "Sebacoyl chloride (SebCl)",
                "Stearoyl chloride (StCl)",
                "Succinyl bromide (SucBr)",
                "Succinyl chloride (SucCl)",
                "Valeryl bromide (VaBr)",
                "Valeryl chloride (VaCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH3COCl)",
            "Benzoyl chloride (C6H5COCl)",
            "Propionyl chloride (C2H5COCl)",
            "Butyryl chloride (C3H7COCl)",
            "Valeryl chloride (C4H9COCl)",
            "Caproyl chloride (C5H11COCl)",
            "Lauryl chloride (C11H23COCl)",
            "Stearoyl chloride (C17H35COCl)",
            "Palmitoyl chloride (C15H31COCl)",
            "Myristoyl chloride (C13H27COCl)",
            "Acryloyl chloride (C3H3ClO)",
            "Methacryloyl chloride (C4H5ClO)",
            "Trifluoroacetyl chloride (CF3COCl)",
            "Chloroacetyl chloride (CH2ClCOCl)",
            "Bromoacetyl chloride (CH2BrCOCl)",
            "Iodoacetyl chloride (CH2ICoCl)",
            "Formyl chloride (HCOCl)",
            "Phenylacetyl chloride (C8H7ClO)",
            "Cyclohexanecarbonyl chloride (C7H11ClO)",
            "Pivaloyl chloride (C5H9ClO)",
            "Isobutyryl chloride (C4H7ClO)",
            "Isovaleryl chloride (C5H9ClO)",
            "Hexanoyl chloride (C6H11ClO)",
            "Octanoyl chloride (C8H15ClO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH3COCl)",
                "Acryloyl chloride (C3H3ClO)",
                "Benzoyl chloride (C6H5COCl)",
                "Bromoacetyl chloride (CH2BrCOCl)",
                "Butyryl chloride (C3H7COCl)",
                "Caproyl chloride (C5H11COCl)",
                "Chloroacetyl chloride (CH2ClCOCl)",
                "Cyclohexanecarbonyl chloride (C7H11ClO)",
                "Formyl chloride (HCOCl)",
                "Hexanoyl chloride (C6H11ClO)",
                "Iodoacetyl chloride (CH2ICoCl)",
                "Isobutyryl chloride (C4H7ClO)",
                "Isovaleryl chloride (C5H9ClO)",
                "Lauryl chloride (C11H23COCl)",
                "Methacryloyl chloride (C4H5ClO)",
                "Myristoyl chloride (C13H27COCl)",
                "Octanoyl chloride (C8H15ClO)",
                "Palmitoyl chloride (C15H31COCl)",
                "Phenylacetyl chloride (C8H7ClO)",
                "Pivaloyl chloride (C5H9ClO)",
                "Propionyl chloride (C2H5COCl)",
                "Stearoyl chloride (C17H35COCl)",
                "Trifluoroacetyl chloride (CF3COCl)",
                "Valeryl chloride (C4H9COCl)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl chloride (CH3COCl)",
                "Acryloyl chloride (C3H3ClO)",
                "Benzoyl chloride (C6H5COCl)",
                "Bromoacetyl chloride (CH2BrCOCl)",
                "Butyryl chloride (C3H7COCl)",
                "Caproyl chloride (C5H11COCl)",
                "Chloroacetyl chloride (CH2ClCOCl)",
                "Cyclohexanecarbonyl chloride (C7H11ClO)",
                "Formyl chloride (HCOCl)",
                "Hexanoyl chloride (C6H11ClO)",
                "Iodoacetyl chloride (CH2ICoCl)",
                "Isobutyryl chloride (C4H7ClO)",
                "Isovaleryl chloride (C5H9ClO)",
                "Lauryl chloride (C11H23COCl)",
                "Methacryloyl chloride (C4H5ClO)",
                "Myristoyl chloride (C13H27COCl)",
                "Octanoyl chloride (C8H15ClO)",
                "Palmitoyl chloride (C15H31COCl)",
                "Phenylacetyl chloride (C8H7ClO)",
                "Pivaloyl chloride (C5H9ClO)",
                "Propionyl chloride (C2H5COCl)",
                "Stearoyl chloride (C17H35COCl)",
                "Trifluoroacetyl chloride (CF3COCl)",
                "Valeryl chloride (C4H9COCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (C2H3ClO)",
            "Benzoyl chloride (C7H5ClO)",
            "Propionyl chloride (C3H5ClO)",
            "Butyryl chloride (C4H7ClO)",
            "Valeryl chloride (C5H9ClO)",
            "Caproyl chloride (C6H11ClO)",
            "Heptanoyl chloride (C7H13ClO)",
            "Octanoyl chloride (C8H15ClO)",
            "Nonanoyl chloride (C9H17ClO)",
            "Decanoyl chloride (C10H19ClO)",
            "Lauryl chloride (C12H25ClO)",
            "Myristoyl chloride (C14H27ClO)",
            "Palmitoyl chloride (C16H31ClO)",
            "Stearoyl chloride (C18H35ClO)",
            "Cholesteryl chloride (C27H45ClO)",
            "2-Pyridinoyl chloride (C6H4ClN)",
            "3-Pyridinoyl chloride (C6H4ClN)",
            "4-Pyridinoyl chloride (C6H4ClN)",
            "Thioacetyl chloride (C2H3ClOS)",
            "Trifluoroacetyl chloride (C2ClF3O)",
            "Formyl chloride (C1HClO)",
            "Succinyl chloride (C4H4Cl2O2)",
            "Phthaloyl chloride (C8H4Cl2O3)",
            "Malonyl chloride (C3H3ClO2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (C2H3ClO)",
                "Benzoyl chloride (C7H5ClO)",
                "Propionyl chloride (C3H5ClO)",
                "Butyryl chloride (C4H7ClO)",
                "Valeryl chloride (C5H9ClO)",
                "Caproyl chloride (C6H11ClO)",
                "Heptanoyl chloride (C7H13ClO)",
                "Octanoyl chloride (C8H15ClO)",
                "Nonanoyl chloride (C9H17ClO)",
                "Decanoyl chloride (C10H19ClO)",
                "Lauryl chloride (C12H25ClO)",
                "Myristoyl chloride (C14H27ClO)",
                "Palmitoyl chloride (C16H31ClO)",
                "Stearoyl chloride (C18H35ClO)",
                "Cholesteryl chloride (C27H45ClO)",
                "2-Pyridinoyl chloride (C6H4ClN)",
                "3-Pyridinoyl chloride (C6H4ClN)",
                "4-Pyridinoyl chloride (C6H4ClN)",
                "Thioacetyl chloride (C2H3ClOS)",
                "Trifluoroacetyl chloride (C2ClF3O)",
                "Formyl chloride (C1HClO)",
                "Succinyl chloride (C4H4Cl2O2)",
                "Phthaloyl chloride (C8H4Cl2O3)",
                "Malonyl chloride (C3H3ClO2)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Pyridinoyl chloride (C6H4ClN)",
                "3-Pyridinoyl chloride (C6H4ClN)",
                "4-Pyridinoyl chloride (C6H4ClN)",
                "Acetyl chloride (C2H3ClO)",
                "Benzoyl chloride (C7H5ClO)",
                "Butyryl chloride (C4H7ClO)",
                "Caproyl chloride (C6H11ClO)",
                "Cholesteryl chloride (C27H45ClO)",
                "Decanoyl chloride (C10H19ClO)",
                "Formyl chloride (C1HClO)",
                "Heptanoyl chloride (C7H13ClO)",
                "Lauryl chloride (C12H25ClO)",
                "Malonyl chloride (C3H3ClO2)",
                "Myristoyl chloride (C14H27ClO)",
                "Nonanoyl chloride (C9H17ClO)",
                "Octanoyl chloride (C8H15ClO)",
                "Palmitoyl chloride (C16H31ClO)",
                "Phthaloyl chloride (C8H4Cl2O3)",
                "Propionyl chloride (C3H5ClO)",
                "Stearoyl chloride (C18H35ClO)",
                "Succinyl chloride (C4H4Cl2O2)",
                "Thioacetyl chloride (C2H3ClOS)",
                "Trifluoroacetyl chloride (C2ClF3O)",
                "Valeryl chloride (C5H9ClO)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH3COCl)",
            "Benzoyl chloride (C6H5COCl)",
            "Propionyl chloride (CH3CH2COCl)",
            "Butyryl chloride (C4H7ClO)",
            "Pivaloyl chloride (C5H9ClO)",
            "Isobutyryl chloride (C4H7ClO)",
            "Valeryl chloride (C5H9ClO)",
            "Caprooyl chloride (C6H11ClO)",
            "Heptanoyl chloride (C7H13ClO)",
            "Octanoyl chloride (C8H15ClO)",
            "Nonanoyl chloride (C9H17ClO)",
            "Decanoyl chloride (C10H19ClO)",
            "Undecanoyl chloride (C11H21ClO)",
            "Dodecanoyl chloride (C12H23ClO)",
            "Tridecanoyl chloride (C13H25ClO)",
            "Tetradecanoyl chloride (C14H27ClO)",
            "Pentadecanoyl chloride (C15H29ClO)",
            "Hexadecanoyl chloride (C16H31ClO)",
            "Heptadecanoyl chloride (C17H33ClO)",
            "Octadecanoyl chloride (C18H35ClO)",
            "Nonadecanoyl chloride (C19H37ClO)",
            "Eicosanoyl chloride (C20H39ClO)",
            "Heneicosanoyl chloride (C21H41ClO)",
            "Docosanoyl chloride (C22H43ClO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH3COCl)",
                "Benzoyl chloride (C6H5COCl)",
                "Propionyl chloride (CH3CH2COCl)",
                "Butyryl chloride (C4H7ClO)",
                "Pivaloyl chloride (C5H9ClO)",
                "Isobutyryl chloride (C4H7ClO)",
                "Valeryl chloride (C5H9ClO)",
                "Caprooyl chloride (C6H11ClO)",
                "Heptanoyl chloride (C7H13ClO)",
                "Octanoyl chloride (C8H15ClO)",
                "Nonanoyl chloride (C9H17ClO)",
                "Decanoyl chloride (C10H19ClO)",
                "Undecanoyl chloride (C11H21ClO)",
                "Dodecanoyl chloride (C12H23ClO)",
                "Tridecanoyl chloride (C13H25ClO)",
                "Tetradecanoyl chloride (C14H27ClO)",
                "Pentadecanoyl chloride (C15H29ClO)",
                "Hexadecanoyl chloride (C16H31ClO)",
                "Heptadecanoyl chloride (C17H33ClO)",
                "Octadecanoyl chloride (C18H35ClO)",
                "Nonadecanoyl chloride (C19H37ClO)",
                "Eicosanoyl chloride (C20H39ClO)",
                "Heneicosanoyl chloride (C21H41ClO)",
                "Docosanoyl chloride (C22H43ClO)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl chloride (CH3COCl)",
                "Benzoyl chloride (C6H5COCl)",
                "Butyryl chloride (C4H7ClO)",
                "Caprooyl chloride (C6H11ClO)",
                "Decanoyl chloride (C10H19ClO)",
                "Docosanoyl chloride (C22H43ClO)",
                "Dodecanoyl chloride (C12H23ClO)",
                "Eicosanoyl chloride (C20H39ClO)",
                "Heneicosanoyl chloride (C21H41ClO)",
                "Heptadecanoyl chloride (C17H33ClO)",
                "Heptanoyl chloride (C7H13ClO)",
                "Hexadecanoyl chloride (C16H31ClO)",
                "Isobutyryl chloride (C4H7ClO)",
                "Nonadecanoyl chloride (C19H37ClO)",
                "Nonanoyl chloride (C9H17ClO)",
                "Octadecanoyl chloride (C18H35ClO)",
                "Octanoyl chloride (C8H15ClO)",
                "Pentadecanoyl chloride (C15H29ClO)",
                "Pivaloyl chloride (C5H9ClO)",
                "Propionyl chloride (CH3CH2COCl)",
                "Tetradecanoyl chloride (C14H27ClO)",
                "Tridecanoyl chloride (C13H25ClO)",
                "Undecanoyl chloride (C11H21ClO)",
                "Valeryl chloride (C5H9ClO)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH3COCl)",
            "Benzoyl chloride (C6H5COCl)",
            "Propionyl chloride (C2H5COCl)",
            "Butyryl chloride (C3H7COCl)",
            "Valeryl chloride (C4H9COCl)",
            "Formyl chloride (HCOCl)",
            "Isobutyryl chloride ((CH3)2CHCOCl)",
            "Isovaleryl chloride ((CH3)2CHCH2COCl)",
            "Trifluoroacetyl chloride (CF3COCl)",
            "Chloroacetyl chloride (ClCH2COCl)",
            "Bromobenzoyl chloride (C6H5COCBr)",
            "Iodobenzoyl chloride (C6H5COCI)",
            "Fluorobenzoyl chloride (C6H5COF)",
            "Chlorobenzoyl chloride (C6H5COCl)",
            "Bromopropionyl chloride (C2H5COCBr)",
            "Iodopropionyl chloride (C2H5COCI)",
            "Fluoropropionyl chloride (C2H5COF)",
            "Chloropropionyl chloride (C2H5COCl)",
            "Bromobutyryl chloride (C3H7COCBr)",
            "Iodobutyryl chloride (C3H7COCI)",
            "Fluorobutyryl chloride (C3H7COF)",
            "Chlorobutyryl chloride (C3H7COCl)",
            "Bromovaleryl chloride (C4H9COCBr)",
            "Iodovaleryl chloride (C4H9COCI)",
            "Fluorovaleryl chloride (C4H9COF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH3COCl)",
                "Benzoyl chloride (C6H5COCl)",
                "Propionyl chloride (C2H5COCl)",
                "Butyryl chloride (C3H7COCl)",
                "Valeryl chloride (C4H9COCl)",
                "Formyl chloride (HCOCl)",
                "Isobutyryl chloride ((CH3)2CHCOCl)",
                "Isovaleryl chloride ((CH3)2CHCH2COCl)",
                "Trifluoroacetyl chloride (CF3COCl)",
                "Chloroacetyl chloride (ClCH2COCl)",
                "Bromobenzoyl chloride (C6H5COCBr)",
                "Iodobenzoyl chloride (C6H5COCI)",
                "Fluorobenzoyl chloride (C6H5COF)",
                "Chlorobenzoyl chloride (C6H5COCl)",
                "Bromopropionyl chloride (C2H5COCBr)",
                "Iodopropionyl chloride (C2H5COCI)",
                "Fluoropropionyl chloride (C2H5COF)",
                "Chloropropionyl chloride (C2H5COCl)",
                "Bromobutyryl chloride (C3H7COCBr)",
                "Iodobutyryl chloride (C3H7COCI)",
                "Fluorobutyryl chloride (C3H7COF)",
                "Chlorobutyryl chloride (C3H7COCl)",
                "Bromovaleryl chloride (C4H9COCBr)",
                "Iodovaleryl chloride (C4H9COCI)"
            ],
            "mismatches": [
                "Fluorovaleryl chloride (C4H9COF)"
            ],
            "true_referents": [
                "Acetyl chloride (CH3COCl)",
                "Benzoyl chloride (C6H5COCl)",
                "Bromobenzoyl chloride (C6H5COCBr)",
                "Bromobutyryl chloride (C3H7COCBr)",
                "Bromopropionyl chloride (C2H5COCBr)",
                "Bromovaleryl chloride (C4H9COCBr)",
                "Butyryl chloride (C3H7COCl)",
                "Chloroacetyl chloride (ClCH2COCl)",
                "Chlorobenzoyl chloride (C6H5COCl)",
                "Chlorobutyryl chloride (C3H7COCl)",
                "Chloropropionyl chloride (C2H5COCl)",
                "Fluorobenzoyl chloride (C6H5COF)",
                "Fluorobutyryl chloride (C3H7COF)",
                "Fluoropropionyl chloride (C2H5COF)",
                "Formyl chloride (HCOCl)",
                "Iodobenzoyl chloride (C6H5COCI)",
                "Iodobutyryl chloride (C3H7COCI)",
                "Iodopropionyl chloride (C2H5COCI)",
                "Iodovaleryl chloride (C4H9COCI)",
                "Isobutyryl chloride ((CH3)2CHCOCl)",
                "Isovaleryl chloride ((CH3)2CHCH2COCl)",
                "Propionyl chloride (C2H5COCl)",
                "Trifluoroacetyl chloride (CF3COCl)",
                "Valeryl chloride (C4H9COCl)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH\u2083COCl)",
            "Benzoyl chloride (C\u2086H\u2085COCl)",
            "Propionyl chloride (CH\u2083CH\u2082COCl)",
            "Butyryl chloride (CH\u2083CH\u2082CH\u2082COCl)",
            "Formyl chloride (HCOCl)",
            "p-Tolyl chloride (p-CH\u2083C\u2086H\u2084COCl)",
            "2-Chlorobenzoyl chloride",
            "3-Chlorobenzoyl chloride",
            "4-Chlorobenzoyl chloride",
            "2,4-Dichlorobenzoyl chloride",
            "2,5-Dichlorobenzoyl chloride",
            "3,5-Dichlorobenzoyl chloride",
            "Hexanoyl chloride (C\u2085H\u2081\u2081COCl)",
            "Benzoyl bromide (C\u2086H\u2085COBr)",
            "Benzoyl iodide (C\u2086H\u2085COI)",
            "Phenylacetyl chloride (C\u2086H\u2085CH\u2082COCl)",
            "Oxalyl chloride ((ClCO)\u2082)",
            "Succinyl chloride (ClCH\u2082CH\u2082COCl)",
            "Glutaroyl chloride (Cl(CH\u2082)\u2083COCl)",
            "Adipoyl chloride (Cl(CH\u2082)\u2084COCl)",
            "Malonyl chloride (ClCH\u2082COCl)",
            "Terephthaloyl chloride (p-C\u2086H\u2084(COCl)\u2082)",
            "2-Naphthoyl chloride",
            "Phthaloyl chloride (o-C\u2086H\u2084(COCl)\u2082)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH\u2083COCl)",
                "Benzoyl chloride (C\u2086H\u2085COCl)",
                "Propionyl chloride (CH\u2083CH\u2082COCl)",
                "Butyryl chloride (CH\u2083CH\u2082CH\u2082COCl)",
                "Formyl chloride (HCOCl)",
                "p-Tolyl chloride (p-CH\u2083C\u2086H\u2084COCl)",
                "2-Chlorobenzoyl chloride",
                "3-Chlorobenzoyl chloride",
                "4-Chlorobenzoyl chloride",
                "2,4-Dichlorobenzoyl chloride",
                "2,5-Dichlorobenzoyl chloride",
                "3,5-Dichlorobenzoyl chloride",
                "Hexanoyl chloride (C\u2085H\u2081\u2081COCl)",
                "Benzoyl bromide (C\u2086H\u2085COBr)",
                "Benzoyl iodide (C\u2086H\u2085COI)",
                "Phenylacetyl chloride (C\u2086H\u2085CH\u2082COCl)",
                "Oxalyl chloride ((ClCO)\u2082)",
                "Succinyl chloride (ClCH\u2082CH\u2082COCl)",
                "Glutaroyl chloride (Cl(CH\u2082)\u2083COCl)",
                "Adipoyl chloride (Cl(CH\u2082)\u2084COCl)",
                "Malonyl chloride (ClCH\u2082COCl)",
                "Terephthaloyl chloride (p-C\u2086H\u2084(COCl)\u2082)",
                "2-Naphthoyl chloride",
                "Phthaloyl chloride (o-C\u2086H\u2084(COCl)\u2082)"
            ],
            "mismatches": [],
            "true_referents": [
                "2,4-Dichlorobenzoyl chloride",
                "2,5-Dichlorobenzoyl chloride",
                "2-Chlorobenzoyl chloride",
                "2-Naphthoyl chloride",
                "3,5-Dichlorobenzoyl chloride",
                "3-Chlorobenzoyl chloride",
                "4-Chlorobenzoyl chloride",
                "Acetyl chloride (CH\u2083COCl)",
                "Adipoyl chloride (Cl(CH\u2082)\u2084COCl)",
                "Benzoyl bromide (C\u2086H\u2085COBr)",
                "Benzoyl chloride (C\u2086H\u2085COCl)",
                "Benzoyl iodide (C\u2086H\u2085COI)",
                "Butyryl chloride (CH\u2083CH\u2082CH\u2082COCl)",
                "Formyl chloride (HCOCl)",
                "Glutaroyl chloride (Cl(CH\u2082)\u2083COCl)",
                "Hexanoyl chloride (C\u2085H\u2081\u2081COCl)",
                "Malonyl chloride (ClCH\u2082COCl)",
                "Oxalyl chloride ((ClCO)\u2082)",
                "Phenylacetyl chloride (C\u2086H\u2085CH\u2082COCl)",
                "Phthaloyl chloride (o-C\u2086H\u2084(COCl)\u2082)",
                "Propionyl chloride (CH\u2083CH\u2082COCl)",
                "Succinyl chloride (ClCH\u2082CH\u2082COCl)",
                "Terephthaloyl chloride (p-C\u2086H\u2084(COCl)\u2082)",
                "p-Tolyl chloride (p-CH\u2083C\u2086H\u2084COCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH3COCl)",
            "Propanoyl bromide (CH3CH2COBr)",
            "Benzoyl chloride (C6H5COCl)",
            "Oxalyl chloride ((COCl)2)",
            "Palmitoyl chloride (CH3(CH2)14COCl)",
            "Malonyl dichloride (ClCOCH2COCl)",
            "Succinyl chloride (ClCO(CH2)2COCl)",
            "Acryloyl chloride (CH2=CHCOCl)",
            "Pivaloyl chloride ((CH3)3CCOCl)",
            "Phthaloyl chloride (C6H4(COCl)2)",
            "Stearoyl chloride (CH3(CH2)16COCl)",
            "Butyryl chloride (CH3CH2CH2COCl)",
            "Cinnamoyl chloride (C6H5CH=CHCOCl)",
            "Lauroyl chloride (CH3(CH2)10COCl)",
            "Myristoyl chloride (CH3(CH2)12COCl)",
            "Oleoyl chloride (CH3(CH2)7CH=CH(CH2)7COCl)",
            "Sebacoyl chloride (ClCO(CH2)8COCl)",
            "Terephthaloyl chloride (ClCOC6H4COCl)",
            "Valeryl chloride (CH3(CH2)3COCl)",
            "Adipoyl chloride (ClCO(CH2)4COCl)",
            "Crotonyl chloride (CH3CH=CHCOCl)",
            "Isophthaloyl chloride (1,3-C6H4(COCl)2)",
            "Octanoyl chloride (CH3(CH2)6COCl)",
            "Trichloroacetyl chloride (Cl3CCOCl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH3COCl)",
                "Propanoyl bromide (CH3CH2COBr)",
                "Benzoyl chloride (C6H5COCl)",
                "Oxalyl chloride ((COCl)2)",
                "Palmitoyl chloride (CH3(CH2)14COCl)",
                "Malonyl dichloride (ClCOCH2COCl)",
                "Succinyl chloride (ClCO(CH2)2COCl)",
                "Acryloyl chloride (CH2=CHCOCl)",
                "Pivaloyl chloride ((CH3)3CCOCl)",
                "Phthaloyl chloride (C6H4(COCl)2)",
                "Stearoyl chloride (CH3(CH2)16COCl)",
                "Butyryl chloride (CH3CH2CH2COCl)",
                "Cinnamoyl chloride (C6H5CH=CHCOCl)",
                "Lauroyl chloride (CH3(CH2)10COCl)",
                "Myristoyl chloride (CH3(CH2)12COCl)",
                "Oleoyl chloride (CH3(CH2)7CH=CH(CH2)7COCl)",
                "Sebacoyl chloride (ClCO(CH2)8COCl)",
                "Terephthaloyl chloride (ClCOC6H4COCl)",
                "Valeryl chloride (CH3(CH2)3COCl)",
                "Adipoyl chloride (ClCO(CH2)4COCl)",
                "Crotonyl chloride (CH3CH=CHCOCl)",
                "Isophthaloyl chloride (1,3-C6H4(COCl)2)",
                "Octanoyl chloride (CH3(CH2)6COCl)",
                "Trichloroacetyl chloride (Cl3CCOCl)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl chloride (CH3COCl)",
                "Acryloyl chloride (CH2=CHCOCl)",
                "Adipoyl chloride (ClCO(CH2)4COCl)",
                "Benzoyl chloride (C6H5COCl)",
                "Butyryl chloride (CH3CH2CH2COCl)",
                "Cinnamoyl chloride (C6H5CH=CHCOCl)",
                "Crotonyl chloride (CH3CH=CHCOCl)",
                "Isophthaloyl chloride (1,3-C6H4(COCl)2)",
                "Lauroyl chloride (CH3(CH2)10COCl)",
                "Malonyl dichloride (ClCOCH2COCl)",
                "Myristoyl chloride (CH3(CH2)12COCl)",
                "Octanoyl chloride (CH3(CH2)6COCl)",
                "Oleoyl chloride (CH3(CH2)7CH=CH(CH2)7COCl)",
                "Oxalyl chloride ((COCl)2)",
                "Palmitoyl chloride (CH3(CH2)14COCl)",
                "Phthaloyl chloride (C6H4(COCl)2)",
                "Pivaloyl chloride ((CH3)3CCOCl)",
                "Propanoyl bromide (CH3CH2COBr)",
                "Sebacoyl chloride (ClCO(CH2)8COCl)",
                "Stearoyl chloride (CH3(CH2)16COCl)",
                "Succinyl chloride (ClCO(CH2)2COCl)",
                "Terephthaloyl chloride (ClCOC6H4COCl)",
                "Trichloroacetyl chloride (Cl3CCOCl)",
                "Valeryl chloride (CH3(CH2)3COCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH3COCl)",
            "Acetyl bromide (CH3COBr)",
            "Acetyl iodide (CH3COI)",
            "Propionyl chloride (CH3CH2COCl)",
            "Butyryl chloride (CH3(CH2)2COCl)",
            "Isobutyryl chloride ((CH3)2CHCOCl)",
            "Valeryl chloride (CH3(CH2)3COCl)",
            "Isovaleryl chloride ((CH3)2CHCH2COCl)",
            "Pivaloyl chloride ((CH3)3CCOCl)",
            "Hexanoyl chloride (CH3(CH2)4COCl)",
            "Heptanoyl chloride (CH3(CH2)5COCl)",
            "Octanoyl chloride (CH3(CH2)6COCl)",
            "Nonanoyl chloride (CH3(CH2)7COCl)",
            "Decanoyl chloride (CH3(CH2)8COCl)",
            "Benzoyl chloride (C6H5COCl)",
            "2-Methylbenzoyl chloride (o-CH3C6H4COCl)",
            "3-Methylbenzoyl chloride (m-CH3C6H4COCl)",
            "4-Methylbenzoyl chloride (p-CH3C6H4COCl)",
            "2-Chlorobenzoyl chloride (o-ClC6H4COCl)",
            "3-Chlorobenzoyl chloride (m-ClC6H4COCl)",
            "4-Chlorobenzoyl chloride (p-ClC6H4COCl)",
            "Oxalyl chloride ((COCl)2)",
            "Malonyl dichloride (CH2(COCl)2)",
            "Succinyl chloride ((CH2)2(COCl)2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH3COCl)",
                "Acetyl bromide (CH3COBr)",
                "Acetyl iodide (CH3COI)",
                "Propionyl chloride (CH3CH2COCl)",
                "Butyryl chloride (CH3(CH2)2COCl)",
                "Isobutyryl chloride ((CH3)2CHCOCl)",
                "Valeryl chloride (CH3(CH2)3COCl)",
                "Isovaleryl chloride ((CH3)2CHCH2COCl)",
                "Pivaloyl chloride ((CH3)3CCOCl)",
                "Hexanoyl chloride (CH3(CH2)4COCl)",
                "Heptanoyl chloride (CH3(CH2)5COCl)",
                "Octanoyl chloride (CH3(CH2)6COCl)",
                "Nonanoyl chloride (CH3(CH2)7COCl)",
                "Decanoyl chloride (CH3(CH2)8COCl)",
                "Benzoyl chloride (C6H5COCl)",
                "2-Methylbenzoyl chloride (o-CH3C6H4COCl)",
                "3-Methylbenzoyl chloride (m-CH3C6H4COCl)",
                "4-Methylbenzoyl chloride (p-CH3C6H4COCl)",
                "2-Chlorobenzoyl chloride (o-ClC6H4COCl)",
                "3-Chlorobenzoyl chloride (m-ClC6H4COCl)",
                "4-Chlorobenzoyl chloride (p-ClC6H4COCl)",
                "Oxalyl chloride ((COCl)2)",
                "Malonyl dichloride (CH2(COCl)2)",
                "Succinyl chloride ((CH2)2(COCl)2)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Chlorobenzoyl chloride (o-ClC6H4COCl)",
                "2-Methylbenzoyl chloride (o-CH3C6H4COCl)",
                "3-Chlorobenzoyl chloride (m-ClC6H4COCl)",
                "3-Methylbenzoyl chloride (m-CH3C6H4COCl)",
                "4-Chlorobenzoyl chloride (p-ClC6H4COCl)",
                "4-Methylbenzoyl chloride (p-CH3C6H4COCl)",
                "Acetyl bromide (CH3COBr)",
                "Acetyl chloride (CH3COCl)",
                "Acetyl iodide (CH3COI)",
                "Benzoyl chloride (C6H5COCl)",
                "Butyryl chloride (CH3(CH2)2COCl)",
                "Decanoyl chloride (CH3(CH2)8COCl)",
                "Heptanoyl chloride (CH3(CH2)5COCl)",
                "Hexanoyl chloride (CH3(CH2)4COCl)",
                "Isobutyryl chloride ((CH3)2CHCOCl)",
                "Isovaleryl chloride ((CH3)2CHCH2COCl)",
                "Malonyl dichloride (CH2(COCl)2)",
                "Nonanoyl chloride (CH3(CH2)7COCl)",
                "Octanoyl chloride (CH3(CH2)6COCl)",
                "Oxalyl chloride ((COCl)2)",
                "Pivaloyl chloride ((CH3)3CCOCl)",
                "Propionyl chloride (CH3CH2COCl)",
                "Succinyl chloride ((CH2)2(COCl)2)",
                "Valeryl chloride (CH3(CH2)3COCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH3COCl)",
            "Acetyl bromide (CH3COBr)",
            "Benzoyl chloride (C6H5COCl)",
            "Benzoyl bromide (C6H5COBr)",
            "Propionyl chloride (CH3CH2COCl)",
            "Butyryl chloride (CH3CH2CH2COCl)",
            "Isobutyryl chloride ((CH3)2CHCOC)",
            "Valeroyl chloride (CH3CH2CH2CH2COCl)",
            "Hexanoyl chloride (CH3(CH2)4COCl)",
            "Heptanoyl chloride (CH3(CH2)5COCl)",
            "Octanoyl chloride (CH3(CH2)6COCl)",
            "Nonanoyl chloride (CH3(CH2)7COCl)",
            "Decanoyl chloride (CH3(CH2)8COCl)",
            "Palmitoyl chloride (CH3(CH2)14COCl)",
            "Stearoyl chloride (CH3(CH2)16COCl)",
            "Oleoyl chloride (CH3(CH2)7CH=CH(CH2)7COCl)",
            "Linoleoyl chloride (CH3(CH2)4CH=CHCH2CH=CH(CH2)7COCl)",
            "Linolenyl chloride (CH3CH2CH=CHCH2CH=CHCH2CH=CH(CH2)7COCl)",
            "Arachidoyl chloride (CH3(CH2)18COCl)",
            "Behenoyl chloride (CH3(CH2)20COCl)",
            "Lignoceroyl chloride (CH3(CH2)22COCl)",
            "Cerotoyl chloride (CH3(CH2)24COCl)",
            "Melissoyl chloride (CH3(CH2)28COCl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH3COCl)",
                "Acetyl bromide (CH3COBr)",
                "Benzoyl chloride (C6H5COCl)",
                "Benzoyl bromide (C6H5COBr)",
                "Propionyl chloride (CH3CH2COCl)",
                "Butyryl chloride (CH3CH2CH2COCl)",
                "Isobutyryl chloride ((CH3)2CHCOC)",
                "Valeroyl chloride (CH3CH2CH2CH2COCl)",
                "Hexanoyl chloride (CH3(CH2)4COCl)",
                "Heptanoyl chloride (CH3(CH2)5COCl)",
                "Octanoyl chloride (CH3(CH2)6COCl)",
                "Nonanoyl chloride (CH3(CH2)7COCl)",
                "Decanoyl chloride (CH3(CH2)8COCl)",
                "Palmitoyl chloride (CH3(CH2)14COCl)",
                "Stearoyl chloride (CH3(CH2)16COCl)",
                "Oleoyl chloride (CH3(CH2)7CH=CH(CH2)7COCl)",
                "Linoleoyl chloride (CH3(CH2)4CH=CHCH2CH=CH(CH2)7COCl)",
                "Linolenyl chloride (CH3CH2CH=CHCH2CH=CHCH2CH=CH(CH2)7COCl)",
                "Arachidoyl chloride (CH3(CH2)18COCl)",
                "Behenoyl chloride (CH3(CH2)20COCl)",
                "Lignoceroyl chloride (CH3(CH2)22COCl)",
                "Cerotoyl chloride (CH3(CH2)24COCl)",
                "Melissoyl chloride (CH3(CH2)28COCl)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl bromide (CH3COBr)",
                "Acetyl chloride (CH3COCl)",
                "Arachidoyl chloride (CH3(CH2)18COCl)",
                "Behenoyl chloride (CH3(CH2)20COCl)",
                "Benzoyl bromide (C6H5COBr)",
                "Benzoyl chloride (C6H5COCl)",
                "Butyryl chloride (CH3CH2CH2COCl)",
                "Cerotoyl chloride (CH3(CH2)24COCl)",
                "Decanoyl chloride (CH3(CH2)8COCl)",
                "Heptanoyl chloride (CH3(CH2)5COCl)",
                "Hexanoyl chloride (CH3(CH2)4COCl)",
                "Isobutyryl chloride ((CH3)2CHCOC)",
                "Lignoceroyl chloride (CH3(CH2)22COCl)",
                "Linolenyl chloride (CH3CH2CH=CHCH2CH=CHCH2CH=CH(CH2)7COCl)",
                "Linoleoyl chloride (CH3(CH2)4CH=CHCH2CH=CH(CH2)7COCl)",
                "Melissoyl chloride (CH3(CH2)28COCl)",
                "Nonanoyl chloride (CH3(CH2)7COCl)",
                "Octanoyl chloride (CH3(CH2)6COCl)",
                "Oleoyl chloride (CH3(CH2)7CH=CH(CH2)7COCl)",
                "Palmitoyl chloride (CH3(CH2)14COCl)",
                "Propionyl chloride (CH3CH2COCl)",
                "Stearoyl chloride (CH3(CH2)16COCl)",
                "Valeroyl chloride (CH3CH2CH2CH2COCl)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (AcCl)",
            "Propionyl chloride (PrCl)",
            "Butyryl chloride (BuCl)",
            "Isobutyryl chloride (i-BuCl)",
            "Valeryl chloride (ValCl)",
            "Isovaleryl chloride (i-ValCl)",
            "Hexanoyl chloride (HxCl)",
            "Heptanoyl chloride (HpCl)",
            "Octanoyl chloride (OcCl)",
            "Nonanoyl chloride (NoCl)",
            "Decanoyl chloride (DeCl)",
            "Lauroyl chloride (LaCl)",
            "Myristoyl chloride (MyCl)",
            "Palmitoyl chloride (PaCl)",
            "Stearoyl chloride (StCl)",
            "Oleoyl chloride (OlCl)",
            "Linoleoyl chloride (LiCl)",
            "Linolenoyl chloride (LnCl)",
            "Acetyl bromide (AcBr)",
            "Propionyl bromide (PrBr)",
            "Butyryl bromide (BuBr)",
            "Isobutyryl bromide (i-BuBr)",
            "Valeryl bromide (ValBr)",
            "Isovaleryl bromide (i-ValBr)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (AcCl)",
                "Propionyl chloride (PrCl)",
                "Butyryl chloride (BuCl)",
                "Isobutyryl chloride (i-BuCl)",
                "Valeryl chloride (ValCl)",
                "Isovaleryl chloride (i-ValCl)",
                "Hexanoyl chloride (HxCl)",
                "Heptanoyl chloride (HpCl)",
                "Octanoyl chloride (OcCl)",
                "Nonanoyl chloride (NoCl)",
                "Decanoyl chloride (DeCl)",
                "Lauroyl chloride (LaCl)",
                "Myristoyl chloride (MyCl)",
                "Palmitoyl chloride (PaCl)",
                "Stearoyl chloride (StCl)",
                "Oleoyl chloride (OlCl)",
                "Linoleoyl chloride (LiCl)",
                "Linolenoyl chloride (LnCl)",
                "Acetyl bromide (AcBr)",
                "Propionyl bromide (PrBr)",
                "Butyryl bromide (BuBr)",
                "Isobutyryl bromide (i-BuBr)",
                "Valeryl bromide (ValBr)",
                "Isovaleryl bromide (i-ValBr)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl bromide (AcBr)",
                "Acetyl chloride (AcCl)",
                "Butyryl bromide (BuBr)",
                "Butyryl chloride (BuCl)",
                "Decanoyl chloride (DeCl)",
                "Heptanoyl chloride (HpCl)",
                "Hexanoyl chloride (HxCl)",
                "Isobutyryl bromide (i-BuBr)",
                "Isobutyryl chloride (i-BuCl)",
                "Isovaleryl bromide (i-ValBr)",
                "Isovaleryl chloride (i-ValCl)",
                "Lauroyl chloride (LaCl)",
                "Linolenoyl chloride (LnCl)",
                "Linoleoyl chloride (LiCl)",
                "Myristoyl chloride (MyCl)",
                "Nonanoyl chloride (NoCl)",
                "Octanoyl chloride (OcCl)",
                "Oleoyl chloride (OlCl)",
                "Palmitoyl chloride (PaCl)",
                "Propionyl bromide (PrBr)",
                "Propionyl chloride (PrCl)",
                "Stearoyl chloride (StCl)",
                "Valeryl bromide (ValBr)",
                "Valeryl chloride (ValCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (AcCl)",
            "Benzoyl chloride (BzCl)",
            "Pivaloyl chloride (PivCl)",
            "Chloroacetyl chloride (ClCH2COCl)",
            "Ethoxycarbonyl chloride (EtO2CCl)",
            "Methoxycarbonyl chloride (MeO2CCl)",
            "Tosyl chloride (TsCl)",
            "Benzoyl bromide (BzBr)",
            "Pivaloyl bromide (PivBr)",
            "Chloroacetyl bromide (ClCH2COBr)",
            "Ethoxycarbonyl bromide (EtO2CCBr)",
            "Methoxycarbonyl bromide (MeO2CCBr)",
            "Acetoxybenzoyl chloride (AcOOC6H4COCl)",
            "Acetoxybenzoyl bromide (AcOOC6H4COBr)",
            "Phthaloyl chloride (PhthCl)",
            "Phthaloyl bromide (PhthBr)",
            "Maleoyl chloride (MaleCl)",
            "Maleoyl bromide (MaleBr)",
            "Fumaryl chloride (FumCl)",
            "Fumaryl bromide (FumBr)",
            "Citramalyl chloride (CitCl)",
            "Citramalyl bromide (CitBr)",
            "Citryl chloride (CitCl)",
            "Citryl bromide (CitBr)",
            "Cinnamoyl chloride (CinnCl)",
            "Cinnamoyl bromide (CinnBr)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (AcCl)",
                "Benzoyl chloride (BzCl)",
                "Pivaloyl chloride (PivCl)",
                "Chloroacetyl chloride (ClCH2COCl)",
                "Ethoxycarbonyl chloride (EtO2CCl)",
                "Methoxycarbonyl chloride (MeO2CCl)",
                "Tosyl chloride (TsCl)",
                "Benzoyl bromide (BzBr)",
                "Pivaloyl bromide (PivBr)",
                "Chloroacetyl bromide (ClCH2COBr)",
                "Ethoxycarbonyl bromide (EtO2CCBr)",
                "Methoxycarbonyl bromide (MeO2CCBr)",
                "Acetoxybenzoyl chloride (AcOOC6H4COCl)",
                "Acetoxybenzoyl bromide (AcOOC6H4COBr)",
                "Phthaloyl chloride (PhthCl)",
                "Phthaloyl bromide (PhthBr)",
                "Maleoyl chloride (MaleCl)",
                "Maleoyl bromide (MaleBr)",
                "Fumaryl chloride (FumCl)",
                "Fumaryl bromide (FumBr)",
                "Citramalyl chloride (CitCl)",
                "Citramalyl bromide (CitBr)"
            ],
            "mismatches": [
                "Citryl chloride (CitCl)",
                "Citryl bromide (CitBr)",
                "Cinnamoyl chloride (CinnCl)",
                "Cinnamoyl bromide (CinnBr)"
            ],
            "true_referents": [
                "Acetoxybenzoyl bromide (AcOOC6H4COBr)",
                "Acetoxybenzoyl chloride (AcOOC6H4COCl)",
                "Acetyl chloride (AcCl)",
                "Benzoyl bromide (BzBr)",
                "Benzoyl chloride (BzCl)",
                "Chloroacetyl bromide (ClCH2COBr)",
                "Chloroacetyl chloride (ClCH2COCl)",
                "Citramalyl bromide (CitBr)",
                "Citramalyl chloride (CitCl)",
                "Citryl bromide (CitBr)",
                "Citryl chloride (CitCl)",
                "Ethoxycarbonyl bromide (EtO2CCBr)",
                "Ethoxycarbonyl chloride (EtO2CCl)",
                "Fumaryl bromide (FumBr)",
                "Fumaryl chloride (FumCl)",
                "Maleoyl bromide (MaleBr)",
                "Maleoyl chloride (MaleCl)",
                "Methoxycarbonyl bromide (MeO2CCBr)",
                "Methoxycarbonyl chloride (MeO2CCl)",
                "Phthaloyl bromide (PhthBr)",
                "Phthaloyl chloride (PhthCl)",
                "Pivaloyl bromide (PivBr)",
                "Pivaloyl chloride (PivCl)",
                "Tosyl chloride (TsCl)"
            ],
            "TP": 22,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (ACl)",
            "Acetyl bromide (ABr)",
            "Acetyl fluoride (AF)",
            "Propionyl chloride (PrCl)",
            "Propionyl bromide (PrBr)",
            "Butyryl chloride (BuCl)",
            "Pentanoyl chloride (PnCl)",
            "Hexanoyl chloride (HxCl)",
            "Heptanoyl chloride (HpCl)",
            "Octanoyl chloride (OcCl)",
            "Decanoyl chloride (DcCl)",
            "Benzooyl chloride (BzCl)",
            "4-Methylbenzoyl chloride (4-MeBzCl)",
            "4-Nitrobenzoyl chloride (4-NBzCl)",
            "4-Methoxybenzoyl chloride (4-MeOBzCl)",
            "Cinnamoyl chloride (CnCl)",
            "3-Chlorobenzoyl chloride (3-ClBzCl)",
            "4-Chlorobenzoyl chloride (4-ClBzCl)",
            "2-Naphthoyl chloride (2-NpCl)",
            "1-Naphthoyl chloride (1-NpCl)",
            "Acryloyl chloride (AcrCl)",
            " Methacryloyl chloride (MAcrCl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (ACl)",
                "Acetyl bromide (ABr)",
                "Acetyl fluoride (AF)",
                "Propionyl chloride (PrCl)",
                "Propionyl bromide (PrBr)",
                "Butyryl chloride (BuCl)",
                "Pentanoyl chloride (PnCl)",
                "Hexanoyl chloride (HxCl)",
                "Heptanoyl chloride (HpCl)",
                "Octanoyl chloride (OcCl)",
                "Decanoyl chloride (DcCl)",
                "Benzooyl chloride (BzCl)",
                "4-Methylbenzoyl chloride (4-MeBzCl)",
                "4-Nitrobenzoyl chloride (4-NBzCl)",
                "4-Methoxybenzoyl chloride (4-MeOBzCl)",
                "Cinnamoyl chloride (CnCl)",
                "3-Chlorobenzoyl chloride (3-ClBzCl)",
                "4-Chlorobenzoyl chloride (4-ClBzCl)",
                "2-Naphthoyl chloride (2-NpCl)",
                "1-Naphthoyl chloride (1-NpCl)",
                "Acryloyl chloride (AcrCl)",
                " Methacryloyl chloride (MAcrCl)"
            ],
            "mismatches": [],
            "true_referents": [
                " Methacryloyl chloride (MAcrCl)",
                "1-Naphthoyl chloride (1-NpCl)",
                "2-Naphthoyl chloride (2-NpCl)",
                "3-Chlorobenzoyl chloride (3-ClBzCl)",
                "4-Chlorobenzoyl chloride (4-ClBzCl)",
                "4-Methoxybenzoyl chloride (4-MeOBzCl)",
                "4-Methylbenzoyl chloride (4-MeBzCl)",
                "4-Nitrobenzoyl chloride (4-NBzCl)",
                "Acetyl bromide (ABr)",
                "Acetyl chloride (ACl)",
                "Acetyl fluoride (AF)",
                "Acryloyl chloride (AcrCl)",
                "Benzooyl chloride (BzCl)",
                "Butyryl chloride (BuCl)",
                "Cinnamoyl chloride (CnCl)",
                "Decanoyl chloride (DcCl)",
                "Heptanoyl chloride (HpCl)",
                "Hexanoyl chloride (HxCl)",
                "Octanoyl chloride (OcCl)",
                "Pentanoyl chloride (PnCl)",
                "Propionyl bromide (PrBr)",
                "Propionyl chloride (PrCl)"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "acetyl chloride",
                "Canonical name": "ethanoic anhydride"
            },
            {
                "Referent": "benzoyl chloride",
                "Canonical name": "benzoyl chloride"
            },
            {
                "Referent": "chloroacetyl chloride",
                "Canonical name": "chloroethanoic anhydride"
            },
            {
                "Referent": "ethyl chloroformate",
                "Canonical name": "ethyl chloroformate"
            },
            {
                "Referent": "ethyl chloroacetate",
                "Canonical name": "ethyl chloroacetate"
            },
            {
                "Referent": "methyl chloroformate",
                "Canonical name": "methyl chloroformate"
            },
            {
                "Referent": "methyl chloroacetate",
                "Canonical name": "methyl chloroacetate"
            },
            {
                "Referent": "propionyl chloride",
                "Canonical name": "propionyl chloride"
            },
            {
                "Referent": "pivaloyl chloride",
                "Canonical name": "pivaloyl chloride"
            },
            {
                "Referent": "thionyl chloride",
                "Canonical name": "thionyl chloride"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "acetyl chloride",
                "benzoyl chloride",
                "chloroacetyl chloride",
                "ethyl chloroacetate",
                "ethyl chloroformate",
                "methyl chloroacetate",
                "methyl chloroformate",
                "pivaloyl chloride",
                "propionyl chloride",
                "thionyl chloride"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"acetyl chloride\", \"Canonical name\": \"ethanoic anhydride\"}",
                "{\"Referent\": \"benzoyl chloride\", \"Canonical name\": \"benzoyl chloride\"}",
                "{\"Referent\": \"chloroacetyl chloride\", \"Canonical name\": \"chloroethanoic anhydride\"}",
                "{\"Referent\": \"ethyl chloroacetate\", \"Canonical name\": \"ethyl chloroacetate\"}",
                "{\"Referent\": \"ethyl chloroformate\", \"Canonical name\": \"ethyl chloroformate\"}",
                "{\"Referent\": \"methyl chloroacetate\", \"Canonical name\": \"methyl chloroacetate\"}",
                "{\"Referent\": \"methyl chloroformate\", \"Canonical name\": \"methyl chloroformate\"}",
                "{\"Referent\": \"pivaloyl chloride\", \"Canonical name\": \"pivaloyl chloride\"}",
                "{\"Referent\": \"propionyl chloride\", \"Canonical name\": \"propionyl chloride\"}",
                "{\"Referent\": \"thionyl chloride\", \"Canonical name\": \"thionyl chloride\"}"
            ],
            "TP": 10,
            "FP": 0,
            "FN": 0
        }
    }
]