[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (AcCl)",
            "Propionyl chloride (PrCl)",
            "Butyryl chloride (BuCl)",
            "Valeryl chloride (VCl)",
            "Hexanoyl chloride (HxCl)",
            "Acetyl bromide (AcBr)",
            "Propionyl bromide (PrBr)",
            "Butyryl bromide (BuBr)",
            "Valeryl bromide (VBr)",
            "Hexanoyl bromide (HxBr)",
            "Acetyl iodide (AcI)",
            "Propionyl iodide (PrI)",
            "Butyryl iodide (BuI)",
            "Valeryl iodide (VI)",
            "Hexanoyl iodide (HxI)",
            "Acetyl fluoride (AcF)",
            "Propionyl fluoride (PrF)",
            "Butyryl fluoride (BuF)",
            "Valeryl fluoride (VF)",
            "Hexanoyl fluoride (HxF)",
            "Benzenecarbonyl chloride (PhCl)",
            "Benzenecarbonyl bromide (PhBr)",
            "Benzenecarbonyl iodide (PhI)",
            "Benzenecarbonyl fluoride (PhF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (AcCl)",
                "Propionyl chloride (PrCl)",
                "Butyryl chloride (BuCl)",
                "Valeryl chloride (VCl)",
                "Hexanoyl chloride (HxCl)",
                "Acetyl bromide (AcBr)",
                "Propionyl bromide (PrBr)",
                "Butyryl bromide (BuBr)",
                "Valeryl bromide (VBr)",
                "Hexanoyl bromide (HxBr)",
                "Acetyl iodide (AcI)",
                "Propionyl iodide (PrI)",
                "Butyryl iodide (BuI)",
                "Valeryl iodide (VI)",
                "Hexanoyl iodide (HxI)",
                "Acetyl fluoride (AcF)",
                "Propionyl fluoride (PrF)",
                "Butyryl fluoride (BuF)",
                "Valeryl fluoride (VF)",
                "Hexanoyl fluoride (HxF)",
                "Benzenecarbonyl chloride (PhCl)",
                "Benzenecarbonyl bromide (PhBr)",
                "Benzenecarbonyl iodide (PhI)",
                "Benzenecarbonyl fluoride (PhF)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl bromide (AcBr)",
                "Acetyl chloride (AcCl)",
                "Acetyl fluoride (AcF)",
                "Acetyl iodide (AcI)",
                "Benzenecarbonyl bromide (PhBr)",
                "Benzenecarbonyl chloride (PhCl)",
                "Benzenecarbonyl fluoride (PhF)",
                "Benzenecarbonyl iodide (PhI)",
                "Butyryl bromide (BuBr)",
                "Butyryl chloride (BuCl)",
                "Butyryl fluoride (BuF)",
                "Butyryl iodide (BuI)",
                "Hexanoyl bromide (HxBr)",
                "Hexanoyl chloride (HxCl)",
                "Hexanoyl fluoride (HxF)",
                "Hexanoyl iodide (HxI)",
                "Propionyl bromide (PrBr)",
                "Propionyl chloride (PrCl)",
                "Propionyl fluoride (PrF)",
                "Propionyl iodide (PrI)",
                "Valeryl bromide (VBr)",
                "Valeryl chloride (VCl)",
                "Valeryl fluoride (VF)",
                "Valeryl iodide (VI)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH3COCl)",
            "Acetyl bromide (CH3COBr)",
            "Propionyl chloride (C2H5COCl)",
            "Propionyl bromide (C2H5COBr)",
            "Butyryl chloride (C3H7COCl)",
            "Butyryl bromide (C3H7COBr)",
            "Valeryl chloride (C4H9COCl)",
            "Valeryl bromide (C4H9COBr)",
            "Isovaleryl chloride ((CH3)2CHCH2COCl)",
            "Isovaleryl bromide ((CH3)2CHCH2COBr)",
            "Benzoyl chloride (C6H5COCl)",
            "Benzoyl bromide (C6H5COBr)",
            "Phenacyl chloride (C6H5CH2COCl)",
            "Phenacyl bromide (C6H5CH2COBr)",
            "Chloroacetyl chloride (ClCH2COCl)",
            "Bromoacetyl bromide (BrCH2COBr)",
            "Trichloroacetyl chloride (CCl3COCl)",
            "Tribromoacetyl bromide (CBr3COBr)",
            "Acetyl fluoride (CH3COF)",
            "Propionyl fluoride (C2H5COF)",
            "Butyryl fluoride (C3H7COF)",
            "Valeryl fluoride (C4H9COF)",
            "Isovaleryl fluoride ((CH3)2CHCH2COF)",
            "Benzoyl fluoride (C6H5COF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH3COCl)",
                "Acetyl bromide (CH3COBr)",
                "Propionyl chloride (C2H5COCl)",
                "Propionyl bromide (C2H5COBr)",
                "Butyryl chloride (C3H7COCl)",
                "Butyryl bromide (C3H7COBr)",
                "Valeryl chloride (C4H9COCl)",
                "Valeryl bromide (C4H9COBr)",
                "Isovaleryl chloride ((CH3)2CHCH2COCl)",
                "Isovaleryl bromide ((CH3)2CHCH2COBr)",
                "Benzoyl chloride (C6H5COCl)",
                "Benzoyl bromide (C6H5COBr)",
                "Phenacyl chloride (C6H5CH2COCl)",
                "Phenacyl bromide (C6H5CH2COBr)",
                "Chloroacetyl chloride (ClCH2COCl)",
                "Bromoacetyl bromide (BrCH2COBr)",
                "Trichloroacetyl chloride (CCl3COCl)",
                "Tribromoacetyl bromide (CBr3COBr)",
                "Acetyl fluoride (CH3COF)",
                "Propionyl fluoride (C2H5COF)",
                "Butyryl fluoride (C3H7COF)",
                "Valeryl fluoride (C4H9COF)",
                "Isovaleryl fluoride ((CH3)2CHCH2COF)",
                "Benzoyl fluoride (C6H5COF)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl bromide (CH3COBr)",
                "Acetyl chloride (CH3COCl)",
                "Acetyl fluoride (CH3COF)",
                "Benzoyl bromide (C6H5COBr)",
                "Benzoyl chloride (C6H5COCl)",
                "Benzoyl fluoride (C6H5COF)",
                "Bromoacetyl bromide (BrCH2COBr)",
                "Butyryl bromide (C3H7COBr)",
                "Butyryl chloride (C3H7COCl)",
                "Butyryl fluoride (C3H7COF)",
                "Chloroacetyl chloride (ClCH2COCl)",
                "Isovaleryl bromide ((CH3)2CHCH2COBr)",
                "Isovaleryl chloride ((CH3)2CHCH2COCl)",
                "Isovaleryl fluoride ((CH3)2CHCH2COF)",
                "Phenacyl bromide (C6H5CH2COBr)",
                "Phenacyl chloride (C6H5CH2COCl)",
                "Propionyl bromide (C2H5COBr)",
                "Propionyl chloride (C2H5COCl)",
                "Propionyl fluoride (C2H5COF)",
                "Tribromoacetyl bromide (CBr3COBr)",
                "Trichloroacetyl chloride (CCl3COCl)",
                "Valeryl bromide (C4H9COBr)",
                "Valeryl chloride (C4H9COCl)",
                "Valeryl fluoride (C4H9COF)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl fluoride (CH3COF)",
            "Acetyl chloride (CH3COCl)",
            "Acetyl bromide (CH3COBr)",
            "Acetyl iodide (CH3COI)",
            "Propionyl fluoride (C2H5COF)",
            "Propionyl chloride (C2H5COCl)",
            "Propionyl bromide (C2H5COBr)",
            "Propionyl iodide (C2H5COI)",
            "Butyryl fluoride (C3H7COF)",
            "Butyryl chloride (C3H7COCl)",
            "Butyryl bromide (C3H7COBr)",
            "Butyryl iodide (C3H7COI)",
            "Valeryl fluoride (C4H9COF)",
            "Valeryl chloride (C4H9COCl)",
            "Valeryl bromide (C4H9COBr)",
            "Valeryl iodide (C4H9COI)",
            "Benzoyl fluoride (C6H5COF)",
            "Benzoyl chloride (C6H5COCl)",
            "Benzoyl bromide (C6H5COBr)",
            "Benzoyl iodide (C6H5COI)",
            "Phenylacetyl fluoride (C6H5CH2COF)",
            "Phenylacetyl chloride (C6H5CH2COCl)",
            "Phenylacetyl bromide (C6H5CH2COBr)",
            "Phenylacetyl iodide (C6H5CH2COI)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl fluoride (CH3COF)",
                "Acetyl chloride (CH3COCl)",
                "Acetyl bromide (CH3COBr)",
                "Acetyl iodide (CH3COI)",
                "Propionyl fluoride (C2H5COF)",
                "Propionyl chloride (C2H5COCl)",
                "Propionyl bromide (C2H5COBr)",
                "Propionyl iodide (C2H5COI)",
                "Butyryl fluoride (C3H7COF)",
                "Butyryl chloride (C3H7COCl)",
                "Butyryl bromide (C3H7COBr)",
                "Butyryl iodide (C3H7COI)",
                "Valeryl fluoride (C4H9COF)",
                "Valeryl chloride (C4H9COCl)",
                "Valeryl bromide (C4H9COBr)",
                "Valeryl iodide (C4H9COI)",
                "Benzoyl fluoride (C6H5COF)",
                "Benzoyl chloride (C6H5COCl)",
                "Benzoyl bromide (C6H5COBr)",
                "Benzoyl iodide (C6H5COI)",
                "Phenylacetyl fluoride (C6H5CH2COF)",
                "Phenylacetyl chloride (C6H5CH2COCl)",
                "Phenylacetyl bromide (C6H5CH2COBr)",
                "Phenylacetyl iodide (C6H5CH2COI)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl bromide (CH3COBr)",
                "Acetyl chloride (CH3COCl)",
                "Acetyl fluoride (CH3COF)",
                "Acetyl iodide (CH3COI)",
                "Benzoyl bromide (C6H5COBr)",
                "Benzoyl chloride (C6H5COCl)",
                "Benzoyl fluoride (C6H5COF)",
                "Benzoyl iodide (C6H5COI)",
                "Butyryl bromide (C3H7COBr)",
                "Butyryl chloride (C3H7COCl)",
                "Butyryl fluoride (C3H7COF)",
                "Butyryl iodide (C3H7COI)",
                "Phenylacetyl bromide (C6H5CH2COBr)",
                "Phenylacetyl chloride (C6H5CH2COCl)",
                "Phenylacetyl fluoride (C6H5CH2COF)",
                "Phenylacetyl iodide (C6H5CH2COI)",
                "Propionyl bromide (C2H5COBr)",
                "Propionyl chloride (C2H5COCl)",
                "Propionyl fluoride (C2H5COF)",
                "Propionyl iodide (C2H5COI)",
                "Valeryl bromide (C4H9COBr)",
                "Valeryl chloride (C4H9COCl)",
                "Valeryl fluoride (C4H9COF)",
                "Valeryl iodide (C4H9COI)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (AcCl)",
            "Acetyl bromide (AcBr)",
            "Acetyl iodide (AcI)",
            "Propionyl chloride (PrCl)",
            "Propionyl bromide (PrBr)",
            "Butyryl chloride (BuCl)",
            "Butyryl bromide (BuBr)",
            "Isobutyryl chloride (iBuCl)",
            "Isobutyryl bromide (iBuBr)",
            "Benzoyl chloride (BzCl)",
            "Benzoyl bromide (BzBr)",
            "Benzoyl iodide (BzI)",
            "Formyl chloride (HCOCl)",
            "Formyl bromide (HCOBr)",
            "Succinyl chloride (SucCl)",
            "Succinyl bromide (SucBr)",
            "Adipoyl chloride (AdCl)",
            "Adipoyl bromide (AdBr)",
            "Sebacoyl chloride (SebCl)",
            "Sebacoyl bromide (SebBr)",
            "2-Methylpropionyl chloride (MPCl)",
            "2-Methylpropionyl bromide (MPBr)",
            "Cyclopropanecarbonyl chloride (CPCl)",
            "Cyclopropanecarbonyl bromide (CPBr)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (AcCl)",
                "Acetyl bromide (AcBr)",
                "Acetyl iodide (AcI)",
                "Propionyl chloride (PrCl)",
                "Propionyl bromide (PrBr)",
                "Butyryl chloride (BuCl)",
                "Butyryl bromide (BuBr)",
                "Isobutyryl chloride (iBuCl)",
                "Isobutyryl bromide (iBuBr)",
                "Benzoyl chloride (BzCl)",
                "Benzoyl bromide (BzBr)",
                "Benzoyl iodide (BzI)",
                "Formyl chloride (HCOCl)",
                "Formyl bromide (HCOBr)",
                "Succinyl chloride (SucCl)",
                "Succinyl bromide (SucBr)",
                "Adipoyl chloride (AdCl)",
                "Adipoyl bromide (AdBr)",
                "Sebacoyl chloride (SebCl)",
                "Sebacoyl bromide (SebBr)",
                "2-Methylpropionyl chloride (MPCl)",
                "2-Methylpropionyl bromide (MPBr)",
                "Cyclopropanecarbonyl chloride (CPCl)",
                "Cyclopropanecarbonyl bromide (CPBr)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Methylpropionyl bromide (MPBr)",
                "2-Methylpropionyl chloride (MPCl)",
                "Acetyl bromide (AcBr)",
                "Acetyl chloride (AcCl)",
                "Acetyl iodide (AcI)",
                "Adipoyl bromide (AdBr)",
                "Adipoyl chloride (AdCl)",
                "Benzoyl bromide (BzBr)",
                "Benzoyl chloride (BzCl)",
                "Benzoyl iodide (BzI)",
                "Butyryl bromide (BuBr)",
                "Butyryl chloride (BuCl)",
                "Cyclopropanecarbonyl bromide (CPBr)",
                "Cyclopropanecarbonyl chloride (CPCl)",
                "Formyl bromide (HCOBr)",
                "Formyl chloride (HCOCl)",
                "Isobutyryl bromide (iBuBr)",
                "Isobutyryl chloride (iBuCl)",
                "Propionyl bromide (PrBr)",
                "Propionyl chloride (PrCl)",
                "Sebacoyl bromide (SebBr)",
                "Sebacoyl chloride (SebCl)",
                "Succinyl bromide (SucBr)",
                "Succinyl chloride (SucCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH3COCl)",
            "Benzoyl chloride (C6H5COCl)",
            "Propionyl chloride (C2H5COCl)",
            "Butyryl chloride (C3H7COCl)",
            "Valeryl chloride (C4H9COCl)",
            "Caproyl chloride (C5H11COCl)",
            "Heptanoyl chloride (C6H13COCl)",
            "Octanoyl chloride (C7H15COCl)",
            "Nonanoyl chloride (C8H17COCl)",
            "Decanoyl chloride (C9H19COCl)",
            "Lauryl chloride (C11H23COCl)",
            "Myristoyl chloride (C13H27COCl)",
            "Palmitoyl chloride (C15H31COCl)",
            "Stearoyl chloride (C17H35COCl)",
            "Acryloyl chloride (C3H3ClO)",
            "Methacryloyl chloride (C4H5ClO)",
            "Trifluoroacetyl chloride (C2ClF3O)",
            "Chloroacetyl chloride (C2H2Cl2O)",
            "Bromoacetyl chloride (C2H2BrClO)",
            "Iodoacetyl chloride (C2H2IClO)",
            "Trichloroacetyl chloride (C2Cl3O)",
            "Pentafluorobenzoyl chloride (C7ClF5O)",
            "Perfluorobutyryl chloride (C4ClF7O)",
            "Tosyl chloride (C7H7ClO2S)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH3COCl)",
                "Benzoyl chloride (C6H5COCl)",
                "Propionyl chloride (C2H5COCl)",
                "Butyryl chloride (C3H7COCl)",
                "Valeryl chloride (C4H9COCl)",
                "Caproyl chloride (C5H11COCl)",
                "Heptanoyl chloride (C6H13COCl)",
                "Octanoyl chloride (C7H15COCl)",
                "Nonanoyl chloride (C8H17COCl)",
                "Decanoyl chloride (C9H19COCl)",
                "Lauryl chloride (C11H23COCl)",
                "Myristoyl chloride (C13H27COCl)",
                "Palmitoyl chloride (C15H31COCl)",
                "Stearoyl chloride (C17H35COCl)",
                "Acryloyl chloride (C3H3ClO)",
                "Methacryloyl chloride (C4H5ClO)",
                "Trifluoroacetyl chloride (C2ClF3O)",
                "Chloroacetyl chloride (C2H2Cl2O)",
                "Bromoacetyl chloride (C2H2BrClO)",
                "Iodoacetyl chloride (C2H2IClO)",
                "Trichloroacetyl chloride (C2Cl3O)",
                "Pentafluorobenzoyl chloride (C7ClF5O)",
                "Perfluorobutyryl chloride (C4ClF7O)",
                "Tosyl chloride (C7H7ClO2S)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl chloride (CH3COCl)",
                "Acryloyl chloride (C3H3ClO)",
                "Benzoyl chloride (C6H5COCl)",
                "Bromoacetyl chloride (C2H2BrClO)",
                "Butyryl chloride (C3H7COCl)",
                "Caproyl chloride (C5H11COCl)",
                "Chloroacetyl chloride (C2H2Cl2O)",
                "Decanoyl chloride (C9H19COCl)",
                "Heptanoyl chloride (C6H13COCl)",
                "Iodoacetyl chloride (C2H2IClO)",
                "Lauryl chloride (C11H23COCl)",
                "Methacryloyl chloride (C4H5ClO)",
                "Myristoyl chloride (C13H27COCl)",
                "Nonanoyl chloride (C8H17COCl)",
                "Octanoyl chloride (C7H15COCl)",
                "Palmitoyl chloride (C15H31COCl)",
                "Pentafluorobenzoyl chloride (C7ClF5O)",
                "Perfluorobutyryl chloride (C4ClF7O)",
                "Propionyl chloride (C2H5COCl)",
                "Stearoyl chloride (C17H35COCl)",
                "Tosyl chloride (C7H7ClO2S)",
                "Trichloroacetyl chloride (C2Cl3O)",
                "Trifluoroacetyl chloride (C2ClF3O)",
                "Valeryl chloride (C4H9COCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (AcCl)",
            "Benzoyl chloride (BzCl)",
            "Propionyl chloride (PrCl)",
            "Butyryl chloride (BuCl)",
            "Valeryl chloride (ValCl)",
            "Caproyl chloride (CapCl)",
            "Octanoyl chloride (OctCl)",
            "Dodecanoyl chloride (DodecCl)",
            "Palmitoyl chloride (PalCl)",
            "Stearoyl chloride (SteCl)",
            "Chloroacetyl chloride (ClAcCl)",
            "Trichloroacetyl chloride (Cl3CCl)",
            "2-Furoyl chloride (FurCl)",
            "3-Phenylpropionyl chloride (PhPrCl)",
            "4-Methylbenzoyl chloride (pMeBzCl)",
            "2-Pyridylacetyl chloride (2-PyAcCl)",
            "3-Butenoyl chloride (3-BuCl)",
            "4-Butyryl chloride (4-BuCl)",
            "2-Isobutyryl chloride (iBuCl)",
            "Cyclohexanecarbonyl chloride (CycCl)",
            "Arachidoyl chloride (ArachCl)",
            "Cinnamoyl chloride (CinnCl)",
            "Hexanoyl chloride (HexCl)",
            "2-Phenylpropionyl chloride (2-PhPrCl)",
            "2-Methylbutyryl chloride (2-MeBuCl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (AcCl)",
                "Benzoyl chloride (BzCl)",
                "Propionyl chloride (PrCl)",
                "Butyryl chloride (BuCl)",
                "Valeryl chloride (ValCl)",
                "Caproyl chloride (CapCl)",
                "Octanoyl chloride (OctCl)",
                "Dodecanoyl chloride (DodecCl)",
                "Palmitoyl chloride (PalCl)",
                "Stearoyl chloride (SteCl)",
                "Chloroacetyl chloride (ClAcCl)",
                "Trichloroacetyl chloride (Cl3CCl)",
                "2-Furoyl chloride (FurCl)",
                "3-Phenylpropionyl chloride (PhPrCl)",
                "4-Methylbenzoyl chloride (pMeBzCl)",
                "2-Pyridylacetyl chloride (2-PyAcCl)",
                "3-Butenoyl chloride (3-BuCl)",
                "4-Butyryl chloride (4-BuCl)",
                "2-Isobutyryl chloride (iBuCl)",
                "Cyclohexanecarbonyl chloride (CycCl)",
                "Arachidoyl chloride (ArachCl)",
                "Cinnamoyl chloride (CinnCl)",
                "Hexanoyl chloride (HexCl)",
                "2-Phenylpropionyl chloride (2-PhPrCl)"
            ],
            "mismatches": [
                "2-Methylbutyryl chloride (2-MeBuCl)"
            ],
            "true_referents": [
                "2-Furoyl chloride (FurCl)",
                "2-Isobutyryl chloride (iBuCl)",
                "2-Phenylpropionyl chloride (2-PhPrCl)",
                "2-Pyridylacetyl chloride (2-PyAcCl)",
                "3-Butenoyl chloride (3-BuCl)",
                "3-Phenylpropionyl chloride (PhPrCl)",
                "4-Butyryl chloride (4-BuCl)",
                "4-Methylbenzoyl chloride (pMeBzCl)",
                "Acetyl chloride (AcCl)",
                "Arachidoyl chloride (ArachCl)",
                "Benzoyl chloride (BzCl)",
                "Butyryl chloride (BuCl)",
                "Caproyl chloride (CapCl)",
                "Chloroacetyl chloride (ClAcCl)",
                "Cinnamoyl chloride (CinnCl)",
                "Cyclohexanecarbonyl chloride (CycCl)",
                "Dodecanoyl chloride (DodecCl)",
                "Hexanoyl chloride (HexCl)",
                "Octanoyl chloride (OctCl)",
                "Palmitoyl chloride (PalCl)",
                "Propionyl chloride (PrCl)",
                "Stearoyl chloride (SteCl)",
                "Trichloroacetyl chloride (Cl3CCl)",
                "Valeryl chloride (ValCl)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH3COCl)",
            "Propionyl chloride (CH3CH2COCl)",
            "Butyryl chloride (CH3(CH2)2COCl)",
            "Pivaloyl chloride ((CH3)3CCOCl)",
            "Benzoyl chloride (C6H5COCl)",
            "Acryloyl chloride (CH2=CHCOCl)",
            "Methacryloyl chloride (CH2=C(CH3)COCl)",
            "Hexanoyl chloride (CH3(CH2)4COCl)",
            "Octanoyl chloride (CH3(CH2)6COCl)",
            "Decanoyl chloride (CH3(CH2)8COCl)",
            "Dodecanoyl chloride (CH3(CH2)10COCl)",
            "Stearoyl chloride (CH3(CH2)16COCl)",
            "Myristoyl chloride (CH3(CH2)12COCl)",
            "Palmitoyl chloride (CH3(CH2)14COCl)",
            "Oleoyl chloride (CH3(CH2)7CH=CH(CH2)7COCl)",
            "Linoleoyl chloride (CH3(CH2)4CH=CHCH2CH=CH(CH2)7COCl)",
            "Arachidoyl chloride (CH3(CH2)18COCl)",
            "Behenoyl chloride (CH3(CH2)20COCl)",
            "Lignoceroyl chloride (CH3(CH2)22COCl)",
            "Cerotoyl chloride (CH3(CH2)24COCl)",
            "Melissyl chloride (CH3(CH2)28COCl)",
            "Lacceryl chloride (CH3(CH2)30COCl)",
            "Ceryl chloride (CH3(CH2)24COCl)",
            "Gedanoyl chloride (CH3(CH2)26COCl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH3COCl)",
                "Propionyl chloride (CH3CH2COCl)",
                "Butyryl chloride (CH3(CH2)2COCl)",
                "Pivaloyl chloride ((CH3)3CCOCl)",
                "Benzoyl chloride (C6H5COCl)",
                "Acryloyl chloride (CH2=CHCOCl)",
                "Methacryloyl chloride (CH2=C(CH3)COCl)",
                "Hexanoyl chloride (CH3(CH2)4COCl)",
                "Octanoyl chloride (CH3(CH2)6COCl)",
                "Decanoyl chloride (CH3(CH2)8COCl)",
                "Dodecanoyl chloride (CH3(CH2)10COCl)",
                "Stearoyl chloride (CH3(CH2)16COCl)",
                "Myristoyl chloride (CH3(CH2)12COCl)",
                "Palmitoyl chloride (CH3(CH2)14COCl)",
                "Oleoyl chloride (CH3(CH2)7CH=CH(CH2)7COCl)",
                "Linoleoyl chloride (CH3(CH2)4CH=CHCH2CH=CH(CH2)7COCl)",
                "Arachidoyl chloride (CH3(CH2)18COCl)",
                "Behenoyl chloride (CH3(CH2)20COCl)",
                "Lignoceroyl chloride (CH3(CH2)22COCl)",
                "Cerotoyl chloride (CH3(CH2)24COCl)",
                "Ceryl chloride (CH3(CH2)24COCl)"
            ],
            "mismatches": [
                "Melissyl chloride (CH3(CH2)28COCl)",
                "Lacceryl chloride (CH3(CH2)30COCl)",
                "Gedanoyl chloride (CH3(CH2)26COCl)"
            ],
            "true_referents": [
                "Acetyl chloride (CH3COCl)",
                "Acryloyl chloride (CH2=CHCOCl)",
                "Arachidoyl chloride (CH3(CH2)18COCl)",
                "Behenoyl chloride (CH3(CH2)20COCl)",
                "Benzoyl chloride (C6H5COCl)",
                "Butyryl chloride (CH3(CH2)2COCl)",
                "Cerotoyl chloride (CH3(CH2)24COCl)",
                "Ceryl chloride (CH3(CH2)24COCl)",
                "Decanoyl chloride (CH3(CH2)8COCl)",
                "Dodecanoyl chloride (CH3(CH2)10COCl)",
                "Gedanoyl chloride (CH3(CH2)26COCl)",
                "Hexanoyl chloride (CH3(CH2)4COCl)",
                "Lacceryl chloride (CH3(CH2)30COCl)",
                "Lignoceroyl chloride (CH3(CH2)22COCl)",
                "Linoleoyl chloride (CH3(CH2)4CH=CHCH2CH=CH(CH2)7COCl)",
                "Melissyl chloride (CH3(CH2)28COCl)",
                "Methacryloyl chloride (CH2=C(CH3)COCl)",
                "Myristoyl chloride (CH3(CH2)12COCl)",
                "Octanoyl chloride (CH3(CH2)6COCl)",
                "Oleoyl chloride (CH3(CH2)7CH=CH(CH2)7COCl)",
                "Palmitoyl chloride (CH3(CH2)14COCl)",
                "Pivaloyl chloride ((CH3)3CCOCl)",
                "Propionyl chloride (CH3CH2COCl)",
                "Stearoyl chloride (CH3(CH2)16COCl)"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride",
            "Benzoyl chloride",
            "Propionyl chloride",
            "Butyryl chloride",
            "Caproyl chloride",
            "Lauric chloride",
            "Palmitoyl chloride",
            "Stearoyl chloride",
            "Myristoyl chloride",
            "Arachidoyl chloride",
            "Oleoyl chloride",
            "Linoleoyl chloride",
            "Linolenoyl chloride",
            "Eicosanoyl chloride",
            "Docosanoyl chloride",
            "Tetradecanoyl chloride",
            "Hexadecanoyl chloride",
            "Octadecanoyl chloride",
            "Nonadecanoyl chloride",
            "Icosanoyl chloride",
            "Heneicosanoyl chloride",
            "Tricosanoyl chloride",
            "Tetracosanoyl chloride",
            "Pentacosanoyl chloride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride",
                "Arachidoyl chloride",
                "Benzoyl chloride",
                "Butyryl chloride",
                "Caproyl chloride",
                "Docosanoyl chloride",
                "Eicosanoyl chloride",
                "Heneicosanoyl chloride",
                "Hexadecanoyl chloride",
                "Icosanoyl chloride",
                "Lauric chloride",
                "Linolenoyl chloride",
                "Linoleoyl chloride",
                "Myristoyl chloride",
                "Nonadecanoyl chloride",
                "Octadecanoyl chloride",
                "Oleoyl chloride",
                "Palmitoyl chloride",
                "Pentacosanoyl chloride",
                "Propionyl chloride",
                "Stearoyl chloride",
                "Tetracosanoyl chloride",
                "Tetradecanoyl chloride",
                "Tricosanoyl chloride"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl chloride",
                "Arachidoyl chloride",
                "Benzoyl chloride",
                "Butyryl chloride",
                "Caproyl chloride",
                "Docosanoyl chloride",
                "Eicosanoyl chloride",
                "Heneicosanoyl chloride",
                "Hexadecanoyl chloride",
                "Icosanoyl chloride",
                "Lauric chloride",
                "Linolenoyl chloride",
                "Linoleoyl chloride",
                "Myristoyl chloride",
                "Nonadecanoyl chloride",
                "Octadecanoyl chloride",
                "Oleoyl chloride",
                "Palmitoyl chloride",
                "Pentacosanoyl chloride",
                "Propionyl chloride",
                "Stearoyl chloride",
                "Tetracosanoyl chloride",
                "Tetradecanoyl chloride",
                "Tricosanoyl chloride"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH\u2083COCl)",
            "Benzoyl chloride (C\u2086H\u2085COCl)",
            "Propionyl chloride (CH\u2083CH\u2082COCl)",
            "Butyryl chloride (CH\u2083CH\u2082CH\u2082COCl)",
            "Pivaloyl chloride (CH\u2083\u2083CCOCl)",
            "Formyl chloride (HCOCl)",
            "Succinyl chloride (CH\u2083CH\u2082COClCOCH\u2082CH\u2083)",
            "Malonyl chloride (CH\u2082(COCl)\u2082)",
            "Phthaloyl chloride (C\u2086H\u2084(COCl)\u2082)",
            "2,4-Dichlorobenzoyl chloride",
            "Hexanoyl chloride (C\u2085H\u2081\u2081COCl)",
            "Valeryl chloride (C\u2084H\u2089COCl)",
            "Isobutyryl chloride (CH\u2083CH(CH\u2083)COCl)",
            "Levulinoyl chloride (CH\u2083C(O)CH\u2082CH\u2082COCl)",
            "Cyclohexanoyl chloride (C\u2086H\u2081\u2081COCl)",
            "Octanoyl chloride (C\u2087H\u2081\u2085COCl)",
            "Dodecanoyl chloride (C\u2081\u2081H\u2082\u2083COCl)",
            "Phenylacetyl chloride (C\u2086H\u2085CH\u2082COCl)",
            "Pivaloyl chloride (tert-Butyryl chloride, (CH\u2083)\u2083CCOCl)",
            "Methyl chloroacetyl chloride (CH\u2083CClCOCl)",
            "Chloroacyl chloride (ClCH\u2082COCl)",
            "2-Chlorobenzoyl chloride",
            "4-Chlorobenzoyl chloride",
            "3,5-Dichlorobenzoyl chloride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH\u2083COCl)",
                "Benzoyl chloride (C\u2086H\u2085COCl)",
                "Propionyl chloride (CH\u2083CH\u2082COCl)",
                "Butyryl chloride (CH\u2083CH\u2082CH\u2082COCl)",
                "Pivaloyl chloride (CH\u2083\u2083CCOCl)",
                "Formyl chloride (HCOCl)",
                "Succinyl chloride (CH\u2083CH\u2082COClCOCH\u2082CH\u2083)",
                "Malonyl chloride (CH\u2082(COCl)\u2082)",
                "Phthaloyl chloride (C\u2086H\u2084(COCl)\u2082)",
                "2,4-Dichlorobenzoyl chloride",
                "Hexanoyl chloride (C\u2085H\u2081\u2081COCl)",
                "Valeryl chloride (C\u2084H\u2089COCl)",
                "Isobutyryl chloride (CH\u2083CH(CH\u2083)COCl)",
                "Levulinoyl chloride (CH\u2083C(O)CH\u2082CH\u2082COCl)",
                "Cyclohexanoyl chloride (C\u2086H\u2081\u2081COCl)",
                "Octanoyl chloride (C\u2087H\u2081\u2085COCl)",
                "Dodecanoyl chloride (C\u2081\u2081H\u2082\u2083COCl)",
                "Phenylacetyl chloride (C\u2086H\u2085CH\u2082COCl)",
                "Pivaloyl chloride (tert-Butyryl chloride, (CH\u2083)\u2083CCOCl)",
                "Methyl chloroacetyl chloride (CH\u2083CClCOCl)",
                "Chloroacyl chloride (ClCH\u2082COCl)",
                "2-Chlorobenzoyl chloride",
                "4-Chlorobenzoyl chloride",
                "3,5-Dichlorobenzoyl chloride"
            ],
            "mismatches": [],
            "true_referents": [
                "2,4-Dichlorobenzoyl chloride",
                "2-Chlorobenzoyl chloride",
                "3,5-Dichlorobenzoyl chloride",
                "4-Chlorobenzoyl chloride",
                "Acetyl chloride (CH\u2083COCl)",
                "Benzoyl chloride (C\u2086H\u2085COCl)",
                "Butyryl chloride (CH\u2083CH\u2082CH\u2082COCl)",
                "Chloroacyl chloride (ClCH\u2082COCl)",
                "Cyclohexanoyl chloride (C\u2086H\u2081\u2081COCl)",
                "Dodecanoyl chloride (C\u2081\u2081H\u2082\u2083COCl)",
                "Formyl chloride (HCOCl)",
                "Hexanoyl chloride (C\u2085H\u2081\u2081COCl)",
                "Isobutyryl chloride (CH\u2083CH(CH\u2083)COCl)",
                "Levulinoyl chloride (CH\u2083C(O)CH\u2082CH\u2082COCl)",
                "Malonyl chloride (CH\u2082(COCl)\u2082)",
                "Methyl chloroacetyl chloride (CH\u2083CClCOCl)",
                "Octanoyl chloride (C\u2087H\u2081\u2085COCl)",
                "Phenylacetyl chloride (C\u2086H\u2085CH\u2082COCl)",
                "Phthaloyl chloride (C\u2086H\u2084(COCl)\u2082)",
                "Pivaloyl chloride (CH\u2083\u2083CCOCl)",
                "Pivaloyl chloride (tert-Butyryl chloride, (CH\u2083)\u2083CCOCl)",
                "Propionyl chloride (CH\u2083CH\u2082COCl)",
                "Succinyl chloride (CH\u2083CH\u2082COClCOCH\u2082CH\u2083)",
                "Valeryl chloride (C\u2084H\u2089COCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH3COCl)",
            "Propionyl bromide (CH3CH2COBr)",
            "Benzoyl fluoride (C6H5COF)",
            "Butyryl iodide (CH3CH2CH2COI)",
            "Acryloyl chloride (CH2=CHCOCl)",
            "Oxalyl chloride ((COCl)2)",
            "Palmitoyl chloride (CH3(CH2)14COCl)",
            "Pivaloyl chloride ((CH3)3CCOCl)",
            "Malonyl dichloride (ClCOCH2COCl)",
            "Succinyl chloride (ClCOCH2CH2COCl)",
            "Phthaloyl chloride (C6H4(COCl)2)",
            "Cinnamoyl chloride (C6H5CH=CHCOCl)",
            "Lauroyl chloride (CH3(CH2)10COCl)",
            "Stearoyl chloride (CH3(CH2)16COCl)",
            "Crotonoyl chloride (CH3CH=CHCOCl)",
            "Adipoyl chloride (ClCO(CH2)4COCl)",
            "Fumaryl chloride (ClCOCH=CHCOCl)",
            "Isophthaloyl dichloride (C6H4-1,3-(COCl)2)",
            "Terephthaloyl dichloride (C6H4-1,4-(COCl)2)",
            "Myristoyl chloride (CH3(CH2)12COCl)",
            "Oleoyl chloride (CH3(CH2)7CH=CH(CH2)7COCl)",
            "Acetyl bromide (CH3COBr)",
            "Propionyl chloride (CH3CH2COCl)",
            "Butyryl chloride (CH3CH2CH2COCl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH3COCl)",
                "Propionyl bromide (CH3CH2COBr)",
                "Benzoyl fluoride (C6H5COF)",
                "Butyryl iodide (CH3CH2CH2COI)",
                "Acryloyl chloride (CH2=CHCOCl)",
                "Oxalyl chloride ((COCl)2)",
                "Palmitoyl chloride (CH3(CH2)14COCl)",
                "Pivaloyl chloride ((CH3)3CCOCl)",
                "Malonyl dichloride (ClCOCH2COCl)",
                "Succinyl chloride (ClCOCH2CH2COCl)",
                "Phthaloyl chloride (C6H4(COCl)2)",
                "Cinnamoyl chloride (C6H5CH=CHCOCl)",
                "Lauroyl chloride (CH3(CH2)10COCl)",
                "Stearoyl chloride (CH3(CH2)16COCl)",
                "Crotonoyl chloride (CH3CH=CHCOCl)",
                "Adipoyl chloride (ClCO(CH2)4COCl)",
                "Fumaryl chloride (ClCOCH=CHCOCl)",
                "Isophthaloyl dichloride (C6H4-1,3-(COCl)2)",
                "Terephthaloyl dichloride (C6H4-1,4-(COCl)2)",
                "Myristoyl chloride (CH3(CH2)12COCl)",
                "Oleoyl chloride (CH3(CH2)7CH=CH(CH2)7COCl)",
                "Acetyl bromide (CH3COBr)",
                "Propionyl chloride (CH3CH2COCl)",
                "Butyryl chloride (CH3CH2CH2COCl)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl bromide (CH3COBr)",
                "Acetyl chloride (CH3COCl)",
                "Acryloyl chloride (CH2=CHCOCl)",
                "Adipoyl chloride (ClCO(CH2)4COCl)",
                "Benzoyl fluoride (C6H5COF)",
                "Butyryl chloride (CH3CH2CH2COCl)",
                "Butyryl iodide (CH3CH2CH2COI)",
                "Cinnamoyl chloride (C6H5CH=CHCOCl)",
                "Crotonoyl chloride (CH3CH=CHCOCl)",
                "Fumaryl chloride (ClCOCH=CHCOCl)",
                "Isophthaloyl dichloride (C6H4-1,3-(COCl)2)",
                "Lauroyl chloride (CH3(CH2)10COCl)",
                "Malonyl dichloride (ClCOCH2COCl)",
                "Myristoyl chloride (CH3(CH2)12COCl)",
                "Oleoyl chloride (CH3(CH2)7CH=CH(CH2)7COCl)",
                "Oxalyl chloride ((COCl)2)",
                "Palmitoyl chloride (CH3(CH2)14COCl)",
                "Phthaloyl chloride (C6H4(COCl)2)",
                "Pivaloyl chloride ((CH3)3CCOCl)",
                "Propionyl bromide (CH3CH2COBr)",
                "Propionyl chloride (CH3CH2COCl)",
                "Stearoyl chloride (CH3(CH2)16COCl)",
                "Succinyl chloride (ClCOCH2CH2COCl)",
                "Terephthaloyl dichloride (C6H4-1,4-(COCl)2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH3COCl)",
            "Acetyl bromide (CH3COBr)",
            "Acetyl iodide (CH3COI)",
            "Propionyl chloride (CH3CH2COCl)",
            "Propionyl bromide (CH3CH2COBr)",
            "Propionyl iodide (CH3CH2COI)",
            "Butyryl chloride (CH3CH2CH2COCl)",
            "Butyryl bromide (CH3CH2CH2COBr)",
            "Butyryl iodide (CH3CH2CH2COI)",
            "Benzoyl chloride (C6H5COCl)",
            "Benzoyl bromide (C6H5COBr)",
            "Benzoyl iodide (C6H5COI)",
            "Oxalyl chloride ((COCl)2)",
            "Oxalyl bromide ((COBr)2)",
            "Succinyl chloride ((CH2COCl)2)",
            "Glutaryl chloride ((CH2)2COCl)2)",
            "Adipoyl chloride ((CH2)3COCl)2)",
            "Sebacoyl chloride ((CH2)8(COCl)2)",
            "Terephthaloyl chloride (C6H4(COCl)2)",
            "Isophthaloyl chloride (C6H4(COCl)2)",
            "Phthaloyl chloride (C6H4(COCl)2)",
            "Malonyl chloride (CH2(COCl)2)",
            "Fumaryl chloride ((CH)2(COCl)2)",
            "Crotonyl chloride (CH3CH=CHCOCl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH3COCl)",
                "Acetyl bromide (CH3COBr)",
                "Acetyl iodide (CH3COI)",
                "Propionyl chloride (CH3CH2COCl)",
                "Propionyl bromide (CH3CH2COBr)",
                "Propionyl iodide (CH3CH2COI)",
                "Butyryl chloride (CH3CH2CH2COCl)",
                "Butyryl bromide (CH3CH2CH2COBr)",
                "Butyryl iodide (CH3CH2CH2COI)",
                "Benzoyl chloride (C6H5COCl)",
                "Benzoyl bromide (C6H5COBr)",
                "Benzoyl iodide (C6H5COI)",
                "Oxalyl chloride ((COCl)2)",
                "Oxalyl bromide ((COBr)2)",
                "Succinyl chloride ((CH2COCl)2)",
                "Glutaryl chloride ((CH2)2COCl)2)",
                "Adipoyl chloride ((CH2)3COCl)2)",
                "Sebacoyl chloride ((CH2)8(COCl)2)",
                "Terephthaloyl chloride (C6H4(COCl)2)",
                "Isophthaloyl chloride (C6H4(COCl)2)",
                "Phthaloyl chloride (C6H4(COCl)2)",
                "Malonyl chloride (CH2(COCl)2)",
                "Fumaryl chloride ((CH)2(COCl)2)",
                "Crotonyl chloride (CH3CH=CHCOCl)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl bromide (CH3COBr)",
                "Acetyl chloride (CH3COCl)",
                "Acetyl iodide (CH3COI)",
                "Adipoyl chloride ((CH2)3COCl)2)",
                "Benzoyl bromide (C6H5COBr)",
                "Benzoyl chloride (C6H5COCl)",
                "Benzoyl iodide (C6H5COI)",
                "Butyryl bromide (CH3CH2CH2COBr)",
                "Butyryl chloride (CH3CH2CH2COCl)",
                "Butyryl iodide (CH3CH2CH2COI)",
                "Crotonyl chloride (CH3CH=CHCOCl)",
                "Fumaryl chloride ((CH)2(COCl)2)",
                "Glutaryl chloride ((CH2)2COCl)2)",
                "Isophthaloyl chloride (C6H4(COCl)2)",
                "Malonyl chloride (CH2(COCl)2)",
                "Oxalyl bromide ((COBr)2)",
                "Oxalyl chloride ((COCl)2)",
                "Phthaloyl chloride (C6H4(COCl)2)",
                "Propionyl bromide (CH3CH2COBr)",
                "Propionyl chloride (CH3CH2COCl)",
                "Propionyl iodide (CH3CH2COI)",
                "Sebacoyl chloride ((CH2)8(COCl)2)",
                "Succinyl chloride ((CH2COCl)2)",
                "Terephthaloyl chloride (C6H4(COCl)2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (CH3COCl)",
            "Acetyl bromide (CH3COBr)",
            "Acetyl fluoride (CH3COF)",
            "Acetyl iodide (CH3COI)",
            "Propionyl chloride (C2H5COCl)",
            "Propionyl bromide (C2H5COBr)",
            "Propionyl fluoride (C2H5COF)",
            "Propionyl iodide (C2H5COI)",
            "Butyryl chloride (C3H7COCl)",
            "Butyryl bromide (C3H7COBr)",
            "Butyryl fluoride (C3H7COF)",
            "Butyryl iodide (C3H7COI)",
            "Benzoyl chloride (C6H5COCl)",
            "Benzoyl bromide (C6H5COBr)",
            "Benzoyl fluoride (C6H5COF)",
            "Benzoyl iodide (C6H5COI)",
            "Trifluoroacetyl chloride (CF3COCl)",
            "Trifluoroacetyl bromide (CF3COBr)",
            "Trifluoroacetyl fluoride (CF3COF)",
            "Trifluoroacetyl iodide (CF3COI)",
            "Trichloroacetyl chloride (CCl3COCl)",
            "Trichloroacetyl bromide (CCl3COBr)",
            "Trichloroacetyl fluoride (CCl3COF)",
            "Trichloroacetyl iodide (CCl3COI)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (CH3COCl)",
                "Acetyl bromide (CH3COBr)",
                "Acetyl fluoride (CH3COF)",
                "Acetyl iodide (CH3COI)",
                "Propionyl chloride (C2H5COCl)",
                "Propionyl bromide (C2H5COBr)",
                "Propionyl fluoride (C2H5COF)",
                "Propionyl iodide (C2H5COI)",
                "Butyryl chloride (C3H7COCl)",
                "Butyryl bromide (C3H7COBr)",
                "Butyryl fluoride (C3H7COF)",
                "Butyryl iodide (C3H7COI)",
                "Benzoyl chloride (C6H5COCl)",
                "Benzoyl bromide (C6H5COBr)",
                "Benzoyl fluoride (C6H5COF)",
                "Benzoyl iodide (C6H5COI)",
                "Trifluoroacetyl chloride (CF3COCl)",
                "Trifluoroacetyl bromide (CF3COBr)",
                "Trifluoroacetyl fluoride (CF3COF)",
                "Trifluoroacetyl iodide (CF3COI)",
                "Trichloroacetyl chloride (CCl3COCl)",
                "Trichloroacetyl bromide (CCl3COBr)",
                "Trichloroacetyl fluoride (CCl3COF)",
                "Trichloroacetyl iodide (CCl3COI)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl bromide (CH3COBr)",
                "Acetyl chloride (CH3COCl)",
                "Acetyl fluoride (CH3COF)",
                "Acetyl iodide (CH3COI)",
                "Benzoyl bromide (C6H5COBr)",
                "Benzoyl chloride (C6H5COCl)",
                "Benzoyl fluoride (C6H5COF)",
                "Benzoyl iodide (C6H5COI)",
                "Butyryl bromide (C3H7COBr)",
                "Butyryl chloride (C3H7COCl)",
                "Butyryl fluoride (C3H7COF)",
                "Butyryl iodide (C3H7COI)",
                "Propionyl bromide (C2H5COBr)",
                "Propionyl chloride (C2H5COCl)",
                "Propionyl fluoride (C2H5COF)",
                "Propionyl iodide (C2H5COI)",
                "Trichloroacetyl bromide (CCl3COBr)",
                "Trichloroacetyl chloride (CCl3COCl)",
                "Trichloroacetyl fluoride (CCl3COF)",
                "Trichloroacetyl iodide (CCl3COI)",
                "Trifluoroacetyl bromide (CF3COBr)",
                "Trifluoroacetyl chloride (CF3COCl)",
                "Trifluoroacetyl fluoride (CF3COF)",
                "Trifluoroacetyl iodide (CF3COI)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (AcCl)",
            "Acetyl bromide (AcBr)",
            "Propionyl chloride (PrCl)",
            "Propionyl bromide (PrBr)",
            "Butyryl chloride (BuCl)",
            "Butyryl bromide (BuBr)",
            "Valeryl chloride (VaCl)",
            "Valeryl bromide (VaBr)",
            "Pivaloyl chloride (PivCl)",
            "Pivaloyl bromide (PivBr)",
            "Hexanoyl chloride (HxCl)",
            "Hexanoyl bromide (HxBr)",
            "Heptanoyl chloride (HpCl)",
            "Heptanoyl bromide (HpBr)",
            "Octanoyl chloride (OcCl)",
            "Octanoyl bromide (OcBr)",
            "Nonanoyl chloride (NoCl)",
            "Nonanoyl bromide (NoBr)",
            "Decanoyl chloride (DeCl)",
            "Decanoyl bromide (DeBr)",
            "Lauroyl chloride (LaCl)",
            "Lauroyl bromide (LaBr)",
            "Myristoyl chloride (MyCl)",
            "Myristoyl bromide (MyBr)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (AcCl)",
                "Acetyl bromide (AcBr)",
                "Propionyl chloride (PrCl)",
                "Propionyl bromide (PrBr)",
                "Butyryl chloride (BuCl)",
                "Butyryl bromide (BuBr)",
                "Valeryl chloride (VaCl)",
                "Valeryl bromide (VaBr)",
                "Pivaloyl chloride (PivCl)",
                "Pivaloyl bromide (PivBr)",
                "Hexanoyl chloride (HxCl)",
                "Hexanoyl bromide (HxBr)",
                "Heptanoyl chloride (HpCl)",
                "Heptanoyl bromide (HpBr)",
                "Octanoyl chloride (OcCl)",
                "Octanoyl bromide (OcBr)",
                "Nonanoyl chloride (NoCl)",
                "Nonanoyl bromide (NoBr)",
                "Decanoyl chloride (DeCl)",
                "Decanoyl bromide (DeBr)",
                "Lauroyl chloride (LaCl)",
                "Lauroyl bromide (LaBr)",
                "Myristoyl chloride (MyCl)",
                "Myristoyl bromide (MyBr)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl bromide (AcBr)",
                "Acetyl chloride (AcCl)",
                "Butyryl bromide (BuBr)",
                "Butyryl chloride (BuCl)",
                "Decanoyl bromide (DeBr)",
                "Decanoyl chloride (DeCl)",
                "Heptanoyl bromide (HpBr)",
                "Heptanoyl chloride (HpCl)",
                "Hexanoyl bromide (HxBr)",
                "Hexanoyl chloride (HxCl)",
                "Lauroyl bromide (LaBr)",
                "Lauroyl chloride (LaCl)",
                "Myristoyl bromide (MyBr)",
                "Myristoyl chloride (MyCl)",
                "Nonanoyl bromide (NoBr)",
                "Nonanoyl chloride (NoCl)",
                "Octanoyl bromide (OcBr)",
                "Octanoyl chloride (OcCl)",
                "Pivaloyl bromide (PivBr)",
                "Pivaloyl chloride (PivCl)",
                "Propionyl bromide (PrBr)",
                "Propionyl chloride (PrCl)",
                "Valeryl bromide (VaBr)",
                "Valeryl chloride (VaCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetic acid chloride (AcCl)",
            "Acetoxime chloride",
            "Benzoic acid chloride",
            "Chloroacetic acid",
            "Chloroformic acid",
            "Fluorobenzoic acid",
            "Formic acid chloride",
            "Hexanoic acid chloride",
            "Iodoacetic acid",
            "Iodoformic acid",
            "Methoxyacetic acid chloride",
            "Methyl chloroformate",
            "Methyl iodide",
            "Oxalic acid dichloride",
            "Pivalic acid chloride",
            "Propionic acid chloride",
            "Succinic acid dichloride",
            "Tartaric acid dichloride",
            "Trifluoroacetic acid",
            "Trimethylacetic acid chloride",
            "Urea chloride",
            "Vinyl chloride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic acid chloride (AcCl)",
                "Acetoxime chloride",
                "Benzoic acid chloride",
                "Chloroacetic acid",
                "Chloroformic acid",
                "Fluorobenzoic acid",
                "Formic acid chloride",
                "Hexanoic acid chloride",
                "Iodoacetic acid",
                "Iodoformic acid",
                "Methoxyacetic acid chloride",
                "Methyl chloroformate",
                "Methyl iodide",
                "Oxalic acid dichloride",
                "Pivalic acid chloride",
                "Propionic acid chloride",
                "Succinic acid dichloride",
                "Tartaric acid dichloride",
                "Trifluoroacetic acid",
                "Trimethylacetic acid chloride",
                "Urea chloride",
                "Vinyl chloride"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetic acid chloride (AcCl)",
                "Acetoxime chloride",
                "Benzoic acid chloride",
                "Chloroacetic acid",
                "Chloroformic acid",
                "Fluorobenzoic acid",
                "Formic acid chloride",
                "Hexanoic acid chloride",
                "Iodoacetic acid",
                "Iodoformic acid",
                "Methoxyacetic acid chloride",
                "Methyl chloroformate",
                "Methyl iodide",
                "Oxalic acid dichloride",
                "Pivalic acid chloride",
                "Propionic acid chloride",
                "Succinic acid dichloride",
                "Tartaric acid dichloride",
                "Trifluoroacetic acid",
                "Trimethylacetic acid chloride",
                "Urea chloride",
                "Vinyl chloride"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            "Acetyl chloride (ACl)",
            "Acetyl bromide (ABr)",
            "Acetyl fluoride (AF)",
            "Pivaloyl chloride (PiCl)",
            "Pivaloyl bromide (PiBr)",
            "Benzoyl chloride (BzCl)",
            "Benzoyl bromide (BzBr)",
            "Benzoyl fluoride (BzF)",
            "Propionyl chloride (PrCl)",
            "Propionyl bromide (PrBr)",
            "Butyryl chloride (BuCl)",
            "Butyryl bromide (BuBr)",
            "Valeryl chloride (VCl)",
            "Valeryl bromide (VBr)",
            "Caproyl chloride (CpCl)",
            "Caproyl bromide (CpBr)",
            "Acryloyl chloride (AcrCl)",
            "Acryloyl bromide (AcrBr)",
            "Methacryloyl chloride (MAcCl)",
            "Methacryloyl bromide (MAcBr)",
            "Cyclohexanecarbonyl chloride (ChCl)",
            "Cyclohexanecarbonyl bromide (ChBr)",
            "4-Methylbenzoyl chloride (4-MBzCl)",
            "4-Methylbenzoyl bromide (4-MBzBr)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl chloride (ACl)",
                "Acetyl bromide (ABr)",
                "Acetyl fluoride (AF)",
                "Pivaloyl chloride (PiCl)",
                "Pivaloyl bromide (PiBr)",
                "Benzoyl chloride (BzCl)",
                "Benzoyl bromide (BzBr)",
                "Benzoyl fluoride (BzF)",
                "Propionyl chloride (PrCl)",
                "Propionyl bromide (PrBr)",
                "Butyryl chloride (BuCl)",
                "Butyryl bromide (BuBr)",
                "Valeryl chloride (VCl)",
                "Valeryl bromide (VBr)",
                "Caproyl chloride (CpCl)",
                "Caproyl bromide (CpBr)",
                "Acryloyl chloride (AcrCl)",
                "Acryloyl bromide (AcrBr)",
                "Methacryloyl chloride (MAcCl)",
                "Methacryloyl bromide (MAcBr)",
                "Cyclohexanecarbonyl chloride (ChCl)",
                "Cyclohexanecarbonyl bromide (ChBr)",
                "4-Methylbenzoyl chloride (4-MBzCl)",
                "4-Methylbenzoyl bromide (4-MBzBr)"
            ],
            "mismatches": [],
            "true_referents": [
                "4-Methylbenzoyl bromide (4-MBzBr)",
                "4-Methylbenzoyl chloride (4-MBzCl)",
                "Acetyl bromide (ABr)",
                "Acetyl chloride (ACl)",
                "Acetyl fluoride (AF)",
                "Acryloyl bromide (AcrBr)",
                "Acryloyl chloride (AcrCl)",
                "Benzoyl bromide (BzBr)",
                "Benzoyl chloride (BzCl)",
                "Benzoyl fluoride (BzF)",
                "Butyryl bromide (BuBr)",
                "Butyryl chloride (BuCl)",
                "Caproyl bromide (CpBr)",
                "Caproyl chloride (CpCl)",
                "Cyclohexanecarbonyl bromide (ChBr)",
                "Cyclohexanecarbonyl chloride (ChCl)",
                "Methacryloyl bromide (MAcBr)",
                "Methacryloyl chloride (MAcCl)",
                "Pivaloyl bromide (PiBr)",
                "Pivaloyl chloride (PiCl)",
                "Propionyl bromide (PrBr)",
                "Propionyl chloride (PrCl)",
                "Valeryl bromide (VBr)",
                "Valeryl chloride (VCl)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "acyl halide",
        "domain": "chemistry",
        "response": [
            [
                "Referent",
                "acetyl chloride"
            ],
            [
                "Referent",
                "acetyl bromide"
            ],
            [
                "Referent",
                "acetyl iodide"
            ]
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "acetyl chloride",
                "acetyl bromide",
                "acetyl iodide"
            ],
            "mismatches": [],
            "true_referents": [
                "[\"Referent\", \"acetyl bromide\"]",
                "[\"Referent\", \"acetyl chloride\"]",
                "[\"Referent\", \"acetyl iodide\"]"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 0
        }
    }
]