[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Sodium chloride (NaCl)",
            "Potassium chloride (KCl)",
            "Calcium carbonate (CaCO3)",
            "Magnesium sulfate (MgSO4)",
            "Iron(II) sulfate (FeSO4)",
            "Zinc sulfate (ZnSO4)",
            "Copper(II) sulfate (CuSO4)",
            "Potassium nitrate (KNO3)",
            "Sodium bicarbonate (NaHCO3)",
            "Calcium chloride (CaCl2)",
            "Ammonium nitrate (NH4NO3)",
            "Sodium phosphate (Na3PO4)",
            "Magnesium oxide (MgO)",
            "Calcium nitrate (Ca(NO3)2)",
            "Sodium carbonate (Na2CO3)",
            "Potassium sulfate (K2SO4)",
            "Iron(III) chloride (FeCl3)",
            "Sodium nitrate (NaNO3)",
            "Ammonium chloride (NH4Cl)",
            "Calcium hydroxide (Ca(OH)2)",
            "Sodium sulfite (Na2SO3)",
            "Potassium hydroxide (KOH)",
            "Magnesium nitrate (Mg(NO3)2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium chloride (NaCl)",
                "Potassium chloride (KCl)",
                "Calcium carbonate (CaCO3)",
                "Magnesium sulfate (MgSO4)",
                "Zinc sulfate (ZnSO4)",
                "Copper(II) sulfate (CuSO4)",
                "Potassium nitrate (KNO3)",
                "Calcium chloride (CaCl2)",
                "Ammonium nitrate (NH4NO3)",
                "Sodium phosphate (Na3PO4)",
                "Calcium nitrate (Ca(NO3)2)",
                "Potassium sulfate (K2SO4)",
                "Sodium nitrate (NaNO3)",
                "Ammonium chloride (NH4Cl)",
                "Calcium hydroxide (Ca(OH)2)",
                "Sodium sulfite (Na2SO3)",
                "Magnesium nitrate (Mg(NO3)2)"
            ],
            "mismatches": [
                "Iron(II) sulfate (FeSO4)",
                "Sodium bicarbonate (NaHCO3)",
                "Magnesium oxide (MgO)",
                "Sodium carbonate (Na2CO3)",
                "Iron(III) chloride (FeCl3)",
                "Potassium hydroxide (KOH)"
            ],
            "true_referents": [
                "ammonium chloride",
                "ammonium nitrate",
                "ammonium nitrate phosphate",
                "ammonium sulfate",
                "aragonite",
                "barium carbonate",
                "caesium chloride",
                "caesium nitrate",
                "calcium carbonate",
                "calcium dichloride",
                "calcium dihydroxide",
                "calcium hydroxide",
                "calcium monohydroxide",
                "calcium nitrate",
                "calcium nitrate tetrahydrate",
                "copper(II) sulfate",
                "copper(II) sulfate hexahydrate",
                "copper(II) sulfate pentahydrate",
                "inorganic ammonium salt",
                "inorganic magnesium salt",
                "inorganic nitrate salt",
                "inorganic sulfate salt",
                "iron dichloride tetrahydrate",
                "iron trichloride hexahydrate",
                "iron(2+) sulfate (anhydrous)",
                "iron(3+) sulfate",
                "magnesium nitrate",
                "magnesium sulfate",
                "manganese(II) sulfate",
                "potassium aluminium sulfate",
                "potassium chloride",
                "potassium nitrate",
                "potassium nitrite",
                "potassium sulfate",
                "sodium chloride",
                "sodium diphosphate",
                "sodium disulfite",
                "sodium nitrate",
                "sodium nitrite",
                "sodium phosphate",
                "sodium sulfate",
                "sodium sulfite",
                "zinc sulfate",
                "zinc sulfate heptahydrate",
                "zinc sulfate hexahydrate"
            ],
            "TP": 17,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Sodium chloride (NaCl)",
            "Potassium chloride (KCl)",
            "Calcium chloride (CaCl2)",
            "Magnesium sulfate (MgSO4)",
            "Sodium bicarbonate (NaHCO3)",
            "Potassium sulfate (K2SO4)",
            "Calcium carbonate (CaCO3)",
            "Magnesium oxide (MgO)",
            "Ammonium chloride (NH4Cl)",
            "Sodium hydroxide (NaOH)",
            "Potassium hydroxide (KOH)",
            "Calcium hydroxide (Ca(OH)2)",
            "Sodium phosphate (Na3PO4)",
            "Potassium nitrate (KNO3)",
            "Sodium sulfate (Na2SO4)",
            "Ammonium sulfate ((NH4)2SO4)",
            "Zinc sulfate (ZnSO4)",
            "Copper(II) sulfate (CuSO4)",
            "Iron(III) chloride (FeCl3)",
            "Silver nitrate (AgNO3)",
            "Barium chloride (BaCl2)",
            "Lead(II) nitrate (Pb(NO3)2)",
            "Aluminum sulfate (Al2(SO4)3)",
            "Strontium chloride (SrCl2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium chloride",
                "Potassium chloride",
                "Calcium hydroxide",
                "Magnesium sulfate",
                "Potassium sulfate",
                "Calcium carbonate",
                "Ammonium chloride",
                "Sodium phosphate",
                "Potassium nitrate",
                "Sodium sulfate",
                "Ammonium sulfate",
                "Zinc sulfate",
                "Copper(II) sulfate",
                "Barium chloride",
                "lead nitrate",
                "strontium dichloride"
            ],
            "mismatches": [
                "Sodium bicarbonate",
                "Magnesium oxide",
                "Sodium hydroxide",
                "Potassium hydroxide",
                "Iron(III) chloride",
                "Silver nitrate",
                "Aluminum sulfate"
            ],
            "true_referents": [
                "aluminium sulfate",
                "aluminium sulfate (anhydrous)",
                "ammonium chloride",
                "ammonium phosphate sulfate",
                "ammonium sulfate",
                "ammonium thiosulfate",
                "aragonite",
                "barium carbonate",
                "barium chloride",
                "barium nitrate",
                "barium sulfate",
                "caesium chloride",
                "calcium carbonate",
                "calcium dichloride",
                "calcium dihydroxide",
                "calcium hydroxide",
                "calcium monohydroxide",
                "copper(II) sulfate",
                "copper(II) sulfate hexahydrate",
                "copper(II) sulfate pentahydrate",
                "disodium hydrogenphosphate",
                "inorganic ammonium salt",
                "inorganic magnesium salt",
                "inorganic sulfate salt",
                "iron dichloride tetrahydrate",
                "iron trichloride hexahydrate",
                "iron(3+) sulfate",
                "lead nitrate",
                "lead oxide",
                "lead(II) chloride",
                "magnesium nitrate",
                "magnesium sulfate",
                "potassium aluminium sulfate",
                "potassium chloride",
                "potassium nitrate",
                "potassium nitrite",
                "potassium sulfate",
                "scandium nitrate",
                "silver(1+) nitrate",
                "sodium chloride",
                "sodium diphosphate",
                "sodium hypochlorite",
                "sodium nitrate",
                "sodium phosphate",
                "sodium sulfate",
                "sodium thiosulfate",
                "strontium dichloride",
                "zinc sulfate",
                "zinc sulfate heptahydrate",
                "zinc sulfate hexahydrate"
            ],
            "TP": 16,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Sodium Chloride (NaCl)",
            "Potassium Chloride (KCl)",
            "Calcium Chloride (CaCl2)",
            "Magnesium Sulfate (MgSO4)",
            "Sodium Bicarbonate (NaHCO3)",
            "Ammonium Chloride (NH4Cl)",
            "Calcium Carbonate (CaCO3)",
            "Sodium Sulfate (Na2SO4)",
            "Potassium Sulfate (K2SO4)",
            "Potassium Nitrate (KNO3)",
            "Sodium Nitrate (NaNO3)",
            "Calcium Phosphate (Ca3(PO4)2)",
            "Sodium Phosphate (Na3PO4)",
            "Calcium Sulfate (CaSO4)",
            "Ammonium Sulfate ((NH4)2SO4)",
            "Copper Sulfate (CuSO4)",
            "Iron Sulfate (FeSO4)",
            "Zinc Sulfate (ZnSO4)",
            "Potassium Hydroxide (KOH)",
            "Sodium Hydroxide (NaOH)",
            "Calcium Hydroxide (Ca(OH)2)",
            "Ammonium Nitrate (NH4NO3)",
            "Sodium Chlorate (NaClO3)",
            "Potassium Chlorate (KClO3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium Chloride (NaCl)",
                "Potassium Chloride (KCl)",
                "Magnesium Sulfate (MgSO4)",
                "Ammonium Chloride (NH4Cl)",
                "Calcium Carbonate (CaCO3)",
                "Sodium Sulfate (Na2SO4)",
                "Potassium Sulfate (K2SO4)",
                "Potassium Nitrate (KNO3)",
                "Sodium Nitrate (NaNO3)",
                "Calcium Phosphate (Ca3(PO4)2)",
                "Sodium Phosphate (Na3PO4)",
                "Calcium Sulfate (CaSO4)",
                "Ammonium Sulfate ((NH4)2SO4)",
                "Zinc Sulfate (ZnSO4)",
                "Sodium Chlorate (NaClO3)",
                "Ammonium Nitrate (NH4NO3)"
            ],
            "mismatches": [
                "Sodium Bicarbonate (NaHCO3)",
                "Copper Sulfate (CuSO4)",
                "Iron Sulfate (FeSO4)",
                "Potassium Hydroxide (KOH)",
                "Sodium Hydroxide (NaOH)",
                "Calcium Hydroxide (Ca(OH)2)",
                "Potassium Chlorate (KClO3)"
            ],
            "true_referents": [
                "ammonium chloride",
                "ammonium nitrate",
                "ammonium nitrate phosphate",
                "ammonium phosphate sulfate",
                "ammonium sulfate",
                "ammonium thiosulfate",
                "aragonite",
                "barium carbonate",
                "caesium chloride",
                "calcium carbonate",
                "calcium dichloride",
                "calcium dihydroxide",
                "calcium hydroxide",
                "calcium monohydroxide",
                "calcium phosphate",
                "calcium sulfate",
                "copper(II) sulfate",
                "copper(II) sulfate hexahydrate",
                "copper(II) sulfate pentahydrate",
                "disodium hydrogenphosphate",
                "ferrous ammonium sulfate (anhydrous)",
                "inorganic ammonium salt",
                "inorganic sulfate salt",
                "iron(2+) sulfate (anhydrous)",
                "iron(3+) sulfate",
                "magnesium sulfate",
                "potassium aluminium sulfate",
                "potassium chloride",
                "potassium nitrate",
                "potassium nitrite",
                "potassium sulfate",
                "sodium chlorate",
                "sodium chloride",
                "sodium chlorite",
                "sodium diphosphate",
                "sodium hypochlorite",
                "sodium nitrate",
                "sodium nitrite",
                "sodium perchlorate",
                "sodium phosphate",
                "sodium sulfate",
                "sodium thiosulfate",
                "tricalcium bis(phosphate)",
                "zinc sulfate",
                "zinc sulfate heptahydrate",
                "zinc sulfate hexahydrate"
            ],
            "TP": 16,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Sodium Chloride (NaCl)",
            "Potassium Iodide (KI)",
            "Calcium Carbonate (CaCO3)",
            "Magnesium Sulfate (MgSO4)",
            "Sodium Bicarbonate (NaHCO3)",
            "Potassium Chloride (KCl)",
            "Calcium Chloride (CaCl2)",
            "Sodium Phosphate (Na3PO4)",
            "Potassium Nitrate (KNO3)",
            "Magnesium Chloride (MgCl2)",
            "Sodium Sulfate (Na2SO4)",
            "Calcium Sulfate (CaSO4)",
            "Potassium Phosphate (K3PO4)",
            "Ammonium Chloride (NH4Cl)",
            "Sodium Fluoride (NaF)",
            "Potassium Fluoride (KF)",
            "Lithium Carbonate (Li2CO3)",
            "Ferrous Sulfate (FeSO4)",
            "Zinc Chloride (ZnCl2)",
            "Copper Sulfate (CuSO4)",
            "Aluminum Sulfate (Al2(SO4)3)",
            "Sodium Silicate (Na2SiO3)",
            "Potassium Permanganate (KMnO4)",
            "Barium Sulfate (BaSO4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium Chloride (NaCl)",
                "Calcium Carbonate (CaCO3)",
                "Magnesium Sulfate (MgSO4)",
                "Potassium Chloride (KCl)",
                "Calcium Chloride (CaCl2)",
                "Sodium Phosphate (Na3PO4)",
                "Potassium Nitrate (KNO3)",
                "Magnesium Chloride (MgCl2)",
                "Sodium Sulfate (Na2SO4)",
                "Calcium Sulfate (CaSO4)",
                "Ammonium Chloride (NH4Cl)",
                "Sodium Silicate (Na2SiO3)",
                "Barium Sulfate (BaSO4)"
            ],
            "mismatches": [
                "Potassium Iodide (KI)",
                "Sodium Bicarbonate (NaHCO3)",
                "Potassium Phosphate (K3PO4)",
                "Sodium Fluoride (NaF)",
                "Potassium Fluoride (KF)",
                "Lithium Carbonate (Li2CO3)",
                "Ferrous Sulfate (FeSO4)",
                "Zinc Chloride (ZnCl2)",
                "Copper Sulfate (CuSO4)",
                "Aluminum Sulfate (Al2(SO4)3)",
                "Potassium Permanganate (KMnO4)"
            ],
            "true_referents": [
                "Kaliumhexachloroantimonat(V)",
                "aluminium sulfate",
                "aluminium sulfate (anhydrous)",
                "ammonium chloride",
                "ammonium sulfate",
                "aragonite",
                "barium carbonate",
                "barium chloride",
                "barium sulfate",
                "beryllium dichloride",
                "caesium chloride",
                "calcium carbonate",
                "calcium dichloride",
                "calcium monohydroxide",
                "calcium silicate",
                "calcium sulfate",
                "copper(II) chloride",
                "copper(II) sulfate",
                "copper(II) sulfate hexahydrate",
                "copper(II) sulfate pentahydrate",
                "ferrous ammonium sulfate (anhydrous)",
                "inorganic ammonium salt",
                "inorganic fluoride salt",
                "inorganic iodine salt",
                "inorganic manganese salt",
                "inorganic phosphate salt",
                "inorganic sulfate salt",
                "iron(2+) sulfate (anhydrous)",
                "iron(3+) sulfate",
                "lithium sulfate",
                "magnesium dichloride",
                "magnesium dichloride dihydrate",
                "magnesium sulfate",
                "manganese(II) sulfate",
                "potassium chloride",
                "potassium nitrate",
                "potassium nitrite",
                "sodium chloride",
                "sodium diphosphate",
                "sodium fluorate",
                "sodium fluorophosphate",
                "sodium iodide",
                "sodium nitrate",
                "sodium phosphate",
                "sodium silicate",
                "sodium sulfate",
                "sodium thiosulfate",
                "zinc dichloride"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Sodium chloride (NaCl)",
            "Potassium chloride (KCl)",
            "Calcium carbonate (CaCO3)",
            "Magnesium sulfate (MgSO4)",
            "Sodium bicarbonate (NaHCO3)",
            "Calcium sulfate (CaSO4)",
            "Ammonium nitrate (NH4NO3)",
            "Sodium nitrate (NaNO3)",
            "Potassium nitrate (KNO3)",
            "Calcium phosphate (Ca3(PO4)2)",
            "Sodium sulfate (Na2SO4)",
            "Potassium sulfate (K2SO4)",
            "Ammonium sulfate ((NH4)2SO4)",
            "Magnesium chloride (MgCl2)",
            "Calcium chloride (CaCl2)",
            "Sodium carbonate (Na2CO3)",
            "Potassium carbonate (K2CO3)",
            "Aluminum sulfate (Al2(SO4)3)",
            "Barium sulfate (BaSO4)",
            "Lithium chloride (LiCl)",
            "Zinc sulfate (ZnSO4)",
            "Copper(II) sulfate (CuSO4)",
            "Iron(III) chloride (FeCl3)",
            "Sodium phosphate (Na3PO4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium chloride (NaCl)",
                "Potassium chloride (KCl)",
                "Calcium carbonate (CaCO3)",
                "Magnesium sulfate (MgSO4)",
                "Calcium sulfate (CaSO4)",
                "Ammonium nitrate (NH4NO3)",
                "Sodium nitrate (NaNO3)",
                "Potassium nitrate (KNO3)",
                "Calcium phosphate (Ca3(PO4)2)",
                "Sodium sulfate (Na2SO4)",
                "Potassium sulfate (K2SO4)",
                "Ammonium sulfate ((NH4)2SO4)",
                "Magnesium chloride (MgCl2)",
                "Calcium chloride (CaCl2)",
                "Barium sulfate (BaSO4)",
                "Lithium chloride (LiCl)",
                "Zinc sulfate (ZnSO4)",
                "Copper(II) sulfate (CuSO4)",
                "Sodium phosphate (Na3PO4)"
            ],
            "mismatches": [
                "Sodium bicarbonate (NaHCO3)",
                "Sodium carbonate (Na2CO3)",
                "Potassium carbonate (K2CO3)",
                "Aluminum sulfate (Al2(SO4)3)",
                "Iron(III) chloride (FeCl3)"
            ],
            "true_referents": [
                "aluminium sulfate",
                "aluminium sulfate (anhydrous)",
                "ammonium nitrate",
                "ammonium nitrate phosphate",
                "ammonium phosphate sulfate",
                "ammonium sulfate",
                "ammonium thiosulfate",
                "aragonite",
                "barium carbonate",
                "barium chloride",
                "barium sulfate",
                "caesium chloride",
                "calcium carbonate",
                "calcium dichloride",
                "calcium monohydroxide",
                "calcium phosphate",
                "calcium sulfate",
                "copper(II) sulfate",
                "copper(II) sulfate hexahydrate",
                "copper(II) sulfate pentahydrate",
                "inorganic lithium salt",
                "inorganic sulfate salt",
                "iron dichloride tetrahydrate",
                "iron trichloride hexahydrate",
                "iron(3+) sulfate",
                "lithium chloride",
                "lithium sulfate",
                "magnesium dichloride",
                "magnesium dichloride dihydrate",
                "magnesium sulfate",
                "potassium aluminium sulfate",
                "potassium chloride",
                "potassium nitrate",
                "potassium nitrite",
                "potassium sulfate",
                "sodium chloride",
                "sodium diphosphate",
                "sodium nitrate",
                "sodium nitrite",
                "sodium phosphate",
                "sodium sulfate",
                "sodium thiosulfate",
                "tricalcium bis(phosphate)",
                "zinc sulfate",
                "zinc sulfate heptahydrate",
                "zinc sulfate hexahydrate"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Sodium chloride (NaCl)",
            "Potassium chloride (KCl)",
            "Calcium carbonate (CaCO3)",
            "Magnesium sulfate (MgSO4)",
            "Ammonium nitrate (NH4NO3)",
            "Sodium bicarbonate (NaHCO3)",
            "Calcium phosphate (Ca3(PO4)2)",
            "Iron(III) chloride (FeCl3)",
            "Copper(II) sulfate (CuSO4)",
            "Zinc oxide (ZnO)",
            "Barium sulfate (BaSO4)",
            "Sodium sulfate (Na2SO4)",
            "Lithium bromide (LiBr)",
            "Aluminum sulfate (Al2(SO4)3)",
            "Potassium phosphate (K3PO4)",
            "Calcium sulfate (CaSO4)",
            "Sodium nitrite (NaNO2)",
            "Silver nitrate (AgNO3)",
            "Lead(II) acetate (Pb(C2H3O2)2)",
            "Sodium thiosulfate (Na2S2O3)",
            "Manganese(II) sulfate (MnSO4)",
            "Cobalt(II) chloride (CoCl2)",
            "Nickel(II) sulfate (NiSO4)",
            "Sodium acetate (CH3COONa)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium chloride (NaCl)",
                "Potassium chloride (KCl)",
                "Calcium carbonate (CaCO3)",
                "Magnesium sulfate (MgSO4)",
                "Ammonium nitrate (NH4NO3)",
                "Calcium phosphate (Ca3(PO4)2)",
                "Copper(II) sulfate (CuSO4)",
                "Barium sulfate (BaSO4)",
                "Sodium sulfate (Na2SO4)",
                "Calcium sulfate (CaSO4)",
                "Sodium nitrite (NaNO2)",
                "Sodium thiosulfate (Na2S2O3)",
                "Manganese(II) sulfate (MnSO4)",
                "Nickel(II) sulfate (NiSO4)"
            ],
            "mismatches": [
                "Sodium bicarbonate (NaHCO3)",
                "Iron(III) chloride (FeCl3)",
                "Zinc oxide (ZnO)",
                "Lithium bromide (LiBr)",
                "Aluminum sulfate (Al2(SO4)3)",
                "Potassium phosphate (K3PO4)",
                "Silver nitrate (AgNO3)",
                "Lead(II) acetate (Pb(C2H3O2)2)",
                "Cobalt(II) chloride (CoCl2)",
                "Sodium acetate (CH3COONa)"
            ],
            "true_referents": [
                "aluminium sulfate",
                "aluminium sulfate (anhydrous)",
                "ammonium nitrate",
                "ammonium nitrate phosphate",
                "ammonium sulfate",
                "ammonium thiosulfate",
                "aragonite",
                "barium carbonate",
                "barium chloride",
                "barium nitrate",
                "barium sulfate",
                "calcium carbonate",
                "calcium monohydroxide",
                "calcium phosphate",
                "calcium sulfate",
                "cobalt dichloride",
                "copper(II) chloride",
                "copper(II) sulfate",
                "copper(II) sulfate hexahydrate",
                "copper(II) sulfate pentahydrate",
                "inorganic chloride",
                "inorganic phosphate salt",
                "inorganic sulfate salt",
                "inorganic zinc salt",
                "iron dichloride tetrahydrate",
                "iron trichloride hexahydrate",
                "iron(3+) sulfate",
                "lead arsenate",
                "lead oxide",
                "lead(II) chloride",
                "lithium chloride",
                "lithium sulfate",
                "magnesium sulfate",
                "manganese(II) sulfate",
                "manganese(II) sulfate dihydrate",
                "manganese(II) sulfate tetrahydrate",
                "metal sulfate",
                "nickel sulfate",
                "potassium chloride",
                "potassium nitrite",
                "scandium nitrate",
                "silver(1+) nitrate",
                "sodium amide",
                "sodium bromide",
                "sodium chloride",
                "sodium disulfite",
                "sodium nitrate",
                "sodium nitrite",
                "sodium phosphate",
                "sodium sulfate",
                "sodium thiosulfate",
                "tricalcium bis(phosphate)",
                "zinc nitrate"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Sodium chloride (NaCl)",
            "Potassium chloride (KCl)",
            "Calcium chloride (CaCl2)",
            "Ammonium chloride (NH4Cl)",
            "Magnesium sulfate (MgSO4)",
            "Sodium bicarbonate (NaHCO3)",
            "Copper sulfate (CuSO4)",
            "Zinc sulfate (ZnSO4)",
            "Ferrous sulfate (FeSO4)",
            "Aluminum sulfate (Al2(SO4)3)",
            "Potassium nitrate (KNO3)",
            "Sodium nitrate (NaNO3)",
            "Barium chloride (BaCl2)",
            "Calcium carbonate (CaCO3)",
            "Potassium carbonate (K2CO3)",
            "Sodium sulfate (Na2SO4)",
            "Ammonium nitrate (NH4NO3)",
            "Zinc chloride (ZnCl2)",
            "Copper chloride (CuCl2)",
            "Iron (III) chloride (FeCl3)",
            "Aluminum chloride (AlCl3)",
            "Barium sulfate (BaSO4)",
            "Cadmium chloride (CdCl2)",
            "Lead (II) nitrate (Pb(NO3)2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium chloride (NaCl)",
                "Potassium chloride (KCl)",
                "Calcium chloride (CaCl2)",
                "Ammonium chloride (NH4Cl)",
                "Magnesium sulfate (MgSO4)",
                "Zinc sulfate (ZnSO4)",
                "Potassium nitrate (KNO3)",
                "Sodium nitrate (NaNO3)",
                "Barium chloride (BaCl2)",
                "Calcium carbonate (CaCO3)",
                "Sodium sulfate (Na2SO4)",
                "Ammonium nitrate (NH4NO3)"
            ],
            "mismatches": [
                "Sodium bicarbonate (NaHCO3)",
                "Copper sulfate (CuSO4)",
                "Ferrous sulfate (FeSO4)",
                "Aluminum sulfate (Al2(SO4)3)",
                "Potassium carbonate (K2CO3)",
                "Zinc chloride (ZnCl2)",
                "Copper chloride (CuCl2)",
                "Iron (III) chloride (FeCl3)",
                "Aluminum chloride (AlCl3)",
                "Barium sulfate (BaSO4)",
                "Cadmium chloride (CdCl2)",
                "Lead (II) nitrate (Pb(NO3)2)"
            ],
            "true_referents": [
                "aluminium sulfate",
                "aluminium sulfate (anhydrous)",
                "ammonium chloride",
                "ammonium nitrate",
                "ammonium nitrate phosphate",
                "ammonium sulfate",
                "aragonite",
                "barium carbonate",
                "barium chloride",
                "barium sulfate",
                "beryllium dichloride",
                "cadmium nitrate",
                "caesium chloride",
                "calcium carbonate",
                "calcium dichloride",
                "calcium monohydroxide",
                "copper(I) chloride",
                "copper(II) chloride",
                "copper(II) sulfate",
                "copper(II) sulfate hexahydrate",
                "copper(II) sulfate pentahydrate",
                "ferrous ammonium sulfate (anhydrous)",
                "inorganic aluminium salt",
                "inorganic ammonium salt",
                "inorganic cadmium salt",
                "inorganic sulfate salt",
                "iron dichloride tetrahydrate",
                "iron trichloride hexahydrate",
                "iron(2+) sulfate (anhydrous)",
                "iron(3+) sulfate",
                "lanthanum trichloride",
                "lead nitrate",
                "lead oxide",
                "lead(II) chloride",
                "magnesium sulfate",
                "potassium chloride",
                "potassium nitrate",
                "potassium nitrite",
                "sodium chloride",
                "sodium nitrate",
                "sodium nitrite",
                "sodium sulfate",
                "sodium thiosulfate",
                "zinc dichloride",
                "zinc sulfate",
                "zinc sulfate heptahydrate",
                "zinc sulfate hexahydrate"
            ],
            "TP": 12,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Sodium chloride (NaCl)",
            "Potassium nitrate (KNO3)",
            "Calcium carbonate (CaCO3)",
            "Magnesium sulfate (MgSO4)",
            "Ammonium phosphate ((NH4)3PO4)",
            "Iron(II) sulfate (FeSO4)",
            "Zinc chloride (ZnCl2)",
            "Copper sulfate (CuSO4)",
            "Silver nitrate (AgNO3)",
            "Lead(II) acetate (Pb(C2H3O2)2)",
            "Barium sulfate (BaSO4)",
            "Mercury(II) chloride (HgCl2)",
            "Aluminum sulfate (Al2(SO4)3)",
            "Nickel chloride (NiCl2)",
            "Cobalt nitrate (Co(NO3)2)",
            "Manganese sulfate (MnSO4)",
            "Lithium carbonate (Li2CO3)",
            "Beryllium chloride (BeCl2)",
            "Strontium bromide (SrBr2)",
            "Cadmium iodide (CdI2)",
            "Gallium nitrate (Ga(NO3)3)",
            "Thallium sulfate (Tl2SO4)",
            "Indium chloride (InCl3)",
            "Tin(II) chloride (SnCl2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium chloride (NaCl)",
                "Potassium nitrate (KNO3)",
                "Calcium carbonate (CaCO3)",
                "Magnesium sulfate (MgSO4)",
                "Barium sulfate (BaSO4)",
                "Aluminum sulfate (Al2(SO4)3)",
                "Cobalt nitrate (Co(NO3)2)",
                "Manganese sulfate (MnSO4)",
                "Beryllium chloride (BeCl2)",
                "Gallium nitrate (Ga(NO3)3)",
                "Thallium sulfate (Tl2SO4)"
            ],
            "mismatches": [
                "Ammonium phosphate ((NH4)3PO4)",
                "Iron(II) sulfate (FeSO4)",
                "Zinc chloride (ZnCl2)",
                "Copper sulfate (CuSO4)",
                "Silver nitrate (AgNO3)",
                "Lead(II) acetate (Pb(C2H3O2)2)",
                "Mercury(II) chloride (HgCl2)",
                "Nickel chloride (NiCl2)",
                "Lithium carbonate (Li2CO3)",
                "Strontium bromide (SrBr2)",
                "Cadmium iodide (CdI2)",
                "Indium chloride (InCl3)",
                "Tin(II) chloride (SnCl2)"
            ],
            "true_referents": [
                "((201)Tl)thallium monochloride",
                "aluminium sulfate",
                "aluminium sulfate (anhydrous)",
                "ammonium nitrate phosphate",
                "ammonium phosphate sulfate",
                "ammonium polyphosphate",
                "aragonite",
                "barium carbonate",
                "barium chloride",
                "barium nitrate",
                "barium sulfate",
                "beryllium dichloride",
                "beryllium sulfate",
                "cadmium nitrate",
                "caesium chloride",
                "calcium carbonate",
                "cobalt dinitrate",
                "cobalt dinitrate hexahydrate",
                "cobalt trinitrate",
                "copper(II) chloride",
                "copper(II) sulfate",
                "copper(II) sulfate hexahydrate",
                "copper(II) sulfate pentahydrate",
                "gallium nitrate",
                "indium(III) nitrate",
                "inorganic cadmium salt",
                "inorganic chloride",
                "inorganic mercury salt",
                "inorganic nickel salt",
                "inorganic strontium salt",
                "inorganic sulfate salt",
                "inorganic tin salt",
                "iron(2+) sulfate (anhydrous)",
                "iron(3+) sulfate",
                "lanthanum trichloride",
                "lead arsenate",
                "lead oxide",
                "lead(II) chloride",
                "lithium sulfate",
                "magnesium sulfate",
                "manganese(II) chloride",
                "manganese(II) sulfate",
                "manganese(II) sulfate dihydrate",
                "manganese(II) sulfate tetrahydrate",
                "mercuric amidochloride",
                "nickel sulfate",
                "potassium chloride",
                "potassium nitrate",
                "potassium nitrite",
                "scandium nitrate",
                "silver(1+) nitrate",
                "sodium bromide",
                "sodium chloride",
                "sodium iodide",
                "sodium nitrate",
                "sodium sulfate",
                "strontium dichloride",
                "thallium monochloride",
                "thallium sulfate",
                "tin(II) chloride (anhydrous)",
                "zinc dichloride"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Sodium chloride (NaCl)",
            "Potassium chloride (KCl)",
            "Calcium carbonate (CaCO\u2083)",
            "Magnesium sulfate (MgSO\u2084)",
            "Ammonium nitrate (NH\u2084NO\u2083)",
            "Sodium bicarbonate (NaHCO\u2083)",
            "Sodium sulfate (Na\u2082SO\u2084)",
            "Potassium nitrate (KNO\u2083)",
            "Calcium sulfate (CaSO\u2084)",
            "Sodium phosphate (Na\u2083PO\u2084)",
            "Potassium phosphate (K\u2083PO\u2084)",
            "Magnesium chloride (MgCl\u2082)",
            "Aluminum sulfate (Al\u2082(SO\u2084)\u2083)",
            "Copper sulfate (CuSO\u2084)",
            "Zinc chloride (ZnCl\u2082)",
            "Iron(III) chloride (FeCl\u2083)",
            "Silver nitrate (AgNO\u2083)",
            "Sodium hydroxide (NaOH)",
            "Potassium hydroxide (KOH)",
            "Sodium nitrate (NaNO\u2083)",
            "Barium sulfate (BaSO\u2084)",
            "Lithium carbonate (Li\u2082CO\u2083)",
            "Sodium fluoride (NaF)",
            "Calcium nitrate (Ca(NO\u2083)\u2082)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium chloride (NaCl)",
                "Potassium chloride (KCl)",
                "Calcium carbonate (CaCO\u2083)",
                "Magnesium sulfate (MgSO\u2084)",
                "Ammonium nitrate (NH\u2084NO\u2083)",
                "Sodium sulfate (Na\u2082SO\u2084)",
                "Potassium nitrate (KNO\u2083)",
                "Calcium sulfate (CaSO\u2084)",
                "Sodium phosphate (Na\u2083PO\u2084)",
                "Magnesium chloride (MgCl\u2082)",
                "Barium sulfate (BaSO\u2084)",
                "Sodium nitrate (NaNO\u2083)",
                "Calcium nitrate (Ca(NO\u2083)\u2082)"
            ],
            "mismatches": [
                "Sodium bicarbonate (NaHCO\u2083)",
                "Potassium phosphate (K\u2083PO\u2084)",
                "Aluminum sulfate (Al\u2082(SO\u2084)\u2083)",
                "Copper sulfate (CuSO\u2084)",
                "Zinc chloride (ZnCl\u2082)",
                "Iron(III) chloride (FeCl\u2083)",
                "Silver nitrate (AgNO\u2083)",
                "Sodium hydroxide (NaOH)",
                "Potassium hydroxide (KOH)",
                "Lithium carbonate (Li\u2082CO\u2083)",
                "Sodium fluoride (NaF)"
            ],
            "true_referents": [
                "aluminium sulfate",
                "aluminium sulfate (anhydrous)",
                "ammonium nitrate",
                "ammonium nitrate phosphate",
                "aragonite",
                "barium carbonate",
                "barium chloride",
                "barium nitrate",
                "barium sulfate",
                "caesium nitrate",
                "calcium carbonate",
                "calcium hydroxide",
                "calcium monohydroxide",
                "calcium nitrate",
                "calcium sulfate",
                "copper(II) chloride",
                "copper(II) sulfate",
                "copper(II) sulfate hexahydrate",
                "copper(II) sulfate pentahydrate",
                "disodium hydrogenphosphate",
                "inorganic fluoride salt",
                "inorganic phosphate salt",
                "inorganic sulfate salt",
                "inorganic zinc salt",
                "iron dichloride tetrahydrate",
                "iron trichloride hexahydrate",
                "iron(3+) sulfate",
                "lithium sulfate",
                "magnesium dichloride",
                "magnesium dichloride dihydrate",
                "magnesium sulfate",
                "potassium chloride",
                "potassium nitrate",
                "potassium nitrite",
                "scandium nitrate",
                "silver(1+) nitrate",
                "sodium chloride",
                "sodium diphosphate",
                "sodium fluorate",
                "sodium fluorophosphate",
                "sodium hypochlorite",
                "sodium nitrate",
                "sodium nitrite",
                "sodium phosphate",
                "sodium sulfate",
                "zinc dichloride"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Sodium chloride (NaCl)",
            "Potassium chloride (KCl)",
            "Calcium chloride (CaCl\u2082)",
            "Magnesium sulfate (MgSO\u2084)",
            "Ammonium chloride (NH\u2084Cl)",
            "Sodium bicarbonate (NaHCO\u2083)",
            "Potassium phosphate (K\u2083PO\u2084)",
            "Calcium carbonate (CaCO\u2083)",
            "Sodium nitrate (NaNO\u2083)",
            "Potassium iodide (KI)",
            "Ferric chloride (FeCl\u2083)",
            "Copper sulfate (CuSO\u2084)",
            "Zinc sulfate (ZnSO\u2084)",
            "Sodium fluoride (NaF)",
            "Lithium chloride (LiCl)",
            "Barium sulfate (BaSO\u2084)",
            "Silver nitrate (AgNO\u2083)",
            "Aluminum sulfate (Al\u2082(SO\u2084)\u2083)",
            "Manganese chloride (MnCl\u2082)",
            "Cobalt chloride (CoCl\u2082)",
            "Nickel sulfate (NiSO\u2084)",
            "Ammonium nitrate (NH\u2084NO\u2083)",
            "Potassium permanganate (KMnO\u2084)",
            "Sodium thiosulfate (Na\u2082S\u2082O\u2083)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium chloride (NaCl)",
                "Potassium chloride (KCl)",
                "Calcium chloride (CaCl\u2082)",
                "Magnesium sulfate (MgSO\u2084)",
                "Ammonium chloride (NH\u2084Cl)",
                "Calcium carbonate (CaCO\u2083)",
                "Sodium nitrate (NaNO\u2083)",
                "Lithium chloride (LiCl)",
                "Barium sulfate (BaSO\u2084)",
                "Silver nitrate (AgNO\u2083)",
                "Zinc sulfate (ZnSO\u2084)",
                "Manganese chloride (MnCl\u2082)",
                "Cobalt chloride (CoCl\u2082)",
                "Nickel sulfate (NiSO\u2084)",
                "Ammonium nitrate (NH\u2084NO\u2083)",
                "Sodium thiosulfate (Na\u2082S\u2082O\u2083)"
            ],
            "mismatches": [
                "Sodium bicarbonate (NaHCO\u2083)",
                "Potassium phosphate (K\u2083PO\u2084)",
                "Potassium iodide (KI)",
                "Ferric chloride (FeCl\u2083)",
                "Copper sulfate (CuSO\u2084)",
                "Sodium fluoride (NaF)",
                "Aluminum sulfate (Al\u2082(SO\u2084)\u2083)",
                "Potassium permanganate (KMnO\u2084)"
            ],
            "true_referents": [
                "Kaliumhexachloroantimonat(V)",
                "aluminium sulfate",
                "aluminium sulfate (anhydrous)",
                "ammonium chloride",
                "ammonium nickel sulfate",
                "ammonium nitrate",
                "ammonium nitrate phosphate",
                "ammonium sulfate",
                "ammonium thiosulfate",
                "aragonite",
                "barium carbonate",
                "barium chloride",
                "barium nitrate",
                "barium sulfate",
                "caesium chloride",
                "calcium carbonate",
                "calcium dichloride",
                "calcium monohydroxide",
                "calcium sulfate",
                "cobalt dichloride",
                "copper(II) sulfate",
                "copper(II) sulfate hexahydrate",
                "copper(II) sulfate pentahydrate",
                "inorganic ammonium salt",
                "inorganic chloride",
                "inorganic cobalt salt",
                "inorganic fluoride salt",
                "inorganic iodine salt",
                "inorganic lithium salt",
                "inorganic manganese salt",
                "inorganic nickel salt",
                "inorganic phosphate salt",
                "inorganic sulfate salt",
                "iron trichloride hexahydrate",
                "iron(3+) phosphate",
                "iron(3+) sulfate",
                "lithium chloride",
                "lithium sulfate",
                "magnesium sulfate",
                "manganese(II) chloride",
                "manganese(II) chloride dihydrate",
                "manganese(II) chloride tetrahydrate",
                "nickel sulfate",
                "potassium chloride",
                "potassium nitrate",
                "scandium nitrate",
                "silver(1+) nitrate",
                "sodium chloride",
                "sodium disulfite",
                "sodium fluorate",
                "sodium fluorophosphate",
                "sodium iodide",
                "sodium nitrate",
                "sodium nitrite",
                "sodium phosphate",
                "sodium thiosulfate",
                "zinc sulfate",
                "zinc sulfate heptahydrate",
                "zinc sulfate hexahydrate"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Sodium chloride (NaCl)",
            "Potassium chloride (KCl)",
            "Calcium chloride (CaCl2)",
            "Magnesium sulfate (MgSO4)",
            "Potassium phosphate (K3PO4)",
            "Ammonium chloride (NH4Cl)",
            "Sodium bicarbonate (NaHCO3)",
            "Calcium carbonate (CaCO3)",
            "Potassium nitrate (KNO3)",
            "Sodium sulfate (Na2SO4)",
            "Magnesium chloride (MgCl2)",
            "Ammonium sulfate ((NH4)2SO4)",
            "Calcium phosphate (Ca3(PO4)2)",
            "Potassium carbonate (K2CO3)",
            "Sodium acetate (CH3COONa)",
            "Magnesium carbonate (MgCO3)",
            "Ammonium nitrate (NH4NO3)",
            "Calcium sulfate (CaSO4)",
            "Potassium sulfate (K2SO4)",
            "Sodium phosphate (Na3PO4)",
            "Magnesium phosphate (Mg3(PO4)2)",
            "Ammonium carbonate ((NH4)2CO3)",
            "Calcium nitrate (Ca(NO3)2)",
            "Potassium acetate (CH3COOK)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium chloride (NaCl)",
                "Potassium chloride (KCl)",
                "Magnesium sulfate (MgSO4)",
                "Ammonium chloride (NH4Cl)",
                "Calcium carbonate (CaCO3)",
                "Potassium nitrate (KNO3)",
                "Sodium sulfate (Na2SO4)",
                "Magnesium chloride (MgCl2)",
                "Ammonium sulfate ((NH4)2SO4)",
                "Calcium phosphate (Ca3(PO4)2)",
                "Ammonium nitrate (NH4NO3)",
                "Calcium sulfate (CaSO4)",
                "Potassium sulfate (K2SO4)",
                "Sodium phosphate (Na3PO4)",
                "Magnesium phosphate (Mg3(PO4)2)",
                "Calcium nitrate (Ca(NO3)2)"
            ],
            "mismatches": [
                "Potassium phosphate (K3PO4)",
                "Sodium bicarbonate (NaHCO3)",
                "Potassium carbonate (K2CO3)",
                "Sodium acetate (CH3COONa)",
                "Magnesium carbonate (MgCO3)",
                "Ammonium carbonate ((NH4)2CO3)",
                "Potassium acetate (CH3COOK)"
            ],
            "true_referents": [
                "ammonium chloride",
                "ammonium nitrate",
                "ammonium nitrate phosphate",
                "ammonium phosphate sulfate",
                "ammonium sulfate",
                "ammonium thiosulfate",
                "aragonite",
                "barium carbonate",
                "caesium chloride",
                "caesium nitrate",
                "calcium carbonate",
                "calcium dichloride",
                "calcium monohydroxide",
                "calcium nitrate",
                "calcium nitrate tetrahydrate",
                "calcium phosphate",
                "calcium sulfate",
                "inorganic ammonium salt",
                "inorganic phosphate salt",
                "inorganic sulfate salt",
                "magnesium dichloride",
                "magnesium dichloride dihydrate",
                "magnesium nitrate",
                "magnesium phosphate",
                "magnesium sulfate",
                "potassium aluminium sulfate",
                "potassium chloride",
                "potassium nitrate",
                "potassium nitrite",
                "potassium sulfate",
                "sodium amide",
                "sodium chloride",
                "sodium diphosphate",
                "sodium nitrate",
                "sodium phosphate",
                "sodium sulfate",
                "sodium thiosulfate",
                "tricalcium bis(phosphate)"
            ],
            "TP": 16,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Sodium chloride (NaCl)",
            "Potassium nitrate (KNO3)",
            "Calcium carbonate (CaCO3)",
            "Magnesium sulfate (MgSO4)",
            "Ammonium chloride (NH4Cl)",
            "Copper sulfate (CuSO4)",
            "Iron(III) oxide (Fe2O3)",
            "Aluminum hydroxide (Al(OH)3)",
            "Zinc oxide (ZnO)",
            "Barium sulfate (BaSO4)",
            "Lead(II) nitrate (Pb(NO3)2)",
            "Silver nitrate (AgNO3)",
            "Potassium chloride (KCl)",
            "Sodium bicarbonate (NaHCO3)",
            "Calcium chloride (CaCl2)",
            "Magnesium chloride (MgCl2)",
            "Ammonium sulfate ((NH4)2SO4)",
            "Copper(II) chloride (CuCl2)",
            "Iron(II) sulfate (FeSO4)",
            "Aluminum sulfate (Al2(SO4)3)",
            "Zinc chloride (ZnCl2)",
            "Barium chloride (BaCl2)",
            "Lead(II) oxide (PbO)",
            "Silver chloride (AgCl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium chloride (NaCl)",
                "Potassium nitrate (KNO3)",
                "Calcium carbonate (CaCO3)",
                "Magnesium sulfate (MgSO4)",
                "Ammonium chloride (NH4Cl)",
                "Barium sulfate (BaSO4)",
                "Potassium chloride (KCl)",
                "Calcium chloride (CaCl2)",
                "Magnesium chloride (MgCl2)",
                "Ammonium sulfate ((NH4)2SO4)",
                "Copper(II) chloride (CuCl2)",
                "Aluminum sulfate (Al2(SO4)3)",
                "Barium chloride (BaCl2)"
            ],
            "mismatches": [
                "Copper sulfate (CuSO4)",
                "Iron(III) oxide (Fe2O3)",
                "Aluminum hydroxide (Al(OH)3)",
                "Zinc oxide (ZnO)",
                "Lead(II) nitrate (Pb(NO3)2)",
                "Silver nitrate (AgNO3)",
                "Sodium bicarbonate (NaHCO3)",
                "Iron(II) sulfate (FeSO4)",
                "Zinc chloride (ZnCl2)",
                "Lead(II) oxide (PbO)",
                "Silver chloride (AgCl)"
            ],
            "true_referents": [
                "aluminium sulfate",
                "aluminium sulfate (anhydrous)",
                "ammonium chloride",
                "ammonium phosphate sulfate",
                "ammonium sulfate",
                "ammonium thiosulfate",
                "aragonite",
                "barium carbonate",
                "barium chloride",
                "barium nitrate",
                "barium sulfate",
                "beryllium dichloride",
                "caesium chloride",
                "calcium carbonate",
                "calcium dichloride",
                "calcium monohydroxide",
                "copper(I) chloride",
                "copper(II) chloride",
                "copper(II) sulfate",
                "copper(II) sulfate hexahydrate",
                "copper(II) sulfate pentahydrate",
                "inorganic ammonium salt",
                "inorganic chloride",
                "inorganic sulfate salt",
                "inorganic zinc salt",
                "iron(2+) sulfate (anhydrous)",
                "iron(3+) phosphate",
                "iron(3+) sulfate",
                "lead nitrate",
                "lead oxide",
                "lead(II) chloride",
                "magnesium dichloride",
                "magnesium dichloride dihydrate",
                "magnesium sulfate",
                "manganese(II) sulfate",
                "potassium chloride",
                "potassium nitrate",
                "potassium nitrite",
                "scandium nitrate",
                "silver monochloride",
                "silver(1+) nitrate",
                "sodium chloride",
                "sodium nitrate",
                "sodium sulfate",
                "sodium tetrahydroaluminate",
                "zinc dichloride",
                "zinc nitrate"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Sodium Chloride (NaCl)",
            "Potassium Chloride (KCl)",
            "Calcium Chloride (CaCl2)",
            "Magnesium Sulfate (MgSO4)",
            "Ammonium Nitrate (NH4NO3)",
            "Copper Sulfate (CuSO4)",
            "Iron Sulfate (FeSO4)",
            "Zinc Chloride (ZnCl2)",
            "Aluminum Sulfate (Al2(SO4)3)",
            "Barium Chloride (BaCl2)",
            "Lithium Chloride (LiCl)",
            "Potassium Iodide (KI)",
            "Calcium Carbonate (CaCO3)",
            "Sodium Bicarbonate (NaHCO3)",
            "Sodium Phosphate (Na3PO4)",
            "Calcium Nitrate (Ca(NO3)2)",
            "Magnesium Chloride (MgCl2)",
            "Ferric Chloride (FeCl3)",
            "Zinc Sulfate (ZnSO4)",
            "Copper Chloride (CuCl2)",
            "Ammonium Sulfate ((NH4)2SO4)",
            "Sodium Sulfate (Na2SO4)",
            "Calcium Phosphate (Ca3(PO4)2)",
            "Potassium Nitrate (KNO3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium Chloride (NaCl)",
                "Potassium Chloride (KCl)",
                "Calcium Chloride (CaCl2)",
                "Magnesium Sulfate (MgSO4)",
                "Ammonium Nitrate (NH4NO3)",
                "Barium Chloride (BaCl2)",
                "Lithium Chloride (LiCl)",
                "Calcium Carbonate (CaCO3)",
                "Sodium Phosphate (Na3PO4)",
                "Calcium Nitrate (Ca(NO3)2)",
                "Magnesium Chloride (MgCl2)",
                "Zinc Sulfate (ZnSO4)",
                "Copper Chloride (CuCl2)",
                "Ammonium Sulfate ((NH4)2SO4)",
                "Sodium Sulfate (Na2SO4)",
                "Calcium Phosphate (Ca3(PO4)2)",
                "Potassium Nitrate (KNO3)"
            ],
            "mismatches": [
                "Copper Sulfate (CuSO4)",
                "Iron Sulfate (FeSO4)",
                "Zinc Chloride (ZnCl2)",
                "Aluminum Sulfate (Al2(SO4)3)",
                "Potassium Iodide (KI)",
                "Sodium Bicarbonate (NaHCO3)",
                "Ferric Chloride (FeCl3)"
            ],
            "true_referents": [
                "aluminium sulfate",
                "aluminium sulfate (anhydrous)",
                "ammonium nitrate",
                "ammonium nitrate phosphate",
                "ammonium phosphate sulfate",
                "ammonium sulfate",
                "ammonium thiosulfate",
                "aragonite",
                "barium carbonate",
                "barium chloride",
                "barium sulfate",
                "beryllium dichloride",
                "caesium chloride",
                "caesium nitrate",
                "calcium carbonate",
                "calcium dichloride",
                "calcium monohydroxide",
                "calcium nitrate",
                "calcium nitrate tetrahydrate",
                "calcium phosphate",
                "copper(I) chloride",
                "copper(II) chloride",
                "copper(II) sulfate",
                "copper(II) sulfate hexahydrate",
                "copper(II) sulfate pentahydrate",
                "ferrous ammonium sulfate (anhydrous)",
                "inorganic iodine salt",
                "inorganic lithium salt",
                "inorganic sulfate salt",
                "iron trichloride hexahydrate",
                "iron(2+) sulfate (anhydrous)",
                "iron(3+) phosphate",
                "iron(3+) sulfate",
                "lithium chloride",
                "lithium sulfate",
                "magnesium dichloride",
                "magnesium dichloride dihydrate",
                "magnesium sulfate",
                "potassium chloride",
                "potassium nitrate",
                "potassium nitrite",
                "sodium chloride",
                "sodium diphosphate",
                "sodium iodide",
                "sodium nitrate",
                "sodium phosphate",
                "sodium sulfate",
                "sodium thiosulfate",
                "tricalcium bis(phosphate)",
                "zinc dichloride",
                "zinc sulfate",
                "zinc sulfate heptahydrate",
                "zinc sulfate hexahydrate"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Calcium carbonate (CaCO3)",
            "Magnesium chloride (MgCl2)",
            "Sodium nitrate (NaNO3)",
            "Potassium sulfate (K2SO4)",
            "Calcium phosphate (Ca3(PO4)2)",
            "Magnesium oxide (MgO)",
            "Sodium sulfate (Na2SO4)",
            "Potassium chloride (KCl)",
            "Calcium hydroxide (Ca(OH)2)",
            "Magnesium nitrate (Mg(NO3)2)",
            "Sodium carbonate (Na2CO3)",
            "Potassium nitrate (KNO3)",
            "Calcium acetate (Ca(C2H3O2)2)",
            "Magnesium acetate (Mg(C2H3O2)2)",
            "Sodium citrate (Na3(C6H5O7))",
            "Potassium citrate (K3(C6H5O7))",
            "Calcium gluconate (Ca(C6H11O7))",
            "Magnesium gluconate (Mg(C6H11O7))",
            "Sodium tartrate (Na2(C4H4O6))",
            "Potassium tartrate (K2(C4H4O6))",
            "Calcium lactate (Ca(C3H5O5))",
            "Magnesium lactate (Mg(C3H5O5))",
            "Sodium lactate (NaC3H5O3)",
            "Potassium lactate (KC3H5O3)",
            "Calcium malate (Ca(C4H4O5))",
            "Magnesium malate (Mg(C4H4O5))",
            "Sodium malate (NaC4H4O5)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Calcium carbonate (CaCO3)",
                "Sodium nitrate (NaNO3)",
                "Potassium sulfate (K2SO4)",
                "Calcium phosphate (Ca3(PO4)2)",
                "Sodium sulfate (Na2SO4)",
                "Potassium chloride (KCl)",
                "Calcium hydroxide (Ca(OH)2)",
                "Magnesium nitrate (Mg(NO3)2)",
                "Potassium nitrate (KNO3)"
            ],
            "mismatches": [
                "Magnesium chloride (MgCl2)",
                "Magnesium oxide (MgO)",
                "Sodium carbonate (Na2CO3)",
                "Calcium acetate (Ca(C2H3O2)2)",
                "Magnesium acetate (Mg(C2H3O2)2)",
                "Sodium citrate (Na3(C6H5O7))",
                "Potassium citrate (K3(C6H5O7))",
                "Calcium gluconate (Ca(C6H11O7))",
                "Magnesium gluconate (Mg(C6H11O7))",
                "Sodium tartrate (Na2(C4H4O6))",
                "Potassium tartrate (K2(C4H4O6))",
                "Calcium lactate (Ca(C3H5O5))",
                "Magnesium lactate (Mg(C3H5O5))",
                "Sodium lactate (NaC3H5O3)",
                "Potassium lactate (KC3H5O3)",
                "Calcium malate (Ca(C4H4O5))",
                "Magnesium malate (Mg(C4H4O5))",
                "Sodium malate (NaC4H4O5)"
            ],
            "true_referents": [
                "aragonite",
                "barium carbonate",
                "calcium carbonate",
                "calcium dihydroxide",
                "calcium diphosphate",
                "calcium hydrogenphosphate",
                "calcium hydroxide",
                "calcium monohydroxide",
                "calcium phosphate",
                "inorganic magnesium salt",
                "inorganic nitrate salt",
                "inorganic sulfate salt",
                "magnesium dichloride",
                "magnesium dichloride dihydrate",
                "magnesium dichloride monohydrate",
                "magnesium nitrate",
                "magnesium phosphate",
                "magnesium sulfate",
                "potassium aluminium sulfate",
                "potassium chloride",
                "potassium nitrate",
                "potassium nitrite",
                "potassium sulfate",
                "sodium chlorate",
                "sodium chloride",
                "sodium chlorite",
                "sodium diphosphate",
                "sodium fluorate",
                "sodium nitrate",
                "sodium nitrite",
                "sodium phosphate",
                "sodium sulfate",
                "sodium thiosulfate",
                "tricalcium bis(phosphate)"
            ],
            "TP": 9,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            "Aluminum sulfate (Al2(SO4)3)",
            "Sodium nitrate (NaNO3)",
            "Copper(II) chloride (CuCl2)",
            "Calcium carbonate (CaCO3)",
            "Potassium bromide (KBr)",
            "Barium sulfate (BaSO4)",
            "Zinc oxide (ZnO)",
            "Magnesium hydroxide (Mg(OH)2)",
            "Iron(II) sulfate (FeSO4)",
            "Silver nitrate (AgNO3)",
            "Ammonium chloride (NH4Cl)",
            "Manganese(II) oxide (MnO)",
            "Cobalt(II) chloride (CoCl2)",
            "Sodium phosphate (Na3PO4)",
            "Nickel(II) sulfate (NiSO4)",
            "Lithium chloride (LiCl)",
            "Strontium carbonate (SrCO3)",
            "Chromium(III) oxide (Cr2O3)",
            "Potassium iodide (KI)",
            "Tin(II) chloride (SnCl2)",
            "Cadmium sulfate (CdSO4)",
            "Mercury(II) chloride (HgCl2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aluminum sulfate (Al2(SO4)3)",
                "Sodium nitrate (NaNO3)",
                "Copper(II) chloride (CuCl2)",
                "Calcium carbonate (CaCO3)",
                "Barium sulfate (BaSO4)",
                "Ammonium chloride (NH4Cl)",
                "Cobalt(II) chloride (CoCl2)",
                "Sodium phosphate (Na3PO4)",
                "Nickel(II) sulfate (NiSO4)",
                "Lithium chloride (LiCl)"
            ],
            "mismatches": [
                "Potassium bromide (KBr)",
                "Zinc oxide (ZnO)",
                "Magnesium hydroxide (Mg(OH)2)",
                "Iron(II) sulfate (FeSO4)",
                "Silver nitrate (AgNO3)",
                "Manganese(II) oxide (MnO)",
                "Strontium carbonate (SrCO3)",
                "Chromium(III) oxide (Cr2O3)",
                "Potassium iodide (KI)",
                "Tin(II) chloride (SnCl2)",
                "Cadmium sulfate (CdSO4)",
                "Mercury(II) chloride (HgCl2)"
            ],
            "true_referents": [
                "aluminium sulfate",
                "aluminium sulfate (anhydrous)",
                "ammonium chloride",
                "ammonium sulfate",
                "aragonite",
                "barium carbonate",
                "barium chloride",
                "barium nitrate",
                "barium sulfate",
                "cadmium nitrate",
                "cadmium nitrate tetrahydrate",
                "calcium carbonate",
                "calcium dihydroxide",
                "chromium(III) sulfate",
                "cobalt dichloride",
                "copper(I) chloride",
                "copper(II) chloride",
                "copper(II) sulfate",
                "disodium hydrogenphosphate",
                "inorganic ammonium salt",
                "inorganic cadmium salt",
                "inorganic chloride",
                "inorganic chromium salt",
                "inorganic iodine salt",
                "inorganic lithium salt",
                "inorganic manganese salt",
                "inorganic mercury salt",
                "inorganic strontium salt",
                "inorganic tin salt",
                "inorganic zinc salt",
                "iron(2+) sulfate (anhydrous)",
                "iron(3+) sulfate",
                "lithium chloride",
                "lithium sulfate",
                "magnesium sulfate",
                "manganese(II) chloride",
                "manganese(II) sulfate",
                "mercuric amidochloride",
                "metal sulfate",
                "nickel sulfate",
                "potassium chloride",
                "scandium nitrate",
                "silver(1+) nitrate",
                "sodium bromide",
                "sodium chromate",
                "sodium diphosphate",
                "sodium iodide",
                "sodium nitrate",
                "sodium nitrite",
                "sodium phosphate",
                "tin(II) chloride (anhydrous)",
                "zinc nitrate"
            ],
            "TP": 10,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "inorganic salt",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Calcium iodide",
                "Canonical name": "(CaI2)"
            },
            {
                "Referent": "Barium sulfate",
                "Canonical name": "(BaSO4)"
            },
            {
                "Referent": "Copper sulfate",
                "Canonical name": "(CuSO4)"
            },
            {
                "Referent": "Silver nitrate",
                "Canonical name": "(AgNO3)"
            },
            {
                "Referent": "Zinc chloride",
                "Canonical name": "(ZnCl2)"
            },
            {
                "Referent": "Sodium chloride",
                "Canonical name": "(NaCl)"
            },
            {
                "Referent": "Magnesium chloride",
                "Canonical name": "(MgCl2)"
            },
            {
                "Referent": "Iron(III) chloride",
                "Canonical name": "(FeCl3)"
            },
            {
                "Referent": "Lead(IV) oxide",
                "Canonical name": "(PbO2)"
            },
            {
                "Referent": "Potassium iodide",
                "Canonical name": "(KI)"
            },
            {
                "Referent": "Ammonium chloride",
                "Canonical name": "(NH4Cl)"
            },
            {
                "Referent": "Sodium bromide",
                "Canonical name": "(NaBr)"
            },
            {
                "Referent": "Silver bromide",
                "Canonical name": "(AgBr)"
            },
            {
                "Referent": "Iron(II) sulfate",
                "Canonical name": "(FeSO4)"
            },
            {
                "Referent": "Sodium carbonate",
                "Canonical name": "(Na2CO3)"
            },
            {
                "Referent": "Calcium carbonate",
                "Canonical name": "(CaCO3)"
            },
            {
                "Referent": "Magnesium carbonate",
                "Canonical name": "(MgCO3)"
            },
            {
                "Referent": "Barium carbonate",
                "Canonical name": "(BaCO3)"
            },
            {
                "Referent": "Potassium carbonate",
                "Canonical name": "(K2CO3)"
            },
            {
                "Referent": "Ammonium carbonate",
                "Canonical name": "(NH4)2CO3)"
            },
            {
                "Referent": "Sodium nitrite",
                "Canonical name": "(NaNO2)"
            },
            {
                "Referent": "Ammonium nitrate",
                "Canonical name": "(NH4NO3)"
            },
            {
                "Referent": "Sodium nitrate",
                "Canonical name": "(NaNO3)"
            },
            {
                "Referent": "Potassium nitrate",
                "Canonical name": "(KNO3)"
            },
            {
                "Referent": "Ammonium sulfate",
                "Canonical name": "(NH4)2SO4)"
            },
            {
                "Referent": "Calcium sulfate",
                "Canonical name": "(CaSO4)"
            },
            {
                "Referent": "Magnesium sulfate",
                "Canonical name": "(MgSO4)"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Barium sulfate",
                "Sodium chloride",
                "Ammonium chloride",
                "Sodium bromide",
                "Calcium carbonate",
                "Barium carbonate",
                "Sodium nitrite",
                "Ammonium nitrate",
                "Sodium nitrate",
                "Potassium nitrate",
                "Ammonium sulfate",
                "Magnesium sulfate"
            ],
            "mismatches": [
                "Calcium iodide",
                "Copper sulfate",
                "Silver nitrate",
                "Zinc chloride",
                "Magnesium chloride",
                "Iron(III) chloride",
                "Lead(IV) oxide",
                "Potassium iodide",
                "Silver bromide",
                "Iron(II) sulfate",
                "Sodium carbonate",
                "Magnesium carbonate",
                "Potassium carbonate",
                "Ammonium carbonate",
                "Calcium sulfate"
            ],
            "true_referents": [
                "ammonium chloride",
                "ammonium nitrate",
                "ammonium nitrate phosphate",
                "ammonium sulfate",
                "aragonite",
                "barium carbonate",
                "barium chloride",
                "barium nitrate",
                "barium sulfate",
                "caesium chloride",
                "calcium carbonate",
                "copper(II) chloride",
                "copper(II) sulfate",
                "copper(II) sulfate pentahydrate",
                "inorganic ammonium salt",
                "inorganic caesium salt",
                "inorganic chloride",
                "inorganic copper salt",
                "inorganic iodine salt",
                "inorganic magnesium salt",
                "inorganic nitrate salt",
                "inorganic potassium salt",
                "inorganic sodium salt",
                "inorganic sulfate salt",
                "iron dichloride tetrahydrate",
                "iron(2+) sulfate (anhydrous)",
                "iron(3+) sulfate",
                "lead nitrate",
                "lead oxide",
                "lead(II) chloride",
                "magnesium dichloride",
                "magnesium sulfate",
                "potassium nitrate",
                "potassium nitrite",
                "silver(1+) nitrate",
                "sodium bromide",
                "sodium chloride",
                "sodium iodide",
                "sodium nitrate",
                "sodium nitrite",
                "zinc dichloride"
            ],
            "TP": 12,
            "FP": 15,
            "FN": 0
        }
    }
]