[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Hydroxide (OH\u207b)",
            "Fluoride (F\u207b)",
            "Chloride (Cl\u207b)",
            "Bromide (Br\u207b)",
            "Iodide (I\u207b)",
            "Astatide (At\u207b)",
            "Nitride (N\u00b3\u207b)",
            "Phosphide (P\u00b3\u207b)",
            "Arsenide (As\u00b3\u207b)",
            "Antimonide (Sb\u00b3\u207b)",
            "Bismuthide (Bi\u00b3\u207b)",
            "Sulfide (S\u00b2\u207b)",
            "Selenide (Se\u00b2\u207b)",
            "Telluride (Te\u00b2\u207b)",
            "Polonium hydride (PoH\u207b)",
            "Oxide (O\u00b2\u207b)",
            "Peroxide (O\u2082\u00b2\u207b)",
            "Azide (N\u2083\u207b)",
            "Thiocyanate (SCN\u207b)",
            "Thiocyanate (NCS\u207b)",
            "Formate (HCOO\u207b)",
            "Acetate (CH\u2083COO\u207b)",
            "Nitrate (NO\u2083\u207b)",
            "Nitrite (NO\u2082\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxide (OH\u207b)",
                "Fluoride (F\u207b)",
                "Chloride (Cl\u207b)",
                "Bromide (Br\u207b)",
                "Iodide (I\u207b)",
                "Astatide (At\u207b)",
                "Nitride (N\u00b3\u207b)",
                "Phosphide (P\u00b3\u207b)",
                "Arsenide (As\u00b3\u207b)",
                "Antimonide (Sb\u00b3\u207b)",
                "Bismuthide (Bi\u00b3\u207b)",
                "Sulfide (S\u00b2\u207b)",
                "Selenide (Se\u00b2\u207b)",
                "Telluride (Te\u00b2\u207b)",
                "Polonium hydride (PoH\u207b)",
                "Oxide (O\u00b2\u207b)",
                "Peroxide (O\u2082\u00b2\u207b)",
                "Azide (N\u2083\u207b)",
                "Thiocyanate (SCN\u207b)",
                "Thiocyanate (NCS\u207b)",
                "Formate (HCOO\u207b)",
                "Acetate (CH\u2083COO\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Nitrite (NO\u2082\u207b)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate (CH\u2083COO\u207b)",
                "Antimonide (Sb\u00b3\u207b)",
                "Arsenide (As\u00b3\u207b)",
                "Astatide (At\u207b)",
                "Azide (N\u2083\u207b)",
                "Bismuthide (Bi\u00b3\u207b)",
                "Bromide (Br\u207b)",
                "Chloride (Cl\u207b)",
                "Fluoride (F\u207b)",
                "Formate (HCOO\u207b)",
                "Hydroxide (OH\u207b)",
                "Iodide (I\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Nitride (N\u00b3\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Oxide (O\u00b2\u207b)",
                "Peroxide (O\u2082\u00b2\u207b)",
                "Phosphide (P\u00b3\u207b)",
                "Polonium hydride (PoH\u207b)",
                "Selenide (Se\u00b2\u207b)",
                "Sulfide (S\u00b2\u207b)",
                "Telluride (Te\u00b2\u207b)",
                "Thiocyanate (NCS\u207b)",
                "Thiocyanate (SCN\u207b)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride (Cl\u207b)",
            "Fluoride (F\u207b)",
            "Bromide (Br\u207b)",
            "Iodide (I\u207b)",
            "Hydroxide (OH\u207b)",
            "Nitrate (NO\u2083\u207b)",
            "Nitrite (NO\u2082\u207b)",
            "Sulfate (SO\u2084\u00b2\u207b)",
            "Sulfite (SO\u2083\u00b2\u207b)",
            "Perchlorate (ClO\u2084\u207b)",
            "Phosphate (PO\u2084\u00b3\u207b)",
            "Hypochlorite (ClO\u207b)",
            "Chlorite (ClO\u2082\u207b)",
            "Bicarbonate (HCO\u2083\u207b)",
            "Acetate (C\u2082H\u2083O\u2082\u207b)",
            "Formate (HCOO\u207b)",
            "Thiocyanate (SCN\u207b)",
            "Cyanide (CN\u207b)",
            "Phenolate (C\u2086H\u2085O\u207b)",
            "Oxalate (C\u2082O\u2084\u00b2\u207b)",
            "Permanganate (MnO\u2084\u207b)",
            "Dichromate (Cr\u2082O\u2087\u00b2\u207b)",
            "Molybdate (MoO\u2084\u00b2\u207b)",
            "Chromate (CrO\u2084\u00b2\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloride (Cl\u207b)",
                "Fluoride (F\u207b)",
                "Bromide (Br\u207b)",
                "Iodide (I\u207b)",
                "Hydroxide (OH\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Sulfate (SO\u2084\u00b2\u207b)",
                "Sulfite (SO\u2083\u00b2\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Phosphate (PO\u2084\u00b3\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Chlorite (ClO\u2082\u207b)",
                "Bicarbonate (HCO\u2083\u207b)",
                "Acetate (C\u2082H\u2083O\u2082\u207b)",
                "Formate (HCOO\u207b)",
                "Thiocyanate (SCN\u207b)",
                "Cyanide (CN\u207b)",
                "Phenolate (C\u2086H\u2085O\u207b)",
                "Oxalate (C\u2082O\u2084\u00b2\u207b)",
                "Permanganate (MnO\u2084\u207b)",
                "Dichromate (Cr\u2082O\u2087\u00b2\u207b)",
                "Molybdate (MoO\u2084\u00b2\u207b)",
                "Chromate (CrO\u2084\u00b2\u207b)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate (C\u2082H\u2083O\u2082\u207b)",
                "Bicarbonate (HCO\u2083\u207b)",
                "Bromide (Br\u207b)",
                "Chloride (Cl\u207b)",
                "Chlorite (ClO\u2082\u207b)",
                "Chromate (CrO\u2084\u00b2\u207b)",
                "Cyanide (CN\u207b)",
                "Dichromate (Cr\u2082O\u2087\u00b2\u207b)",
                "Fluoride (F\u207b)",
                "Formate (HCOO\u207b)",
                "Hydroxide (OH\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Iodide (I\u207b)",
                "Molybdate (MoO\u2084\u00b2\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Oxalate (C\u2082O\u2084\u00b2\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Permanganate (MnO\u2084\u207b)",
                "Phenolate (C\u2086H\u2085O\u207b)",
                "Phosphate (PO\u2084\u00b3\u207b)",
                "Sulfate (SO\u2084\u00b2\u207b)",
                "Sulfite (SO\u2083\u00b2\u207b)",
                "Thiocyanate (SCN\u207b)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Fluoride (F\u207b)",
            "Chloride (Cl\u207b)",
            "Bromide (Br\u207b)",
            "Iodide (I\u207b)",
            "Hydroxide (OH\u207b)",
            "Cyanide (CN\u207b)",
            "Azide (N\u2083\u207b)",
            "Hypochlorite (ClO\u207b)",
            "Hypobromite (BrO\u207b)",
            "Hypoiodite (IO\u207b)",
            "Chlorate (ClO\u2083\u207b)",
            "Bromate (BrO\u2083\u207b)",
            "Iodate (IO\u2083\u207b)",
            "Perchlorate (ClO\u2084\u207b)",
            "Perbromate (BrO\u2084\u207b)",
            "Periodate (IO\u2084\u207b)",
            "Thiocyanate (SCN\u207b)",
            "Nitrite (NO\u2082\u207b)",
            "Nitrate (NO\u2083\u207b)",
            "Permanganate (MnO\u2084\u207b)",
            "Carbonate (CO\u2083\u00b2\u207b)",
            "Bicarbonate (HCO\u2083\u207b)",
            "Sulfite (SO\u2083\u00b2\u207b)",
            "Sulfate (SO\u2084\u00b2\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fluoride (F\u207b)",
                "Chloride (Cl\u207b)",
                "Bromide (Br\u207b)",
                "Iodide (I\u207b)",
                "Hydroxide (OH\u207b)",
                "Cyanide (CN\u207b)",
                "Azide (N\u2083\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Hypobromite (BrO\u207b)",
                "Hypoiodite (IO\u207b)",
                "Chlorate (ClO\u2083\u207b)",
                "Bromate (BrO\u2083\u207b)",
                "Iodate (IO\u2083\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Perbromate (BrO\u2084\u207b)",
                "Periodate (IO\u2084\u207b)",
                "Thiocyanate (SCN\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Permanganate (MnO\u2084\u207b)",
                "Carbonate (CO\u2083\u00b2\u207b)",
                "Bicarbonate (HCO\u2083\u207b)",
                "Sulfite (SO\u2083\u00b2\u207b)",
                "Sulfate (SO\u2084\u00b2\u207b)"
            ],
            "mismatches": [],
            "true_referents": [
                "Azide (N\u2083\u207b)",
                "Bicarbonate (HCO\u2083\u207b)",
                "Bromate (BrO\u2083\u207b)",
                "Bromide (Br\u207b)",
                "Carbonate (CO\u2083\u00b2\u207b)",
                "Chlorate (ClO\u2083\u207b)",
                "Chloride (Cl\u207b)",
                "Cyanide (CN\u207b)",
                "Fluoride (F\u207b)",
                "Hydroxide (OH\u207b)",
                "Hypobromite (BrO\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Hypoiodite (IO\u207b)",
                "Iodate (IO\u2083\u207b)",
                "Iodide (I\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Perbromate (BrO\u2084\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Periodate (IO\u2084\u207b)",
                "Permanganate (MnO\u2084\u207b)",
                "Sulfate (SO\u2084\u00b2\u207b)",
                "Sulfite (SO\u2083\u00b2\u207b)",
                "Thiocyanate (SCN\u207b)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Hydroxide (OH\u207b)",
            "Fluoride (F\u207b)",
            "Chloride (Cl\u207b)",
            "Bromide (Br\u207b)",
            "Iodide (I\u207b)",
            "Cyanide (CN\u207b)",
            "Hypochlorite (ClO\u207b)",
            "Chlorite (ClO\u2082\u207b)",
            "Chlorate (ClO\u2083\u207b)",
            "Perchlorate (ClO\u2084\u207b)",
            "Nitrite (NO\u2082\u207b)",
            "Nitrate (NO\u2083\u207b)",
            "Sulfite (SO\u2083\u00b2\u207b)",
            "Bisulfite/Hydrogen Sulfite (HSO\u2083\u207b)",
            "Sulfate (SO\u2084\u00b2\u207b)",
            "Hydrogen Sulfate/Bisulfate (HSO\u2084\u207b)",
            "Carbonate (CO\u2083\u00b2\u207b)",
            "Bicarbonate/Hydrogen Carbonate (HCO\u2083\u207b)",
            "Phosphate (PO\u2084\u00b3\u207b)",
            "Hydrogen Phosphate (HPO\u2084\u00b2\u207b)",
            "Dihydrogen Phosphate (H\u2082PO\u2084\u207b)",
            "Silicate (SiO\u2084\u2074\u207b)",
            "Metasilicate (SiO\u2083\u00b2\u207b)",
            "Arsenite (AsO\u2082\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxide (OH\u207b)",
                "Fluoride (F\u207b)",
                "Chloride (Cl\u207b)",
                "Bromide (Br\u207b)",
                "Iodide (I\u207b)",
                "Cyanide (CN\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Chlorite (ClO\u2082\u207b)",
                "Chlorate (ClO\u2083\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Sulfite (SO\u2083\u00b2\u207b)",
                "Bisulfite/Hydrogen Sulfite (HSO\u2083\u207b)",
                "Sulfate (SO\u2084\u00b2\u207b)",
                "Hydrogen Sulfate/Bisulfate (HSO\u2084\u207b)",
                "Carbonate (CO\u2083\u00b2\u207b)",
                "Bicarbonate/Hydrogen Carbonate (HCO\u2083\u207b)",
                "Phosphate (PO\u2084\u00b3\u207b)",
                "Hydrogen Phosphate (HPO\u2084\u00b2\u207b)",
                "Dihydrogen Phosphate (H\u2082PO\u2084\u207b)",
                "Silicate (SiO\u2084\u2074\u207b)",
                "Metasilicate (SiO\u2083\u00b2\u207b)",
                "Arsenite (AsO\u2082\u207b)"
            ],
            "mismatches": [],
            "true_referents": [
                "Arsenite (AsO\u2082\u207b)",
                "Bicarbonate/Hydrogen Carbonate (HCO\u2083\u207b)",
                "Bisulfite/Hydrogen Sulfite (HSO\u2083\u207b)",
                "Bromide (Br\u207b)",
                "Carbonate (CO\u2083\u00b2\u207b)",
                "Chlorate (ClO\u2083\u207b)",
                "Chloride (Cl\u207b)",
                "Chlorite (ClO\u2082\u207b)",
                "Cyanide (CN\u207b)",
                "Dihydrogen Phosphate (H\u2082PO\u2084\u207b)",
                "Fluoride (F\u207b)",
                "Hydrogen Phosphate (HPO\u2084\u00b2\u207b)",
                "Hydrogen Sulfate/Bisulfate (HSO\u2084\u207b)",
                "Hydroxide (OH\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Iodide (I\u207b)",
                "Metasilicate (SiO\u2083\u00b2\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Phosphate (PO\u2084\u00b3\u207b)",
                "Silicate (SiO\u2084\u2074\u207b)",
                "Sulfate (SO\u2084\u00b2\u207b)",
                "Sulfite (SO\u2083\u00b2\u207b)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride (Cl-)",
            "Fluoride (F-)",
            "Bromide (Br-)",
            "Iodide (I-)",
            "Hydroxide (OH-)",
            "Cyanide (CN-)",
            "Nitrite (NO2-)",
            "Nitrate (NO3-)",
            "Hydrogen sulfate (HSO4-)",
            "Hydrogen carbonate (HCO3-)",
            "Acetate (CH3COO-)",
            "Perchlorate (ClO4-)",
            "Hypochlorite (ClO-)",
            "Dihydrogen phosphate (H2PO4-)",
            "Hydrogen sulfide (HS-)",
            "Thiocyanate (SCN-)",
            "Azide (N3-)",
            "Hydrogen fluoride (HF2-)",
            "Formate (HCOO-)",
            "Hydrogen sulfite (HSO3-)",
            "Hydrogen oxalate (HC2O4-)",
            "Hydrogen arsenate (HAsO4-)",
            "Hydrogen silicate (HSiO3-)",
            "Hydrogen borate (HB4O7-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloride (Cl-)",
                "Fluoride (F-)",
                "Bromide (Br-)",
                "Iodide (I-)",
                "Hydroxide (OH-)",
                "Cyanide (CN-)",
                "Nitrite (NO2-)",
                "Nitrate (NO3-)",
                "Hydrogen sulfate (HSO4-)",
                "Hydrogen carbonate (HCO3-)",
                "Acetate (CH3COO-)",
                "Perchlorate (ClO4-)",
                "Hypochlorite (ClO-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Hydrogen sulfide (HS-)",
                "Thiocyanate (SCN-)",
                "Azide (N3-)",
                "Hydrogen fluoride (HF2-)",
                "Formate (HCOO-)",
                "Hydrogen sulfite (HSO3-)",
                "Hydrogen oxalate (HC2O4-)",
                "Hydrogen arsenate (HAsO4-)",
                "Hydrogen silicate (HSiO3-)",
                "Hydrogen borate (HB4O7-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate (CH3COO-)",
                "Azide (N3-)",
                "Bromide (Br-)",
                "Chloride (Cl-)",
                "Cyanide (CN-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Fluoride (F-)",
                "Formate (HCOO-)",
                "Hydrogen arsenate (HAsO4-)",
                "Hydrogen borate (HB4O7-)",
                "Hydrogen carbonate (HCO3-)",
                "Hydrogen fluoride (HF2-)",
                "Hydrogen oxalate (HC2O4-)",
                "Hydrogen silicate (HSiO3-)",
                "Hydrogen sulfate (HSO4-)",
                "Hydrogen sulfide (HS-)",
                "Hydrogen sulfite (HSO3-)",
                "Hydroxide (OH-)",
                "Hypochlorite (ClO-)",
                "Iodide (I-)",
                "Nitrate (NO3-)",
                "Nitrite (NO2-)",
                "Perchlorate (ClO4-)",
                "Thiocyanate (SCN-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride (Cl\u207b)",
            "Bromide (Br\u207b)",
            "Iodide (I\u207b)",
            "Fluoride (F\u207b)",
            "Nitrate (NO3\u207b)",
            "Nitrite (NO2\u207b)",
            "Sulfate (SO4\u00b2\u207b)",
            "Sulfite (SO3\u00b2\u207b)",
            "Phosphate (PO4\u00b3\u207b)",
            "Carbonate (CO3\u00b2\u207b)",
            "Hydroxide (OH\u207b)",
            "Cyanide (CN\u207b)",
            "Acetate (C2H3O2\u207b)",
            "Formate (HCOO\u207b)",
            "Thiocyanate (SCN\u207b)",
            "Perchlorate (ClO4\u207b)",
            "Chlorate (ClO3\u207b)",
            "Hypochlorite (ClO\u207b)",
            "Bicarbonate (HCO3\u207b)",
            "Arsenate (AsO4\u00b3\u207b)",
            "Arsenite (AsO3\u00b3\u207b)",
            "Molybdate (MoO4\u00b2\u207b)",
            "Tungstate (WO4\u00b2\u207b)",
            "Vanadate (VO4\u00b3\u207b)",
            "Silicate (SiO4\u2074\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloride (Cl\u207b)",
                "Bromide (Br\u207b)",
                "Iodide (I\u207b)",
                "Fluoride (F\u207b)",
                "Nitrate (NO3\u207b)",
                "Nitrite (NO2\u207b)",
                "Sulfate (SO4\u00b2\u207b)",
                "Sulfite (SO3\u00b2\u207b)",
                "Phosphate (PO4\u00b3\u207b)",
                "Carbonate (CO3\u00b2\u207b)",
                "Hydroxide (OH\u207b)",
                "Cyanide (CN\u207b)",
                "Acetate (C2H3O2\u207b)",
                "Formate (HCOO\u207b)",
                "Thiocyanate (SCN\u207b)",
                "Perchlorate (ClO4\u207b)",
                "Chlorate (ClO3\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Bicarbonate (HCO3\u207b)",
                "Arsenate (AsO4\u00b3\u207b)",
                "Arsenite (AsO3\u00b3\u207b)",
                "Molybdate (MoO4\u00b2\u207b)",
                "Tungstate (WO4\u00b2\u207b)",
                "Vanadate (VO4\u00b3\u207b)"
            ],
            "mismatches": [
                "Silicate (SiO4\u2074\u207b)"
            ],
            "true_referents": [
                "Acetate (C2H3O2\u207b)",
                "Arsenate (AsO4\u00b3\u207b)",
                "Arsenite (AsO3\u00b3\u207b)",
                "Bicarbonate (HCO3\u207b)",
                "Bromide (Br\u207b)",
                "Carbonate (CO3\u00b2\u207b)",
                "Chlorate (ClO3\u207b)",
                "Chloride (Cl\u207b)",
                "Cyanide (CN\u207b)",
                "Fluoride (F\u207b)",
                "Formate (HCOO\u207b)",
                "Hydroxide (OH\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Iodide (I\u207b)",
                "Molybdate (MoO4\u00b2\u207b)",
                "Nitrate (NO3\u207b)",
                "Nitrite (NO2\u207b)",
                "Perchlorate (ClO4\u207b)",
                "Phosphate (PO4\u00b3\u207b)",
                "Sulfate (SO4\u00b2\u207b)",
                "Sulfite (SO3\u00b2\u207b)",
                "Thiocyanate (SCN\u207b)",
                "Tungstate (WO4\u00b2\u207b)",
                "Vanadate (VO4\u00b3\u207b)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride (Cl-)",
            "Bromide (Br-)",
            "Iodide (I-)",
            "Fluoride (F-)",
            "Nitrate (NO3-)",
            "Hydroxide (OH-)",
            "Perchlorate (ClO4-)",
            "Hypochlorite (ClO-)",
            "Cyanide (CN-)",
            "Thiocyanate (SCN-)",
            "Azide (N3-)",
            "Acetate (CH3COO-)",
            "Bicarbonate (HCO3-)",
            "Dihydrogen phosphate (H2PO4-)",
            "Nitrite (NO2-)",
            "Hydrogen sulfate (HSO4-)",
            "Chromate (CrO4-)",
            "Dichromate (Cr2O7-)",
            "Permanganate (MnO4-)",
            "Thiosulfate (S2O3-)",
            "Hydrogen carbonate (HCO3-)",
            "Hydrogen sulfide (HS-)",
            "Peroxynitrite (ONOO-)",
            "Hypobromite (BrO-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloride (Cl-)",
                "Bromide (Br-)",
                "Iodide (I-)",
                "Fluoride (F-)",
                "Nitrate (NO3-)",
                "Hydroxide (OH-)",
                "Perchlorate (ClO4-)",
                "Hypochlorite (ClO-)",
                "Cyanide (CN-)",
                "Thiocyanate (SCN-)",
                "Azide (N3-)",
                "Acetate (CH3COO-)",
                "Bicarbonate (HCO3-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Nitrite (NO2-)",
                "Hydrogen sulfate (HSO4-)",
                "Chromate (CrO4-)",
                "Dichromate (Cr2O7-)",
                "Permanganate (MnO4-)",
                "Thiosulfate (S2O3-)",
                "Hydrogen carbonate (HCO3-)",
                "Hydrogen sulfide (HS-)",
                "Peroxynitrite (ONOO-)",
                "Hypobromite (BrO-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate (CH3COO-)",
                "Azide (N3-)",
                "Bicarbonate (HCO3-)",
                "Bromide (Br-)",
                "Chloride (Cl-)",
                "Chromate (CrO4-)",
                "Cyanide (CN-)",
                "Dichromate (Cr2O7-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Fluoride (F-)",
                "Hydrogen carbonate (HCO3-)",
                "Hydrogen sulfate (HSO4-)",
                "Hydrogen sulfide (HS-)",
                "Hydroxide (OH-)",
                "Hypobromite (BrO-)",
                "Hypochlorite (ClO-)",
                "Iodide (I-)",
                "Nitrate (NO3-)",
                "Nitrite (NO2-)",
                "Perchlorate (ClO4-)",
                "Permanganate (MnO4-)",
                "Peroxynitrite (ONOO-)",
                "Thiocyanate (SCN-)",
                "Thiosulfate (S2O3-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride ion (Cl-)",
            "Bromide ion (Br-)",
            "Iodide ion (I-)",
            "Fluoride ion (F-)",
            "Hydroxide ion (OH-)",
            "Nitrate ion (NO3-)",
            "Nitrite ion (NO2-)",
            "Sulfate ion (SO4^2-)",
            "Sulfite ion (SO3^2-)",
            "Carbonate ion (CO3^2-)",
            "Bicarbonate ion (HCO3-)",
            "Phosphate ion (PO4^3-)",
            "Acetate ion (CH3COO-)",
            "Cyanide ion (CN-)",
            "Permanganate ion (MnO4-)",
            "Chromate ion (CrO4^2-)",
            "Dichromate ion (Cr2O7^2-)",
            "Oxalate ion (C2O4^2-)",
            "Thiosulfate ion (S2O3^2-)",
            "Peroxide ion (O2^2-)",
            "Hypochlorite ion (ClO-)",
            "Chlorate ion (ClO3-)",
            "Chlorite ion (ClO2-)",
            "Perchlorate ion (ClO4-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloride ion (Cl-)",
                "Bromide ion (Br-)",
                "Iodide ion (I-)",
                "Fluoride ion (F-)",
                "Hydroxide ion (OH-)",
                "Nitrate ion (NO3-)",
                "Nitrite ion (NO2-)",
                "Sulfate ion (SO4^2-)",
                "Sulfite ion (SO3^2-)",
                "Carbonate ion (CO3^2-)",
                "Bicarbonate ion (HCO3-)",
                "Phosphate ion (PO4^3-)",
                "Acetate ion (CH3COO-)",
                "Cyanide ion (CN-)",
                "Permanganate ion (MnO4-)",
                "Chromate ion (CrO4^2-)",
                "Dichromate ion (Cr2O7^2-)",
                "Oxalate ion (C2O4^2-)",
                "Thiosulfate ion (S2O3^2-)",
                "Peroxide ion (O2^2-)",
                "Hypochlorite ion (ClO-)",
                "Chlorate ion (ClO3-)",
                "Chlorite ion (ClO2-)",
                "Perchlorate ion (ClO4-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate ion (CH3COO-)",
                "Bicarbonate ion (HCO3-)",
                "Bromide ion (Br-)",
                "Carbonate ion (CO3^2-)",
                "Chlorate ion (ClO3-)",
                "Chloride ion (Cl-)",
                "Chlorite ion (ClO2-)",
                "Chromate ion (CrO4^2-)",
                "Cyanide ion (CN-)",
                "Dichromate ion (Cr2O7^2-)",
                "Fluoride ion (F-)",
                "Hydroxide ion (OH-)",
                "Hypochlorite ion (ClO-)",
                "Iodide ion (I-)",
                "Nitrate ion (NO3-)",
                "Nitrite ion (NO2-)",
                "Oxalate ion (C2O4^2-)",
                "Perchlorate ion (ClO4-)",
                "Permanganate ion (MnO4-)",
                "Peroxide ion (O2^2-)",
                "Phosphate ion (PO4^3-)",
                "Sulfate ion (SO4^2-)",
                "Sulfite ion (SO3^2-)",
                "Thiosulfate ion (S2O3^2-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride (Cl^-)",
            "Bromide (Br^-)",
            "Iodide (I^-)",
            "Fluoride (F^-)",
            "Nitrite (NO\u2082^-)",
            "Nitrate (NO\u2083^-)",
            "Perchlorate (ClO\u2084^-)",
            "Chlorate (ClO\u2083^-)",
            "Bromate (BrO\u2083^-)",
            "Iodate (IO\u2083^-)",
            "Perbromate (BrO\u2084^-)",
            "Hypochlorite (ClO^-)",
            "Chlorite (ClO\u2082^-)",
            "Bromite (BrO\u2082^-)",
            "Cyanide (CN^-)",
            "Thiocyanate (SCN^-)",
            "Azide (N\u2083^-)",
            "Hydroxide (OH^-)",
            "Permanganate (MnO\u2084^-)",
            "Hydrogen carbonate (HCO\u2083^-)",
            "Hydrosulfide (HS^-)",
            "Hypobromite (BrO^-)",
            "Hypoiodite (IO^-)",
            "Hypothiocyanite (OSCN^-)",
            "Hydrogensulfide (HS^-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloride (Cl^-)",
                "Bromide (Br^-)",
                "Iodide (I^-)",
                "Fluoride (F^-)",
                "Nitrite (NO\u2082^-)",
                "Nitrate (NO\u2083^-)",
                "Perchlorate (ClO\u2084^-)",
                "Chlorate (ClO\u2083^-)",
                "Bromate (BrO\u2083^-)",
                "Iodate (IO\u2083^-)",
                "Perbromate (BrO\u2084^-)",
                "Hypochlorite (ClO^-)",
                "Chlorite (ClO\u2082^-)",
                "Bromite (BrO\u2082^-)",
                "Cyanide (CN^-)",
                "Thiocyanate (SCN^-)",
                "Azide (N\u2083^-)",
                "Hydroxide (OH^-)",
                "Permanganate (MnO\u2084^-)",
                "Hydrogen carbonate (HCO\u2083^-)",
                "Hydrosulfide (HS^-)",
                "Hypobromite (BrO^-)",
                "Hypoiodite (IO^-)",
                "Hypothiocyanite (OSCN^-)"
            ],
            "mismatches": [
                "Hydrogensulfide (HS^-)"
            ],
            "true_referents": [
                "Azide (N\u2083^-)",
                "Bromate (BrO\u2083^-)",
                "Bromide (Br^-)",
                "Bromite (BrO\u2082^-)",
                "Chlorate (ClO\u2083^-)",
                "Chloride (Cl^-)",
                "Chlorite (ClO\u2082^-)",
                "Cyanide (CN^-)",
                "Fluoride (F^-)",
                "Hydrogen carbonate (HCO\u2083^-)",
                "Hydrosulfide (HS^-)",
                "Hydroxide (OH^-)",
                "Hypobromite (BrO^-)",
                "Hypochlorite (ClO^-)",
                "Hypoiodite (IO^-)",
                "Hypothiocyanite (OSCN^-)",
                "Iodate (IO\u2083^-)",
                "Iodide (I^-)",
                "Nitrate (NO\u2083^-)",
                "Nitrite (NO\u2082^-)",
                "Perbromate (BrO\u2084^-)",
                "Perchlorate (ClO\u2084^-)",
                "Permanganate (MnO\u2084^-)",
                "Thiocyanate (SCN^-)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride (Cl-)",
            "Fluoride (F-)",
            "Bromide (Br-)",
            "Iodide (I-)",
            "Hydroxide (OH-)",
            "Nitrate (NO3-)",
            "Bicarbonate (HCO3-)",
            "Cyanide (CN-)",
            "Thiocyanate (SCN-)",
            "Hypochlorite (ClO-)",
            "Perchlorate (ClO4-)",
            "Permanganate (MnO4-)",
            "Azide (N3-)",
            "Hydride (H-)",
            "Nitrite (NO2-)",
            "Bisulfite (HSO3-)",
            "Hydrogen sulfide (HS-)",
            "Dihydrogen phosphate (H2PO4-)",
            "Formate (HCOO-)",
            "Acetate (CH3COO-)",
            "Hydrogen carbonate (HCO3-)",
            "Hydrogen sulfate (HSO4-)",
            "Hypobromite (BrO-)",
            "Hypoiodite (IO-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloride (Cl-)",
                "Fluoride (F-)",
                "Bromide (Br-)",
                "Iodide (I-)",
                "Hydroxide (OH-)",
                "Nitrate (NO3-)",
                "Bicarbonate (HCO3-)",
                "Cyanide (CN-)",
                "Thiocyanate (SCN-)",
                "Hypochlorite (ClO-)",
                "Perchlorate (ClO4-)",
                "Permanganate (MnO4-)",
                "Azide (N3-)",
                "Hydride (H-)",
                "Nitrite (NO2-)",
                "Bisulfite (HSO3-)",
                "Hydrogen sulfide (HS-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Formate (HCOO-)",
                "Acetate (CH3COO-)",
                "Hydrogen sulfate (HSO4-)",
                "Hypobromite (BrO-)",
                "Hypoiodite (IO-)"
            ],
            "mismatches": [
                "Hydrogen carbonate (HCO3-)"
            ],
            "true_referents": [
                "Acetate (CH3COO-)",
                "Azide (N3-)",
                "Bicarbonate (HCO3-)",
                "Bisulfite (HSO3-)",
                "Bromide (Br-)",
                "Chloride (Cl-)",
                "Cyanide (CN-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Fluoride (F-)",
                "Formate (HCOO-)",
                "Hydride (H-)",
                "Hydrogen carbonate (HCO3-)",
                "Hydrogen sulfate (HSO4-)",
                "Hydrogen sulfide (HS-)",
                "Hydroxide (OH-)",
                "Hypobromite (BrO-)",
                "Hypochlorite (ClO-)",
                "Hypoiodite (IO-)",
                "Iodide (I-)",
                "Nitrate (NO3-)",
                "Nitrite (NO2-)",
                "Perchlorate (ClO4-)",
                "Permanganate (MnO4-)",
                "Thiocyanate (SCN-)"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "fluoride (F\u207b)",
            "chloride (Cl\u207b)",
            "bromide (Br\u207b)",
            "iodide (I\u207b)",
            "hydride (H\u207b)",
            "hydroxide (OH\u207b)",
            "cyanide (CN\u207b)",
            "nitrate (NO\u2083\u207b)",
            "nitrite (NO\u2082\u207b)",
            "hypochlorite (ClO\u207b)",
            "chlorite (ClO\u2082\u207b)",
            "chlorate (ClO\u2083\u207b)",
            "perchlorate (ClO\u2084\u207b)",
            "hypobromite (BrO\u207b)",
            "bromite (BrO\u2082\u207b)",
            "bromate (BrO\u2083\u207b)",
            "perbromate (BrO\u2084\u207b)",
            "hypoiodite (IO\u207b)",
            "iodite (IO\u2082\u207b)",
            "iodate (IO\u2083\u207b)",
            "periodate (IO\u2084\u207b)",
            "hydrogen sulfide (HS\u207b)",
            "bisulfide (HSO\u2083\u207b)",
            "hydrogen selenide (HSe\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "fluoride (F\u207b)",
                "chloride (Cl\u207b)",
                "bromide (Br\u207b)",
                "iodide (I\u207b)",
                "hydride (H\u207b)",
                "hydroxide (OH\u207b)",
                "cyanide (CN\u207b)",
                "nitrate (NO\u2083\u207b)",
                "nitrite (NO\u2082\u207b)",
                "hypochlorite (ClO\u207b)",
                "chlorite (ClO\u2082\u207b)",
                "chlorate (ClO\u2083\u207b)",
                "perchlorate (ClO\u2084\u207b)",
                "hypobromite (BrO\u207b)",
                "bromite (BrO\u2082\u207b)",
                "bromate (BrO\u2083\u207b)",
                "perbromate (BrO\u2084\u207b)",
                "hypoiodite (IO\u207b)",
                "iodite (IO\u2082\u207b)",
                "iodate (IO\u2083\u207b)",
                "periodate (IO\u2084\u207b)",
                "hydrogen sulfide (HS\u207b)",
                "bisulfide (HSO\u2083\u207b)",
                "hydrogen selenide (HSe\u207b)"
            ],
            "mismatches": [],
            "true_referents": [
                "bisulfide (HSO\u2083\u207b)",
                "bromate (BrO\u2083\u207b)",
                "bromide (Br\u207b)",
                "bromite (BrO\u2082\u207b)",
                "chlorate (ClO\u2083\u207b)",
                "chloride (Cl\u207b)",
                "chlorite (ClO\u2082\u207b)",
                "cyanide (CN\u207b)",
                "fluoride (F\u207b)",
                "hydride (H\u207b)",
                "hydrogen selenide (HSe\u207b)",
                "hydrogen sulfide (HS\u207b)",
                "hydroxide (OH\u207b)",
                "hypobromite (BrO\u207b)",
                "hypochlorite (ClO\u207b)",
                "hypoiodite (IO\u207b)",
                "iodate (IO\u2083\u207b)",
                "iodide (I\u207b)",
                "iodite (IO\u2082\u207b)",
                "nitrate (NO\u2083\u207b)",
                "nitrite (NO\u2082\u207b)",
                "perbromate (BrO\u2084\u207b)",
                "perchlorate (ClO\u2084\u207b)",
                "periodate (IO\u2084\u207b)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Fluoride (F\u207b)",
            "Chloride (Cl\u207b)",
            "Bromide (Br\u207b)",
            "Iodide (I\u207b)",
            "Nitride (N\u00b3\u207b)",
            "Hydride (H\u207b)",
            "Cyanide (CN\u207b)",
            "Hydroxide (OH\u207b)",
            "Amide (NH\u2082\u207b)",
            "Azide (N\u2083\u207b)",
            "Thiocyanate (SCN\u207b)",
            "Hypochlorite (ClO\u207b)",
            "Chlorite (ClO\u2082\u207b)",
            "Chlorate (ClO\u2083\u207b)",
            "Perchlorate (ClO\u2084\u207b)",
            "Nitrite (NO\u2082\u207b)",
            "Nitrate (NO\u2083\u207b)",
            "Carbonate (CO\u2083\u00b2\u207b)",
            "Bicarbonate (HCO\u2083\u207b)",
            "Sulfite (SO\u2083\u00b2\u207b)",
            "Bisulfite (HSO\u2083\u207b)",
            "Sulfate (SO\u2084\u00b2\u207b)",
            "Hydrogen Sulfate (HSO\u2084\u207b)",
            "Phosphate (PO\u2084\u00b3\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fluoride (F\u207b)",
                "Chloride (Cl\u207b)",
                "Bromide (Br\u207b)",
                "Iodide (I\u207b)",
                "Nitride (N\u00b3\u207b)",
                "Hydride (H\u207b)",
                "Cyanide (CN\u207b)",
                "Hydroxide (OH\u207b)",
                "Amide (NH\u2082\u207b)",
                "Azide (N\u2083\u207b)",
                "Thiocyanate (SCN\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Chlorite (ClO\u2082\u207b)",
                "Chlorate (ClO\u2083\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Carbonate (CO\u2083\u00b2\u207b)",
                "Bicarbonate (HCO\u2083\u207b)",
                "Sulfite (SO\u2083\u00b2\u207b)",
                "Bisulfite (HSO\u2083\u207b)",
                "Sulfate (SO\u2084\u00b2\u207b)",
                "Hydrogen Sulfate (HSO\u2084\u207b)",
                "Phosphate (PO\u2084\u00b3\u207b)"
            ],
            "mismatches": [],
            "true_referents": [
                "Amide (NH\u2082\u207b)",
                "Azide (N\u2083\u207b)",
                "Bicarbonate (HCO\u2083\u207b)",
                "Bisulfite (HSO\u2083\u207b)",
                "Bromide (Br\u207b)",
                "Carbonate (CO\u2083\u00b2\u207b)",
                "Chlorate (ClO\u2083\u207b)",
                "Chloride (Cl\u207b)",
                "Chlorite (ClO\u2082\u207b)",
                "Cyanide (CN\u207b)",
                "Fluoride (F\u207b)",
                "Hydride (H\u207b)",
                "Hydrogen Sulfate (HSO\u2084\u207b)",
                "Hydroxide (OH\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Iodide (I\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Nitride (N\u00b3\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Phosphate (PO\u2084\u00b3\u207b)",
                "Sulfate (SO\u2084\u00b2\u207b)",
                "Sulfite (SO\u2083\u00b2\u207b)",
                "Thiocyanate (SCN\u207b)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride (Cl-)",
            "Bromide (Br-)",
            "Iodide (I-)",
            "Fluoride (F-)",
            "Cyanide (CN-)",
            "Hydroxide (OH-)",
            "Nitrite (NO2-)",
            "Nitrate (NO3-)",
            "Sulfite (SO3-)",
            "Bisulfite (HSO3-)",
            "Phosphate (PO4-)",
            "Hydrogen phosphate (HPO4-)",
            "Dihydrogen phosphate (H2PO4-)",
            "Acetate (CH3COO-)",
            "Formate (HCOO-)",
            "Oxalate (C2O4-)",
            "Permanganate (MnO4-)",
            "Perchlorate (ClO4-)",
            "Hypochlorite (ClO-)",
            "Chlorite (ClO2-)",
            "Chlorate (ClO3-)",
            "Bicarbonate (HCO3-)",
            "Carbonate (CO3-)",
            "Thiosulfate (S2O3-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloride (Cl-)",
                "Bromide (Br-)",
                "Iodide (I-)",
                "Fluoride (F-)",
                "Cyanide (CN-)",
                "Hydroxide (OH-)",
                "Nitrite (NO2-)",
                "Nitrate (NO3-)",
                "Sulfite (SO3-)",
                "Bisulfite (HSO3-)",
                "Phosphate (PO4-)",
                "Hydrogen phosphate (HPO4-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Acetate (CH3COO-)",
                "Formate (HCOO-)",
                "Oxalate (C2O4-)",
                "Permanganate (MnO4-)",
                "Perchlorate (ClO4-)",
                "Hypochlorite (ClO-)",
                "Chlorite (ClO2-)",
                "Chlorate (ClO3-)",
                "Bicarbonate (HCO3-)",
                "Carbonate (CO3-)",
                "Thiosulfate (S2O3-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate (CH3COO-)",
                "Bicarbonate (HCO3-)",
                "Bisulfite (HSO3-)",
                "Bromide (Br-)",
                "Carbonate (CO3-)",
                "Chlorate (ClO3-)",
                "Chloride (Cl-)",
                "Chlorite (ClO2-)",
                "Cyanide (CN-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Fluoride (F-)",
                "Formate (HCOO-)",
                "Hydrogen phosphate (HPO4-)",
                "Hydroxide (OH-)",
                "Hypochlorite (ClO-)",
                "Iodide (I-)",
                "Nitrate (NO3-)",
                "Nitrite (NO2-)",
                "Oxalate (C2O4-)",
                "Perchlorate (ClO4-)",
                "Permanganate (MnO4-)",
                "Phosphate (PO4-)",
                "Sulfite (SO3-)",
                "Thiosulfate (S2O3-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": "[\n\"Chloride ion (Cl-)\" ,\n\"Bromide ion (Br-)\" ,\n\"Iodide ion (I-)\" ,\n\"Fluoride ion (F-)\" ,\n\"Hydroxide ion (OH-)\" ,\n\"Hydrogen carbonate ion (HCO3-)\" ,\n\"Carbonate ion (CO32-)\" ,\n\"Sulfide ion (S2-)\" ,\n\"Thiosulfate ion (S2O32-)\" ,\n\"Phosphate ion (PO43-)\" ,\n\"Arsenate ion (AsO43-)\" ,\n\"Silicate ion (SiO43-)\" ,\n\"Phosphite ion (PO33-)\" ,\n\"Arsonate ion (AsO33-)\" ,\n\"Chromate ion (CrO42-)\" ,\n\"Molybdate ion (MoO42-)\" ,\n\"Tungstate ion (WO42-)\" ,\n\"Perchlorate ion (ClO4-)\" ,\n\"Borate ion (BO33-)\" ,\n\"Metaphosphate ion (PO33-)\" ,\n\"Pyrophosphate ion (P2O74-)\" ,\n\"Polyphosphate ion (PnO3n-)\" ,\n\"Silicofluoride ion (SiF6-)\" ,\n\"Aluminate ion (AlO2-)\" ,\n\"Oxalate ion (C2O42-)\" ,\n\"Tartrate ion (C4H4O63-)\"",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Fluoride (F-)",
            "Chloride (Cl-)",
            "Bromide (Br-)",
            "Iodide (I-)",
            "Hydride (H-)",
            "Oxide (O2-)",
            "Hydroxide (OH-)",
            "Nitride (N3-)",
            "Phosphide (P3-)",
            "Carbonate (CO32-)",
            "Bicarbonate (HCO3-)",
            "Cyanide (CN-)",
            "Thiocyanate (SCN-)",
            "Permanganate (MnO4-)",
            "Chromate (CrO42-)",
            "Dichromate (Cr2O72-)",
            "Sulfide (S2-)",
            "Sulfite (SO32-)",
            "Bisulfite (HSO3-)",
            "Thiosulfate (S2O32-)",
            "Metabisulfite (S2O52-)",
            "Phosphate (PO43-)",
            "Hydrogen phosphate (HPO42-)",
            "Dihydrogen phosphate (H2PO4-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fluoride (F-)",
                "Chloride (Cl-)",
                "Bromide (Br-)",
                "Iodide (I-)",
                "Hydride (H-)",
                "Oxide (O2-)",
                "Hydroxide (OH-)",
                "Nitride (N3-)",
                "Phosphide (P3-)",
                "Carbonate (CO32-)",
                "Bicarbonate (HCO3-)",
                "Cyanide (CN-)",
                "Thiocyanate (SCN-)",
                "Permanganate (MnO4-)",
                "Chromate (CrO42-)",
                "Dichromate (Cr2O72-)",
                "Sulfide (S2-)",
                "Sulfite (SO32-)",
                "Bisulfite (HSO3-)",
                "Thiosulfate (S2O32-)",
                "Metabisulfite (S2O52-)",
                "Phosphate (PO43-)",
                "Hydrogen phosphate (HPO42-)",
                "Dihydrogen phosphate (H2PO4-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Bicarbonate (HCO3-)",
                "Bisulfite (HSO3-)",
                "Bromide (Br-)",
                "Carbonate (CO32-)",
                "Chloride (Cl-)",
                "Chromate (CrO42-)",
                "Cyanide (CN-)",
                "Dichromate (Cr2O72-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Fluoride (F-)",
                "Hydride (H-)",
                "Hydrogen phosphate (HPO42-)",
                "Hydroxide (OH-)",
                "Iodide (I-)",
                "Metabisulfite (S2O52-)",
                "Nitride (N3-)",
                "Oxide (O2-)",
                "Permanganate (MnO4-)",
                "Phosphate (PO43-)",
                "Phosphide (P3-)",
                "Sulfide (S2-)",
                "Sulfite (SO32-)",
                "Thiocyanate (SCN-)",
                "Thiosulfate (S2O32-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            {
                "Canonical name": "acetate (CH3COO-)",
                "Abbreviated identifier": "(CH3COO-)"
            },
            {
                "Canonical name": "bromide (Br-)",
                "Abbreviated identifier": "(Br-)"
            },
            {
                "Canonical name": "chloride (Cl-)",
                "Abbreviated identifier": "(Cl-)"
            },
            {
                "Canonical name": "dichromate (Cr2O72-)",
                "Abbreviated identifier": "(Cr2O72-)"
            },
            {
                "Canonical name": "hydrogen carbonate (HCO3-)",
                "Abbreviated identifier": "(HCO3-)"
            },
            {
                "Canonical name": "iodide (I-)",
                "Abbreviated identifier": "(I-)"
            },
            {
                "Canonical name": "nitrate (NO3-)",
                "Abbreviated identifier": "(NO3-)"
            },
            {
                "Canonical name": "phosphate (PO43-)",
                "Abbreviated identifier": "(PO43-)"
            },
            {
                "Canonical name": "sulfate (SO42-)",
                "Abbreviated identifier": "(SO42-)"
            },
            {
                "Canonical name": "sulfide (S2-)",
                "Abbreviated identifier": "(S2-)"
            },
            {
                "Canonical name": "sulfite (SO32-)",
                "Abbreviated identifier": "(SO32-)"
            },
            {
                "Canonical name": "thiocyanate (SCN-)",
                "Abbreviated identifier": "(SCN-)"
            },
            {
                "Canonical name": "trifluoromethanesulfonate (CF3SO3-)",
                "Abbreviated identifier": "(CF3SO3-)"
            },
            {
                "Canonical name": "hydrogen phosphate (HPO42-)",
                "Abbreviated identifier": "(HPO42-)"
            },
            {
                "Canonical name": "hydrogen sulfate (HSO4-)",
                "Abbreviated identifier": "(HSO4-)"
            },
            {
                "Canonical name": "perchlorate (ClO4-)",
                "Abbreviated identifier": "(ClO4-)"
            },
            {
                "Canonical name": "peroxodisulfate (S2O82-)",
                "Abbreviated identifier": "(S2O82-)"
            },
            {
                "Canonical name": "cyanide (CN-)",
                "Abbreviated identifier": "(CN-)"
            },
            {
                "Canonical name": "nitrite (NO2-)",
                "Abbreviated identifier": "(NO2-)"
            },
            {
                "Canonical name": "hydrogen sulfide (H2S)",
                "Abbreviated identifier": "(H2S)"
            },
            {
                "Canonical name": "sulfur dioxide (SO2)",
                "Abbreviated identifier": "(SO2)"
            },
            {
                "Canonical name": "dithionite (S2O22-)",
                "Abbreviated identifier": "(S2O22-)"
            },
            {
                "Canonical name": "hypochlorite (ClO2-)",
                "Abbreviated identifier": "(ClO2-)"
            },
            {
                "Canonical name": "chlorite (ClO2-)",
                "Abbreviated identifier": "(ClO2-)"
            },
            {
                "Canonical name": "hypoiodite (IO2-)",
                "Abbreviated identifier": "(IO2-)"
            },
            {
                "Canonical name": "iodite (IO3-)",
                "Abbreviated identifier": "(IO3-)"
            },
            {
                "Canonical name": "periodate (IO4-)",
                "Abbreviated identifier": "(IO4-)"
            },
            {
                "Canonical name": "chlorate (ClO3-)",
                "Abbreviated identifier": "(ClO3-)"
            },
            {
                "Canonical name": "peroxocyanate (OClO2-)",
                "Abbreviated identifier": "(OClO2-)"
            },
            {
                "Canonical name": "chlorite (ClO2-)",
                "Abbreviated identifier": "(ClO2-)"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "acetate (CH3COO-)",
                "bromide (Br-)",
                "chloride (Cl-)",
                "dichromate (Cr2O72-)",
                "hydrogen carbonate (HCO3-)",
                "iodide (I-)",
                "nitrate (NO3-)",
                "phosphate (PO43-)",
                "sulfate (SO42-)",
                "sulfide (S2-)",
                "sulfite (SO32-)",
                "thiocyanate (SCN-)",
                "trifluoromethanesulfonate (CF3SO3-)",
                "hydrogen phosphate (HPO42-)",
                "hydrogen sulfate (HSO4-)",
                "perchlorate (ClO4-)",
                "peroxodisulfate (S2O82-)",
                "cyanide (CN-)",
                "nitrite (NO2-)",
                "hydrogen sulfide (H2S)",
                "sulfur dioxide (SO2)",
                "dithionite (S2O22-)",
                "chlorite (ClO2-)"
            ],
            "mismatches": [
                "hypoiodite (IO2-)",
                "iodite (IO3-)",
                "periodate (IO4-)",
                "chlorate (ClO3-)",
                "peroxocyanate (OClO2-)"
            ],
            "true_referents": [
                "{\"Canonical name\": \"acetate (CH3COO-)\", \"Abbreviated identifier\": \"(CH3COO-)\"}",
                "{\"Canonical name\": \"bromide (Br-)\", \"Abbreviated identifier\": \"(Br-)\"}",
                "{\"Canonical name\": \"chloride (Cl-)\", \"Abbreviated identifier\": \"(Cl-)\"}",
                "{\"Canonical name\": \"chlorite (ClO2-)\", \"Abbreviated identifier\": \"(ClO2-)\"}",
                "{\"Canonical name\": \"cyanide (CN-)\", \"Abbreviated identifier\": \"(CN-)\"}",
                "{\"Canonical name\": \"dichromate (Cr2O72-)\", \"Abbreviated identifier\": \"(Cr2O72-)\"}",
                "{\"Canonical name\": \"dithionite (S2O22-)\", \"Abbreviated identifier\": \"(S2O22-)\"}",
                "{\"Canonical name\": \"hydrogen carbonate (HCO3-)\", \"Abbreviated identifier\": \"(HCO3-)\"}",
                "{\"Canonical name\": \"hydrogen phosphate (HPO42-)\", \"Abbreviated identifier\": \"(HPO42-)\"}",
                "{\"Canonical name\": \"hydrogen sulfate (HSO4-)\", \"Abbreviated identifier\": \"(HSO4-)\"}",
                "{\"Canonical name\": \"hydrogen sulfide (H2S)\", \"Abbreviated identifier\": \"(H2S)\"}",
                "{\"Canonical name\": \"hypochlorite (ClO2-)\", \"Abbreviated identifier\": \"(ClO2-)\"}",
                "{\"Canonical name\": \"iodide (I-)\", \"Abbreviated identifier\": \"(I-)\"}",
                "{\"Canonical name\": \"nitrate (NO3-)\", \"Abbreviated identifier\": \"(NO3-)\"}",
                "{\"Canonical name\": \"nitrite (NO2-)\", \"Abbreviated identifier\": \"(NO2-)\"}",
                "{\"Canonical name\": \"perchlorate (ClO4-)\", \"Abbreviated identifier\": \"(ClO4-)\"}",
                "{\"Canonical name\": \"peroxodisulfate (S2O82-)\", \"Abbreviated identifier\": \"(S2O82-)\"}",
                "{\"Canonical name\": \"phosphate (PO43-)\", \"Abbreviated identifier\": \"(PO43-)\"}",
                "{\"Canonical name\": \"sulfate (SO42-)\", \"Abbreviated identifier\": \"(SO42-)\"}",
                "{\"Canonical name\": \"sulfide (S2-)\", \"Abbreviated identifier\": \"(S2-)\"}",
                "{\"Canonical name\": \"sulfite (SO32-)\", \"Abbreviated identifier\": \"(SO32-)\"}",
                "{\"Canonical name\": \"sulfur dioxide (SO2)\", \"Abbreviated identifier\": \"(SO2)\"}",
                "{\"Canonical name\": \"thiocyanate (SCN-)\", \"Abbreviated identifier\": \"(SCN-)\"}",
                "{\"Canonical name\": \"trifluoromethanesulfonate (CF3SO3-)\", \"Abbreviated identifier\": \"(CF3SO3-)\"}"
            ],
            "TP": 23,
            "FP": 5,
            "FN": 0
        }
    }
]