[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "chloride (Cl-)",
            "bromide (Br-)",
            "iodide (I-)",
            "fluoride (F-)",
            "sulfide (S2-)",
            "cyanide (CN-)",
            "nitrate (NO3-)",
            "bicarbonate (HCO3-)",
            "sulfite (SO32-)",
            "phosphate (PO43-)",
            "hydroxide (OH-)",
            "permanganate (MnO4-)",
            "perchlorate (ClO4-)",
            "chlorite (ClO2-)",
            "hypochlorite (ClO-)",
            "sulfate (SO42-)",
            "thiocyanate (SCN-)",
            "arsenite (AsO33-)",
            "arsenate (AsO43-)",
            "borate (BO33-)",
            "chromate (CrO42-)",
            "dichromate (Cr2O72-)",
            "nitrite (NO2-)",
            "carbonate (CO32-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "chloride (Cl-)",
                "bromide (Br-)",
                "iodide (I-)",
                "fluoride (F-)",
                "sulfide (S2-)",
                "cyanide (CN-)",
                "nitrate (NO3-)",
                "bicarbonate (HCO3-)",
                "sulfite (SO32-)",
                "phosphate (PO43-)",
                "hydroxide (OH-)",
                "permanganate (MnO4-)",
                "perchlorate (ClO4-)",
                "chlorite (ClO2-)",
                "hypochlorite (ClO-)",
                "sulfate (SO42-)",
                "thiocyanate (SCN-)",
                "arsenite (AsO33-)",
                "arsenate (AsO43-)",
                "borate (BO33-)",
                "chromate (CrO42-)",
                "dichromate (Cr2O72-)",
                "nitrite (NO2-)",
                "carbonate (CO32-)"
            ],
            "mismatches": [],
            "true_referents": [
                "arsenate (AsO43-)",
                "arsenite (AsO33-)",
                "bicarbonate (HCO3-)",
                "borate (BO33-)",
                "bromide (Br-)",
                "carbonate (CO32-)",
                "chloride (Cl-)",
                "chlorite (ClO2-)",
                "chromate (CrO42-)",
                "cyanide (CN-)",
                "dichromate (Cr2O72-)",
                "fluoride (F-)",
                "hydroxide (OH-)",
                "hypochlorite (ClO-)",
                "iodide (I-)",
                "nitrate (NO3-)",
                "nitrite (NO2-)",
                "perchlorate (ClO4-)",
                "permanganate (MnO4-)",
                "phosphate (PO43-)",
                "sulfate (SO42-)",
                "sulfide (S2-)",
                "sulfite (SO32-)",
                "thiocyanate (SCN-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Fluoride (F-)",
            "Chloride (Cl-)",
            "Bromide (Br-)",
            "Iodide (I-)",
            "Hydroxide (OH-)",
            "Nitrate (NO3-)",
            "Acetate (C2H3O2-)",
            "Carbonate (CO3^2-)",
            "Sulfate (SO4^2-)",
            "Phosphate (PO4^3-)",
            "Permanganate (MnO4-)",
            "Dichromate (Cr2O7^2-)",
            "Thiocyanate (SCN-)",
            "Cyanide (CN-)",
            "Azide (N3-)",
            "Perchlorate (ClO4-)",
            "Bisulfate (HSO4-)",
            "Oxalate (C2O4^2-)",
            "Aluminate (AlO2-)",
            "Silicate (SiO3^2-)",
            "Chromate (CrO4^2-)",
            "Molybdate (MoO4^2-)",
            "Tungstate (WO4^2-)",
            "Vanadate (VO4^3-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fluoride (F-)",
                "Chloride (Cl-)",
                "Bromide (Br-)",
                "Iodide (I-)",
                "Hydroxide (OH-)",
                "Nitrate (NO3-)",
                "Acetate (C2H3O2-)",
                "Carbonate (CO3^2-)",
                "Sulfate (SO4^2-)",
                "Phosphate (PO4^3-)",
                "Permanganate (MnO4-)",
                "Dichromate (Cr2O7^2-)",
                "Thiocyanate (SCN-)",
                "Cyanide (CN-)",
                "Azide (N3-)",
                "Perchlorate (ClO4-)",
                "Bisulfate (HSO4-)",
                "Oxalate (C2O4^2-)",
                "Aluminate (AlO2-)",
                "Silicate (SiO3^2-)",
                "Chromate (CrO4^2-)",
                "Molybdate (MoO4^2-)",
                "Tungstate (WO4^2-)",
                "Vanadate (VO4^3-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate (C2H3O2-)",
                "Aluminate (AlO2-)",
                "Azide (N3-)",
                "Bisulfate (HSO4-)",
                "Bromide (Br-)",
                "Carbonate (CO3^2-)",
                "Chloride (Cl-)",
                "Chromate (CrO4^2-)",
                "Cyanide (CN-)",
                "Dichromate (Cr2O7^2-)",
                "Fluoride (F-)",
                "Hydroxide (OH-)",
                "Iodide (I-)",
                "Molybdate (MoO4^2-)",
                "Nitrate (NO3-)",
                "Oxalate (C2O4^2-)",
                "Perchlorate (ClO4-)",
                "Permanganate (MnO4-)",
                "Phosphate (PO4^3-)",
                "Silicate (SiO3^2-)",
                "Sulfate (SO4^2-)",
                "Thiocyanate (SCN-)",
                "Tungstate (WO4^2-)",
                "Vanadate (VO4^3-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Hydroxide (OH\u207b)",
            "Fluoride (F\u207b)",
            "Chloride (Cl\u207b)",
            "Bromide (Br\u207b)",
            "Iodide (I\u207b)",
            "Cyanide (CN\u207b)",
            "Hypochlorite (ClO\u207b)",
            "Hydrogen Carbonate (HCO\u2083\u207b)",
            "Nitrite (NO\u2082\u207b)",
            "Nitrate (NO\u2083\u207b)",
            "Perchlorate (ClO\u2084\u207b)",
            "Permanganate (MnO\u2084\u207b)",
            "Thiocyanate (SCN\u207b)",
            "Bicarbonate (HCO\u2083\u207b)",
            "Hydrogensulfite (HSO\u2083\u207b)",
            "Hydrogensulfate (HSO\u2084\u207b)",
            "Hydrogenphosphate (HPO\u2084\u00b2\u207b)",
            "Dihydrogenphosphate (H\u2082PO\u2084\u207b)",
            "Hydrogenpyrophosphate (H\u2082P\u2082O\u2087\u207b)",
            "Hydrogenarsenate (HAsO\u2084\u00b2\u207b)",
            "Hydrogenselenate (HSeO\u2084\u207b)",
            "Hydrogenchromate (HCrO\u2084\u207b)",
            "Hydrogentellurate (HTeO\u2084\u207b)",
            "Hydrogenperoxide (HO\u2082\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxide (OH\u207b)",
                "Fluoride (F\u207b)",
                "Chloride (Cl\u207b)",
                "Bromide (Br\u207b)",
                "Iodide (I\u207b)",
                "Cyanide (CN\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Hydrogen Carbonate (HCO\u2083\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Permanganate (MnO\u2084\u207b)",
                "Thiocyanate (SCN\u207b)",
                "Bicarbonate (HCO\u2083\u207b)",
                "Hydrogensulfite (HSO\u2083\u207b)",
                "Hydrogensulfate (HSO\u2084\u207b)",
                "Hydrogenphosphate (HPO\u2084\u00b2\u207b)",
                "Dihydrogenphosphate (H\u2082PO\u2084\u207b)",
                "Hydrogenpyrophosphate (H\u2082P\u2082O\u2087\u207b)",
                "Hydrogenarsenate (HAsO\u2084\u00b2\u207b)",
                "Hydrogenselenate (HSeO\u2084\u207b)",
                "Hydrogenchromate (HCrO\u2084\u207b)",
                "Hydrogentellurate (HTeO\u2084\u207b)",
                "Hydrogenperoxide (HO\u2082\u207b)"
            ],
            "mismatches": [],
            "true_referents": [
                "Bicarbonate (HCO\u2083\u207b)",
                "Bromide (Br\u207b)",
                "Chloride (Cl\u207b)",
                "Cyanide (CN\u207b)",
                "Dihydrogenphosphate (H\u2082PO\u2084\u207b)",
                "Fluoride (F\u207b)",
                "Hydrogen Carbonate (HCO\u2083\u207b)",
                "Hydrogenarsenate (HAsO\u2084\u00b2\u207b)",
                "Hydrogenchromate (HCrO\u2084\u207b)",
                "Hydrogenperoxide (HO\u2082\u207b)",
                "Hydrogenphosphate (HPO\u2084\u00b2\u207b)",
                "Hydrogenpyrophosphate (H\u2082P\u2082O\u2087\u207b)",
                "Hydrogenselenate (HSeO\u2084\u207b)",
                "Hydrogensulfate (HSO\u2084\u207b)",
                "Hydrogensulfite (HSO\u2083\u207b)",
                "Hydrogentellurate (HTeO\u2084\u207b)",
                "Hydroxide (OH\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Iodide (I\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Permanganate (MnO\u2084\u207b)",
                "Thiocyanate (SCN\u207b)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Hydroxide (OH\u207b)",
            "Fluoride (F\u207b)",
            "Chloride (Cl\u207b)",
            "Bromide (Br\u207b)",
            "Iodide (I\u207b)",
            "Cyanide (CN\u207b)",
            "Oxide (O\u00b2\u207b) - as a component of complex anions",
            "Nitride (N\u00b3\u207b) - as a component of complex anions",
            "Sulfide (S\u00b2\u207b) - as a component of complex anions",
            "Phosphide (P\u00b3\u207b) - as a component of complex anions",
            "Perchlorate (ClO\u2084\u207b)",
            "Chlorate (ClO\u2083\u207b)",
            "Chlorite (ClO\u2082\u207b)",
            "Hypochlorite (ClO\u207b)",
            "Bromate (BrO\u2083\u207b)",
            "Iodate (IO\u2083\u207b)",
            "Sulfate (SO\u2084\u00b2\u207b) - as a component of complex anions",
            "Nitrate (NO\u2083\u207b)",
            "Nitrite (NO\u2082\u207b)",
            "Carbonate (CO\u2083\u00b2\u207b) - as a component of complex anions",
            "Bicarbonate (HCO\u2083\u207b)",
            "Phosphate (PO\u2084\u00b3\u207b) - as a component of complex anions",
            "Hydrogen Phosphate (HPO\u2084\u00b2\u207b)",
            "Dihydrogen Phosphate (H\u2082PO\u2084\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxide (OH\u207b)",
                "Fluoride (F\u207b)",
                "Chloride (Cl\u207b)",
                "Bromide (Br\u207b)",
                "Iodide (I\u207b)",
                "Cyanide (CN\u207b)",
                "Oxide (O\u00b2\u207b) - as a component of complex anions",
                "Nitride (N\u00b3\u207b) - as a component of complex anions",
                "Sulfide (S\u00b2\u207b) - as a component of complex anions",
                "Phosphide (P\u00b3\u207b) - as a component of complex anions",
                "Perchlorate (ClO\u2084\u207b)",
                "Chlorate (ClO\u2083\u207b)",
                "Chlorite (ClO\u2082\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Bromate (BrO\u2083\u207b)",
                "Iodate (IO\u2083\u207b)",
                "Sulfate (SO\u2084\u00b2\u207b) - as a component of complex anions",
                "Nitrate (NO\u2083\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Carbonate (CO\u2083\u00b2\u207b) - as a component of complex anions",
                "Bicarbonate (HCO\u2083\u207b)",
                "Phosphate (PO\u2084\u00b3\u207b) - as a component of complex anions",
                "Hydrogen Phosphate (HPO\u2084\u00b2\u207b)",
                "Dihydrogen Phosphate (H\u2082PO\u2084\u207b)"
            ],
            "mismatches": [],
            "true_referents": [
                "Bicarbonate (HCO\u2083\u207b)",
                "Bromate (BrO\u2083\u207b)",
                "Bromide (Br\u207b)",
                "Carbonate (CO\u2083\u00b2\u207b) - as a component of complex anions",
                "Chlorate (ClO\u2083\u207b)",
                "Chloride (Cl\u207b)",
                "Chlorite (ClO\u2082\u207b)",
                "Cyanide (CN\u207b)",
                "Dihydrogen Phosphate (H\u2082PO\u2084\u207b)",
                "Fluoride (F\u207b)",
                "Hydrogen Phosphate (HPO\u2084\u00b2\u207b)",
                "Hydroxide (OH\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Iodate (IO\u2083\u207b)",
                "Iodide (I\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Nitride (N\u00b3\u207b) - as a component of complex anions",
                "Nitrite (NO\u2082\u207b)",
                "Oxide (O\u00b2\u207b) - as a component of complex anions",
                "Perchlorate (ClO\u2084\u207b)",
                "Phosphate (PO\u2084\u00b3\u207b) - as a component of complex anions",
                "Phosphide (P\u00b3\u207b) - as a component of complex anions",
                "Sulfate (SO\u2084\u00b2\u207b) - as a component of complex anions",
                "Sulfide (S\u00b2\u207b) - as a component of complex anions"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride (Cl-)",
            "Fluoride (F-)",
            "Bromide (Br-)",
            "Iodide (I-)",
            "Hydroxide (OH-)",
            "Nitrate (NO3-)",
            "Nitrite (NO2-)",
            "Bicarbonate (HCO3-)",
            "Bisulfate (HSO4-)",
            "Permanganate (MnO4-)",
            "Hydrosulfide (HS-)",
            "Cyanide (CN-)",
            "Acetate (CH3COO-)",
            "Formate (HCOO-)",
            "Hypochlorite (ClO-)",
            "Chlorate (ClO3-)",
            "Perchlorate (ClO4-)",
            "Bromate (BrO3-)",
            "Iodate (IO3-)",
            "Dihydrogen phosphate (H2PO4-)",
            "Hydrogen sulfate (HSO4-)",
            "Hydrogen sulfide (HS-)",
            "Thiocyanate (SCN-)",
            "Azide (N3-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloride (Cl-)",
                "Fluoride (F-)",
                "Bromide (Br-)",
                "Iodide (I-)",
                "Hydroxide (OH-)",
                "Nitrate (NO3-)",
                "Nitrite (NO2-)",
                "Bicarbonate (HCO3-)",
                "Bisulfate (HSO4-)",
                "Permanganate (MnO4-)",
                "Hydrosulfide (HS-)",
                "Cyanide (CN-)",
                "Acetate (CH3COO-)",
                "Formate (HCOO-)",
                "Hypochlorite (ClO-)",
                "Chlorate (ClO3-)",
                "Perchlorate (ClO4-)",
                "Bromate (BrO3-)",
                "Iodate (IO3-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Hydrogen sulfate (HSO4-)",
                "Hydrogen sulfide (HS-)",
                "Thiocyanate (SCN-)",
                "Azide (N3-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate (CH3COO-)",
                "Azide (N3-)",
                "Bicarbonate (HCO3-)",
                "Bisulfate (HSO4-)",
                "Bromate (BrO3-)",
                "Bromide (Br-)",
                "Chlorate (ClO3-)",
                "Chloride (Cl-)",
                "Cyanide (CN-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Fluoride (F-)",
                "Formate (HCOO-)",
                "Hydrogen sulfate (HSO4-)",
                "Hydrogen sulfide (HS-)",
                "Hydrosulfide (HS-)",
                "Hydroxide (OH-)",
                "Hypochlorite (ClO-)",
                "Iodate (IO3-)",
                "Iodide (I-)",
                "Nitrate (NO3-)",
                "Nitrite (NO2-)",
                "Perchlorate (ClO4-)",
                "Permanganate (MnO4-)",
                "Thiocyanate (SCN-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride (Cl-)",
            "Bromide (Br-)",
            "Iodide (I-)",
            "Fluoride (F-)",
            "Hydroxide (OH-)",
            "Nitrate (NO3-)",
            "Nitrite (NO2-)",
            "Acetate (C2H3O2-)",
            "Permanganate (MnO4-)",
            "Cyanide (CN-)",
            "Sulfide (S2-)",
            "Phosphate (PO4^3-)",
            "Carbonate (CO3^2-)",
            "Chlorate (ClO3-)",
            "Perchlorate (ClO4-)",
            "Thiocyanate (SCN-)",
            "Arsenate (AsO4^3-)",
            "Bicarbonate (HCO3-)",
            "Hydrogen phosphate (H2PO4-)",
            "Dichromate (Cr2O7^2-)",
            "Selenate (SeO4^2-)",
            "Borate (BO3^3-)",
            "Formate (HCOO-)",
            "Oxalate (C2O4^2-)",
            "Tartrate (C4H4O6^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloride (Cl-)",
                "Bromide (Br-)",
                "Iodide (I-)",
                "Fluoride (F-)",
                "Hydroxide (OH-)",
                "Nitrate (NO3-)",
                "Nitrite (NO2-)",
                "Acetate (C2H3O2-)",
                "Permanganate (MnO4-)",
                "Cyanide (CN-)",
                "Sulfide (S2-)",
                "Phosphate (PO4^3-)",
                "Carbonate (CO3^2-)",
                "Chlorate (ClO3-)",
                "Perchlorate (ClO4-)",
                "Thiocyanate (SCN-)",
                "Arsenate (AsO4^3-)",
                "Bicarbonate (HCO3-)",
                "Hydrogen phosphate (H2PO4-)",
                "Dichromate (Cr2O7^2-)",
                "Selenate (SeO4^2-)",
                "Borate (BO3^3-)",
                "Formate (HCOO-)",
                "Oxalate (C2O4^2-)"
            ],
            "mismatches": [
                "Tartrate (C4H4O6^2-)"
            ],
            "true_referents": [
                "Acetate (C2H3O2-)",
                "Arsenate (AsO4^3-)",
                "Bicarbonate (HCO3-)",
                "Borate (BO3^3-)",
                "Bromide (Br-)",
                "Carbonate (CO3^2-)",
                "Chlorate (ClO3-)",
                "Chloride (Cl-)",
                "Cyanide (CN-)",
                "Dichromate (Cr2O7^2-)",
                "Fluoride (F-)",
                "Formate (HCOO-)",
                "Hydrogen phosphate (H2PO4-)",
                "Hydroxide (OH-)",
                "Iodide (I-)",
                "Nitrate (NO3-)",
                "Nitrite (NO2-)",
                "Oxalate (C2O4^2-)",
                "Perchlorate (ClO4-)",
                "Permanganate (MnO4-)",
                "Phosphate (PO4^3-)",
                "Selenate (SeO4^2-)",
                "Sulfide (S2-)",
                "Thiocyanate (SCN-)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride ion (Cl-)",
            "Bromide ion (Br-)",
            "Iodide ion (I-)",
            "Fluoride ion (F-)",
            "Hydroxide ion (OH-)",
            "Cyanide ion (CN-)",
            "Hydrosulfide ion (HS-)",
            "Hydrogen carbonate ion (HCO3-)",
            "Hydrogen sulfate ion (HSO4-)",
            "Perchlorate ion (ClO4-)",
            "Permanganate ion (MnO4-)",
            "Hydrogen phosphate ion (HPO4 2-)",
            "Dihydrogen phosphate ion (H2PO4-)",
            "Nitrate ion (NO3-)",
            "Hydrogen nitrate ion (HNO3-)",
            "Thiocyanate ion (SCN-)",
            "Azide ion (N3-)",
            "Amide ion (NH2-)",
            "Hydrogen sulfite ion (HSO3-)",
            "Hydrogen peroxide ion (HO2-)",
            "Superoxide ion (O2-)",
            "Peroxide ion (O2 2-)",
            "Oxide ion (O2-)",
            "Hydrogen oxalate ion (HC2O4-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloride ion (Cl-)",
                "Bromide ion (Br-)",
                "Iodide ion (I-)",
                "Fluoride ion (F-)",
                "Hydroxide ion (OH-)",
                "Cyanide ion (CN-)",
                "Hydrosulfide ion (HS-)",
                "Hydrogen carbonate ion (HCO3-)",
                "Hydrogen sulfate ion (HSO4-)",
                "Perchlorate ion (ClO4-)",
                "Permanganate ion (MnO4-)",
                "Hydrogen phosphate ion (HPO4 2-)",
                "Dihydrogen phosphate ion (H2PO4-)",
                "Nitrate ion (NO3-)",
                "Hydrogen nitrate ion (HNO3-)",
                "Thiocyanate ion (SCN-)",
                "Azide ion (N3-)",
                "Amide ion (NH2-)",
                "Hydrogen sulfite ion (HSO3-)",
                "Hydrogen peroxide ion (HO2-)",
                "Superoxide ion (O2-)",
                "Peroxide ion (O2 2-)",
                "Oxide ion (O2-)",
                "Hydrogen oxalate ion (HC2O4-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Amide ion (NH2-)",
                "Azide ion (N3-)",
                "Bromide ion (Br-)",
                "Chloride ion (Cl-)",
                "Cyanide ion (CN-)",
                "Dihydrogen phosphate ion (H2PO4-)",
                "Fluoride ion (F-)",
                "Hydrogen carbonate ion (HCO3-)",
                "Hydrogen nitrate ion (HNO3-)",
                "Hydrogen oxalate ion (HC2O4-)",
                "Hydrogen peroxide ion (HO2-)",
                "Hydrogen phosphate ion (HPO4 2-)",
                "Hydrogen sulfate ion (HSO4-)",
                "Hydrogen sulfite ion (HSO3-)",
                "Hydrosulfide ion (HS-)",
                "Hydroxide ion (OH-)",
                "Iodide ion (I-)",
                "Nitrate ion (NO3-)",
                "Oxide ion (O2-)",
                "Perchlorate ion (ClO4-)",
                "Permanganate ion (MnO4-)",
                "Peroxide ion (O2 2-)",
                "Superoxide ion (O2-)",
                "Thiocyanate ion (SCN-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Hydroxide ion (OH-)",
            "Chloride ion (Cl-)",
            "Fluoride ion (F-)",
            "Bromide ion (Br-)",
            "Iodide ion (I-)",
            "Nitrate ion (NO3-)",
            "Nitrite ion (NO2-)",
            "Sulfate ion (SO4^2-)",
            "Sulfite ion (SO3^2-)",
            "Phosphate ion (PO4^3-)",
            "Carbonate ion (CO3^2-)",
            "Bicarbonate ion (HCO3-)",
            "Ammonium ion (NH4+)",
            "Cyanide ion (CN-)",
            "Hypochlorite ion (ClO-)",
            "Chlorate ion (ClO3-)",
            "Perchlorate ion (ClO4-)",
            "Permanganate ion (MnO4-)",
            "Chromate ion (CrO4^2-)",
            "Dichromate ion (Cr2O7^2-)",
            "Oxalate ion (C2O4^2-)",
            "Acetate ion (C2H3O2-)",
            "Selenate ion (SeO4^2-)",
            "Tellurate ion (TeO4^2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hydroxide ion (OH-)",
                "Chloride ion (Cl-)",
                "Fluoride ion (F-)",
                "Bromide ion (Br-)",
                "Iodide ion (I-)",
                "Nitrate ion (NO3-)",
                "Nitrite ion (NO2-)",
                "Sulfate ion (SO4^2-)",
                "Sulfite ion (SO3^2-)",
                "Phosphate ion (PO4^3-)",
                "Carbonate ion (CO3^2-)",
                "Bicarbonate ion (HCO3-)",
                "Ammonium ion (NH4+)",
                "Cyanide ion (CN-)",
                "Hypochlorite ion (ClO-)",
                "Chlorate ion (ClO3-)",
                "Perchlorate ion (ClO4-)",
                "Permanganate ion (MnO4-)",
                "Chromate ion (CrO4^2-)",
                "Dichromate ion (Cr2O7^2-)",
                "Oxalate ion (C2O4^2-)",
                "Acetate ion (C2H3O2-)",
                "Selenate ion (SeO4^2-)",
                "Tellurate ion (TeO4^2-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate ion (C2H3O2-)",
                "Ammonium ion (NH4+)",
                "Bicarbonate ion (HCO3-)",
                "Bromide ion (Br-)",
                "Carbonate ion (CO3^2-)",
                "Chlorate ion (ClO3-)",
                "Chloride ion (Cl-)",
                "Chromate ion (CrO4^2-)",
                "Cyanide ion (CN-)",
                "Dichromate ion (Cr2O7^2-)",
                "Fluoride ion (F-)",
                "Hydroxide ion (OH-)",
                "Hypochlorite ion (ClO-)",
                "Iodide ion (I-)",
                "Nitrate ion (NO3-)",
                "Nitrite ion (NO2-)",
                "Oxalate ion (C2O4^2-)",
                "Perchlorate ion (ClO4-)",
                "Permanganate ion (MnO4-)",
                "Phosphate ion (PO4^3-)",
                "Selenate ion (SeO4^2-)",
                "Sulfate ion (SO4^2-)",
                "Sulfite ion (SO3^2-)",
                "Tellurate ion (TeO4^2-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Fluoride (F\u2013)",
            "Chloride (Cl\u2013)",
            "Bromide (Br\u2013)",
            "Iodide (I\u2013)",
            "Hydroxide (OH\u2013)",
            "Cyanide (CN\u2013)",
            "Nitrite (NO\u2082\u2013)",
            "Nitrate (NO\u2083\u2013)",
            "Hydrogen Carbonate (HCO\u2083\u2013)",
            "Hydrogen Sulfate (HSO\u2084\u2013)",
            "Hydrogen Sulfite (HSO\u2083\u2013)",
            "Perchlorate (ClO\u2084\u2013)",
            "Chlorate (ClO\u2083\u2013)",
            "Hypochlorite (ClO\u2013)",
            "Thiocyanate (SCN\u2013)",
            "Hydrogen Phosphate (H\u2082PO\u2084\u2013)",
            "Hydrogen Arsenate (H\u2082AsO\u2084\u2013)",
            "Hydrogen Selenite (HSeO\u2083\u2013)",
            "Hypophosphite (H\u2082PO\u2082\u2013)",
            "Permanganate (MnO\u2084\u2013)",
            "Hydrogen Chromate (HCrO\u2084\u2013)",
            "Hydrogen Manganate (HMnO\u2084\u2013)",
            "Hydrogen Tellurite (HTeO\u2083\u2013)",
            "Hydrogen Peroxide (H\u2082O\u2082\u2013)",
            "Mercaptide (RS\u2013)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fluoride (F\u2013)",
                "Chloride (Cl\u2013)",
                "Bromide (Br\u2013)",
                "Iodide (I\u2013)",
                "Hydroxide (OH\u2013)",
                "Cyanide (CN\u2013)",
                "Nitrite (NO\u2082\u2013)",
                "Nitrate (NO\u2083\u2013)",
                "Hydrogen Carbonate (HCO\u2083\u2013)",
                "Hydrogen Sulfate (HSO\u2084\u2013)",
                "Hydrogen Sulfite (HSO\u2083\u2013)",
                "Perchlorate (ClO\u2084\u2013)",
                "Chlorate (ClO\u2083\u2013)",
                "Hypochlorite (ClO\u2013)",
                "Thiocyanate (SCN\u2013)",
                "Hydrogen Phosphate (H\u2082PO\u2084\u2013)",
                "Hydrogen Arsenate (H\u2082AsO\u2084\u2013)",
                "Hydrogen Selenite (HSeO\u2083\u2013)",
                "Hypophosphite (H\u2082PO\u2082\u2013)",
                "Permanganate (MnO\u2084\u2013)",
                "Hydrogen Chromate (HCrO\u2084\u2013)",
                "Hydrogen Manganate (HMnO\u2084\u2013)",
                "Hydrogen Tellurite (HTeO\u2083\u2013)",
                "Hydrogen Peroxide (H\u2082O\u2082\u2013)"
            ],
            "mismatches": [
                "Mercaptide (RS\u2013)"
            ],
            "true_referents": [
                "Bromide (Br\u2013)",
                "Chlorate (ClO\u2083\u2013)",
                "Chloride (Cl\u2013)",
                "Cyanide (CN\u2013)",
                "Fluoride (F\u2013)",
                "Hydrogen Arsenate (H\u2082AsO\u2084\u2013)",
                "Hydrogen Carbonate (HCO\u2083\u2013)",
                "Hydrogen Chromate (HCrO\u2084\u2013)",
                "Hydrogen Manganate (HMnO\u2084\u2013)",
                "Hydrogen Peroxide (H\u2082O\u2082\u2013)",
                "Hydrogen Phosphate (H\u2082PO\u2084\u2013)",
                "Hydrogen Selenite (HSeO\u2083\u2013)",
                "Hydrogen Sulfate (HSO\u2084\u2013)",
                "Hydrogen Sulfite (HSO\u2083\u2013)",
                "Hydrogen Tellurite (HTeO\u2083\u2013)",
                "Hydroxide (OH\u2013)",
                "Hypochlorite (ClO\u2013)",
                "Hypophosphite (H\u2082PO\u2082\u2013)",
                "Iodide (I\u2013)",
                "Nitrate (NO\u2083\u2013)",
                "Nitrite (NO\u2082\u2013)",
                "Perchlorate (ClO\u2084\u2013)",
                "Permanganate (MnO\u2084\u2013)",
                "Thiocyanate (SCN\u2013)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride (Cl-)",
            "Bromide (Br-)",
            "Iodide (I-)",
            "Fluoride (F-)",
            "Hydroxide (OH-)",
            "Cyanide (CN-)",
            "Nitrite (NO2-)",
            "Hypochlorite (ClO-)",
            "Perchlorate (ClO4-)",
            "Permanganate (MnO4-)",
            "Thiocyanate (SCN-)",
            "Azide (N3-)",
            "Hydride (H-)",
            "Bicarbonate (HCO3-)",
            "Bisulfite (HSO3-)",
            "Hydrogen sulfide (HS-)",
            "Dihydrogen phosphate (H2PO4-)",
            "Nitrate (NO3-)",
            "Acetate (CH3COO-)",
            "Formate (HCOO-)",
            "Hydrogen sulfate (HSO4-)",
            "Bromate (BrO3-)",
            "Iodate (IO3-)",
            "Hypobromite (BrO-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloride (Cl-)",
                "Bromide (Br-)",
                "Iodide (I-)",
                "Fluoride (F-)",
                "Hydroxide (OH-)",
                "Cyanide (CN-)",
                "Nitrite (NO2-)",
                "Hypochlorite (ClO-)",
                "Perchlorate (ClO4-)",
                "Permanganate (MnO4-)",
                "Thiocyanate (SCN-)",
                "Azide (N3-)",
                "Hydride (H-)",
                "Bicarbonate (HCO3-)",
                "Bisulfite (HSO3-)",
                "Hydrogen sulfide (HS-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Nitrate (NO3-)",
                "Acetate (CH3COO-)",
                "Formate (HCOO-)",
                "Hydrogen sulfate (HSO4-)",
                "Bromate (BrO3-)",
                "Iodate (IO3-)",
                "Hypobromite (BrO-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate (CH3COO-)",
                "Azide (N3-)",
                "Bicarbonate (HCO3-)",
                "Bisulfite (HSO3-)",
                "Bromate (BrO3-)",
                "Bromide (Br-)",
                "Chloride (Cl-)",
                "Cyanide (CN-)",
                "Dihydrogen phosphate (H2PO4-)",
                "Fluoride (F-)",
                "Formate (HCOO-)",
                "Hydride (H-)",
                "Hydrogen sulfate (HSO4-)",
                "Hydrogen sulfide (HS-)",
                "Hydroxide (OH-)",
                "Hypobromite (BrO-)",
                "Hypochlorite (ClO-)",
                "Iodate (IO3-)",
                "Iodide (I-)",
                "Nitrate (NO3-)",
                "Nitrite (NO2-)",
                "Perchlorate (ClO4-)",
                "Permanganate (MnO4-)",
                "Thiocyanate (SCN-)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Fluoride (F\u207b)",
            "Chloride (Cl\u207b)",
            "Bromide (Br\u207b)",
            "Iodide (I\u207b)",
            "Hydroxide (OH\u207b)",
            "Cyanide (CN\u207b)",
            "Azide (N\u2083\u207b)",
            "Nitrate (NO\u2083\u207b)",
            "Nitrite (NO\u2082\u207b)",
            "Hydrogen sulfate (HSO\u2084\u207b)",
            "Dihydrogen phosphate (H\u2082PO\u2084\u207b)",
            "Bicarbonate (HCO\u2083\u207b)",
            "Permanganate (MnO\u2084\u207b)",
            "Perchlorate (ClO\u2084\u207b)",
            "Chlorate (ClO\u2083\u207b)",
            "Chlorite (ClO\u2082\u207b)",
            "Hypochlorite (ClO\u207b)",
            "Bromate (BrO\u2083\u207b)",
            "Iodate (IO\u2083\u207b)",
            "Thiocyanate (SCN\u207b)",
            "Hydrogen sulfite (HSO\u2083\u207b)",
            "Methanesulfonate (CH\u2083SO\u2083\u207b)",
            "Trifluoromethanesulfonate (CF\u2083SO\u2083\u207b)",
            "Tetrafluoroborate (BF\u2084\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fluoride (F\u207b)",
                "Chloride (Cl\u207b)",
                "Bromide (Br\u207b)",
                "Iodide (I\u207b)",
                "Hydroxide (OH\u207b)",
                "Cyanide (CN\u207b)",
                "Azide (N\u2083\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Hydrogen sulfate (HSO\u2084\u207b)",
                "Dihydrogen phosphate (H\u2082PO\u2084\u207b)",
                "Bicarbonate (HCO\u2083\u207b)",
                "Permanganate (MnO\u2084\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Chlorate (ClO\u2083\u207b)",
                "Chlorite (ClO\u2082\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Bromate (BrO\u2083\u207b)",
                "Iodate (IO\u2083\u207b)",
                "Thiocyanate (SCN\u207b)",
                "Hydrogen sulfite (HSO\u2083\u207b)",
                "Methanesulfonate (CH\u2083SO\u2083\u207b)",
                "Trifluoromethanesulfonate (CF\u2083SO\u2083\u207b)",
                "Tetrafluoroborate (BF\u2084\u207b)"
            ],
            "mismatches": [],
            "true_referents": [
                "Azide (N\u2083\u207b)",
                "Bicarbonate (HCO\u2083\u207b)",
                "Bromate (BrO\u2083\u207b)",
                "Bromide (Br\u207b)",
                "Chlorate (ClO\u2083\u207b)",
                "Chloride (Cl\u207b)",
                "Chlorite (ClO\u2082\u207b)",
                "Cyanide (CN\u207b)",
                "Dihydrogen phosphate (H\u2082PO\u2084\u207b)",
                "Fluoride (F\u207b)",
                "Hydrogen sulfate (HSO\u2084\u207b)",
                "Hydrogen sulfite (HSO\u2083\u207b)",
                "Hydroxide (OH\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Iodate (IO\u2083\u207b)",
                "Iodide (I\u207b)",
                "Methanesulfonate (CH\u2083SO\u2083\u207b)",
                "Nitrate (NO\u2083\u207b)",
                "Nitrite (NO\u2082\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Permanganate (MnO\u2084\u207b)",
                "Tetrafluoroborate (BF\u2084\u207b)",
                "Thiocyanate (SCN\u207b)",
                "Trifluoromethanesulfonate (CF\u2083SO\u2083\u207b)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Fluoride (F\u207b)",
            "Chloride (Cl\u207b)",
            "Bromide (Br\u207b)",
            "Iodide (I\u207b)",
            "Astatide (At\u207b)",
            "Cyanide (CN\u207b)",
            "Hydroxide (OH\u207b)",
            "Nitride (N\u00b3\u207b)",
            "Phosphide (P\u00b3\u207b)",
            "Arsenide (As\u00b3\u207b)",
            "Hydride (H\u207b)",
            "Amide (NH\u2082\u207b)",
            "Azide (N\u2083\u207b)",
            "Peroxide (O\u2082\u00b2\u207b)",
            "Superoxide (O\u2082\u207b)",
            "Ozonide (O\u2083\u207b)",
            "Hypochlorite (ClO\u207b)",
            "Chlorite (ClO\u2082\u207b)",
            "Chlorate (ClO\u2083\u207b)",
            "Perchlorate (ClO\u2084\u207b)",
            "Hypobromite (BrO\u207b)",
            "Bromite (BrO\u2082\u207b)",
            "Bromate (BrO\u2083\u207b)",
            "Perbromate (BrO\u2084\u207b)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fluoride (F\u207b)",
                "Chloride (Cl\u207b)",
                "Bromide (Br\u207b)",
                "Iodide (I\u207b)",
                "Astatide (At\u207b)",
                "Cyanide (CN\u207b)",
                "Hydroxide (OH\u207b)",
                "Nitride (N\u00b3\u207b)",
                "Phosphide (P\u00b3\u207b)",
                "Arsenide (As\u00b3\u207b)",
                "Hydride (H\u207b)",
                "Amide (NH\u2082\u207b)",
                "Azide (N\u2083\u207b)",
                "Peroxide (O\u2082\u00b2\u207b)",
                "Superoxide (O\u2082\u207b)",
                "Ozonide (O\u2083\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Chlorite (ClO\u2082\u207b)",
                "Chlorate (ClO\u2083\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Hypobromite (BrO\u207b)",
                "Bromite (BrO\u2082\u207b)",
                "Bromate (BrO\u2083\u207b)",
                "Perbromate (BrO\u2084\u207b)"
            ],
            "mismatches": [],
            "true_referents": [
                "Amide (NH\u2082\u207b)",
                "Arsenide (As\u00b3\u207b)",
                "Astatide (At\u207b)",
                "Azide (N\u2083\u207b)",
                "Bromate (BrO\u2083\u207b)",
                "Bromide (Br\u207b)",
                "Bromite (BrO\u2082\u207b)",
                "Chlorate (ClO\u2083\u207b)",
                "Chloride (Cl\u207b)",
                "Chlorite (ClO\u2082\u207b)",
                "Cyanide (CN\u207b)",
                "Fluoride (F\u207b)",
                "Hydride (H\u207b)",
                "Hydroxide (OH\u207b)",
                "Hypobromite (BrO\u207b)",
                "Hypochlorite (ClO\u207b)",
                "Iodide (I\u207b)",
                "Nitride (N\u00b3\u207b)",
                "Ozonide (O\u2083\u207b)",
                "Perbromate (BrO\u2084\u207b)",
                "Perchlorate (ClO\u2084\u207b)",
                "Peroxide (O\u2082\u00b2\u207b)",
                "Phosphide (P\u00b3\u207b)",
                "Superoxide (O\u2082\u207b)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Fluoride (F-)",
            "Chloride (Cl-)",
            "Bromide (Br-)",
            "Iodide (I-)",
            "Cyanide (CN-)",
            "Hydroxide (OH-)",
            "Nitrite (NO2-)",
            "Nitrate (NO3-)",
            "Sulfite (SO3-2)",
            "Sulfate (SO4-2)",
            "Phosphite (PO3-3)",
            "Phosphate (PO4-3)",
            "Acetate (CH3COO-)",
            "Formate (HCOO-)",
            "Oxalate (C2O4-2)",
            "Carbonate (CO3-2)",
            "Bicarbonate (HCO3-)",
            "Borate (BO3-3)",
            "Silicate (SiO3-2)",
            "Ferrocyanide (Fe(CN)6-4)",
            "Ferricyanide (Fe(CN)6-3)",
            "Permanganate (MnO4-)",
            "Dichromate (Cr2O7-2)",
            "Perchlorate (ClO4-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fluoride (F-)",
                "Chloride (Cl-)",
                "Bromide (Br-)",
                "Iodide (I-)",
                "Cyanide (CN-)",
                "Hydroxide (OH-)",
                "Nitrite (NO2-)",
                "Nitrate (NO3-)",
                "Sulfite (SO3-2)",
                "Sulfate (SO4-2)",
                "Phosphite (PO3-3)",
                "Phosphate (PO4-3)",
                "Acetate (CH3COO-)",
                "Formate (HCOO-)",
                "Oxalate (C2O4-2)",
                "Carbonate (CO3-2)",
                "Bicarbonate (HCO3-)",
                "Borate (BO3-3)",
                "Silicate (SiO3-2)",
                "Ferrocyanide (Fe(CN)6-4)",
                "Ferricyanide (Fe(CN)6-3)",
                "Permanganate (MnO4-)",
                "Dichromate (Cr2O7-2)",
                "Perchlorate (ClO4-)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetate (CH3COO-)",
                "Bicarbonate (HCO3-)",
                "Borate (BO3-3)",
                "Bromide (Br-)",
                "Carbonate (CO3-2)",
                "Chloride (Cl-)",
                "Cyanide (CN-)",
                "Dichromate (Cr2O7-2)",
                "Ferricyanide (Fe(CN)6-3)",
                "Ferrocyanide (Fe(CN)6-4)",
                "Fluoride (F-)",
                "Formate (HCOO-)",
                "Hydroxide (OH-)",
                "Iodide (I-)",
                "Nitrate (NO3-)",
                "Nitrite (NO2-)",
                "Oxalate (C2O4-2)",
                "Perchlorate (ClO4-)",
                "Permanganate (MnO4-)",
                "Phosphate (PO4-3)",
                "Phosphite (PO3-3)",
                "Silicate (SiO3-2)",
                "Sulfate (SO4-2)",
                "Sulfite (SO3-2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Chloride (Cl-)",
            "Fluoride (F-)",
            "Bromide (Br-)",
            "Iodide (I-)",
            "Hydride (H-)",
            "Oxide (O2-)",
            "Perchlorate (ClO4-)",
            "Phosphate (PO43-)",
            "Sulfate (SO42-)",
            "Nitrate (NO3-)",
            "Carbonate (CO32-)",
            "Bicarbonate (HCO3-)",
            "Phosphite (PO33-)",
            "Phosphonate (PO32-)",
            "Hydroxide (OH-)",
            "Fluorosulfonate (FSO3-)",
            "Chlorosulfonate (ClSO3-)",
            "Bromosulfonate (BrSO3-)",
            "Iodosulfonate (ISO3-)",
            "Chlorate (ClO3-)",
            "Bromate (BrO3-)",
            "Iodate (IO3-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chloride (Cl-)",
                "Fluoride (F-)",
                "Bromide (Br-)",
                "Iodide (I-)",
                "Hydride (H-)",
                "Oxide (O2-)",
                "Perchlorate (ClO4-)",
                "Phosphate (PO43-)",
                "Sulfate (SO42-)",
                "Nitrate (NO3-)",
                "Carbonate (CO32-)",
                "Bicarbonate (HCO3-)",
                "Phosphite (PO33-)",
                "Phosphonate (PO32-)",
                "Hydroxide (OH-)",
                "Chlorosulfonate (ClSO3-)",
                "Bromosulfonate (BrSO3-)",
                "Iodosulfonate (ISO3-)",
                "Chlorate (ClO3-)",
                "Bromate (BrO3-)",
                "Iodate (IO3-)"
            ],
            "mismatches": [
                "Fluorosulfonate (FSO3-)"
            ],
            "true_referents": [
                "Bicarbonate (HCO3-)",
                "Bromate (BrO3-)",
                "Bromide (Br-)",
                "Bromosulfonate (BrSO3-)",
                "Carbonate (CO32-)",
                "Chlorate (ClO3-)",
                "Chloride (Cl-)",
                "Chlorosulfonate (ClSO3-)",
                "Fluoride (F-)",
                "Fluorosulfonate (FSO3-)",
                "Hydride (H-)",
                "Hydroxide (OH-)",
                "Iodate (IO3-)",
                "Iodide (I-)",
                "Iodosulfonate (ISO3-)",
                "Nitrate (NO3-)",
                "Oxide (O2-)",
                "Perchlorate (ClO4-)",
                "Phosphate (PO43-)",
                "Phosphite (PO33-)",
                "Phosphonate (PO32-)",
                "Sulfate (SO42-)"
            ],
            "TP": 21,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            "Azide (N3-)",
            "Cyanide (CN-)",
            "Hydride (H-)",
            "Nitride (N3-)",
            "Oxide (O2-)",
            "Peroxide (O22-)",
            "Chloride (Cl-)",
            "Bromide (Br-)",
            "Iodide (I-)",
            "Fluoride (F-)",
            "Hydrogen carbonate (HCO3-)",
            "Nitrate (NO3-)",
            "Nitrite (NO2-)",
            "Sulfide (S2-)",
            "Sulfite (SO32-)",
            "Bisulfite (HSO3-)",
            "Thiocyanate (SCN-)",
            "Cyanate (OCN-)",
            "Peroxynitrite (ONOO-)",
            "Peroxycarbonate (CO42-)",
            "Peroxynitrate (O2NO-)",
            "Peroxysulfate (SO52-)",
            "Peroxymonosulfate (SO52-)",
            "Chlorite (ClO2-)",
            "Bromite (BrO2-)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Azide (N3-)",
                "Cyanide (CN-)",
                "Hydride (H-)",
                "Nitride (N3-)",
                "Oxide (O2-)",
                "Peroxide (O22-)",
                "Chloride (Cl-)",
                "Bromide (Br-)",
                "Iodide (I-)",
                "Fluoride (F-)",
                "Hydrogen carbonate (HCO3-)",
                "Nitrate (NO3-)",
                "Nitrite (NO2-)",
                "Sulfide (S2-)",
                "Sulfite (SO32-)",
                "Bisulfite (HSO3-)",
                "Thiocyanate (SCN-)",
                "Cyanate (OCN-)",
                "Peroxynitrite (ONOO-)",
                "Peroxycarbonate (CO42-)",
                "Peroxynitrate (O2NO-)",
                "Peroxysulfate (SO52-)",
                "Peroxymonosulfate (SO52-)",
                "Chlorite (ClO2-)"
            ],
            "mismatches": [
                "Bromite (BrO2-)"
            ],
            "true_referents": [
                "Azide (N3-)",
                "Bisulfite (HSO3-)",
                "Bromide (Br-)",
                "Chloride (Cl-)",
                "Chlorite (ClO2-)",
                "Cyanate (OCN-)",
                "Cyanide (CN-)",
                "Fluoride (F-)",
                "Hydride (H-)",
                "Hydrogen carbonate (HCO3-)",
                "Iodide (I-)",
                "Nitrate (NO3-)",
                "Nitride (N3-)",
                "Nitrite (NO2-)",
                "Oxide (O2-)",
                "Peroxide (O22-)",
                "Peroxycarbonate (CO42-)",
                "Peroxymonosulfate (SO52-)",
                "Peroxynitrate (O2NO-)",
                "Peroxynitrite (ONOO-)",
                "Peroxysulfate (SO52-)",
                "Sulfide (S2-)",
                "Sulfite (SO32-)",
                "Thiocyanate (SCN-)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "monovalent inorganic anion",
        "domain": "chemistry",
        "response": [
            {
                "Canonical name": "chloride (Cl-)",
                "Abbreviated identifier": "Cl-"
            },
            {
                "Canonical name": "nitrate (NO3-)",
                "Abbreviated identifier": "NO3-"
            },
            {
                "Canonical name": "bromide (Br-)",
                "Abbreviated identifier": "Br-"
            },
            {
                "Canonical name": "iodide (I-)",
                "Abbreviated identifier": "I-"
            },
            {
                "Canonical name": "acetate (CH3COO-)",
                "Abbreviated identifier": "CH3COO-"
            },
            {
                "Canonical name": "propionate (CH3CH2COO-)",
                "Abbreviated identifier": "CH3CH2COO-"
            },
            {
                "Canonical name": "butyrate (CH3CH2CH2COO-)",
                "Abbreviated identifier": "CH3CH2CH2COO-"
            },
            {
                "Canonical name": "valerate (CH3(CH2)3COO-)",
                "Abbreviated identifier": "CH3(CH2)3COO-"
            },
            {
                "Canonical name": "heptanoate (CH3(CH2)5COO-)",
                "Abbreviated identifier": "CH3(CH2)5COO-"
            },
            {
                "Canonical name": "octanoate (CH3(CH2)6COO-)",
                "Abbreviated identifier": "CH3(CH2)6COO-"
            },
            {
                "Canonical name": "nonanoate (CH3(CH2)7COO-)",
                "Abbreviated identifier": "CH3(CH2)7COO-"
            },
            {
                "Canonical name": "decanoate (CH3(CH2)8COO-)",
                "Abbreviated identifier": "CH3(CH2)8COO-"
            },
            {
                "Canonical name": "undecanoate (CH3(CH2)9COO-)",
                "Abbreviated identifier": "CH3(CH2)9COO-"
            },
            {
                "Canonical name": "dodecanoate (CH3(CH2)10COO-)",
                "Abbreviated identifier": "CH3(CH2)10COO-"
            },
            {
                "Canonical name": "tridecanoate (CH3(CH2)11COO-)",
                "Abbreviated identifier": "CH3(CH2)11COO-"
            },
            {
                "Canonical name": "tetradecanoate (CH3(CH2)12COO-)",
                "Abbreviated identifier": "CH3(CH2)12COO-"
            },
            {
                "Canonical name": "pentadecanoate (CH3(CH2)13COO-)",
                "Abbreviated identifier": "CH3(CH2)13COO-"
            },
            {
                "Canonical name": "hexadecanoate (CH3(CH2)14COO-)",
                "Abbreviated identifier": "CH3(CH2)14COO-"
            },
            {
                "Canonical name": "heptadecanoate (CH3(CH2)15COO-)",
                "Abbreviated identifier": "CH3(CH2)15COO-"
            },
            {
                "Canonical name": "octadecanoate (CH3(CH2)16COO-)",
                "Abbreviated identifier": "CH3(CH2)16COO-"
            },
            {
                "Canonical name": "nonadecanoate (CH3(CH2)17COO-)",
                "Abbreviated identifier": "CH3(CH2)17COO-"
            },
            {
                "Canonical name": "icosanoate (CH3(CH2)18COO-)",
                "Abbreviated identifier": "CH3(CH2)18COO-"
            },
            {
                "Canonical name": "docosanoate (CH3(CH2)20COO-)",
                "Abbreviated identifier": "CH3(CH2)20COO-"
            },
            {
                "Canonical name": "tetracosanate (CH3(CH2)24COO-)",
                "Abbreviated identifier": "CH3(CH2)24COO-"
            },
            {
                "Canonical name": "pentacosanate (CH3(CH2)26COO-)",
                "Abbreviated identifier": "CH3(CH2)26COO-"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "chloride (Cl-)",
                "nitrate (NO3-)",
                "bromide (Br-)",
                "iodide (I-)",
                "acetate (CH3COO-)",
                "propionate (CH3CH2COO-)",
                "butyrate (CH3CH2CH2COO-)",
                "valerate (CH3(CH2)3COO-)",
                "heptanoate (CH3(CH2)5COO-)",
                "octanoate (CH3(CH2)6COO-)",
                "nonanoate (CH3(CH2)7COO-)",
                "decanoate (CH3(CH2)8COO-)",
                "undecanoate (CH3(CH2)9COO-)",
                "dodecanoate (CH3(CH2)10COO-)",
                "tridecanoate (CH3(CH2)11COO-)",
                "tetradecanoate (CH3(CH2)12COO-)",
                "pentadecanoate (CH3(CH2)13COO-)",
                "hexadecanoate (CH3(CH2)14COO-)",
                "heptadecanoate (CH3(CH2)15COO-)",
                "octadecanoate (CH3(CH2)16COO-)",
                "nonadecanoate (CH3(CH2)17COO-)",
                "icosanoate (CH3(CH2)18COO-)",
                "docosanoate (CH3(CH2)20COO-)",
                "tetracosanate (CH3(CH2)24COO-)"
            ],
            "mismatches": [
                "pentacosanate (CH3(CH2)26COO-)"
            ],
            "true_referents": [
                "{\"Canonical name\": \"acetate (CH3COO-)\", \"Abbreviated identifier\": \"CH3COO-\"}",
                "{\"Canonical name\": \"bromide (Br-)\", \"Abbreviated identifier\": \"Br-\"}",
                "{\"Canonical name\": \"butyrate (CH3CH2CH2COO-)\", \"Abbreviated identifier\": \"CH3CH2CH2COO-\"}",
                "{\"Canonical name\": \"chloride (Cl-)\", \"Abbreviated identifier\": \"Cl-\"}",
                "{\"Canonical name\": \"decanoate (CH3(CH2)8COO-)\", \"Abbreviated identifier\": \"CH3(CH2)8COO-\"}",
                "{\"Canonical name\": \"docosanoate (CH3(CH2)20COO-)\", \"Abbreviated identifier\": \"CH3(CH2)20COO-\"}",
                "{\"Canonical name\": \"dodecanoate (CH3(CH2)10COO-)\", \"Abbreviated identifier\": \"CH3(CH2)10COO-\"}",
                "{\"Canonical name\": \"heptadecanoate (CH3(CH2)15COO-)\", \"Abbreviated identifier\": \"CH3(CH2)15COO-\"}",
                "{\"Canonical name\": \"heptanoate (CH3(CH2)5COO-)\", \"Abbreviated identifier\": \"CH3(CH2)5COO-\"}",
                "{\"Canonical name\": \"hexadecanoate (CH3(CH2)14COO-)\", \"Abbreviated identifier\": \"CH3(CH2)14COO-\"}",
                "{\"Canonical name\": \"icosanoate (CH3(CH2)18COO-)\", \"Abbreviated identifier\": \"CH3(CH2)18COO-\"}",
                "{\"Canonical name\": \"iodide (I-)\", \"Abbreviated identifier\": \"I-\"}",
                "{\"Canonical name\": \"nitrate (NO3-)\", \"Abbreviated identifier\": \"NO3-\"}",
                "{\"Canonical name\": \"nonadecanoate (CH3(CH2)17COO-)\", \"Abbreviated identifier\": \"CH3(CH2)17COO-\"}",
                "{\"Canonical name\": \"nonanoate (CH3(CH2)7COO-)\", \"Abbreviated identifier\": \"CH3(CH2)7COO-\"}",
                "{\"Canonical name\": \"octadecanoate (CH3(CH2)16COO-)\", \"Abbreviated identifier\": \"CH3(CH2)16COO-\"}",
                "{\"Canonical name\": \"octanoate (CH3(CH2)6COO-)\", \"Abbreviated identifier\": \"CH3(CH2)6COO-\"}",
                "{\"Canonical name\": \"pentadecanoate (CH3(CH2)13COO-)\", \"Abbreviated identifier\": \"CH3(CH2)13COO-\"}",
                "{\"Canonical name\": \"propionate (CH3CH2COO-)\", \"Abbreviated identifier\": \"CH3CH2COO-\"}",
                "{\"Canonical name\": \"tetracosanate (CH3(CH2)24COO-)\", \"Abbreviated identifier\": \"CH3(CH2)24COO-\"}",
                "{\"Canonical name\": \"tetradecanoate (CH3(CH2)12COO-)\", \"Abbreviated identifier\": \"CH3(CH2)12COO-\"}",
                "{\"Canonical name\": \"tridecanoate (CH3(CH2)11COO-)\", \"Abbreviated identifier\": \"CH3(CH2)11COO-\"}",
                "{\"Canonical name\": \"undecanoate (CH3(CH2)9COO-)\", \"Abbreviated identifier\": \"CH3(CH2)9COO-\"}",
                "{\"Canonical name\": \"valerate (CH3(CH2)3COO-)\", \"Abbreviated identifier\": \"CH3(CH2)3COO-\"}"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    }
]