[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "Nitrogen dioxide (NO2)",
            "Nitric oxide (NO)",
            "Nitrous oxide (N2O)",
            "Dinitrogen trioxide (N2O3)",
            "Dinitrogen pentoxide (N2O5)",
            "Nitryl fluoride (NO2F)",
            "Nitryl chloride (NO2Cl)",
            "Nitryl bromide (NO2Br)",
            "Nitryl iodide (NO2I)",
            "Nitrosyl fluoride (NOF)",
            "Nitrosyl chloride (NOCl)",
            "Nitrosyl bromide (NOBr)",
            "Nitrosyl iodide (NOI)",
            "Nitrosyl cation (NO+)",
            "Nitrosyl hypofluorite (NOOF)",
            "Nitrosyl hypoiodite (NOOI)",
            "Nitrosyl peroxide (N2O4)",
            "Nitrosyl perchlorate (NOClO3)",
            "Nitrosyl nitrate (NO3ONO2)",
            "Nitrosyl sulfite (NOHSO3)",
            "Nitrosyl sulfate (NOHSO4)",
            "Nitrosyl nitrite (NONO2)",
            "Nitrosyl nitrate (NONO3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nitrogen dioxide (NO2)",
                "Nitric oxide (NO)",
                "Nitrous oxide (N2O)",
                "Dinitrogen trioxide (N2O3)",
                "Dinitrogen pentoxide (N2O5)",
                "Nitryl fluoride (NO2F)",
                "Nitryl chloride (NO2Cl)",
                "Nitryl bromide (NO2Br)",
                "Nitryl iodide (NO2I)",
                "Nitrosyl fluoride (NOF)",
                "Nitrosyl chloride (NOCl)",
                "Nitrosyl bromide (NOBr)",
                "Nitrosyl iodide (NOI)",
                "Nitrosyl cation (NO+)",
                "Nitrosyl hypofluorite (NOOF)",
                "Nitrosyl hypoiodite (NOOI)",
                "Nitrosyl peroxide (N2O4)",
                "Nitrosyl perchlorate (NOClO3)",
                "Nitrosyl nitrate (NO3ONO2)",
                "Nitrosyl sulfite (NOHSO3)",
                "Nitrosyl sulfate (NOHSO4)",
                "Nitrosyl nitrite (NONO2)",
                "Nitrosyl nitrate (NONO3)"
            ],
            "mismatches": [],
            "true_referents": [
                "Dinitrogen pentoxide (N2O5)",
                "Dinitrogen trioxide (N2O3)",
                "Nitric oxide (NO)",
                "Nitrogen dioxide (NO2)",
                "Nitrosyl bromide (NOBr)",
                "Nitrosyl cation (NO+)",
                "Nitrosyl chloride (NOCl)",
                "Nitrosyl fluoride (NOF)",
                "Nitrosyl hypofluorite (NOOF)",
                "Nitrosyl hypoiodite (NOOI)",
                "Nitrosyl iodide (NOI)",
                "Nitrosyl nitrate (NO3ONO2)",
                "Nitrosyl nitrate (NONO3)",
                "Nitrosyl nitrite (NONO2)",
                "Nitrosyl perchlorate (NOClO3)",
                "Nitrosyl peroxide (N2O4)",
                "Nitrosyl sulfate (NOHSO4)",
                "Nitrosyl sulfite (NOHSO3)",
                "Nitrous oxide (N2O)",
                "Nitryl bromide (NO2Br)",
                "Nitryl chloride (NO2Cl)",
                "Nitryl fluoride (NO2F)",
                "Nitryl iodide (NO2I)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "Dinitrogen pentoxide (N2O5)",
            "Nitrogen dioxide (NO2)",
            "Nitrous oxide (N2O)",
            "Dinitrogen trioxide (N2O3)",
            "Nitrogen trioxide (NO3)",
            "N2O4 (Dinitrogen tetroxide)",
            "N2O6 (Dinitrogen hexoxide)",
            "N2O7 (Dinitrogen heptoxide)",
            "NO (Nitric oxide)",
            "NO2 (Nitrogen dioxide)",
            "N2O5 (Dinitrogen pentoxide)",
            "N2O3 (Dinitrogen trioxide)",
            "N2O (Nitrous oxide)",
            "N2O4 (Dinitrogen tetroxide)",
            "N2O6 (Dinitrogen hexoxide)",
            "N2O7 (Dinitrogen heptoxide)",
            "NO3 (Nitrogen trioxide)",
            "N2O2 (Dinitrogen dioxide)",
            "N4O2 (Tetranitrogen dioxide)",
            "N2O8 (Dinitrogen octoxide)",
            "N3O2 (Trinitrogen dioxide)",
            "N4O4 (Tetranitrogen tetroxide)",
            "N5O (Pentazotone)",
            "N10O2 (Decazotone)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dinitrogen pentoxide (N2O5)",
                "Nitrogen dioxide (NO2)",
                "Nitrous oxide (N2O)",
                "Dinitrogen trioxide (N2O3)",
                "Nitrogen trioxide (NO3)",
                "N2O4 (Dinitrogen tetroxide)",
                "N2O6 (Dinitrogen hexoxide)",
                "N2O7 (Dinitrogen heptoxide)",
                "NO (Nitric oxide)",
                "NO2 (Nitrogen dioxide)",
                "N2O2 (Dinitrogen dioxide)",
                "N4O2 (Tetranitrogen dioxide)",
                "N2O8 (Dinitrogen octoxide)",
                "N3O2 (Trinitrogen dioxide)",
                "N4O4 (Tetranitrogen tetroxide)",
                "N5O (Pentazotone)",
                "N10O2 (Decazotone)"
            ],
            "mismatches": [],
            "true_referents": [
                "Dinitrogen pentoxide (N2O5)",
                "Dinitrogen trioxide (N2O3)",
                "N10O2 (Decazotone)",
                "N2O (Nitrous oxide)",
                "N2O2 (Dinitrogen dioxide)",
                "N2O3 (Dinitrogen trioxide)",
                "N2O4 (Dinitrogen tetroxide)",
                "N2O5 (Dinitrogen pentoxide)",
                "N2O6 (Dinitrogen hexoxide)",
                "N2O7 (Dinitrogen heptoxide)",
                "N2O8 (Dinitrogen octoxide)",
                "N3O2 (Trinitrogen dioxide)",
                "N4O2 (Tetranitrogen dioxide)",
                "N4O4 (Tetranitrogen tetroxide)",
                "N5O (Pentazotone)",
                "NO (Nitric oxide)",
                "NO2 (Nitrogen dioxide)",
                "NO3 (Nitrogen trioxide)",
                "Nitrogen dioxide (NO2)",
                "Nitrogen trioxide (NO3)",
                "Nitrous oxide (N2O)"
            ],
            "TP": 17,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "Dinitrogen pentoxide (N2O5)",
            "Nitrogen dioxide (NO2)",
            "Nitrogen trioxide (NO3)",
            "Dinitrogen trioxide (N2O3)",
            "Nitrogen monoxide (NO)",
            "Dinitrogen monoxide (N2O)",
            "Nitrous oxide (N2O)",
            "Nitric oxide (NO)",
            "Dinitrogen tetraoxide (N2O4)",
            "Nitric acid (HNO3)",
            "Nitrous acid (HNO2)",
            "Nitric anhydride (N2O5)",
            "Nitrous anhydride (N2O3)",
            "Nitric oxide dimer (N2O2)",
            "Nitrosyl chloride (NOCl)",
            "Nitrosyl bromide (NOBr)",
            "Nitrosyl fluoride (NOF)",
            "Nitrosyl cyanide (NONO)",
            "Nitrosyl thiocyanate (NOSCN)",
            "Nitrosyl azide (NON3)",
            "Nitrosyl hydroxide (NOOH)",
            "Nitrosyl hydrosulfide (NOSH)",
            "Nitrosyl sulfite (NOSO3)",
            "Nitrosyl sulfate (NOSO4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dinitrogen pentoxide (N2O5)",
                "Nitrogen dioxide (NO2)",
                "Nitrogen trioxide (NO3)",
                "Dinitrogen trioxide (N2O3)",
                "Nitrogen monoxide (NO)",
                "Dinitrogen monoxide (N2O)",
                "Nitrous oxide (N2O)",
                "Nitric oxide (NO)",
                "Dinitrogen tetraoxide (N2O4)",
                "Nitric acid (HNO3)",
                "Nitrous acid (HNO2)",
                "Nitric anhydride (N2O5)",
                "Nitrous anhydride (N2O3)",
                "Nitric oxide dimer (N2O2)",
                "Nitrosyl chloride (NOCl)",
                "Nitrosyl bromide (NOBr)",
                "Nitrosyl fluoride (NOF)",
                "Nitrosyl cyanide (NONO)",
                "Nitrosyl thiocyanate (NOSCN)",
                "Nitrosyl azide (NON3)",
                "Nitrosyl hydroxide (NOOH)",
                "Nitrosyl hydrosulfide (NOSH)",
                "Nitrosyl sulfite (NOSO3)",
                "Nitrosyl sulfate (NOSO4)"
            ],
            "mismatches": [],
            "true_referents": [
                "Dinitrogen monoxide (N2O)",
                "Dinitrogen pentoxide (N2O5)",
                "Dinitrogen tetraoxide (N2O4)",
                "Dinitrogen trioxide (N2O3)",
                "Nitric acid (HNO3)",
                "Nitric anhydride (N2O5)",
                "Nitric oxide (NO)",
                "Nitric oxide dimer (N2O2)",
                "Nitrogen dioxide (NO2)",
                "Nitrogen monoxide (NO)",
                "Nitrogen trioxide (NO3)",
                "Nitrosyl azide (NON3)",
                "Nitrosyl bromide (NOBr)",
                "Nitrosyl chloride (NOCl)",
                "Nitrosyl cyanide (NONO)",
                "Nitrosyl fluoride (NOF)",
                "Nitrosyl hydrosulfide (NOSH)",
                "Nitrosyl hydroxide (NOOH)",
                "Nitrosyl sulfate (NOSO4)",
                "Nitrosyl sulfite (NOSO3)",
                "Nitrosyl thiocyanate (NOSCN)",
                "Nitrous acid (HNO2)",
                "Nitrous anhydride (N2O3)",
                "Nitrous oxide (N2O)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "Nitrogen Monoxide (NO)",
            "Nitrogen Dioxide (NO2)",
            "Nitrous Oxide (N2O)",
            "Dinitrogen Trioxide (N2O3)",
            "Tetranitrogen Tetroxide (N2O4)",
            "Dinitrogen Pentoxide (N2O5)",
            "Ammonium Nitrate (NH4NO3)",
            "Sodium Nitrite (NaNO2)",
            "Potassium Nitrate (KNO3)",
            "Calcium Nitride (Ca3N2)",
            "Magnesium Nitride (Mg3N2)",
            "Zinc Nitride (Zn3N2)",
            "Aluminum Nitride (AlN)",
            "Boron Nitride (BN)",
            "Silicon Nitride (Si3N4)",
            "Titanium Nitride (TiN)",
            "Vanadium Nitride (VN)",
            "Chromium Nitride (CrN)",
            "Molybdenum Nitride (Mo2N)",
            "Tungsten Nitride (WN)",
            "Iron(II) Oxide Nitride (FeO(N))",
            "Iron(III) Oxide Nitride (Fe2O3(N))",
            "Copper(I) Oxide Nitride (Cu2O(N))",
            "Silver Oxide Nitride (Ag2O(N))"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nitrogen Monoxide (NO)",
                "Nitrogen Dioxide (NO2)",
                "Nitrous Oxide (N2O)",
                "Dinitrogen Trioxide (N2O3)",
                "Tetranitrogen Tetroxide (N2O4)",
                "Dinitrogen Pentoxide (N2O5)",
                "Ammonium Nitrate (NH4NO3)",
                "Sodium Nitrite (NaNO2)",
                "Potassium Nitrate (KNO3)",
                "Calcium Nitride (Ca3N2)",
                "Magnesium Nitride (Mg3N2)",
                "Zinc Nitride (Zn3N2)",
                "Aluminum Nitride (AlN)",
                "Boron Nitride (BN)",
                "Silicon Nitride (Si3N4)",
                "Titanium Nitride (TiN)",
                "Vanadium Nitride (VN)",
                "Chromium Nitride (CrN)",
                "Molybdenum Nitride (Mo2N)",
                "Tungsten Nitride (WN)",
                "Iron(II) Oxide Nitride (FeO(N))",
                "Iron(III) Oxide Nitride (Fe2O3(N))",
                "Copper(I) Oxide Nitride (Cu2O(N))",
                "Silver Oxide Nitride (Ag2O(N))"
            ],
            "mismatches": [],
            "true_referents": [
                "Aluminum Nitride (AlN)",
                "Ammonium Nitrate (NH4NO3)",
                "Boron Nitride (BN)",
                "Calcium Nitride (Ca3N2)",
                "Chromium Nitride (CrN)",
                "Copper(I) Oxide Nitride (Cu2O(N))",
                "Dinitrogen Pentoxide (N2O5)",
                "Dinitrogen Trioxide (N2O3)",
                "Iron(II) Oxide Nitride (FeO(N))",
                "Iron(III) Oxide Nitride (Fe2O3(N))",
                "Magnesium Nitride (Mg3N2)",
                "Molybdenum Nitride (Mo2N)",
                "Nitrogen Dioxide (NO2)",
                "Nitrogen Monoxide (NO)",
                "Nitrous Oxide (N2O)",
                "Potassium Nitrate (KNO3)",
                "Silicon Nitride (Si3N4)",
                "Silver Oxide Nitride (Ag2O(N))",
                "Sodium Nitrite (NaNO2)",
                "Tetranitrogen Tetroxide (N2O4)",
                "Titanium Nitride (TiN)",
                "Tungsten Nitride (WN)",
                "Vanadium Nitride (VN)",
                "Zinc Nitride (Zn3N2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "Nitrous Oxide (N2O)",
            "Nitric Oxide (NO)",
            "Nitrogen Dioxide (NO2)",
            "Dinitrogen Tetroxide (N2O4)",
            "Dinitrogen Pentoxide (N2O5)",
            "Nitrogen Trioxide (N2O3)",
            "Tetranitrogen Hexaoxide (N4O6)",
            "Trinitrogen Tetraoxide (N3O4)",
            "Pentanitrogen Octaoxide (N5O8)",
            "Hexanitrogen Decaoxide (N6O10)",
            "Trinitrogen Hexaoxide (N3O6)",
            "Tetranitrogen Octaoxide (N4O8)",
            "Pentanitrogen Decaoxide (N5O10)",
            "Hexanitrogen Dodecaoxide (N6O12)",
            "Heptanitrogen Tetraoxide (N7O4)",
            "Octanitrogen Hexaoxide (N8O6)",
            "Nonanitrogen Octaoxide (N9O8)",
            "Decanitrogen Decaoxide (N10O10)",
            "Undecanitrogen Dodecaoxide (N11O12)",
            "Dodecanitrogen Tetradecaoxide (N12O14)",
            "Tridecanitrogen Hexadecaoxide (N13O16)",
            "Tetradecanitrogen Octadecaoxide (N14O18)",
            "Pentadecanitrogen Eicosaoxide (N15O20)",
            "Hexadecanitrogen Docosaoxide (N16O22)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nitrous Oxide (N2O)",
                "Nitric Oxide (NO)",
                "Nitrogen Dioxide (NO2)",
                "Dinitrogen Tetroxide (N2O4)",
                "Dinitrogen Pentoxide (N2O5)",
                "Nitrogen Trioxide (N2O3)",
                "Tetranitrogen Hexaoxide (N4O6)",
                "Trinitrogen Tetraoxide (N3O4)",
                "Pentanitrogen Octaoxide (N5O8)",
                "Hexanitrogen Decaoxide (N6O10)",
                "Trinitrogen Hexaoxide (N3O6)",
                "Tetranitrogen Octaoxide (N4O8)",
                "Pentanitrogen Decaoxide (N5O10)",
                "Hexanitrogen Dodecaoxide (N6O12)",
                "Heptanitrogen Tetraoxide (N7O4)",
                "Octanitrogen Hexaoxide (N8O6)",
                "Nonanitrogen Octaoxide (N9O8)",
                "Decanitrogen Decaoxide (N10O10)",
                "Undecanitrogen Dodecaoxide (N11O12)",
                "Dodecanitrogen Tetradecaoxide (N12O14)",
                "Tridecanitrogen Hexadecaoxide (N13O16)",
                "Tetradecanitrogen Octadecaoxide (N14O18)",
                "Pentadecanitrogen Eicosaoxide (N15O20)",
                "Hexadecanitrogen Docosaoxide (N16O22)"
            ],
            "mismatches": [],
            "true_referents": [
                "Decanitrogen Decaoxide (N10O10)",
                "Dinitrogen Pentoxide (N2O5)",
                "Dinitrogen Tetroxide (N2O4)",
                "Dodecanitrogen Tetradecaoxide (N12O14)",
                "Heptanitrogen Tetraoxide (N7O4)",
                "Hexadecanitrogen Docosaoxide (N16O22)",
                "Hexanitrogen Decaoxide (N6O10)",
                "Hexanitrogen Dodecaoxide (N6O12)",
                "Nitric Oxide (NO)",
                "Nitrogen Dioxide (NO2)",
                "Nitrogen Trioxide (N2O3)",
                "Nitrous Oxide (N2O)",
                "Nonanitrogen Octaoxide (N9O8)",
                "Octanitrogen Hexaoxide (N8O6)",
                "Pentadecanitrogen Eicosaoxide (N15O20)",
                "Pentanitrogen Decaoxide (N5O10)",
                "Pentanitrogen Octaoxide (N5O8)",
                "Tetradecanitrogen Octadecaoxide (N14O18)",
                "Tetranitrogen Hexaoxide (N4O6)",
                "Tetranitrogen Octaoxide (N4O8)",
                "Tridecanitrogen Hexadecaoxide (N13O16)",
                "Trinitrogen Hexaoxide (N3O6)",
                "Trinitrogen Tetraoxide (N3O4)",
                "Undecanitrogen Dodecaoxide (N11O12)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "Nitrogen dioxide (NO2)",
            "Dinitrogen tetroxide (N2O4)",
            "Nitrous oxide (N2O)",
            "Nitrogen trioxide (N2O3)",
            "Nitrogen pentoxide (N2O5)",
            "Nitrogen monoxide (NO)",
            "Ammonium nitrate (NH4NO3)",
            "Sodium nitrite (NaNO2)",
            "Potassium nitrate (KNO3)",
            "Calcium nitrate (Ca(NO3)2)",
            "Barium nitrate (Ba(NO3)2)",
            "Magnesium nitrate (Mg(NO3)2)",
            "Aluminum nitride (AlN)",
            "Silicon nitride (Si3N4)",
            "Titanium nitride (TiN)",
            "Zinc nitride (Zn3N2)",
            "Iron(III) nitride (FeN)",
            "Copper(I) nitride (Cu3N)",
            "Lead(II) nitride (Pb3N2)",
            "Gallium nitride (GaN)",
            "Indium nitride (InN)",
            "Boron nitride (BN)",
            "Tin(II) nitride (Sn3N4)",
            "Manganese(II) nitride (Mn3N2)",
            "Nickel(II) nitride (Ni3N2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nitrogen dioxide (NO2)",
                "Dinitrogen tetroxide (N2O4)",
                "Nitrous oxide (N2O)",
                "Nitrogen trioxide (N2O3)",
                "Nitrogen pentoxide (N2O5)",
                "Nitrogen monoxide (NO)",
                "Ammonium nitrate (NH4NO3)",
                "Sodium nitrite (NaNO2)",
                "Potassium nitrate (KNO3)",
                "Calcium nitrate (Ca(NO3)2)",
                "Barium nitrate (Ba(NO3)2)",
                "Magnesium nitrate (Mg(NO3)2)",
                "Aluminum nitride (AlN)",
                "Silicon nitride (Si3N4)",
                "Titanium nitride (TiN)",
                "Zinc nitride (Zn3N2)",
                "Iron(III) nitride (FeN)",
                "Copper(I) nitride (Cu3N)",
                "Lead(II) nitride (Pb3N2)",
                "Gallium nitride (GaN)",
                "Indium nitride (InN)",
                "Boron nitride (BN)",
                "Tin(II) nitride (Sn3N4)",
                "Manganese(II) nitride (Mn3N2)"
            ],
            "mismatches": [
                "Nickel(II) nitride (Ni3N2)"
            ],
            "true_referents": [
                "Aluminum nitride (AlN)",
                "Ammonium nitrate (NH4NO3)",
                "Barium nitrate (Ba(NO3)2)",
                "Boron nitride (BN)",
                "Calcium nitrate (Ca(NO3)2)",
                "Copper(I) nitride (Cu3N)",
                "Dinitrogen tetroxide (N2O4)",
                "Gallium nitride (GaN)",
                "Indium nitride (InN)",
                "Iron(III) nitride (FeN)",
                "Lead(II) nitride (Pb3N2)",
                "Magnesium nitrate (Mg(NO3)2)",
                "Manganese(II) nitride (Mn3N2)",
                "Nitrogen dioxide (NO2)",
                "Nitrogen monoxide (NO)",
                "Nitrogen pentoxide (N2O5)",
                "Nitrogen trioxide (N2O3)",
                "Nitrous oxide (N2O)",
                "Potassium nitrate (KNO3)",
                "Silicon nitride (Si3N4)",
                "Sodium nitrite (NaNO2)",
                "Tin(II) nitride (Sn3N4)",
                "Titanium nitride (TiN)",
                "Zinc nitride (Zn3N2)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "Ammonium Nitrate (NH4NO3)",
            "Dinitrogen Pentoxide (N2O5)",
            "Dinitrogen Tetroxide (N2O4)",
            "Dinitrogen Trioxide (N2O3)",
            "Hyponitrous Acid (H2N2O2)",
            "Hyponitric Acid (HNO)",
            "Lead Nitrate (Pb(NO3)2)",
            "Potassium Nitrate (KNO3)",
            "Sodium Nitrate (NaNO3)",
            "Calcium Nitrate (Ca(NO3)2)",
            "Barium Nitrate (Ba(NO3)2)",
            "Strontium Nitrate (Sr(NO3)2)",
            "Magnesium Nitrate (Mg(NO3)2)",
            "Zinc Nitrate (Zn(NO3)2)",
            "Copper Nitrate (Cu(NO3)2)",
            "Silver Nitrate (AgNO3)",
            "Nickel Nitrate (Ni(NO3)2)",
            "Cadmium Nitrate (Cd(NO3)2)",
            "Mercury Nitrate (Hg(NO3)2)",
            "Aluminum Nitrate (Al(NO3)3)",
            "Chromium Nitrate (Cr(NO3)3)",
            "Iron Nitrate (Fe(NO3)3)",
            "Cobalt Nitrate (Co(NO3)2)",
            "Manganese Nitrate (Mn(NO3)2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ammonium Nitrate (NH4NO3)",
                "Dinitrogen Pentoxide (N2O5)",
                "Dinitrogen Tetroxide (N2O4)",
                "Dinitrogen Trioxide (N2O3)",
                "Hyponitrous Acid (H2N2O2)",
                "Hyponitric Acid (HNO)",
                "Lead Nitrate (Pb(NO3)2)",
                "Potassium Nitrate (KNO3)",
                "Sodium Nitrate (NaNO3)",
                "Calcium Nitrate (Ca(NO3)2)",
                "Barium Nitrate (Ba(NO3)2)",
                "Strontium Nitrate (Sr(NO3)2)",
                "Magnesium Nitrate (Mg(NO3)2)",
                "Zinc Nitrate (Zn(NO3)2)",
                "Copper Nitrate (Cu(NO3)2)",
                "Silver Nitrate (AgNO3)",
                "Nickel Nitrate (Ni(NO3)2)",
                "Cadmium Nitrate (Cd(NO3)2)",
                "Mercury Nitrate (Hg(NO3)2)",
                "Aluminum Nitrate (Al(NO3)3)",
                "Chromium Nitrate (Cr(NO3)3)",
                "Iron Nitrate (Fe(NO3)3)",
                "Cobalt Nitrate (Co(NO3)2)",
                "Manganese Nitrate (Mn(NO3)2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aluminum Nitrate (Al(NO3)3)",
                "Ammonium Nitrate (NH4NO3)",
                "Barium Nitrate (Ba(NO3)2)",
                "Cadmium Nitrate (Cd(NO3)2)",
                "Calcium Nitrate (Ca(NO3)2)",
                "Chromium Nitrate (Cr(NO3)3)",
                "Cobalt Nitrate (Co(NO3)2)",
                "Copper Nitrate (Cu(NO3)2)",
                "Dinitrogen Pentoxide (N2O5)",
                "Dinitrogen Tetroxide (N2O4)",
                "Dinitrogen Trioxide (N2O3)",
                "Hyponitric Acid (HNO)",
                "Hyponitrous Acid (H2N2O2)",
                "Iron Nitrate (Fe(NO3)3)",
                "Lead Nitrate (Pb(NO3)2)",
                "Magnesium Nitrate (Mg(NO3)2)",
                "Manganese Nitrate (Mn(NO3)2)",
                "Mercury Nitrate (Hg(NO3)2)",
                "Nickel Nitrate (Ni(NO3)2)",
                "Potassium Nitrate (KNO3)",
                "Silver Nitrate (AgNO3)",
                "Sodium Nitrate (NaNO3)",
                "Strontium Nitrate (Sr(NO3)2)",
                "Zinc Nitrate (Zn(NO3)2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": "",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "Nitric oxide (NO)",
            "Nitrogen dioxide (NO\u2082)",
            "Dinitrogen tetroxide (N\u2082O\u2084)",
            "Dinitrogen trioxide (N\u2082O\u2083)",
            "Nitrous oxide (N\u2082O)",
            "Dinitrogen pentoxide (N\u2082O\u2085)",
            "Nitronium oxide (NO\u207aO\u207b)",
            "Nitrate anion (NO\u2083\u207b)",
            "Nitrite anion (NO\u2082\u207b)",
            "Peroxynitric acid (HNO\u2084)",
            "Nitrosyl fluoride oxide (NOF\u2093O)",
            "Acetyl nitrate (CH\u2083COONO\u2082)",
            "Peroxynitric anhydride (ONOOOH)",
            "Nitrosyl chloride oxide (NOClO)",
            "Nitrated titanium oxide (TiONO\u2082)",
            "Nitrated zinc oxide (Zn(NO\u2083)\u2082O)",
            "Nitrated magnesium oxide (Mg(NO\u2083)\u2082O)",
            "Nitrated aluminum oxide (Al(NO\u2083)\u2083O)",
            "Hydrogen nitrate oxide (HNO\u2082O)",
            "Ammonium nitrate oxide (NH\u2084NO\u2083O)",
            "Sodium nitrate oxide (NaNO\u2083O)",
            "Potassium nitrate oxide (KNO\u2083O)",
            "Calcium nitrate oxide (Ca(NO\u2083)\u2082O)",
            "Barium nitrate oxide (Ba(NO\u2083)\u2082O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nitric oxide (NO)",
                "Nitrogen dioxide (NO\u2082)",
                "Dinitrogen tetroxide (N\u2082O\u2084)",
                "Dinitrogen trioxide (N\u2082O\u2083)",
                "Nitrous oxide (N\u2082O)",
                "Dinitrogen pentoxide (N\u2082O\u2085)",
                "Nitronium oxide (NO\u207aO\u207b)",
                "Nitrate anion (NO\u2083\u207b)",
                "Nitrite anion (NO\u2082\u207b)",
                "Peroxynitric acid (HNO\u2084)",
                "Nitrosyl fluoride oxide (NOF\u2093O)",
                "Acetyl nitrate (CH\u2083COONO\u2082)",
                "Peroxynitric anhydride (ONOOOH)",
                "Nitrosyl chloride oxide (NOClO)",
                "Nitrated titanium oxide (TiONO\u2082)",
                "Nitrated zinc oxide (Zn(NO\u2083)\u2082O)",
                "Nitrated magnesium oxide (Mg(NO\u2083)\u2082O)",
                "Nitrated aluminum oxide (Al(NO\u2083)\u2083O)",
                "Hydrogen nitrate oxide (HNO\u2082O)",
                "Ammonium nitrate oxide (NH\u2084NO\u2083O)",
                "Sodium nitrate oxide (NaNO\u2083O)",
                "Potassium nitrate oxide (KNO\u2083O)",
                "Calcium nitrate oxide (Ca(NO\u2083)\u2082O)",
                "Barium nitrate oxide (Ba(NO\u2083)\u2082O)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl nitrate (CH\u2083COONO\u2082)",
                "Ammonium nitrate oxide (NH\u2084NO\u2083O)",
                "Barium nitrate oxide (Ba(NO\u2083)\u2082O)",
                "Calcium nitrate oxide (Ca(NO\u2083)\u2082O)",
                "Dinitrogen pentoxide (N\u2082O\u2085)",
                "Dinitrogen tetroxide (N\u2082O\u2084)",
                "Dinitrogen trioxide (N\u2082O\u2083)",
                "Hydrogen nitrate oxide (HNO\u2082O)",
                "Nitrate anion (NO\u2083\u207b)",
                "Nitrated aluminum oxide (Al(NO\u2083)\u2083O)",
                "Nitrated magnesium oxide (Mg(NO\u2083)\u2082O)",
                "Nitrated titanium oxide (TiONO\u2082)",
                "Nitrated zinc oxide (Zn(NO\u2083)\u2082O)",
                "Nitric oxide (NO)",
                "Nitrite anion (NO\u2082\u207b)",
                "Nitrogen dioxide (NO\u2082)",
                "Nitronium oxide (NO\u207aO\u207b)",
                "Nitrosyl chloride oxide (NOClO)",
                "Nitrosyl fluoride oxide (NOF\u2093O)",
                "Nitrous oxide (N\u2082O)",
                "Peroxynitric acid (HNO\u2084)",
                "Peroxynitric anhydride (ONOOOH)",
                "Potassium nitrate oxide (KNO\u2083O)",
                "Sodium nitrate oxide (NaNO\u2083O)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "Nitrous oxide (N2O)",
            "Nitrogen dioxide (NO2)",
            "Dinitrogen trioxide (N2O3)",
            "Dinitrogen tetroxide (N2O4)",
            "Dinitrogen pentoxide (N2O5)",
            "Nitric oxide (NO)",
            "Nitrogen trioxide (NO3)",
            "Nitrosyl hydroxide (HNO2)",
            "Nitric acid (HNO3)",
            "Peroxynitrous acid (HOONO)",
            "Peroxynitric acid (HOONO2)",
            "Nitronium nitrate (NO2NO3)",
            "Nitrosyl perchlorate (NOClO4)",
            "Nitrosyl fluoride (NOF)",
            "Nitrosyl chloride (NOCl)",
            "Nitrosyl bromide (NOBr)",
            "Nitrosyl iodide (NOI)",
            "Nitryl fluoride (NO2F)",
            "Nitryl chloride (NO2Cl)",
            "Nitryl bromide (NO2Br)",
            "Nitryl iodide (NO2I)",
            "Nitrosyl azide (NON3)",
            "Nitrosyl cyanide (NOCN)",
            "Nitrosyl thiocyanate (NOSCN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nitrous oxide (N2O)",
                "Nitrogen dioxide (NO2)",
                "Dinitrogen trioxide (N2O3)",
                "Dinitrogen tetroxide (N2O4)",
                "Dinitrogen pentoxide (N2O5)",
                "Nitric oxide (NO)",
                "Nitrogen trioxide (NO3)",
                "Nitrosyl hydroxide (HNO2)",
                "Nitric acid (HNO3)",
                "Peroxynitrous acid (HOONO)",
                "Peroxynitric acid (HOONO2)",
                "Nitronium nitrate (NO2NO3)",
                "Nitrosyl perchlorate (NOClO4)",
                "Nitrosyl fluoride (NOF)",
                "Nitrosyl chloride (NOCl)",
                "Nitrosyl bromide (NOBr)",
                "Nitrosyl iodide (NOI)",
                "Nitryl fluoride (NO2F)",
                "Nitryl chloride (NO2Cl)",
                "Nitryl bromide (NO2Br)",
                "Nitryl iodide (NO2I)",
                "Nitrosyl azide (NON3)",
                "Nitrosyl cyanide (NOCN)",
                "Nitrosyl thiocyanate (NOSCN)"
            ],
            "mismatches": [],
            "true_referents": [
                "Dinitrogen pentoxide (N2O5)",
                "Dinitrogen tetroxide (N2O4)",
                "Dinitrogen trioxide (N2O3)",
                "Nitric acid (HNO3)",
                "Nitric oxide (NO)",
                "Nitrogen dioxide (NO2)",
                "Nitrogen trioxide (NO3)",
                "Nitronium nitrate (NO2NO3)",
                "Nitrosyl azide (NON3)",
                "Nitrosyl bromide (NOBr)",
                "Nitrosyl chloride (NOCl)",
                "Nitrosyl cyanide (NOCN)",
                "Nitrosyl fluoride (NOF)",
                "Nitrosyl hydroxide (HNO2)",
                "Nitrosyl iodide (NOI)",
                "Nitrosyl perchlorate (NOClO4)",
                "Nitrosyl thiocyanate (NOSCN)",
                "Nitrous oxide (N2O)",
                "Nitryl bromide (NO2Br)",
                "Nitryl chloride (NO2Cl)",
                "Nitryl fluoride (NO2F)",
                "Nitryl iodide (NO2I)",
                "Peroxynitric acid (HOONO2)",
                "Peroxynitrous acid (HOONO)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "Nitric oxide (NO)",
            "Nitrous oxide (N2O)",
            "Dinitrogen trioxide (N2O3)",
            "Dinitrogen tetroxide (N2O4)",
            "Dinitrogen pentoxide (N2O5)",
            "Nitrogen dioxide (NO2)",
            "Nitrogen monoxide (NO)",
            "Nitroxyl (HNO)",
            "Peroxynitrite (ONOO\u2212)",
            "Peroxynitrous acid (ONOOH)",
            "Nitrite (NO2\u2212)",
            "Nitrate (NO3\u2212)",
            "Orthonitric acid (H3NO4)",
            "Peroxonitric acid (HOONO2)",
            "Nitryl chloride (NO2Cl)",
            "Nitrosyl chloride (NOCl)",
            "Nitrosonium (NO+)",
            "Nitronium (NO2+)",
            "Nitrosyl (NO\u2212)",
            "Hyponitrous acid (H2N2O2)",
            "Nitroamide (NO2NH2)",
            "Nitroamine (NHNO2)",
            "Nitrosamine (R2NNO)",
            "Azide (N3\u2212)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nitric oxide (NO)",
                "Nitrous oxide (N2O)",
                "Dinitrogen trioxide (N2O3)",
                "Dinitrogen tetroxide (N2O4)",
                "Dinitrogen pentoxide (N2O5)",
                "Nitrogen dioxide (NO2)",
                "Nitrogen monoxide (NO)",
                "Nitroxyl (HNO)",
                "Peroxynitrite (ONOO\u2212)",
                "Peroxynitrous acid (ONOOH)",
                "Nitrite (NO2\u2212)",
                "Nitrate (NO3\u2212)",
                "Orthonitric acid (H3NO4)",
                "Peroxonitric acid (HOONO2)",
                "Nitryl chloride (NO2Cl)",
                "Nitrosyl chloride (NOCl)",
                "Nitrosonium (NO+)",
                "Nitronium (NO2+)",
                "Nitrosyl (NO\u2212)",
                "Hyponitrous acid (H2N2O2)",
                "Nitroamide (NO2NH2)",
                "Nitroamine (NHNO2)",
                "Nitrosamine (R2NNO)",
                "Azide (N3\u2212)"
            ],
            "mismatches": [],
            "true_referents": [
                "Azide (N3\u2212)",
                "Dinitrogen pentoxide (N2O5)",
                "Dinitrogen tetroxide (N2O4)",
                "Dinitrogen trioxide (N2O3)",
                "Hyponitrous acid (H2N2O2)",
                "Nitrate (NO3\u2212)",
                "Nitric oxide (NO)",
                "Nitrite (NO2\u2212)",
                "Nitroamide (NO2NH2)",
                "Nitroamine (NHNO2)",
                "Nitrogen dioxide (NO2)",
                "Nitrogen monoxide (NO)",
                "Nitronium (NO2+)",
                "Nitrosamine (R2NNO)",
                "Nitrosonium (NO+)",
                "Nitrosyl (NO\u2212)",
                "Nitrosyl chloride (NOCl)",
                "Nitrous oxide (N2O)",
                "Nitroxyl (HNO)",
                "Nitryl chloride (NO2Cl)",
                "Orthonitric acid (H3NO4)",
                "Peroxonitric acid (HOONO2)",
                "Peroxynitrite (ONOO\u2212)",
                "Peroxynitrous acid (ONOOH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "nitrous oxide (N2O)",
            "nitric oxide (NO)",
            "nitrogen dioxide (NO2)",
            "dinitrogen trioxide (N2O3)",
            "dinitrogen tetroxide (N2O4)",
            "dinitrogen pentoxide (N2O5)",
            "nitrogen monoxide (NO)",
            "nitrogen sesquioxide (N2O3)",
            "nitrogen trioxide (NO3)",
            "nitrogen tetroxide (N2O4)",
            "nitrogen pentoxide (N2O5)",
            "nitrosyl chloride (NOCl)",
            "nitrosyl bromide (NOBr)",
            "nitrosyl iodide (NOI)",
            "nitrosyl fluoride (NOF)",
            "nitrosyl cyanide (NONCN)",
            "nitrosyl azide (NON3)",
            "nitrosyl thiocyanate (NONCS)",
            "nitrosyl perchlorate (NO(ClO4))",
            "nitrosyl nitrate (NO(NO3))",
            "nitrosyl sulfate (NO(SO4))",
            "nitrosyl phosphate (NO(PO4))",
            "nitrosyl carbonate (NO(CO3))"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "nitrous oxide (N2O)",
                "nitric oxide (NO)",
                "nitrogen dioxide (NO2)",
                "dinitrogen trioxide (N2O3)",
                "dinitrogen tetroxide (N2O4)",
                "dinitrogen pentoxide (N2O5)",
                "nitrogen monoxide (NO)",
                "nitrogen sesquioxide (N2O3)",
                "nitrogen trioxide (NO3)",
                "nitrogen tetroxide (N2O4)",
                "nitrogen pentoxide (N2O5)",
                "nitrosyl chloride (NOCl)",
                "nitrosyl bromide (NOBr)",
                "nitrosyl iodide (NOI)",
                "nitrosyl fluoride (NOF)",
                "nitrosyl cyanide (NONCN)",
                "nitrosyl azide (NON3)",
                "nitrosyl thiocyanate (NONCS)",
                "nitrosyl perchlorate (NO(ClO4))",
                "nitrosyl nitrate (NO(NO3))",
                "nitrosyl sulfate (NO(SO4))",
                "nitrosyl phosphate (NO(PO4))",
                "nitrosyl carbonate (NO(CO3))"
            ],
            "mismatches": [],
            "true_referents": [
                "dinitrogen pentoxide (N2O5)",
                "dinitrogen tetroxide (N2O4)",
                "dinitrogen trioxide (N2O3)",
                "nitric oxide (NO)",
                "nitrogen dioxide (NO2)",
                "nitrogen monoxide (NO)",
                "nitrogen pentoxide (N2O5)",
                "nitrogen sesquioxide (N2O3)",
                "nitrogen tetroxide (N2O4)",
                "nitrogen trioxide (NO3)",
                "nitrosyl azide (NON3)",
                "nitrosyl bromide (NOBr)",
                "nitrosyl carbonate (NO(CO3))",
                "nitrosyl chloride (NOCl)",
                "nitrosyl cyanide (NONCN)",
                "nitrosyl fluoride (NOF)",
                "nitrosyl iodide (NOI)",
                "nitrosyl nitrate (NO(NO3))",
                "nitrosyl perchlorate (NO(ClO4))",
                "nitrosyl phosphate (NO(PO4))",
                "nitrosyl sulfate (NO(SO4))",
                "nitrosyl thiocyanate (NONCS)",
                "nitrous oxide (N2O)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "Ammonium nitrate (NH4NO3)",
            "Ammonium sulfate ((NH4)2SO4)",
            "Calcium nitrate (Ca(NO3)2)",
            "Sodium nitrate (NaNO3)",
            "Potassium nitrate (KNO3)",
            "Nitric acid (HNO3)",
            "Nitrogen dioxide (NO2)",
            "Nitrous oxide (N2O)",
            "Nitric oxide (NO)",
            "Hydrazine (N2H4)",
            "Hydroxylamine (NH2OH)",
            "Urea (CO(NH2)2)",
            "Guanidine (CH6N3)",
            "Cyanide (CN-)",
            "Cyanamide (CH2N2)",
            "Ammonium chloride (NH4Cl)",
            "Ammonium phosphate ((NH4)3PO4)",
            "Ammonium carbonate ((NH4)2CO3)",
            "Ammonium sulfite ((NH4)2SO3)",
            "Ammonium nitrite (NH4NO2)",
            "Ammonium perchlorate (NH4ClO4)",
            "Ammonium formate (HCOONH4)",
            "Ammonium acetate (CH3COONH4)",
            "Ammonium oxalate ((NH4)2C2O4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ammonium nitrate (NH4NO3)",
                "Ammonium sulfate ((NH4)2SO4)",
                "Calcium nitrate (Ca(NO3)2)",
                "Sodium nitrate (NaNO3)",
                "Potassium nitrate (KNO3)",
                "Nitric acid (HNO3)",
                "Nitrogen dioxide (NO2)",
                "Nitrous oxide (N2O)",
                "Nitric oxide (NO)",
                "Hydrazine (N2H4)",
                "Hydroxylamine (NH2OH)",
                "Urea (CO(NH2)2)",
                "Guanidine (CH6N3)",
                "Cyanide (CN-)",
                "Cyanamide (CH2N2)",
                "Ammonium chloride (NH4Cl)",
                "Ammonium phosphate ((NH4)3PO4)",
                "Ammonium carbonate ((NH4)2CO3)",
                "Ammonium sulfite ((NH4)2SO3)",
                "Ammonium nitrite (NH4NO2)",
                "Ammonium perchlorate (NH4ClO4)",
                "Ammonium formate (HCOONH4)",
                "Ammonium acetate (CH3COONH4)",
                "Ammonium oxalate ((NH4)2C2O4)"
            ],
            "mismatches": [],
            "true_referents": [
                "Ammonium acetate (CH3COONH4)",
                "Ammonium carbonate ((NH4)2CO3)",
                "Ammonium chloride (NH4Cl)",
                "Ammonium formate (HCOONH4)",
                "Ammonium nitrate (NH4NO3)",
                "Ammonium nitrite (NH4NO2)",
                "Ammonium oxalate ((NH4)2C2O4)",
                "Ammonium perchlorate (NH4ClO4)",
                "Ammonium phosphate ((NH4)3PO4)",
                "Ammonium sulfate ((NH4)2SO4)",
                "Ammonium sulfite ((NH4)2SO3)",
                "Calcium nitrate (Ca(NO3)2)",
                "Cyanamide (CH2N2)",
                "Cyanide (CN-)",
                "Guanidine (CH6N3)",
                "Hydrazine (N2H4)",
                "Hydroxylamine (NH2OH)",
                "Nitric acid (HNO3)",
                "Nitric oxide (NO)",
                "Nitrogen dioxide (NO2)",
                "Nitrous oxide (N2O)",
                "Potassium nitrate (KNO3)",
                "Sodium nitrate (NaNO3)",
                "Urea (CO(NH2)2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "Titanium dioxide (TiO2)",
            "Zirconium nitride (ZrN)",
            "Titanium nitride (TiN)",
            "Zirconium oxide (ZrO2)",
            "Silicon nitride (Si3N4)",
            "Aluminum nitride (AlN)",
            "Tantalum nitride (Ta3N5)",
            "Hafnium nitride (HfN)",
            "Barium nitride (Ba3N2)",
            "Strontium nitride (Sr3N2)",
            "Calcium nitride (Ca3N2)",
            "Magnesium nitride (Mg3N2)",
            "Lithium nitride (Li3N)",
            "Sodium nitride (Na3N)",
            "Potassium nitride (K3N)",
            "Rubidium nitride (Rb3N)",
            "Caesium nitride (Cs3N)",
            "Rhenium oxide (Re2O7)",
            "Osmium oxide (OsO4)",
            "Iridium oxide (IrO2)",
            "Platinum oxide (PtO2)",
            "Rhodium oxide (Rh2O3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Titanium dioxide (TiO2)",
                "Zirconium nitride (ZrN)",
                "Titanium nitride (TiN)",
                "Zirconium oxide (ZrO2)",
                "Silicon nitride (Si3N4)",
                "Aluminum nitride (AlN)",
                "Tantalum nitride (Ta3N5)",
                "Hafnium nitride (HfN)",
                "Barium nitride (Ba3N2)",
                "Strontium nitride (Sr3N2)",
                "Calcium nitride (Ca3N2)",
                "Magnesium nitride (Mg3N2)",
                "Lithium nitride (Li3N)",
                "Sodium nitride (Na3N)",
                "Potassium nitride (K3N)",
                "Rubidium nitride (Rb3N)",
                "Caesium nitride (Cs3N)",
                "Rhenium oxide (Re2O7)",
                "Osmium oxide (OsO4)",
                "Iridium oxide (IrO2)",
                "Platinum oxide (PtO2)",
                "Rhodium oxide (Rh2O3)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aluminum nitride (AlN)",
                "Barium nitride (Ba3N2)",
                "Caesium nitride (Cs3N)",
                "Calcium nitride (Ca3N2)",
                "Hafnium nitride (HfN)",
                "Iridium oxide (IrO2)",
                "Lithium nitride (Li3N)",
                "Magnesium nitride (Mg3N2)",
                "Osmium oxide (OsO4)",
                "Platinum oxide (PtO2)",
                "Potassium nitride (K3N)",
                "Rhenium oxide (Re2O7)",
                "Rhodium oxide (Rh2O3)",
                "Rubidium nitride (Rb3N)",
                "Silicon nitride (Si3N4)",
                "Sodium nitride (Na3N)",
                "Strontium nitride (Sr3N2)",
                "Tantalum nitride (Ta3N5)",
                "Titanium dioxide (TiO2)",
                "Titanium nitride (TiN)",
                "Zirconium nitride (ZrN)",
                "Zirconium oxide (ZrO2)"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            "Silicon nitride (Si3N4)",
            "Aluminum nitride (AlN)",
            "Boron nitride (BN)",
            "Titanium nitride (TiN)",
            "Zirconium nitride (ZrN)",
            "Hafnium nitride (HfN)",
            "Germanium nitride (Ge3N4)",
            "Cerium nitride (CeN)",
            "Lanthanum nitride (LaN)",
            "Actinium nitride (AcN)",
            "Thorium nitride (Th3N4)",
            "Uranium nitride (UN)",
            "Neodymium nitride (NdN)",
            "Praseodymium nitride (PrN)",
            "Samarium nitride (SmN)",
            "Europium nitride (EuN)",
            "Gadolinium nitride (GdN)",
            "Terbium nitride (TbN)",
            "Dysprosium nitride (DyN)",
            "Holmium nitride (HoN)",
            "Erbium nitride (ErN)",
            "Thulium nitride (TmN)",
            "Ytterbium nitride (YbN)",
            "Lutetium nitride (LuN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Silicon nitride (Si3N4)",
                "Aluminum nitride (AlN)",
                "Boron nitride (BN)",
                "Titanium nitride (TiN)",
                "Zirconium nitride (ZrN)",
                "Hafnium nitride (HfN)",
                "Germanium nitride (Ge3N4)",
                "Cerium nitride (CeN)",
                "Lanthanum nitride (LaN)",
                "Actinium nitride (AcN)",
                "Thorium nitride (Th3N4)",
                "Uranium nitride (UN)",
                "Neodymium nitride (NdN)",
                "Praseodymium nitride (PrN)",
                "Samarium nitride (SmN)",
                "Europium nitride (EuN)",
                "Gadolinium nitride (GdN)",
                "Terbium nitride (TbN)",
                "Dysprosium nitride (DyN)",
                "Holmium nitride (HoN)",
                "Erbium nitride (ErN)",
                "Thulium nitride (TmN)",
                "Ytterbium nitride (YbN)",
                "Lutetium nitride (LuN)"
            ],
            "mismatches": [],
            "true_referents": [
                "Actinium nitride (AcN)",
                "Aluminum nitride (AlN)",
                "Boron nitride (BN)",
                "Cerium nitride (CeN)",
                "Dysprosium nitride (DyN)",
                "Erbium nitride (ErN)",
                "Europium nitride (EuN)",
                "Gadolinium nitride (GdN)",
                "Germanium nitride (Ge3N4)",
                "Hafnium nitride (HfN)",
                "Holmium nitride (HoN)",
                "Lanthanum nitride (LaN)",
                "Lutetium nitride (LuN)",
                "Neodymium nitride (NdN)",
                "Praseodymium nitride (PrN)",
                "Samarium nitride (SmN)",
                "Silicon nitride (Si3N4)",
                "Terbium nitride (TbN)",
                "Thorium nitride (Th3N4)",
                "Thulium nitride (TmN)",
                "Titanium nitride (TiN)",
                "Uranium nitride (UN)",
                "Ytterbium nitride (YbN)",
                "Zirconium nitride (ZrN)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "nitrogen oxide",
        "domain": "chemistry",
        "response": [
            {
                "Example": "Nitrogen dioxide",
                "Canonical name": "N2O2"
            },
            {
                "Example": "Nitrogen trioxide",
                "Canonical name": "N2O3"
            },
            {
                "Example": "Nitrogen tetroxide",
                "Canonical name": "N2O4"
            },
            {
                "Example": "Nitrogen pentoxide",
                "Canonical name": "N2O5"
            },
            {
                "Example": "Nitrogen hexoxide",
                "Canonical name": "N2O6"
            },
            {
                "Example": "Nitrogen heptoxide",
                "Canonical name": "N2O7"
            },
            {
                "Example": "Nitrogen octoxide",
                "Canonical name": "N2O8"
            },
            {
                "Example": "Nitrogen nonoxide",
                "Canonical name": "N2O9"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nitrogen dioxide",
                "Nitrogen trioxide",
                "Nitrogen tetroxide",
                "Nitrogen pentoxide",
                "Nitrogen hexoxide",
                "Nitrogen heptoxide",
                "Nitrogen octoxide",
                "Nitrogen nonoxide"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Example\": \"Nitrogen dioxide\", \"Canonical name\": \"N2O2\"}",
                "{\"Example\": \"Nitrogen heptoxide\", \"Canonical name\": \"N2O7\"}",
                "{\"Example\": \"Nitrogen hexoxide\", \"Canonical name\": \"N2O6\"}",
                "{\"Example\": \"Nitrogen nonoxide\", \"Canonical name\": \"N2O9\"}",
                "{\"Example\": \"Nitrogen octoxide\", \"Canonical name\": \"N2O8\"}",
                "{\"Example\": \"Nitrogen pentoxide\", \"Canonical name\": \"N2O5\"}",
                "{\"Example\": \"Nitrogen tetroxide\", \"Canonical name\": \"N2O4\"}",
                "{\"Example\": \"Nitrogen trioxide\", \"Canonical name\": \"N2O3\"}"
            ],
            "TP": 8,
            "FP": 0,
            "FN": 0
        }
    }
]