[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic anhydride (Ac2O)",
            "Propionic anhydride",
            "Butyric anhydride",
            "Valeric anhydride",
            "Hexanoic anhydride",
            "Heptanoic anhydride",
            "Octanoic anhydride",
            "Nonanoic anhydride",
            "Decanoic anhydride",
            "Undecanoic anhydride",
            "Dodecanoic anhydride",
            "Tridecanoic anhydride",
            "Myristic anhydride",
            "Pentadecanoic anhydride",
            "Palmitic anhydride",
            "Stearic anhydride",
            "Isobutyric anhydride",
            "Isopentanoic anhydride",
            "2-Methylbutyric anhydride",
            "3-Methylbutyric anhydride",
            "Phenylacetic anhydride",
            "Benzoic anhydride",
            "Toluic anhydride",
            "Trimellitic anhydride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride (Ac2O)",
                "Propionic anhydride",
                "Butyric anhydride",
                "Valeric anhydride",
                "Hexanoic anhydride",
                "Heptanoic anhydride",
                "Octanoic anhydride",
                "Nonanoic anhydride",
                "Decanoic anhydride",
                "Undecanoic anhydride",
                "Dodecanoic anhydride",
                "Tridecanoic anhydride",
                "Myristic anhydride",
                "Pentadecanoic anhydride",
                "Palmitic anhydride",
                "Stearic anhydride",
                "Isobutyric anhydride",
                "Isopentanoic anhydride",
                "2-Methylbutyric anhydride",
                "3-Methylbutyric anhydride",
                "Phenylacetic anhydride",
                "Benzoic anhydride",
                "Toluic anhydride",
                "Trimellitic anhydride"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Methylbutyric anhydride",
                "3-Methylbutyric anhydride",
                "Acetic anhydride (Ac2O)",
                "Benzoic anhydride",
                "Butyric anhydride",
                "Decanoic anhydride",
                "Dodecanoic anhydride",
                "Heptanoic anhydride",
                "Hexanoic anhydride",
                "Isobutyric anhydride",
                "Isopentanoic anhydride",
                "Myristic anhydride",
                "Nonanoic anhydride",
                "Octanoic anhydride",
                "Palmitic anhydride",
                "Pentadecanoic anhydride",
                "Phenylacetic anhydride",
                "Propionic anhydride",
                "Stearic anhydride",
                "Toluic anhydride",
                "Tridecanoic anhydride",
                "Trimellitic anhydride",
                "Undecanoic anhydride",
                "Valeric anhydride"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic anhydride (Ac2O)",
            "Propionic anhydride (C3H6O3)",
            "Butyric anhydride (C8H14O3)",
            "Valeric anhydride (C10H18O3)",
            "Glutaric anhydride (C10H16O3)",
            "Adipic anhydride (C12H20O3)",
            "Phthalic anhydride (C8H4O3)",
            "Maleic anhydride (C4H2O3)",
            "Fumaric anhydride (C4H2O3)",
            "Succinic anhydride (C4H4O3)",
            "Glutaric anhydride (C10H16O3)",
            "Pimelic anhydride (C14H20O3)",
            "Suberic anhydride (C16H28O3)",
            "Azelaic anhydride (C18H30O3)",
            "Sebacic anhydride (C16H28O3)",
            "Benzoic anhydride (C14H10O3)",
            "Isobutyric anhydride (C8H14O3)",
            "Isovaleric anhydride (C10H18O3)",
            "Cyclopentanecarboxylic anhydride (C11H18O3)",
            "Cyclohexanecarboxylic anhydride (C13H20O3)",
            "Cycloheptanecarboxylic anhydride (C15H24O3)",
            "Cyclooctanecarboxylic anhydride (C17H28O3)",
            "Terephthalic anhydride (C8H4O3)",
            "Hexahydrophthalic anhydride (C8H10O3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride (Ac2O)",
                "Propionic anhydride (C3H6O3)",
                "Butyric anhydride (C8H14O3)",
                "Valeric anhydride (C10H18O3)",
                "Glutaric anhydride (C10H16O3)",
                "Adipic anhydride (C12H20O3)",
                "Phthalic anhydride (C8H4O3)",
                "Maleic anhydride (C4H2O3)",
                "Fumaric anhydride (C4H2O3)",
                "Succinic anhydride (C4H4O3)",
                "Pimelic anhydride (C14H20O3)",
                "Suberic anhydride (C16H28O3)",
                "Azelaic anhydride (C18H30O3)",
                "Sebacic anhydride (C16H28O3)",
                "Benzoic anhydride (C14H10O3)",
                "Isobutyric anhydride (C8H14O3)",
                "Isovaleric anhydride (C10H18O3)",
                "Cyclopentanecarboxylic anhydride (C11H18O3)",
                "Cyclohexanecarboxylic anhydride (C13H20O3)",
                "Cycloheptanecarboxylic anhydride (C15H24O3)",
                "Cyclooctanecarboxylic anhydride (C17H28O3)",
                "Terephthalic anhydride (C8H4O3)",
                "Hexahydrophthalic anhydride (C8H10O3)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetic anhydride (Ac2O)",
                "Adipic anhydride (C12H20O3)",
                "Azelaic anhydride (C18H30O3)",
                "Benzoic anhydride (C14H10O3)",
                "Butyric anhydride (C8H14O3)",
                "Cycloheptanecarboxylic anhydride (C15H24O3)",
                "Cyclohexanecarboxylic anhydride (C13H20O3)",
                "Cyclooctanecarboxylic anhydride (C17H28O3)",
                "Cyclopentanecarboxylic anhydride (C11H18O3)",
                "Fumaric anhydride (C4H2O3)",
                "Glutaric anhydride (C10H16O3)",
                "Hexahydrophthalic anhydride (C8H10O3)",
                "Isobutyric anhydride (C8H14O3)",
                "Isovaleric anhydride (C10H18O3)",
                "Maleic anhydride (C4H2O3)",
                "Phthalic anhydride (C8H4O3)",
                "Pimelic anhydride (C14H20O3)",
                "Propionic anhydride (C3H6O3)",
                "Sebacic anhydride (C16H28O3)",
                "Suberic anhydride (C16H28O3)",
                "Succinic anhydride (C4H4O3)",
                "Terephthalic anhydride (C8H4O3)",
                "Valeric anhydride (C10H18O3)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic anhydride (Ac2O)",
            "Propionic anhydride",
            "Butyric anhydride",
            "Isobutyric anhydride",
            "Valeric anhydride",
            "Isovaleric anhydride",
            "Pivalic anhydride",
            "Hexanoic anhydride",
            "Heptanoic anhydride",
            "Octanoic anhydride",
            "Nonanoic anhydride",
            "Decanoic anhydride",
            "Benzoic anhydride",
            "Phthalic anhydride",
            "Maleic anhydride",
            "Succinic anhydride",
            "Glutaric anhydride",
            "Adipic anhydride",
            "Pimelic anhydride",
            "Suberic anhydride",
            "Azelaic anhydride",
            "Sebacic anhydride",
            "Terephthalic anhydride",
            "Trimellitic anhydride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride (Ac2O)",
                "Propionic anhydride",
                "Butyric anhydride",
                "Isobutyric anhydride",
                "Valeric anhydride",
                "Isovaleric anhydride",
                "Pivalic anhydride",
                "Hexanoic anhydride",
                "Heptanoic anhydride",
                "Octanoic anhydride",
                "Nonanoic anhydride",
                "Decanoic anhydride",
                "Benzoic anhydride",
                "Phthalic anhydride",
                "Maleic anhydride",
                "Succinic anhydride",
                "Glutaric anhydride",
                "Adipic anhydride",
                "Pimelic anhydride",
                "Suberic anhydride",
                "Azelaic anhydride",
                "Sebacic anhydride",
                "Terephthalic anhydride",
                "Trimellitic anhydride"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetic anhydride (Ac2O)",
                "Adipic anhydride",
                "Azelaic anhydride",
                "Benzoic anhydride",
                "Butyric anhydride",
                "Decanoic anhydride",
                "Glutaric anhydride",
                "Heptanoic anhydride",
                "Hexanoic anhydride",
                "Isobutyric anhydride",
                "Isovaleric anhydride",
                "Maleic anhydride",
                "Nonanoic anhydride",
                "Octanoic anhydride",
                "Phthalic anhydride",
                "Pimelic anhydride",
                "Pivalic anhydride",
                "Propionic anhydride",
                "Sebacic anhydride",
                "Suberic anhydride",
                "Succinic anhydride",
                "Terephthalic anhydride",
                "Trimellitic anhydride",
                "Valeric anhydride"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic Anhydride (Ac\u2082O)",
            "Propionic Anhydride",
            "Butyric Anhydride",
            "Isobutyric Anhydride",
            "Valeric Anhydride",
            "Formic Anhydride (Mixed)",
            "Succinic Anhydride",
            "Glutaric Anhydride",
            "Adipic Anhydride",
            "Phthalic Anhydride (PA)",
            "Maleic Anhydride (MA)",
            "Fumaric Anhydride",
            "Citric Anhydride (Mixed)",
            "Trimellitic Anhydride (TMA)",
            "Pyromellitic Dianhydride (PMDA)",
            "Benzoyl Formic Anhydride",
            "Chloroacetyl Chloride Dimer (as anhydride)",
            "Trifluoroacetic Anhydride (TFAA)",
            "p-Toluenesulfonic Anhydride",
            "Methanesulfonic Anhydride",
            "Camphorsulfonic Anhydride",
            "Acetylsuccinic Anhydride",
            "Dodecenylsuccinic Anhydride (DDSA)",
            "Polysebacic Anhydride (PSA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic Anhydride (Ac\u2082O)",
                "Propionic Anhydride",
                "Butyric Anhydride",
                "Isobutyric Anhydride",
                "Valeric Anhydride",
                "Formic Anhydride (Mixed)",
                "Succinic Anhydride",
                "Glutaric Anhydride",
                "Adipic Anhydride",
                "Phthalic Anhydride (PA)",
                "Maleic Anhydride (MA)",
                "Fumaric Anhydride",
                "Citric Anhydride (Mixed)",
                "Trimellitic Anhydride (TMA)",
                "Pyromellitic Dianhydride (PMDA)",
                "Benzoyl Formic Anhydride",
                "Chloroacetyl Chloride Dimer (as anhydride)",
                "Trifluoroacetic Anhydride (TFAA)",
                "p-Toluenesulfonic Anhydride",
                "Methanesulfonic Anhydride",
                "Camphorsulfonic Anhydride",
                "Acetylsuccinic Anhydride",
                "Dodecenylsuccinic Anhydride (DDSA)",
                "Polysebacic Anhydride (PSA)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetic Anhydride (Ac\u2082O)",
                "Acetylsuccinic Anhydride",
                "Adipic Anhydride",
                "Benzoyl Formic Anhydride",
                "Butyric Anhydride",
                "Camphorsulfonic Anhydride",
                "Chloroacetyl Chloride Dimer (as anhydride)",
                "Citric Anhydride (Mixed)",
                "Dodecenylsuccinic Anhydride (DDSA)",
                "Formic Anhydride (Mixed)",
                "Fumaric Anhydride",
                "Glutaric Anhydride",
                "Isobutyric Anhydride",
                "Maleic Anhydride (MA)",
                "Methanesulfonic Anhydride",
                "Phthalic Anhydride (PA)",
                "Polysebacic Anhydride (PSA)",
                "Propionic Anhydride",
                "Pyromellitic Dianhydride (PMDA)",
                "Succinic Anhydride",
                "Trifluoroacetic Anhydride (TFAA)",
                "Trimellitic Anhydride (TMA)",
                "Valeric Anhydride",
                "p-Toluenesulfonic Anhydride"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic anhydride (Ac2O)",
            "Propionic anhydride",
            "Butyric anhydride",
            "Isobutyric anhydride",
            "Valeric anhydride",
            "Hexanoic anhydride",
            "Benzoic anhydride",
            "Maleic anhydride",
            "Succinic anhydride",
            "Phthalic anhydride",
            "Glutaric anhydride",
            "Adipic anhydride",
            "Trimellitic anhydride",
            "Lauric anhydride",
            "Stearic anhydride",
            "Palmitic anhydride",
            "Myristic anhydride",
            "Sebacic anhydride",
            "Terephthalic anhydride",
            "Trifluoroacetic anhydride (TFAA)",
            "Methanesulfonic anhydride",
            "Ethyl chloroformate",
            "Isatoic anhydride",
            "Naphthalic anhydride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride (Ac2O)",
                "Propionic anhydride",
                "Butyric anhydride",
                "Isobutyric anhydride",
                "Valeric anhydride",
                "Hexanoic anhydride",
                "Benzoic anhydride",
                "Maleic anhydride",
                "Succinic anhydride",
                "Phthalic anhydride",
                "Glutaric anhydride",
                "Adipic anhydride",
                "Trimellitic anhydride",
                "Lauric anhydride",
                "Stearic anhydride",
                "Palmitic anhydride",
                "Myristic anhydride",
                "Sebacic anhydride",
                "Terephthalic anhydride",
                "Trifluoroacetic anhydride (TFAA)",
                "Methanesulfonic anhydride",
                "Ethyl chloroformate",
                "Isatoic anhydride",
                "Naphthalic anhydride"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetic anhydride (Ac2O)",
                "Adipic anhydride",
                "Benzoic anhydride",
                "Butyric anhydride",
                "Ethyl chloroformate",
                "Glutaric anhydride",
                "Hexanoic anhydride",
                "Isatoic anhydride",
                "Isobutyric anhydride",
                "Lauric anhydride",
                "Maleic anhydride",
                "Methanesulfonic anhydride",
                "Myristic anhydride",
                "Naphthalic anhydride",
                "Palmitic anhydride",
                "Phthalic anhydride",
                "Propionic anhydride",
                "Sebacic anhydride",
                "Stearic anhydride",
                "Succinic anhydride",
                "Terephthalic anhydride",
                "Trifluoroacetic anhydride (TFAA)",
                "Trimellitic anhydride",
                "Valeric anhydride"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic anhydride (Ac2O)",
            "Phthalic anhydride (C8H4O3)",
            "Succinic anhydride (C4H4O3)",
            "Maleic anhydride (C4H2O3)",
            "Glutaric anhydride (C5H6O3)",
            "Benzene-1,2-dicarboxylic anhydride (C8H4O3)",
            "Trimellitic anhydride (C9H6O5)",
            "Cyclic anhydride of citric acid (C6H8O7)",
            "Adipic anhydride (C6H8O3)",
            "Salicylic anhydride (C7H6O3)",
            "Itaconic anhydride (C5H6O3)",
            "Diglycolic anhydride (C4H6O3)",
            "Methyl succinic anhydride (C5H6O3)",
            "Terephthalic anhydride (C8H4O3)",
            "Dodecanedioic anhydride (C12H20O3)",
            "Hexahydrophthalic anhydride (C8H10O3)",
            "Isophthalic anhydride (C8H4O3)",
            "3,4-Epoxytetrahydrofuran-2,5-dione (C4H4O3)",
            "Naphthalene-1,2-dicarboxylic anhydride (C10H6O3)",
            "2,3-Dihydro-1H-pyrrole-2,5-dione (C4H5NO2)",
            "2-Phenyl-2-methyl-1,3-dioxolane-4,5-dione (C10H10O4)",
            "3,4-Dimethyl-3-cyclobutene-1,2-dione (C6H8O2)",
            "1,2:3,4-Di-O-isopropylidene-D-mannitol anhydride (C15H26O7)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride (Ac2O)",
                "Phthalic anhydride (C8H4O3)",
                "Succinic anhydride (C4H4O3)",
                "Maleic anhydride (C4H2O3)",
                "Glutaric anhydride (C5H6O3)",
                "Benzene-1,2-dicarboxylic anhydride (C8H4O3)",
                "Trimellitic anhydride (C9H6O5)",
                "Cyclic anhydride of citric acid (C6H8O7)",
                "Adipic anhydride (C6H8O3)",
                "Salicylic anhydride (C7H6O3)",
                "Itaconic anhydride (C5H6O3)",
                "Diglycolic anhydride (C4H6O3)",
                "Methyl succinic anhydride (C5H6O3)",
                "Terephthalic anhydride (C8H4O3)",
                "Dodecanedioic anhydride (C12H20O3)",
                "Hexahydrophthalic anhydride (C8H10O3)",
                "Isophthalic anhydride (C8H4O3)",
                "3,4-Epoxytetrahydrofuran-2,5-dione (C4H4O3)",
                "Naphthalene-1,2-dicarboxylic anhydride (C10H6O3)",
                "2,3-Dihydro-1H-pyrrole-2,5-dione (C4H5NO2)",
                "2-Phenyl-2-methyl-1,3-dioxolane-4,5-dione (C10H10O4)",
                "3,4-Dimethyl-3-cyclobutene-1,2-dione (C6H8O2)",
                "1,2:3,4-Di-O-isopropylidene-D-mannitol anhydride (C15H26O7)"
            ],
            "mismatches": [],
            "true_referents": [
                "1,2:3,4-Di-O-isopropylidene-D-mannitol anhydride (C15H26O7)",
                "2,3-Dihydro-1H-pyrrole-2,5-dione (C4H5NO2)",
                "2-Phenyl-2-methyl-1,3-dioxolane-4,5-dione (C10H10O4)",
                "3,4-Dimethyl-3-cyclobutene-1,2-dione (C6H8O2)",
                "3,4-Epoxytetrahydrofuran-2,5-dione (C4H4O3)",
                "Acetic anhydride (Ac2O)",
                "Adipic anhydride (C6H8O3)",
                "Benzene-1,2-dicarboxylic anhydride (C8H4O3)",
                "Cyclic anhydride of citric acid (C6H8O7)",
                "Diglycolic anhydride (C4H6O3)",
                "Dodecanedioic anhydride (C12H20O3)",
                "Glutaric anhydride (C5H6O3)",
                "Hexahydrophthalic anhydride (C8H10O3)",
                "Isophthalic anhydride (C8H4O3)",
                "Itaconic anhydride (C5H6O3)",
                "Maleic anhydride (C4H2O3)",
                "Methyl succinic anhydride (C5H6O3)",
                "Naphthalene-1,2-dicarboxylic anhydride (C10H6O3)",
                "Phthalic anhydride (C8H4O3)",
                "Salicylic anhydride (C7H6O3)",
                "Succinic anhydride (C4H4O3)",
                "Terephthalic anhydride (C8H4O3)",
                "Trimellitic anhydride (C9H6O5)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic anhydride (AA)",
            "Maleic anhydride (MA)",
            "Phthalic anhydride (PA)",
            "Succinic anhydride (SA)",
            "Glutaric anhydride (GA)",
            "Hexahydrophthalic anhydride (HHPA)",
            "Methyltetrahydrophthalic anhydride (MTHPA)",
            "Trimellitic anhydride (TMA)",
            "Pyromellitic dianhydride (PMDA)",
            "Naphthalic anhydride (NA)",
            "Dodecenylsuccinic anhydride (DDSA)",
            "Hexahydrotrimellitic anhydride (HHTA)",
            "Tetrachlorophthalic anhydride (TCPA)",
            "Chlorendic anhydride (CA)",
            "Tetrahydrophthalic anhydride (THPA)",
            "Endomethylene tetrahydrophthalic anhydride (EMTHPA)",
            "Dodecylsuccinic anhydride (DDA)",
            "Octadecenylsuccinic anhydride (ODSA)",
            "Benzoic anhydride (BA)",
            "Propionic anhydride (PA)",
            "Butyric anhydride (BA)",
            "Valeric anhydride (VA)",
            "Caproic anhydride (CA)",
            "Enanthic anhydride (EA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride (AA)",
                "Maleic anhydride (MA)",
                "Phthalic anhydride (PA)",
                "Succinic anhydride (SA)",
                "Glutaric anhydride (GA)",
                "Hexahydrophthalic anhydride (HHPA)",
                "Methyltetrahydrophthalic anhydride (MTHPA)",
                "Trimellitic anhydride (TMA)",
                "Pyromellitic dianhydride (PMDA)",
                "Naphthalic anhydride (NA)",
                "Dodecenylsuccinic anhydride (DDSA)",
                "Hexahydrotrimellitic anhydride (HHTA)",
                "Tetrachlorophthalic anhydride (TCPA)",
                "Chlorendic anhydride (CA)",
                "Tetrahydrophthalic anhydride (THPA)",
                "Endomethylene tetrahydrophthalic anhydride (EMTHPA)",
                "Dodecylsuccinic anhydride (DDA)",
                "Octadecenylsuccinic anhydride (ODSA)",
                "Benzoic anhydride (BA)",
                "Propionic anhydride (PA)",
                "Butyric anhydride (BA)",
                "Valeric anhydride (VA)",
                "Caproic anhydride (CA)",
                "Enanthic anhydride (EA)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetic anhydride (AA)",
                "Benzoic anhydride (BA)",
                "Butyric anhydride (BA)",
                "Caproic anhydride (CA)",
                "Chlorendic anhydride (CA)",
                "Dodecenylsuccinic anhydride (DDSA)",
                "Dodecylsuccinic anhydride (DDA)",
                "Enanthic anhydride (EA)",
                "Endomethylene tetrahydrophthalic anhydride (EMTHPA)",
                "Glutaric anhydride (GA)",
                "Hexahydrophthalic anhydride (HHPA)",
                "Hexahydrotrimellitic anhydride (HHTA)",
                "Maleic anhydride (MA)",
                "Methyltetrahydrophthalic anhydride (MTHPA)",
                "Naphthalic anhydride (NA)",
                "Octadecenylsuccinic anhydride (ODSA)",
                "Phthalic anhydride (PA)",
                "Propionic anhydride (PA)",
                "Pyromellitic dianhydride (PMDA)",
                "Succinic anhydride (SA)",
                "Tetrachlorophthalic anhydride (TCPA)",
                "Tetrahydrophthalic anhydride (THPA)",
                "Trimellitic anhydride (TMA)",
                "Valeric anhydride (VA)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic anhydride",
            "Propionic anhydride",
            "Butyric anhydride",
            "Isobutyric anhydride",
            "Valeric anhydride",
            "Isocaproic anhydride",
            "Caproic anhydride",
            "Heptanoic anhydride",
            "Caprylic anhydride",
            "Nonanoic anhydride",
            "Decanoic anhydride",
            "Lauric anhydride",
            "Myristic anhydride",
            "Palmitic anhydride",
            "Stearic anhydride",
            "Oleic anhydride",
            "Linoleic anhydride",
            "Linolenic anhydride",
            "Arachidonic anhydride",
            "Dodecanoic anhydride",
            "Tetradecanoic anhydride",
            "Hexadecanoic anhydride",
            "Octadecanoic anhydride",
            "Eicosanoic anhydride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride",
                "Propionic anhydride",
                "Butyric anhydride",
                "Isobutyric anhydride",
                "Valeric anhydride",
                "Isocaproic anhydride",
                "Caproic anhydride",
                "Heptanoic anhydride",
                "Caprylic anhydride",
                "Nonanoic anhydride",
                "Decanoic anhydride",
                "Lauric anhydride",
                "Myristic anhydride",
                "Palmitic anhydride",
                "Stearic anhydride",
                "Oleic anhydride",
                "Linoleic anhydride",
                "Linolenic anhydride",
                "Arachidonic anhydride",
                "Dodecanoic anhydride",
                "Tetradecanoic anhydride",
                "Hexadecanoic anhydride",
                "Octadecanoic anhydride",
                "Eicosanoic anhydride"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetic anhydride",
                "Arachidonic anhydride",
                "Butyric anhydride",
                "Caproic anhydride",
                "Caprylic anhydride",
                "Decanoic anhydride",
                "Dodecanoic anhydride",
                "Eicosanoic anhydride",
                "Heptanoic anhydride",
                "Hexadecanoic anhydride",
                "Isobutyric anhydride",
                "Isocaproic anhydride",
                "Lauric anhydride",
                "Linoleic anhydride",
                "Linolenic anhydride",
                "Myristic anhydride",
                "Nonanoic anhydride",
                "Octadecanoic anhydride",
                "Oleic anhydride",
                "Palmitic anhydride",
                "Propionic anhydride",
                "Stearic anhydride",
                "Tetradecanoic anhydride",
                "Valeric anhydride"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic anhydride (Ac\u2082O)",
            "Maleic anhydride",
            "Phthalic anhydride",
            "Succinic anhydride",
            "Adipic anhydride",
            "Itaconic anhydride",
            "Trimellitic anhydride",
            "Isophthalic anhydride",
            "Pyromellitic anhydride",
            "Glutaric anhydride",
            "Malonic anhydride",
            "Fumaric anhydride",
            "Napthalic anhydride",
            "Tetrahydrophthalic anhydride",
            "3,3'-Diphenylpropionic anhydride",
            "Citric anhydride",
            "Meldrum's acid",
            "Benzoic anhydride",
            "Hexanedioic anhydride",
            "Cyclopentanetricarboxylic anhydride",
            "Glycolic anhydride",
            "Oxydiphthalic anhydride",
            "Phthalic anhydride dimethyl ester",
            "Dodecanedioic anhydride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride (Ac\u2082O)",
                "Maleic anhydride",
                "Phthalic anhydride",
                "Succinic anhydride",
                "Adipic anhydride",
                "Itaconic anhydride",
                "Trimellitic anhydride",
                "Isophthalic anhydride",
                "Pyromellitic anhydride",
                "Glutaric anhydride",
                "Malonic anhydride",
                "Fumaric anhydride",
                "Napthalic anhydride",
                "Tetrahydrophthalic anhydride",
                "3,3'-Diphenylpropionic anhydride",
                "Citric anhydride",
                "Meldrum's acid",
                "Benzoic anhydride",
                "Hexanedioic anhydride",
                "Cyclopentanetricarboxylic anhydride",
                "Glycolic anhydride",
                "Oxydiphthalic anhydride",
                "Phthalic anhydride dimethyl ester",
                "Dodecanedioic anhydride"
            ],
            "mismatches": [],
            "true_referents": [
                "3,3'-Diphenylpropionic anhydride",
                "Acetic anhydride (Ac\u2082O)",
                "Adipic anhydride",
                "Benzoic anhydride",
                "Citric anhydride",
                "Cyclopentanetricarboxylic anhydride",
                "Dodecanedioic anhydride",
                "Fumaric anhydride",
                "Glutaric anhydride",
                "Glycolic anhydride",
                "Hexanedioic anhydride",
                "Isophthalic anhydride",
                "Itaconic anhydride",
                "Maleic anhydride",
                "Malonic anhydride",
                "Meldrum's acid",
                "Napthalic anhydride",
                "Oxydiphthalic anhydride",
                "Phthalic anhydride",
                "Phthalic anhydride dimethyl ester",
                "Pyromellitic anhydride",
                "Succinic anhydride",
                "Tetrahydrophthalic anhydride",
                "Trimellitic anhydride"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic anhydride (Ac2O)",
            "Maleic anhydride",
            "Succinic anhydride",
            "Phthalic anhydride",
            "Propionic anhydride",
            "Butyric anhydride",
            "Glutaric anhydride",
            "Benzoic anhydride",
            "Trifluoroacetic anhydride (TFAA)",
            "Citraconic anhydride",
            "Itaconic anhydride",
            "Trimellitic anhydride",
            "Pyromellitic dianhydride",
            "Naphthalic anhydride",
            "Hexahydrophthalic anhydride",
            "Methylhexahydrophthalic anhydride",
            "Tetrachlorophthalic anhydride",
            "Dodecenylsuccinic anhydride",
            "Methyltetrahydrophthalic anhydride",
            "Nadic methyl anhydride",
            "Chlorendic anhydride",
            "Dichloromaleic anhydride",
            "Methylnadic anhydride",
            "Tetrahydrophthalic anhydride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride (Ac2O)",
                "Maleic anhydride",
                "Succinic anhydride",
                "Phthalic anhydride",
                "Propionic anhydride",
                "Butyric anhydride",
                "Glutaric anhydride",
                "Benzoic anhydride",
                "Trifluoroacetic anhydride (TFAA)",
                "Citraconic anhydride",
                "Itaconic anhydride",
                "Trimellitic anhydride",
                "Pyromellitic dianhydride",
                "Naphthalic anhydride",
                "Hexahydrophthalic anhydride",
                "Methylhexahydrophthalic anhydride",
                "Tetrachlorophthalic anhydride",
                "Dodecenylsuccinic anhydride",
                "Methyltetrahydrophthalic anhydride",
                "Nadic methyl anhydride",
                "Chlorendic anhydride",
                "Dichloromaleic anhydride",
                "Methylnadic anhydride",
                "Tetrahydrophthalic anhydride"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetic anhydride (Ac2O)",
                "Benzoic anhydride",
                "Butyric anhydride",
                "Chlorendic anhydride",
                "Citraconic anhydride",
                "Dichloromaleic anhydride",
                "Dodecenylsuccinic anhydride",
                "Glutaric anhydride",
                "Hexahydrophthalic anhydride",
                "Itaconic anhydride",
                "Maleic anhydride",
                "Methylhexahydrophthalic anhydride",
                "Methylnadic anhydride",
                "Methyltetrahydrophthalic anhydride",
                "Nadic methyl anhydride",
                "Naphthalic anhydride",
                "Phthalic anhydride",
                "Propionic anhydride",
                "Pyromellitic dianhydride",
                "Succinic anhydride",
                "Tetrachlorophthalic anhydride",
                "Tetrahydrophthalic anhydride",
                "Trifluoroacetic anhydride (TFAA)",
                "Trimellitic anhydride"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic anhydride (Ac2O)",
            "Trifluoroacetic anhydride (TFAA)",
            "Maleic anhydride",
            "Succinic anhydride",
            "Phthalic anhydride",
            "Glutaric anhydride",
            "Propionic anhydride",
            "Benzoic anhydride",
            "Citraconic anhydride",
            "Itaconic anhydride",
            "Butyric anhydride",
            "Valeric anhydride",
            "Hexanoic anhydride",
            "Heptanoic anhydride",
            "Octanoic anhydride",
            "Nonanoic anhydride",
            "Decanoic anhydride",
            "Dodecanoic anhydride",
            "Tetradecanoic anhydride",
            "Hexadecanoic anhydride",
            "Octadecanoic anhydride",
            "Eicosanoic anhydride",
            "Docosanoic anhydride",
            "Tetracosanoic anhydride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride (Ac2O)",
                "Trifluoroacetic anhydride (TFAA)",
                "Maleic anhydride",
                "Succinic anhydride",
                "Phthalic anhydride",
                "Glutaric anhydride",
                "Propionic anhydride",
                "Benzoic anhydride",
                "Citraconic anhydride",
                "Itaconic anhydride",
                "Butyric anhydride",
                "Valeric anhydride",
                "Hexanoic anhydride",
                "Heptanoic anhydride",
                "Octanoic anhydride",
                "Nonanoic anhydride",
                "Decanoic anhydride",
                "Dodecanoic anhydride",
                "Tetradecanoic anhydride",
                "Hexadecanoic anhydride",
                "Octadecanoic anhydride",
                "Eicosanoic anhydride",
                "Docosanoic anhydride",
                "Tetracosanoic anhydride"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetic anhydride (Ac2O)",
                "Benzoic anhydride",
                "Butyric anhydride",
                "Citraconic anhydride",
                "Decanoic anhydride",
                "Docosanoic anhydride",
                "Dodecanoic anhydride",
                "Eicosanoic anhydride",
                "Glutaric anhydride",
                "Heptanoic anhydride",
                "Hexadecanoic anhydride",
                "Hexanoic anhydride",
                "Itaconic anhydride",
                "Maleic anhydride",
                "Nonanoic anhydride",
                "Octadecanoic anhydride",
                "Octanoic anhydride",
                "Phthalic anhydride",
                "Propionic anhydride",
                "Succinic anhydride",
                "Tetracosanoic anhydride",
                "Tetradecanoic anhydride",
                "Trifluoroacetic anhydride (TFAA)",
                "Valeric anhydride"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic anhydride (CH3CO)2O",
            "Propionic anhydride (CH3CH2CO)2O",
            "Butyric anhydride (CH3CH2CH2CO)2O",
            "Valeric anhydride (CH3(CH2)3CO)2O",
            "Hexanoic anhydride (CH3(CH2)4CO)2O",
            "Heptanoic anhydride (CH3(CH2)5CO)2O",
            "Octanoic anhydride (CH3(CH2)6CO)2O",
            "Nonanoic anhydride (CH3(CH2)7CO)2O",
            "Decanoic anhydride (CH3(CH2)8CO)2O",
            "Undecanoic anhydride (CH3(CH2)9CO)2O",
            "Dodecanoic anhydride (CH3(CH2)10CO)2O",
            "Tridecanoic anhydride (CH3(CH2)11CO)2O",
            "Tetradecanoic anhydride (CH3(CH2)12CO)2O",
            "Pentadecanoic anhydride (CH3(CH2)13CO)2O",
            "Hexadecanoic anhydride (CH3(CH2)14CO)2O",
            "Heptadecanoic anhydride (CH3(CH2)15CO)2O",
            "Octadecanoic anhydride (CH3(CH2)16CO)2O",
            "Nonadecanoic anhydride (CH3(CH2)17CO)2O",
            "Eicosanoic anhydride (CH3(CH2)18CO)2O",
            "Benzoic anhydride (C6H5CO)2O",
            "Phthalic anhydride (C6H4(CO)2O)",
            "Maleic anhydride (C2H2(CO)2O)",
            "Succinic anhydride (C2H4(CO)2O)",
            "Glutaric anhydride (C3H6(CO)2O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride (CH3CO)2O",
                "Propionic anhydride (CH3CH2CO)2O",
                "Butyric anhydride (CH3CH2CH2CO)2O",
                "Valeric anhydride (CH3(CH2)3CO)2O",
                "Hexanoic anhydride (CH3(CH2)4CO)2O",
                "Heptanoic anhydride (CH3(CH2)5CO)2O",
                "Octanoic anhydride (CH3(CH2)6CO)2O",
                "Nonanoic anhydride (CH3(CH2)7CO)2O",
                "Decanoic anhydride (CH3(CH2)8CO)2O",
                "Undecanoic anhydride (CH3(CH2)9CO)2O",
                "Dodecanoic anhydride (CH3(CH2)10CO)2O",
                "Tridecanoic anhydride (CH3(CH2)11CO)2O",
                "Tetradecanoic anhydride (CH3(CH2)12CO)2O",
                "Pentadecanoic anhydride (CH3(CH2)13CO)2O",
                "Hexadecanoic anhydride (CH3(CH2)14CO)2O",
                "Heptadecanoic anhydride (CH3(CH2)15CO)2O",
                "Octadecanoic anhydride (CH3(CH2)16CO)2O",
                "Nonadecanoic anhydride (CH3(CH2)17CO)2O",
                "Eicosanoic anhydride (CH3(CH2)18CO)2O",
                "Benzoic anhydride (C6H5CO)2O",
                "Phthalic anhydride (C6H4(CO)2O)",
                "Maleic anhydride (C2H2(CO)2O)",
                "Succinic anhydride (C2H4(CO)2O)",
                "Glutaric anhydride (C3H6(CO)2O)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetic anhydride (CH3CO)2O",
                "Benzoic anhydride (C6H5CO)2O",
                "Butyric anhydride (CH3CH2CH2CO)2O",
                "Decanoic anhydride (CH3(CH2)8CO)2O",
                "Dodecanoic anhydride (CH3(CH2)10CO)2O",
                "Eicosanoic anhydride (CH3(CH2)18CO)2O",
                "Glutaric anhydride (C3H6(CO)2O)",
                "Heptadecanoic anhydride (CH3(CH2)15CO)2O",
                "Heptanoic anhydride (CH3(CH2)5CO)2O",
                "Hexadecanoic anhydride (CH3(CH2)14CO)2O",
                "Hexanoic anhydride (CH3(CH2)4CO)2O",
                "Maleic anhydride (C2H2(CO)2O)",
                "Nonadecanoic anhydride (CH3(CH2)17CO)2O",
                "Nonanoic anhydride (CH3(CH2)7CO)2O",
                "Octadecanoic anhydride (CH3(CH2)16CO)2O",
                "Octanoic anhydride (CH3(CH2)6CO)2O",
                "Pentadecanoic anhydride (CH3(CH2)13CO)2O",
                "Phthalic anhydride (C6H4(CO)2O)",
                "Propionic anhydride (CH3CH2CO)2O",
                "Succinic anhydride (C2H4(CO)2O)",
                "Tetradecanoic anhydride (CH3(CH2)12CO)2O",
                "Tridecanoic anhydride (CH3(CH2)11CO)2O",
                "Undecanoic anhydride (CH3(CH2)9CO)2O",
                "Valeric anhydride (CH3(CH2)3CO)2O"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic anhydride (AcO)",
            "Propanoic anhydride (PrO)",
            "Butanoic anhydride (BuO)",
            "Pentanoic anhydride (PeO)",
            "Hexanoic anhydride (HxO)",
            "Heptanoic anhydride (HpO)",
            "Octanoic anhydride (OcO)",
            "Nonanoic anhydride (NO)",
            "Decanoic anhydride (DO)",
            "Undecanoic anhydride (UO)",
            "Dodecanoic anhydride (DdO)",
            "Tridecanoic anhydride (TO)",
            "Tetradecanoic anhydride (TeO)",
            "Pentadecanoic anhydride (PdO)",
            "Hexadecanoic anhydride (HD)",
            "Heptadecanoic anhydride (HpD)",
            "Octadecanoic anhydride (OD)",
            "Nonadecanoic anhydride (ND)",
            "Eicosanoic anhydride (EO)",
            "Maleic anhydride (MA)",
            "Succinic anhydride (SA)",
            "Phthalic anhydride (PA)",
            "Trimellitic anhydride (TA)",
            "Pyromellitic dianhydride (PMDA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride (AcO)",
                "Propanoic anhydride (PrO)",
                "Butanoic anhydride (BuO)",
                "Pentanoic anhydride (PeO)",
                "Hexanoic anhydride (HxO)",
                "Heptanoic anhydride (HpO)",
                "Octanoic anhydride (OcO)",
                "Nonanoic anhydride (NO)",
                "Decanoic anhydride (DO)",
                "Undecanoic anhydride (UO)",
                "Dodecanoic anhydride (DdO)",
                "Tridecanoic anhydride (TO)",
                "Tetradecanoic anhydride (TeO)",
                "Pentadecanoic anhydride (PdO)",
                "Hexadecanoic anhydride (HD)",
                "Heptadecanoic anhydride (HpD)",
                "Octadecanoic anhydride (OD)",
                "Nonadecanoic anhydride (ND)",
                "Eicosanoic anhydride (EO)",
                "Maleic anhydride (MA)",
                "Succinic anhydride (SA)",
                "Phthalic anhydride (PA)",
                "Trimellitic anhydride (TA)",
                "Pyromellitic dianhydride (PMDA)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetic anhydride (AcO)",
                "Butanoic anhydride (BuO)",
                "Decanoic anhydride (DO)",
                "Dodecanoic anhydride (DdO)",
                "Eicosanoic anhydride (EO)",
                "Heptadecanoic anhydride (HpD)",
                "Heptanoic anhydride (HpO)",
                "Hexadecanoic anhydride (HD)",
                "Hexanoic anhydride (HxO)",
                "Maleic anhydride (MA)",
                "Nonadecanoic anhydride (ND)",
                "Nonanoic anhydride (NO)",
                "Octadecanoic anhydride (OD)",
                "Octanoic anhydride (OcO)",
                "Pentadecanoic anhydride (PdO)",
                "Pentanoic anhydride (PeO)",
                "Phthalic anhydride (PA)",
                "Propanoic anhydride (PrO)",
                "Pyromellitic dianhydride (PMDA)",
                "Succinic anhydride (SA)",
                "Tetradecanoic anhydride (TeO)",
                "Tridecanoic anhydride (TO)",
                "Trimellitic anhydride (TA)",
                "Undecanoic anhydride (UO)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Phthalic anhydride (PA)",
            "Maleic anhydride",
            "Fumaric anhydride",
            "Terephthalic anhydride",
            "Isophthalic anhydride",
            "Adipic anhydride",
            "Sebacic anhydride",
            "Dodecanedioic anhydride",
            "Undecanedioic anhydride",
            "Decanedioic anhydride",
            "Nonanedioic anhydride",
            "Octanedioic anhydride",
            "Heptanedioic anhydride",
            "Hexanedioic anhydride",
            "Pimelic anhydride",
            "Suberic anhydride",
            "Azelaic anhydride",
            "Sebacic anhydride",
            "Dodecanedioic anhydride",
            "Cyclohexane-1,4-dicarboxylic anhydride",
            "Cyclohexane-1,3-dicarboxylic anhydride",
            "Cyclohexane-1,2-dicarboxylic anhydride",
            "Cyclopentane-1,2-dicarboxylic anhydride",
            "Cyclobutane-1,2-dicarboxylic anhydride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Phthalic anhydride (PA)",
                "Maleic anhydride",
                "Fumaric anhydride",
                "Terephthalic anhydride",
                "Isophthalic anhydride",
                "Adipic anhydride",
                "Sebacic anhydride",
                "Dodecanedioic anhydride",
                "Undecanedioic anhydride",
                "Decanedioic anhydride",
                "Nonanedioic anhydride",
                "Octanedioic anhydride",
                "Heptanedioic anhydride",
                "Hexanedioic anhydride",
                "Pimelic anhydride",
                "Suberic anhydride",
                "Azelaic anhydride",
                "Cyclohexane-1,4-dicarboxylic anhydride",
                "Cyclohexane-1,3-dicarboxylic anhydride",
                "Cyclohexane-1,2-dicarboxylic anhydride",
                "Cyclopentane-1,2-dicarboxylic anhydride",
                "Cyclobutane-1,2-dicarboxylic anhydride"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipic anhydride",
                "Azelaic anhydride",
                "Cyclobutane-1,2-dicarboxylic anhydride",
                "Cyclohexane-1,2-dicarboxylic anhydride",
                "Cyclohexane-1,3-dicarboxylic anhydride",
                "Cyclohexane-1,4-dicarboxylic anhydride",
                "Cyclopentane-1,2-dicarboxylic anhydride",
                "Decanedioic anhydride",
                "Dodecanedioic anhydride",
                "Fumaric anhydride",
                "Heptanedioic anhydride",
                "Hexanedioic anhydride",
                "Isophthalic anhydride",
                "Maleic anhydride",
                "Nonanedioic anhydride",
                "Octanedioic anhydride",
                "Phthalic anhydride (PA)",
                "Pimelic anhydride",
                "Sebacic anhydride",
                "Suberic anhydride",
                "Terephthalic anhydride",
                "Undecanedioic anhydride"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            "Acetic anhydride (AA)",
            "Propionic anhydride",
            "Butyric anhydride",
            "Valeric anhydride",
            "Caproic anhydride",
            "Enanthic anhydride",
            "Caprylic anhydride",
            "Pelargonic anhydride",
            "Capric anhydride",
            "Undecylic anhydride",
            "Lauric anhydride",
            "Tridecyl anhydride",
            "Myristic anhydride",
            "Pentadecylic anhydride",
            "Palmitic anhydride",
            "Margoric anhydride",
            "Stearic anhydride",
            "Oleic anhydride",
            "Linoleic anhydride",
            "Linolenic anhydride",
            "Arachidic anhydride",
            "Gadoleic anhydride",
            "Behenic anhydride",
            "Lignoceric anhydride",
            "Cerotic anhydride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride (AA)",
                "Propionic anhydride",
                "Butyric anhydride",
                "Valeric anhydride",
                "Caproic anhydride",
                "Enanthic anhydride",
                "Caprylic anhydride",
                "Pelargonic anhydride",
                "Capric anhydride",
                "Undecylic anhydride",
                "Lauric anhydride",
                "Tridecyl anhydride",
                "Myristic anhydride",
                "Pentadecylic anhydride",
                "Palmitic anhydride",
                "Margoric anhydride",
                "Stearic anhydride",
                "Oleic anhydride",
                "Linoleic anhydride",
                "Linolenic anhydride",
                "Arachidic anhydride",
                "Gadoleic anhydride",
                "Behenic anhydride",
                "Lignoceric anhydride"
            ],
            "mismatches": [
                "Cerotic anhydride"
            ],
            "true_referents": [
                "Acetic anhydride (AA)",
                "Arachidic anhydride",
                "Behenic anhydride",
                "Butyric anhydride",
                "Capric anhydride",
                "Caproic anhydride",
                "Caprylic anhydride",
                "Enanthic anhydride",
                "Gadoleic anhydride",
                "Lauric anhydride",
                "Lignoceric anhydride",
                "Linoleic anhydride",
                "Linolenic anhydride",
                "Margoric anhydride",
                "Myristic anhydride",
                "Oleic anhydride",
                "Palmitic anhydride",
                "Pelargonic anhydride",
                "Pentadecylic anhydride",
                "Propionic anhydride",
                "Stearic anhydride",
                "Tridecyl anhydride",
                "Undecylic anhydride",
                "Valeric anhydride"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "carboxylic anhydride",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Acetic anhydride",
                "Canonical name": "Acetic anhydride"
            },
            {
                "Referent": "Benzoyl chloride",
                "Canonical name": "Benzoyl chloride"
            },
            {
                "Referent": "Dimethylglyoxime",
                "Canonical name": "Dimethylglyoxime"
            },
            {
                "Referent": "Diisopropyl ether",
                "Canonical name": "Diisopropyl ether"
            },
            {
                "Referent": "Diphenylacetylene",
                "Canonical name": "Diphenylacetylene"
            },
            {
                "Referent": "Ethyl acetate",
                "Canonical name": "Ethyl acetate"
            },
            {
                "Referent": "Ethyl benzene",
                "Canonical name": "Ethyl benzene"
            },
            {
                "Referent": "Ethyl formate",
                "Canonical name": "Ethyl formate"
            },
            {
                "Referent": "Ethyl propionate",
                "Canonical name": "Ethyl propionate"
            },
            {
                "Referent": "Ethyl valerate",
                "Canonical name": "Ethyl valerate"
            },
            {
                "Referent": "Methyl acetate",
                "Canonical name": "Methyl acetate"
            },
            {
                "Referent": "Methyl propionate",
                "Canonical name": "Methyl propionate"
            },
            {
                "Referent": "Methyl valerate",
                "Canonical name": "Methyl valerate"
            },
            {
                "Referent": "Propionic anhydride",
                "Canonical name": "Propionic anhydride"
            },
            {
                "Referent": "Vinyl acetate",
                "Canonical name": "Vinyl acetate"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetic anhydride",
                "Benzoyl chloride",
                "Dimethylglyoxime",
                "Diisopropyl ether",
                "Diphenylacetylene",
                "Ethyl acetate",
                "Ethyl benzene",
                "Ethyl formate",
                "Ethyl propionate",
                "Ethyl valerate",
                "Methyl acetate",
                "Methyl propionate",
                "Methyl valerate",
                "Propionic anhydride",
                "Vinyl acetate"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"Acetic anhydride\", \"Canonical name\": \"Acetic anhydride\"}",
                "{\"Referent\": \"Benzoyl chloride\", \"Canonical name\": \"Benzoyl chloride\"}",
                "{\"Referent\": \"Diisopropyl ether\", \"Canonical name\": \"Diisopropyl ether\"}",
                "{\"Referent\": \"Dimethylglyoxime\", \"Canonical name\": \"Dimethylglyoxime\"}",
                "{\"Referent\": \"Diphenylacetylene\", \"Canonical name\": \"Diphenylacetylene\"}",
                "{\"Referent\": \"Ethyl acetate\", \"Canonical name\": \"Ethyl acetate\"}",
                "{\"Referent\": \"Ethyl benzene\", \"Canonical name\": \"Ethyl benzene\"}",
                "{\"Referent\": \"Ethyl formate\", \"Canonical name\": \"Ethyl formate\"}",
                "{\"Referent\": \"Ethyl propionate\", \"Canonical name\": \"Ethyl propionate\"}",
                "{\"Referent\": \"Ethyl valerate\", \"Canonical name\": \"Ethyl valerate\"}",
                "{\"Referent\": \"Methyl acetate\", \"Canonical name\": \"Methyl acetate\"}",
                "{\"Referent\": \"Methyl propionate\", \"Canonical name\": \"Methyl propionate\"}",
                "{\"Referent\": \"Methyl valerate\", \"Canonical name\": \"Methyl valerate\"}",
                "{\"Referent\": \"Propionic anhydride\", \"Canonical name\": \"Propionic anhydride\"}",
                "{\"Referent\": \"Vinyl acetate\", \"Canonical name\": \"Vinyl acetate\"}"
            ],
            "TP": 15,
            "FP": 0,
            "FN": 0
        }
    }
]