[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "methane (CH4)",
            "ethane (C2H6)",
            "propane (C3H8)",
            "butane (C4H10)",
            "pentane (C5H12)",
            "hexane (C6H14)",
            "heptane (C7H16)",
            "octane (C8H18)",
            "nonane (C9H20)",
            "decane (C10H22)",
            "undecane (C11H24)",
            "dodecane (C12H26)",
            "pentadecane (C15H32)",
            "hexadecane (C16H34)",
            "heptadecane (C17H36)",
            "octadecane (C18H38)",
            "nonadecane (C19H40)",
            "eicosane (C20H42)",
            "docosane (C22H46)",
            "tetracosane (C24H50)",
            "hexacosane (C26H54)",
            "octacosane (C28H58)",
            "triacontane (C30H62)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methane (CH4)",
                "ethane (C2H6)",
                "butane (C4H10)",
                "pentane (C5H12)",
                "hexane (C6H14)",
                "heptane (C7H16)",
                "octane (C8H18)",
                "nonane (C9H20)",
                "decane (C10H22)",
                "undecane (C11H24)",
                "dodecane (C12H26)",
                "pentadecane (C15H32)",
                "hexadecane (C16H34)",
                "heptadecane (C17H36)",
                "octadecane (C18H38)",
                "nonadecane (C19H40)",
                "docosane (C22H46)",
                "tetracosane (C24H50)",
                "hexacosane (C26H54)",
                "octacosane (C28H58)",
                "triacontane (C30H62)"
            ],
            "mismatches": [
                "propane (C3H8)",
                "eicosane (C20H42)"
            ],
            "true_referents": [
                "(E)-2-dodecene",
                "(E,Z)-2,4-Dodecadiene",
                "1,2-octacosanediol",
                "1,4-Undecadiene",
                "1-Hexacosene",
                "1-docosene",
                "1-hexene",
                "1-pentadecene",
                "10-Eicosene",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,6,8-trimethyldecane",
                "2,6-dimethylheptadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-methyl-pentadecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "Eicosene",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Tetracosene",
                "Undecane, 2,9-dimethyl-",
                "acene",
                "alkane",
                "butane",
                "butene",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexacosane",
                "hexadecane",
                "hexane",
                "hexatriacontane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octacosane",
                "octadecane",
                "octane",
                "pentadecane",
                "pentane",
                "propene",
                "tetracosane",
                "triacontane",
                "tritriacontane",
                "undecane"
            ],
            "TP": 21,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Eicosane (C20H42)",
            "Cyclopropane (C3H6)",
            "Cyclobutane (C4H8)",
            "Cyclopentane (C5H10)",
            "Cyclohexane (C6H12)",
            "Cycloheptane (C7H14)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane",
                "Ethane",
                "Butane",
                "Pentane",
                "Hexane",
                "Heptane",
                "Octane",
                "Nonane",
                "Decane",
                "Undecane",
                "Dodecane",
                "Tridecane",
                "Tetradecane",
                "Pentadecane",
                "Hexadecane",
                "Heptadecane",
                "Octadecane",
                "Nonadecane",
                "Cyclopropane",
                "Cyclobutane",
                "Cyclopentane",
                "Cyclohexane"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Eicosane (C20H42)",
                "Cycloheptane (C7H14)"
            ],
            "true_referents": [
                "(E)-2-dodecene",
                "(E,Z)-2,4-Dodecadiene",
                "1,2,4-trimethyl-Cyclopentane",
                "1,4-Undecadiene",
                "1-hexene",
                "1-pentadecene",
                "10-Eicosene",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,6,8-trimethyldecane",
                "2,6-dimethylheptadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "Eicosene",
                "Ethylcyclopentane",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "acene",
                "alkane",
                "butane",
                "butene",
                "cyclobutane",
                "cyclobutene",
                "cyclohexane",
                "cyclohexene",
                "cyclopentane",
                "cyclopropane",
                "cyclopropene",
                "decane",
                "dodecane",
                "ethane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentadecane",
                "pentane",
                "propene",
                "tetradecane",
                "tridecane",
                "undecane"
            ],
            "TP": 22,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH\u2084)",
            "Ethane (C\u2082H\u2086)",
            "Propane (C\u2083H\u2088)",
            "Butane (C\u2084H\u2081\u2080)",
            "Pentane (C\u2085H\u2081\u2082)",
            "Hexane (C\u2086H\u2081\u2084)",
            "Heptane (C\u2087H\u2081\u2086)",
            "Octane (C\u2088H\u2081\u2088)",
            "Nonane (C\u2089H\u2082\u2080)",
            "Decane (C\u2081\u2080H\u2082\u2082)",
            "Ethene (C\u2082H\u2084)",
            "Propene (C\u2083H\u2086)",
            "Butene (C\u2084H\u2088)",
            "Pentene (C\u2085H\u2081\u2080)",
            "Hexene (C\u2086H\u2081\u2082)",
            "Heptene (C\u2087H\u2081\u2084)",
            "Octene (C\u2088H\u2081\u2086)",
            "Nonene (C\u2089H\u2081\u2088)",
            "Decene (C\u2081\u2080H\u2082\u2080)",
            "Ethyne (C\u2082H\u2082)",
            "Propyne (C\u2083H\u2084)",
            "Butyne (C\u2084H\u2086)",
            "Pentyne (C\u2085H\u2088)",
            "Hexyne (C\u2086H\u2081\u2080)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methane",
                "ethane",
                "propane",
                "butane",
                "pentane",
                "hexane",
                "heptane",
                "octane",
                "nonane",
                "decane",
                "ethene",
                "propene",
                "butene",
                "propyne"
            ],
            "mismatches": [
                "pentene",
                "hexene",
                "heptene",
                "octene",
                "nonene",
                "decene",
                "ethyne",
                "butyne",
                "pentyne",
                "hexyne"
            ],
            "true_referents": [
                "(E)-2-octene",
                "(E)-3,4-dimethyl-2-Pentene",
                "(E)-3-penten-1-yne",
                "1-Heptene",
                "1-Pentene",
                "1-decene",
                "1-ethyl-2,4-dimethyl-Benzene",
                "1-hexene",
                "1-hexyne",
                "1-nonene",
                "1-octene",
                "2,4-Dimethyl-2-pentene",
                "2,4-dimethyl-1-heptene",
                "2,4-dimethylhexane",
                "2-Heptene",
                "2-Hexene",
                "2-methyl-1-Decene",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-hexene",
                "3-penten-1-yne",
                "4,6,8-trimethyl-1-nonene",
                "5,6-dimethyl-Decane",
                "6-ethyl-2-methyl-Octane",
                "6-methyl- 4E-decene",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "acene",
                "acetylene",
                "alkane",
                "alkyne",
                "benzene-d6",
                "but-1-ene",
                "buta-1,3-diyne",
                "butadiene",
                "butane",
                "butene",
                "decane",
                "ethane",
                "ethene",
                "ethylbenzene",
                "heptadecane",
                "heptane",
                "hexa-1,5-diyne",
                "hexane",
                "hexaphene",
                "isopentane",
                "methane",
                "nonacene",
                "nonane",
                "octane",
                "octene",
                "pentane",
                "propane",
                "propene",
                "propyne"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Ethylene (C2H4)",
            "Propylene (C3H6)",
            "Butylene (C4H8)",
            "Acetylene (C2H2)",
            "Benzene (C6H6)",
            "Cyclohexane (C6H12)",
            "Toluene (C7H8)",
            "Xylene (C8H10)",
            "Naphthalene (C10H8)",
            "Anthracene (C14H10)",
            "Phenanthrene (C14H10)",
            "Tetralin (C10H12)",
            "Decalin (C10H18)",
            "Camphor (C10H16O) - *Note: While it contains Oxygen, the core structure is carbon and hydrogen*"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Acetylene (C2H2)",
                "Benzene (C6H6)",
                "Cyclohexane (C6H12)",
                "Toluene (C7H8)",
                "Xylene (C8H10)",
                "Naphthalene (C10H8)",
                "Anthracene (C14H10)",
                "Phenanthrene (C14H10)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Ethylene (C2H4)",
                "Propylene (C3H6)",
                "Butylene (C4H8)",
                "Tetralin (C10H12)",
                "Decalin (C10H18)",
                "Camphor (C10H16O) - *Note: While it contains Oxygen, the core structure is carbon and hydrogen*"
            ],
            "true_referents": [
                "(1-Ethylpropyl)benzene",
                "(8S,10S)-8,10-Dimethyl-1(9)-octalin",
                "(E)-7-Tetradecene",
                "1,9-Decadiene",
                "1-decene",
                "1-ethyl-2,4-dimethyl-Benzene",
                "1-hexene",
                "2,3-dimethylpentane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "4-ethyl-1-hexene",
                "5,6-dimethyl-Decane",
                "Naphtho[2,3-e]pyrene",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "acene",
                "acetylene",
                "acyclic acetylene",
                "alkane",
                "anthracene",
                "benzene",
                "benzene-d6",
                "butadiene",
                "butane",
                "butene",
                "butylbenzene",
                "cyclohexane",
                "cyclohexene",
                "decane",
                "ethane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "isobutane",
                "isopentane",
                "methane",
                "monocyclic hydrocarbon",
                "naphthalene",
                "nonane",
                "o-xylene",
                "octane",
                "p-xylene",
                "pentane",
                "phenanthrene",
                "propene",
                "pyranthrene",
                "tetramethylbenzene",
                "toluene",
                "toluene-d8",
                "xylene"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Ethylene (C2H4)",
            "Acetylene (C2H2)",
            "Benzene (C6H6)",
            "Toluene (C7H8)",
            "Xylene (C8H10)",
            "Cyclohexane (C6H12)",
            "Cyclopentane (C5H10)",
            "Ethylene (C2H4)",
            "Propylene (C3H6)",
            "Butadiene (C4H6)",
            "Isobutane (C4H10)",
            "Isopentane (C5H12)",
            "Neopentane (C5H12)",
            "Styrene (C8H8)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Acetylene (C2H2)",
                "Benzene (C6H6)",
                "Toluene (C7H8)",
                "Xylene (C8H10)",
                "Cyclohexane (C6H12)",
                "Cyclopentane (C5H10)",
                "Butadiene (C4H6)",
                "Isobutane (C4H10)",
                "Isopentane (C5H12)",
                "Neopentane (C5H12)",
                "Styrene (C8H8)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Ethylene (C2H4)",
                "Propylene (C3H6)"
            ],
            "true_referents": [
                "1,2,4-trimethyl-Cyclopentane",
                "1,4-diphenylbutadiene",
                "1-ethyl-2,4-dimethyl-Benzene",
                "1-hexene",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "4-ethyl-1-hexene",
                "5,6-dimethyl-Decane",
                "Ethylcyclopentane",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "acene",
                "acetylene",
                "acyclic acetylene",
                "alkane",
                "benzene",
                "benzene-d6",
                "butadiene",
                "butane",
                "butene",
                "cyclohexane",
                "cyclohexene",
                "cyclopentane",
                "decane",
                "ethane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "isobutane",
                "isooctane",
                "isopentane",
                "methane",
                "neopentane",
                "nonane",
                "o-xylene",
                "octane",
                "p-xylene",
                "pentane",
                "propene",
                "styrene",
                "toluene",
                "toluene-d8",
                "xylene"
            ],
            "TP": 20,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Eicosane (C20H42)",
            "Heneicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)",
                "Tetracosane (C24H50)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Eicosane (C20H42)",
                "Heneicosane (C21H44)"
            ],
            "true_referents": [
                "(9Z)-tricosene",
                "(E)-2-dodecene",
                "(E,Z)-2,4-Dodecadiene",
                "1,4-Undecadiene",
                "1-docosene",
                "1-hexene",
                "1-pentadecene",
                "10-Eicosene",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,6,8-trimethyldecane",
                "2,6-dimethylheptadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "5,6-dimethyl-Decane",
                "7Z-Heneicosene",
                "8E-Heneicosene",
                "9-Methylnonadecane",
                "Eicosene",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Tetracosene",
                "Undecane, 2,9-dimethyl-",
                "acene",
                "alkane",
                "butane",
                "butene",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentadecane",
                "pentane",
                "propene",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tricosene",
                "tridecane",
                "undecane"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Cyclohexane (C6H12)",
            "Cyclopentane (C5H10)",
            "Cyclopropane (C3H6)",
            "Cyclobutane (C4H8)",
            "Cycloheptane (C7H14)",
            "Cyclooctane (C8H16)",
            "Cyclononane (C9H18)",
            "Cyclodecane (C10H20)",
            "Benzene (C6H6)",
            "Toluene (C7H8)",
            "Xylene (C8H10)",
            "Naphthalene (C10H8)",
            "Anthracene (C14H10)",
            "Phenanthrene (C14H10)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Cyclohexane (C6H12)",
                "Cyclopropane (C3H6)",
                "Cyclobutane (C4H8)",
                "Cyclooctane (C8H16)",
                "Benzene (C6H6)",
                "Toluene (C7H8)",
                "Xylene (C8H10)",
                "Naphthalene (C10H8)",
                "Anthracene (C14H10)",
                "Phenanthrene (C14H10)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Cyclopentane (C5H10)",
                "Cycloheptane (C7H14)",
                "Cyclononane (C9H18)",
                "Cyclodecane (C10H20)"
            ],
            "true_referents": [
                "1,2,4-trimethyl-Cyclopentane",
                "1-Cyclohexyldecane",
                "1-Cyclohexylhexadecane",
                "1-hexene",
                "2,3-dimethylpentane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "4,6-dimethyldodecane",
                "5,6-dimethyl-Decane",
                "Cycloheptene",
                "Cyclooctane",
                "Ethylcyclopentane",
                "Naphtho[2,3-e]pyrene",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "acene",
                "alkane",
                "anthracene",
                "benzene",
                "benzene-d6",
                "butane",
                "butene",
                "cyclobutane",
                "cyclobutene",
                "cyclodecyne",
                "cyclohepta-1,3,5-triene",
                "cyclohexane",
                "cyclohexene",
                "cyclononyne",
                "cyclooctatriene",
                "cyclooctene",
                "cyclopentane",
                "cyclopropane",
                "cyclopropene",
                "decane",
                "ethane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "isobutane",
                "isopentane",
                "methane",
                "naphthalene",
                "nonane",
                "o-xylene",
                "octane",
                "p-xylene",
                "pentane",
                "phenanthrene",
                "propene",
                "toluene",
                "toluene-d8",
                "xylene"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Benzene (C6H6)",
            "Toluene (C7H8)",
            "Xylene (C8H10)",
            "Cyclohexane (C6H12)",
            "Ethene (C2H4)",
            "Propene (C3H6)",
            "Butene (C4H8)",
            "Pentene (C5H10)",
            "Hexene (C6H12)",
            "Heptene (C7H14)",
            "Octene (C8H16)",
            "Nonene (C9H18)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane",
                "Ethane",
                "Pentane",
                "Hexane",
                "Heptane",
                "Octane",
                "Nonane",
                "Decane",
                "Undecane",
                "Dodecane",
                "Benzene",
                "Toluene",
                "Xylene",
                "Cyclohexane",
                "Ethene",
                "Propene",
                "Butene"
            ],
            "mismatches": [
                "Propane",
                "Pentene",
                "Hexene",
                "Heptene",
                "Octene",
                "Nonene"
            ],
            "true_referents": [
                "(E)-2-dodecene",
                "(E)-2-octene",
                "(E)-3,4-dimethyl-2-Pentene",
                "(E,Z)-2,4-Dodecadiene",
                "1,4-Undecadiene",
                "1-Heptene",
                "1-Pentene",
                "1-hexene",
                "1-nonene",
                "1-octene",
                "2,3-dimethylpentane",
                "2,4-Dimethyl-2-pentene",
                "2,4-dimethyl-1-heptene",
                "2-Heptene",
                "2-Hexene",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-hexene",
                "5,6-dimethyl-Decane",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "acene",
                "alkane",
                "benzene",
                "benzene-d6",
                "but-1-ene",
                "butadiene",
                "butane",
                "butene",
                "cyclohexane",
                "cyclohexene",
                "decane",
                "dodecane",
                "ethane",
                "ethene",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "isobutane",
                "isopentane",
                "methane",
                "nonacene",
                "nonane",
                "o-xylene",
                "octane",
                "octene",
                "p-xylene",
                "pentane",
                "propene",
                "toluene",
                "toluene-d8",
                "undecane",
                "xylene"
            ],
            "TP": 17,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH\u2084)",
            "Ethane (C\u2082H\u2086)",
            "Propane (C\u2083H\u2088)",
            "Butane (C\u2084H\u2081\u2080)",
            "Pentane (C\u2085H\u2081\u2082)",
            "Hexane (C\u2086H\u2081\u2084)",
            "Heptane (C\u2087H\u2081\u2086)",
            "Octane (C\u2088H\u2081\u2088)",
            "Nonane (C\u2089H\u2082\u2080)",
            "Decane (C\u2081\u2080H\u2082\u2082)",
            "Undecane (C\u2081\u2081H\u2082\u2084)",
            "Dodecane (C\u2081\u2082H\u2082\u2086)",
            "Cyclohexane (C\u2086H\u2081\u2082)",
            "Benzene (C\u2086H\u2086)",
            "Toluene (C\u2087H\u2088)",
            "Xylene (C\u2088H\u2081\u2080)",
            "Octatetraene (C\u2088H\u2081\u2082)",
            "Ethyne (C\u2082H\u2082)",
            "Ethylene (C\u2082H\u2084)",
            "Isobutane (C\u2084H\u2081\u2080)",
            "Isopentane (C\u2085H\u2081\u2082)",
            "Methylcyclohexane (C\u2087H\u2081\u2084)",
            "Phenylene (C\u2086H\u2084)",
            "Styrene (C\u2088H\u2088)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methane",
                "ethane",
                "propane",
                "butane",
                "pentane",
                "hexane",
                "heptane",
                "octane",
                "nonane",
                "decane",
                "undecane",
                "dodecane",
                "benzene",
                "toluene",
                "xylene",
                "isobutane",
                "isopentane",
                "methylcyclohexane",
                "styrene"
            ],
            "mismatches": [
                "cyclohexane",
                "octatetraene",
                "ethyne",
                "ethylene",
                "phenylene"
            ],
            "true_referents": [
                "(1-Ethylpropyl)benzene",
                "(1-methylethylidene)-Cyclohexane",
                "(3E,5E)-2,6-Dimethyl-1,3,5,7-octatetraene",
                "(E)-2-dodecene",
                "1,3,6-Octatriene",
                "1,4-Undecadiene",
                "1,6-dimethyl-Cyclohexene",
                "1-ethyl-2,4-dimethyl-Benzene",
                "1-hexene",
                "1-methyl-Cyclohexene",
                "2,4-dimethylhexane",
                "2,6-Dimethyldecane",
                "2,6-dimethyl-1,3,5,7-octatetraene",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "4-ethyl-1-hexene",
                "5,6-dimethyl-Decane",
                "6-ethyl-2-methyl-Octane",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "acene",
                "acetylene",
                "alkane",
                "alkyne",
                "benzene",
                "benzene-d6",
                "biphenylene",
                "butane",
                "butene",
                "cyclohexene",
                "decane",
                "dodecane",
                "ethane",
                "ethene",
                "ethylbenzene",
                "heptadecane",
                "heptane",
                "hexane",
                "hexaphenylene",
                "isobutane",
                "isooctane",
                "isopentane",
                "methane",
                "methylcyclohexane",
                "nonane",
                "o-xylene",
                "octane",
                "p-xylene",
                "pentane",
                "propane",
                "propene",
                "styrene",
                "toluene",
                "toluene-d8",
                "undecane",
                "vinylarene",
                "xylene"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH\u2084)",
            "Ethane (C\u2082H\u2086)",
            "Propane (C\u2083H\u2088)",
            "Butane (C\u2084H\u2081\u2080)",
            "Pentane (C\u2085H\u2081\u2082)",
            "Hexane (C\u2086H\u2081\u2084)",
            "Heptane (C\u2087H\u2081\u2086)",
            "Octane (C\u2088H\u2081\u2088)",
            "Benzene (C\u2086H\u2086)",
            "Toluene (C\u2087H\u2088)",
            "Cyclohexane (C\u2086H\u2081\u2082)",
            "Ethylene (C\u2082H\u2084)",
            "Acetylene (C\u2082H\u2082)",
            "Propylene (C\u2083H\u2086)",
            "Naphthalene (C\u2081\u2080H\u2088)",
            "Anthracene (C\u2081\u2084H\u2081\u2080)",
            "Isobutane (C\u2084H\u2081\u2080)",
            "Cyclopentane (C\u2085H\u2081\u2080)",
            "Styrene (C\u2088H\u2088)",
            "Isoprene (C\u2085H\u2088)",
            "Limonene (C\u2081\u2080H\u2081\u2086)",
            "Fullerene (C\u2086\u2080)",
            "Graphene",
            "Diamond"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH\u2084)",
                "Ethane (C\u2082H\u2086)",
                "Propane (C\u2083H\u2088)",
                "Butane (C\u2084H\u2081\u2080)",
                "Pentane (C\u2085H\u2081\u2082)",
                "Hexane (C\u2086H\u2081\u2084)",
                "Heptane (C\u2087H\u2081\u2086)",
                "Octane (C\u2088H\u2081\u2088)",
                "Benzene (C\u2086H\u2086)",
                "Toluene (C\u2087H\u2088)",
                "Acetylene (C\u2082H\u2082)",
                "Naphthalene (C\u2081\u2080H\u2088)",
                "Anthracene (C\u2081\u2084H\u2081\u2080)",
                "Isobutane (C\u2084H\u2081\u2080)",
                "Cyclopentane (C\u2085H\u2081\u2080)",
                "Styrene (C\u2088H\u2088)",
                "Isoprene (C\u2085H\u2088)"
            ],
            "mismatches": [
                "Cyclohexane (C\u2086H\u2081\u2082)",
                "Ethylene (C\u2082H\u2084)",
                "Propylene (C\u2083H\u2086)",
                "Limonene (C\u2081\u2080H\u2081\u2086)",
                "Fullerene (C\u2086\u2080)",
                "Graphene",
                "Diamond"
            ],
            "true_referents": [
                "(1-Ethylpropyl)benzene",
                "(1Z,2Z,6E,10E)-pinacene",
                "(4S)-limonene",
                "1,2,4-trimethyl-Cyclopentane",
                "1,6-dimethyl-Cyclohexene",
                "1-ethyl-2,4-dimethyl-Benzene",
                "1-hexene",
                "1-nonene",
                "2,4-dimethylhexane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "4-ethyl-1-hexene",
                "6-ethyl-2-methyl-Octane",
                "Ethylcyclopentane",
                "Naphtho[2,3-e]pyrene",
                "acene",
                "acetylene",
                "acetylenes",
                "acyclic acetylene",
                "alkane",
                "anthracene",
                "benzene",
                "benzene-d6",
                "beta-hexaprene",
                "butane",
                "butene",
                "cyclohexene",
                "cyclopentane",
                "diamantane",
                "ethane",
                "ethylbenzene",
                "heptadecane",
                "heptane",
                "hexane",
                "isobutane",
                "isooctane",
                "isopentane",
                "isoprene",
                "methane",
                "naphthalene",
                "octane",
                "pentacene",
                "pentane",
                "polyene",
                "polyhedrane",
                "propane",
                "propene",
                "styrene",
                "tetrahedrane",
                "toluene",
                "toluene-d8",
                "vinylarene"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Acetylene (C2H2)",
            "Ethylene (C2H4)",
            "Propylene (C3H6)",
            "1-Butene (C4H8)",
            "Isobutene (C4H8)",
            "1-Pentene (C5H10)",
            "1-Hexene (C6H12)",
            "Benzene (C6H6)",
            "Toluene (C7H8)",
            "Ethylbenzene (C8H10)",
            "o-Xylene (C8H10)",
            "m-Xylene (C8H10)",
            "p-Xylene (C8H10)",
            "Naphthalene (C10H8)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Acetylene (C2H2)",
                "1-Pentene (C5H10)",
                "1-Hexene (C6H12)",
                "Benzene (C6H6)",
                "Toluene (C7H8)",
                "Ethylbenzene (C8H10)",
                "o-Xylene (C8H10)",
                "m-Xylene (C8H10)",
                "p-Xylene (C8H10)",
                "Naphthalene (C10H8)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "1-Butene (C4H8)",
                "Isobutene (C4H8)",
                "Ethylene (C2H4)",
                "Propylene (C3H6)"
            ],
            "true_referents": [
                "(1-Ethylpropyl)benzene",
                "(E)-4,4-Dimethyl-2-pentene",
                "1-Pentene",
                "1-ethyl-2,4-dimethyl-Benzene",
                "1-hexene",
                "2,3-dimethylpentane",
                "2,4-Dimethyl-2-pentene",
                "2-Hexene",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-hexene",
                "4-ethyl-1-hexene",
                "5,6-dimethyl-Decane",
                "Naphtho[2,3-e]pyrene",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "acene",
                "acetylene",
                "acyclic acetylene",
                "alkane",
                "benzene",
                "benzene-d6",
                "but-1-ene",
                "butadiene",
                "butane",
                "butene",
                "decane",
                "ethane",
                "ethylbenzene",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "isobutane",
                "isobutylbenzene",
                "isopentane",
                "m-xylene",
                "methane",
                "methylbenzene",
                "naphthalene",
                "nonane",
                "o-xylene",
                "octane",
                "p-xylene",
                "pentane",
                "propene",
                "toluene",
                "toluene-d8",
                "xylene"
            ],
            "TP": 18,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Ethylene (C2H4)",
            "Propylene (C3H6)",
            "Butylene (C4H8)",
            "Isobutylene (C4H8)",
            "Acetylene (C2H2)",
            "Benzene (C6H6)",
            "Toluene (C7H8)",
            "Xylene (C8H10)",
            "Styrene (C8H8)",
            "Naphthalene (C10H8)",
            "Anthracene (C14H10)",
            "Phenanthrene (C14H10)",
            "Cyclohexane (C6H12)",
            "Methylcyclohexane (C7H14)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Acetylene (C2H2)",
                "Benzene (C6H6)",
                "Toluene (C7H8)",
                "Xylene (C8H10)",
                "Styrene (C8H8)",
                "Naphthalene (C10H8)",
                "Anthracene (C14H10)",
                "Phenanthrene (C14H10)",
                "Cyclohexane (C6H12)",
                "Methylcyclohexane (C7H14)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Ethylene (C2H4)",
                "Propylene (C3H6)",
                "Butylene (C4H8)",
                "Isobutylene (C4H8)"
            ],
            "true_referents": [
                "(1-methylethylidene)-Cyclohexane",
                "1-ethyl-2,4-dimethyl-Benzene",
                "1-hexene",
                "1-methyl-Cyclohexene",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2-Isopropyl-1,4-hexadiene",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "4-ethyl-1-hexene",
                "5,6-dimethyl-Decane",
                "Naphtho[2,3-e]pyrene",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "acene",
                "acetylene",
                "acyclic acetylene",
                "alkane",
                "anthracene",
                "benzene",
                "benzene-d6",
                "butadiene",
                "butane",
                "butene",
                "butylbenzene",
                "cyclohexane",
                "cyclohexene",
                "decane",
                "ethane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "isobutane",
                "isobutylbenzene",
                "isopentane",
                "methane",
                "methylcyclohexane",
                "naphthalene",
                "nonane",
                "o-xylene",
                "octane",
                "p-xylene",
                "pentane",
                "phenanthrene",
                "propene",
                "styrene",
                "toluene",
                "toluene-d8",
                "xylene"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Eicosane (C20H42)",
            "Heneicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methane",
                "ethane",
                "butane",
                "pentane",
                "hexane",
                "heptane",
                "octane",
                "nonane",
                "decane",
                "undecane",
                "dodecane",
                "tridecane",
                "tetradecane",
                "pentadecane",
                "hexadecane",
                "heptadecane",
                "octadecane",
                "nonadecane",
                "henicosane",
                "docosane",
                "tricosane",
                "tetracosane"
            ],
            "mismatches": [
                "propane",
                "eicosane"
            ],
            "true_referents": [
                "(9Z)-tricosene",
                "(E)-2-dodecene",
                "(E,Z)-2,4-Dodecadiene",
                "1,4-Undecadiene",
                "1-docosene",
                "1-hexene",
                "1-pentadecene",
                "10-Eicosene",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,6,8-trimethyldecane",
                "2,6-dimethylheptadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "5,6-dimethyl-Decane",
                "7Z-Heneicosene",
                "8E-Heneicosene",
                "9-Methylnonadecane",
                "Eicosene",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Tetracosene",
                "Undecane, 2,9-dimethyl-",
                "acene",
                "alkane",
                "butane",
                "butene",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentadecane",
                "pentane",
                "propene",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tricosene",
                "tridecane",
                "undecane"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Eicosane (C20H42)",
            "Heneicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)",
                "Tetracosane (C24H50)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Eicosane (C20H42)",
                "Heneicosane (C21H44)"
            ],
            "true_referents": [
                "(9Z)-tricosene",
                "(E)-2-dodecene",
                "(E,Z)-2,4-Dodecadiene",
                "1,4-Undecadiene",
                "1-docosene",
                "1-hexene",
                "1-pentadecene",
                "10-Eicosene",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,6,8-trimethyldecane",
                "2,6-dimethylheptadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "5,6-dimethyl-Decane",
                "7Z-Heneicosene",
                "8E-Heneicosene",
                "9-Methylnonadecane",
                "Eicosene",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Tetracosene",
                "Undecane, 2,9-dimethyl-",
                "acene",
                "alkane",
                "butane",
                "butene",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentadecane",
                "pentane",
                "propene",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tricosene",
                "tridecane",
                "undecane"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Icosane (C20H42)",
            "Ethene (C2H4)",
            "Propene (C3H6)",
            "But-1-ene (C4H8)",
            "But-2-ene (C4H8)",
            "Pent-1-ene (C5H10)",
            "Pent-2-ene (C5H10)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Icosane (C20H42)",
                "Ethene (C2H4)",
                "Propene (C3H6)",
                "But-1-ene (C4H8)",
                "But-2-ene (C4H8)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Pent-1-ene (C5H10)",
                "Pent-2-ene (C5H10)"
            ],
            "true_referents": [
                "(3E)-3-Icosene",
                "(E)-2-dodecene",
                "(E)-3-dodecene",
                "(E,Z)-2,4-Dodecadiene",
                "1,4-Undecadiene",
                "1-hexene",
                "1-pentadecene",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,6,8-trimethyldecane",
                "2,6-dimethylheptadecane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "acene",
                "alkane",
                "but-1-ene",
                "but-2-ene",
                "butane",
                "butene",
                "decane",
                "dodecane",
                "ethane",
                "ethene",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentadecane",
                "pentane",
                "propene",
                "tetradecane",
                "trans-but-2-ene",
                "tridecane",
                "undecane"
            ],
            "TP": 22,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "hydrocarbon",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "diamond",
                "Canonical name": "(C)diamond"
            },
            {
                "Referent": "graphite",
                "Canonical name": "(C)graphite"
            },
            {
                "Referent": "fullerenes",
                "Canonical name": "(C)fullerenes"
            },
            {
                "Referent": "carbon nanotubes",
                "Canonical name": "(C)carbon nanotubes"
            },
            {
                "Referent": "carbohydrate",
                "Canonical name": "(C)carbohydrate"
            },
            {
                "Referent": "glycogen",
                "Canonical name": "(C)glycogen"
            },
            {
                "Referent": "cellulose",
                "Canonical name": "(C)cellulose"
            },
            {
                "Referent": "chitin",
                "Canonical name": "(C)chitin"
            },
            {
                "Referent": "chitosan",
                "Canonical name": "(C)chitosan"
            },
            {
                "Referent": "acetylene",
                "Canonical name": "(C)acetylene"
            },
            {
                "Referent": "ethyne",
                "Canonical name": "(C)ethyne"
            },
            {
                "Referent": "benzene",
                "Canonical name": "(C)benzene"
            },
            {
                "Referent": "cyclohexane",
                "Canonical name": "(C)cyclohexane"
            },
            {
                "Referent": "hexane",
                "Canonical name": "(C)hexane"
            },
            {
                "Referent": "cyclohexene",
                "Canonical name": "(C)cyclohexene"
            },
            {
                "Referent": "cycloheptane",
                "Canonical name": "(C)cycloheptane"
            },
            {
                "Referent": "cyclooctane",
                "Canonical name": "(C)cyclooctane"
            },
            {
                "Referent": "cyclononane",
                "Canonical name": "(C)cyclononane"
            },
            {
                "Referent": "cyclodecane",
                "Canonical name": "(C)cyclodecane"
            },
            {
                "Referent": "cyclododecane",
                "Canonical name": "(C)cyclododecane"
            },
            {
                "Referent": "cyclopentane",
                "Canonical name": "(C)cyclopentane"
            },
            {
                "Referent": "cyclohexadiene",
                "Canonical name": "(C)cyclohexadiene"
            },
            {
                "Referent": "cycloheptadiene",
                "Canonical name": "(C)cycloheptadiene"
            },
            {
                "Referent": "cyclooctadiene",
                "Canonical name": "(C)cyclooctadiene"
            },
            {
                "Referent": "cyclodecadiene",
                "Canonical name": "(C)cyclodecadiene"
            },
            {
                "Referent": "cyclopentadiene",
                "Canonical name": "(C)cyclopentadiene"
            },
            {
                "Referent": "cyclohexatriene",
                "Canonical name": "(C)cyclohexatriene"
            },
            {
                "Referent": "cycloheptatriene",
                "Canonical name": "(C)cycloheptatriene"
            },
            {
                "Referent": "cyclooctatriene",
                "Canonical name": "(C)cyclooctatriene"
            },
            {
                "Referent": "cyclodecatriene",
                "Canonical name": "(C)cyclodecatriene"
            },
            {
                "Referent": "cyclopentatriene",
                "Canonical name": "(C)cyclopentatriene"
            },
            {
                "Referent": "cyclohexadiynyl",
                "Canonical name": "(C)cyclohexadiynyl"
            },
            {
                "Referent": "cycloheptadiynyl",
                "Canonical name": "(C)cycloheptadiynyl"
            },
            {
                "Referent": "cyclooctadiynyl",
                "Canonical name": "(C)cyclooctadiynyl"
            },
            {
                "Referent": "cyclodecadiynyl",
                "Canonical name": "(C)cyclodecadiynyl"
            },
            {
                "Referent": "cyclopentadiynyl",
                "Canonical name": "(C)cyclopentadiynyl"
            },
            {
                "Referent": "cyclohexadiene",
                "Canonical name": "(C)cyclohexadiene"
            },
            {
                "Referent": "cycloheptadiene",
                "Canonical name": "(C)cycloheptadiene"
            },
            {
                "Referent": "cyclooctadiene",
                "Canonical name": "(C)cyclooctadiene"
            },
            {
                "Referent": "cyclodecadiene",
                "Canonical name": "(C)cyclodecadiene"
            },
            {
                "Referent": "cyclopentadiene",
                "Canonical name": "(C)cyclopentadiene"
            },
            {
                "Referent": "cyclohexatriene",
                "Canonical name": "(C)cyclohexatriene"
            },
            {
                "Referent": "cycloheptatriene",
                "Canonical name": "(C)cycloheptatriene"
            },
            {
                "Referent": "cyclooctatriene",
                "Canonical name": "(C)cyclooctatriene"
            },
            {
                "Referent": "cyclodecatriene",
                "Canonical name": "(C)cyclodecatriene"
            },
            {
                "Referent": "cyclopentatriene",
                "Canonical name": "(C)cyclopentatriene"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "acetylene",
                "benzene",
                "hexane",
                "cyclopentane"
            ],
            "mismatches": [
                "diamond",
                "graphite",
                "fullerenes",
                "carbon nanotubes",
                "carbohydrate",
                "glycogen",
                "cellulose",
                "chitin",
                "chitosan",
                "ethyne",
                "cyclohexane",
                "cyclohexene",
                "cycloheptane",
                "cyclooctane",
                "cyclononane",
                "cyclodecane",
                "cyclododecane",
                "cyclohexadiene",
                "cycloheptadiene",
                "cyclooctadiene",
                "cyclodecadiene",
                "cyclopentadiene",
                "cyclohexatriene",
                "cycloheptatriene",
                "cyclooctatriene",
                "cyclodecatriene",
                "cyclopentatriene",
                "cyclohexadiynyl",
                "cycloheptadiynyl",
                "cyclooctadiynyl",
                "cyclodecadiynyl",
                "cyclopentadiynyl"
            ],
            "true_referents": [
                "(+)-Isoconiochaetone C",
                "(+)-cubenene",
                "(-)-alpha-amorphene",
                "(-)-cyperene",
                "(1-methylethylidene)-Cyclohexane",
                "(1Z,2Z,6E,10E)-pinacene",
                "(7E)-tricosene",
                "1,4-Cyclohexadiene, 1-methyl-",
                "1-Methyl-3-(2-methyl-1-propenyl)cyclopentane",
                "1-docosene",
                "1-hexadecene",
                "1-hexene",
                "4,6-dimethyldodecane",
                "Cycloheptene",
                "Cyclopentane, 1,1,3-trimethyl-",
                "acetylene",
                "acetylenes",
                "alkane",
                "benzene",
                "cyclohepta-1,3,5-triene",
                "cycloocta-1,3,5-triene",
                "cycloocta-1,3,6-triene",
                "cyclopentane",
                "hexadecane",
                "hexane",
                "monocyclic hydrocarbon",
                "triacetylene",
                "tricyclic hydrocarbon"
            ],
            "TP": 4,
            "FP": 32,
            "FN": 0
        }
    }
]