[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "methane (CH4)",
            "ethane (C2H6)",
            "propane (C3H8)",
            "butane (C4H10)",
            "pentane (C5H12)",
            "hexane (C6H14)",
            "heptane (C7H16)",
            "octane (C8H18)",
            "nonane (C9H20)",
            "decane (C10H22)",
            "undecane (C11H24)",
            "dodecane (C12H26)",
            "tridecane (C13H28)",
            "tetradecane (C14H30)",
            "pentadecane (C15H32)",
            "hexadecane (C16H34)",
            "heptadecane (C17H36)",
            "octadecane (C18H38)",
            "nonadecane (C19H40)",
            "eicosane (C20H42)",
            "heneicosane (C21H44)",
            "docosane (C22H46)",
            "tricosane (C23H48)",
            "tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methane (CH4)",
                "ethane (C2H6)",
                "butane (C4H10)",
                "pentane (C5H12)",
                "hexane (C6H14)",
                "heptane (C7H16)",
                "octane (C8H18)",
                "nonane (C9H20)",
                "decane (C10H22)",
                "undecane (C11H24)",
                "dodecane (C12H26)",
                "tridecane (C13H28)",
                "tetradecane (C14H30)",
                "pentadecane (C15H32)",
                "hexadecane (C16H34)",
                "heptadecane (C17H36)",
                "octadecane (C18H38)",
                "nonadecane (C19H40)",
                "docosane (C22H46)",
                "tricosane (C23H48)",
                "tetracosane (C24H50)"
            ],
            "mismatches": [
                "propane (C3H8)",
                "eicosane (C20H42)",
                "heneicosane (C21H44)"
            ],
            "true_referents": [
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,4-dimethylhexane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2-Methylhenicosane",
                "2-methyl-Pentadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethyl-5-(2-ethylbutyl)-octadecane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Eicosane (C20H42)",
            "Heneicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)",
            "Pentacosane (C25H52)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)",
                "Tetracosane (C24H50)",
                "Pentacosane (C25H52)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Eicosane (C20H42)",
                "Heneicosane (C21H44)"
            ],
            "true_referents": [
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,4-dimethylhexane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2-Methylhenicosane",
                "2-methyl-Pentadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethyl-5-(2-ethylbutyl)-octadecane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 22,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Eicosane (C20H42)",
            "Heneicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)",
                "Tetracosane (C24H50)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Eicosane (C20H42)",
                "Heneicosane (C21H44)"
            ],
            "true_referents": [
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,4-dimethylhexane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2-Methylhenicosane",
                "2-methyl-Pentadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethyl-5-(2-ethylbutyl)-octadecane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Eicosane (C20H42)",
            "Heneicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)",
                "Tetracosane (C24H50)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Eicosane (C20H42)",
                "Heneicosane (C21H44)"
            ],
            "true_referents": [
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,4-dimethylhexane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2-Methylhenicosane",
                "2-methyl-Pentadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethyl-5-(2-ethylbutyl)-octadecane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Eicosane (C20H42)",
            "Heneicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)",
                "Tetracosane (C24H50)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Eicosane (C20H42)",
                "Heneicosane (C21H44)"
            ],
            "true_referents": [
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,4-dimethylhexane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2-Methylhenicosane",
                "2-methyl-Pentadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethyl-5-(2-ethylbutyl)-octadecane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Eicosane (C20H42)",
            "Heneicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)",
                "Tetracosane (C24H50)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Eicosane (C20H42)",
                "Heneicosane (C21H44)"
            ],
            "true_referents": [
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,4-dimethylhexane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2-Methylhenicosane",
                "2-methyl-Pentadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethyl-5-(2-ethylbutyl)-octadecane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Icosane (C20H42)",
            "Heneicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)",
                "Tetracosane (C24H50)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Icosane (C20H42)",
                "Heneicosane (C21H44)"
            ],
            "true_referents": [
                "2,2,4,4,6,8,8-heptamethylnonane",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,4-dimethylhexane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2-Methylhenicosane",
                "2-methyl-Pentadecane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "methane",
            "ethane",
            "propane",
            "butane",
            "pentane",
            "hexane",
            "heptane",
            "octane",
            "nonane",
            "decane",
            "undecane",
            "dodecane",
            "tridecane",
            "tetradecane",
            "pentadecane",
            "hexadecane",
            "heptadecane",
            "octadecane",
            "nonadecane",
            "icosane",
            "heneicosane",
            "docosane",
            "tricosane",
            "tetracosane"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methane",
                "ethane",
                "propane",
                "butane",
                "pentane",
                "hexane",
                "heptane",
                "octane",
                "nonane",
                "decane",
                "undecane",
                "dodecane",
                "tridecane",
                "tetradecane",
                "pentadecane",
                "hexadecane",
                "heptadecane",
                "octadecane",
                "nonadecane",
                "icosane",
                "docosane",
                "tricosane",
                "tetracosane"
            ],
            "mismatches": [
                "heneicosane"
            ],
            "true_referents": [
                "2-methyl-Pentadecane",
                "3-ethylpentane",
                "3-methyl-pentadecane",
                "5,6-dimethyl-Decane",
                "Decane, 5-methyl-",
                "N-(docosanoyl)eicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexacosane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "propane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "Methane (CH\u2084)",
            "Ethane (C\u2082H\u2086)",
            "Propane (C\u2083H\u2088)",
            "Butane (C\u2084H\u2081\u2080)",
            "Pentane (C\u2085H\u2081\u2082)",
            "Hexane (C\u2086H\u2081\u2084)",
            "Heptane (C\u2087H\u2081\u2086)",
            "Octane (C\u2088H\u2081\u2088)",
            "Nonane (C\u2089H\u2082\u2080)",
            "Decane (C\u2081\u2080H\u2082\u2082)",
            "Undecane (C\u2081\u2081H\u2082\u2084)",
            "Dodecane (C\u2081\u2082H\u2082\u2086)",
            "Tridecane (C\u2081\u2083H\u2082\u2088)",
            "Tetradecane (C\u2081\u2084H\u2083\u2080)",
            "Pentadecane (C\u2081\u2085H\u2083\u2082)",
            "Hexadecane (C\u2081\u2086H\u2083\u2084)",
            "Heptadecane (C\u2081\u2087H\u2083\u2086)",
            "Octadecane (C\u2081\u2088H\u2083\u2088)",
            "Nonadecane (C\u2081\u2089H\u2084\u2080)",
            "Eicosane (C\u2082\u2080H\u2084\u2082)",
            "Heneicosane (C\u2082\u2081H\u2084\u2084)",
            "Docosane (C\u2082\u2082H\u2084\u2086)",
            "Tricosane (C\u2082\u2083H\u2084\u2088)",
            "Tetracosane (C\u2082\u2084H\u2085\u2080)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH\u2084)",
                "Ethane (C\u2082H\u2086)",
                "Propane (C\u2083H\u2088)",
                "Butane (C\u2084H\u2081\u2080)",
                "Pentane (C\u2085H\u2081\u2082)",
                "Hexane (C\u2086H\u2081\u2084)",
                "Heptane (C\u2087H\u2081\u2086)",
                "Octane (C\u2088H\u2081\u2088)",
                "Nonane (C\u2089H\u2082\u2080)",
                "Decane (C\u2081\u2080H\u2082\u2082)",
                "Undecane (C\u2081\u2081H\u2082\u2084)",
                "Dodecane (C\u2081\u2082H\u2082\u2086)",
                "Tridecane (C\u2081\u2083H\u2082\u2088)",
                "Tetradecane (C\u2081\u2084H\u2083\u2080)",
                "Pentadecane (C\u2081\u2085H\u2083\u2082)",
                "Hexadecane (C\u2081\u2086H\u2083\u2084)",
                "Heptadecane (C\u2081\u2087H\u2083\u2086)",
                "Octadecane (C\u2081\u2088H\u2083\u2088)",
                "Nonadecane (C\u2081\u2089H\u2084\u2080)",
                "Docosane (C\u2082\u2082H\u2084\u2086)",
                "Tricosane (C\u2082\u2083H\u2084\u2088)",
                "Tetracosane (C\u2082\u2084H\u2085\u2080)"
            ],
            "mismatches": [
                "Eicosane (C\u2082\u2080H\u2084\u2082)",
                "Heneicosane (C\u2082\u2081H\u2084\u2084)"
            ],
            "true_referents": [
                "2,3,5,8-tetramethyldecane",
                "2,4,6,10-tetramethylpentadecane",
                "2,4-dimethylhexane",
                "2,5,9-Trimethyldecane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2,9-dimethyldecane",
                "2-Methylhenicosane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "6-ethyl-2-methyl-Octane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "N-(eicosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "propane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Icosane (C20H42)",
            "Heneicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)",
                "Tetracosane (C24H50)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Icosane (C20H42)",
                "Heneicosane (C21H44)"
            ],
            "true_referents": [
                "2,2,4,4,6,8,8-heptamethylnonane",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,4-dimethylhexane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2-Methylhenicosane",
                "2-methyl-Pentadecane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Icosane (C20H42)",
            "Henicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Henicosane (C21H44)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)",
                "Tetracosane (C24H50)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Icosane (C20H42)"
            ],
            "true_referents": [
                "2,2,4,4,6,8,8-heptamethylnonane",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,4-dimethylhexane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2-Methylhenicosane",
                "2-methyl-Pentadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Icosane (C20H42)",
            "Henicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Henicosane (C21H44)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)",
                "Tetracosane (C24H50)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Icosane (C20H42)"
            ],
            "true_referents": [
                "2,2,4,4,6,8,8-heptamethylnonane",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,4-dimethylhexane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2-Methylhenicosane",
                "2-methyl-Pentadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Eicosane (C20H42)",
            "Heneicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)",
                "Tetracosane (C24H50)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Eicosane (C20H42)",
                "Heneicosane (C21H44)"
            ],
            "true_referents": [
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,4-dimethylhexane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2-Methylhenicosane",
                "2-methyl-Pentadecane",
                "2-methylicosane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethyl-5-(2-ethylbutyl)-octadecane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Icosane (C20H42)",
            "Heneicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Icosane (C20H42)",
                "Heneicosane (C21H44)"
            ],
            "true_referents": [
                "2,2,4,4,6,8,8-heptamethylnonane",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,4-dimethylhexane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2-Methylhenicosane",
                "2-methyl-Pentadecane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentadecane",
                "pentane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 20,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            "Methane (CH4)",
            "Ethane (C2H6)",
            "Propane (C3H8)",
            "Butane (C4H10)",
            "Pentane (C5H12)",
            "Hexane (C6H14)",
            "Heptane (C7H16)",
            "Octane (C8H18)",
            "Nonane (C9H20)",
            "Decane (C10H22)",
            "Undecane (C11H24)",
            "Dodecane (C12H26)",
            "Tridecane (C13H28)",
            "Tetradecane (C14H30)",
            "Pentadecane (C15H32)",
            "Hexadecane (C16H34)",
            "Heptadecane (C17H36)",
            "Octadecane (C18H38)",
            "Nonadecane (C19H40)",
            "Icosane (C20H42)",
            "Heneicosane (C21H44)",
            "Docosane (C22H46)",
            "Tricosane (C23H48)",
            "Tetracosane (C24H50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methane (CH4)",
                "Ethane (C2H6)",
                "Butane (C4H10)",
                "Pentane (C5H12)",
                "Hexane (C6H14)",
                "Heptane (C7H16)",
                "Octane (C8H18)",
                "Nonane (C9H20)",
                "Decane (C10H22)",
                "Undecane (C11H24)",
                "Dodecane (C12H26)",
                "Tridecane (C13H28)",
                "Tetradecane (C14H30)",
                "Pentadecane (C15H32)",
                "Hexadecane (C16H34)",
                "Heptadecane (C17H36)",
                "Octadecane (C18H38)",
                "Nonadecane (C19H40)",
                "Docosane (C22H46)",
                "Tricosane (C23H48)",
                "Tetracosane (C24H50)"
            ],
            "mismatches": [
                "Propane (C3H8)",
                "Icosane (C20H42)",
                "Heneicosane (C21H44)"
            ],
            "true_referents": [
                "2,2,4,4,6,8,8-heptamethylnonane",
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,4-dimethylhexane",
                "2,6,8-trimethyldecane",
                "2,6-Dimethyldecane",
                "2,6-dimethylheptadecane",
                "2-Methylhenicosane",
                "2-methyl-Pentadecane",
                "3,6-dimethyl-Decane",
                "3,6-dimethyl-Octane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "3-methyl-pentadecane",
                "4,6-dimethyldodecane",
                "4-methyl-Tetradecane",
                "5,6-dimethyl-Decane",
                "9-Methylnonadecane",
                "N-(docosanoyl)-4-hydroxyeicosasphinganine",
                "Nonane, 2,5-dimethyl-",
                "Nonane, 4-methyl-",
                "Undecane, 2,9-dimethyl-",
                "Undecane, 2-methyl-",
                "butane",
                "decane",
                "docosane",
                "dodecane",
                "ethane",
                "henicosane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "icosane",
                "isobutane",
                "isopentane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "tetracosane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "alkane",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "ethane",
                "Canonical name": "ethane"
            },
            {
                "Referent": "propane",
                "Canonical name": "propane"
            },
            {
                "Referent": "butane",
                "Canonical name": "butane"
            },
            {
                "Referent": "pentane",
                "Canonical name": "pentane"
            },
            {
                "Referent": "hexane",
                "Canonical name": "hexane"
            },
            {
                "Referent": "heptane",
                "Canonical name": "heptane"
            },
            {
                "Referent": "octane",
                "Canonical name": "octane"
            },
            {
                "Referent": "nonane",
                "Canonical name": "nonane"
            },
            {
                "Referent": "decane",
                "Canonical name": "decane"
            },
            {
                "Referent": "undecane",
                "Canonical name": "undecane"
            },
            {
                "Referent": "dodecane",
                "Canonical name": "dodecane"
            },
            {
                "Referent": "tridecane",
                "Canonical name": "tridecane"
            },
            {
                "Referent": "tetradecane",
                "Canonical name": "tetradecane"
            },
            {
                "Referent": "pentadecane",
                "Canonical name": "pentadecane"
            },
            {
                "Referent": "hexadecane",
                "Canonical name": "hexadecane"
            },
            {
                "Referent": "heptadecane",
                "Canonical name": "heptadecane"
            },
            {
                "Referent": "octadecane",
                "Canonical name": "octadecane"
            },
            {
                "Referent": "nonadecane",
                "Canonical name": "nonadecane"
            },
            {
                "Referent": "eicosane",
                "Canonical name": "eicosane"
            },
            {
                "Referent": "heneicosane",
                "Canonical name": "heneicosane"
            },
            {
                "Referent": "docosane",
                "Canonical name": "docosane"
            },
            {
                "Referent": "tricosane",
                "Canonical name": "tricosane"
            },
            {
                "Referent": "tetracosane",
                "Canonical name": "tetracosane"
            },
            {
                "Referent": "pentacosan",
                "Canonical name": "pentacosan"
            },
            {
                "Referent": "hexacosan",
                "Canonical name": "hexacosan"
            },
            {
                "Referent": "heptacosan",
                "Canonical name": "heptacosan"
            },
            {
                "Referent": "octacosan",
                "Canonical name": "octacosan"
            },
            {
                "Referent": "nonacosan",
                "Canonical name": "nonacosan"
            },
            {
                "Referent": "triacontane",
                "Canonical name": "triacontane"
            },
            {
                "Referent": "tetracontane",
                "Canonical name": "tetracontane"
            },
            {
                "Referent": "pentacontane",
                "Canonical name": "pentacontane"
            },
            {
                "Referent": "hexacontane",
                "Canonical name": "hexacontane"
            },
            {
                "Referent": "heptacontane",
                "Canonical name": "heptacontane"
            },
            {
                "Referent": "octacontane",
                "Canonical name": "octacontane"
            },
            {
                "Referent": "nonacontane",
                "Canonical name": "nonacontane"
            },
            {
                "Referent": "hentriacontane",
                "Canonical name": "hentriacontane"
            },
            {
                "Referent": "dotriacontane",
                "Canonical name": "dotriacontane"
            },
            {
                "Referent": "tritriacontane",
                "Canonical name": "tritriacontane"
            },
            {
                "Referent": "tetratriacontane",
                "Canonical name": "tetratriacontane"
            },
            {
                "Referent": "pentatriacontane",
                "Canonical name": "pentatriacontane"
            },
            {
                "Referent": "hexatriacontane",
                "Canonical name": "hexatriacontane"
            },
            {
                "Referent": "heptatriacontane",
                "Canonical name": "heptatriacontane"
            },
            {
                "Referent": "octatriacontane",
                "Canonical name": "octatriacontane"
            },
            {
                "Referent": "nonatriacontane",
                "Canonical name": "nonatriacontane"
            },
            {
                "Referent": "triacontane",
                "Canonical name": "triacontane"
            },
            {
                "Referent": "tetracontane",
                "Canonical name": "tetracontane"
            },
            {
                "Referent": "pentacontane",
                "Canonical name": "pentacontane"
            },
            {
                "Referent": "hexacontane",
                "Canonical name": "hexacontane"
            },
            {
                "Referent": "heptacontane",
                "Canonical name": "heptacontane"
            },
            {
                "Referent": "octacontane",
                "Canonical name": "octacontane"
            },
            {
                "Referent": "nonacontane",
                "Canonical name": "nonacontane"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethane",
                "propane",
                "butane",
                "pentane",
                "hexane",
                "heptane",
                "octane",
                "nonane",
                "undecane",
                "dodecane",
                "tridecane",
                "pentadecane",
                "hexadecane",
                "heptadecane",
                "octadecane",
                "nonadecane",
                "docosane",
                "tricosane",
                "pentacosane",
                "heptacosane"
            ],
            "mismatches": [
                "decane",
                "tetradecane",
                "eicosane",
                "heneicosane",
                "tetracosane",
                "hexacosan",
                "octacosan",
                "nonacosan",
                "triacontane",
                "tetracontane",
                "pentacontane",
                "hexacontane",
                "heptacontane",
                "octacontane",
                "nonacontane",
                "hentriacontane",
                "dotriacontane",
                "tritriacontane",
                "tetratriacontane",
                "pentatriacontane",
                "hexatriacontane",
                "heptatriacontane",
                "octatriacontane",
                "nonatriacontane"
            ],
            "true_referents": [
                "2,3,5,8-tetramethyldecane",
                "2,3-dimethylpentane",
                "2,5,9-Trimethyldecane",
                "2,6-Dimethyldecane",
                "3,5-dimethyl-Heptane",
                "3,6-dimethyl-Octane",
                "3-ethyl-3-methyldecane",
                "3-ethylpentane",
                "3-methyl-Tridecane",
                "4,6-dimethyldodecane",
                "Decane, 5-methyl-",
                "Dodecane, 4-methyl-",
                "Hexane, 2,2,5-trimethyl-",
                "Nonane, 4-methyl-",
                "Nonane, 5-methyl-5-propyl-",
                "Undecane, 2-methyl-",
                "butane",
                "docosane",
                "dodecane",
                "ethane",
                "heptacosane",
                "heptadecane",
                "heptane",
                "hexadecane",
                "hexane",
                "methane",
                "nonadecane",
                "nonane",
                "octadecane",
                "octane",
                "pentacosane",
                "pentadecane",
                "pentane",
                "propane",
                "tetradecane",
                "tricosane",
                "tridecane",
                "undecane"
            ],
            "TP": 20,
            "FP": 24,
            "FN": 0
        }
    }
]