[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "propanol (C3H7OH)",
            "butanol (C4H9OH)",
            "pentanol (C5H11OH)",
            "hexanol (C6H13OH)",
            "heptanol (C7H15OH)",
            "octanol (C8H17OH)",
            "nonanol (C9H19OH)",
            "decanol (C10H21OH)",
            "undecanol (C11H23OH)",
            "dodecanol (C12H25OH)",
            "tridecanol (C13H27OH)",
            "tetradecanol (C14H31OH)",
            "pentadecanol (C15H33OH)",
            "hexadecanol (C16H35OH)",
            "heptadecanol (C17H37OH)",
            "octadecanol (C18H39OH)",
            "nonadecanol (C19H41OH)",
            "eicosanol (C20H43OH)",
            "heneicosanol (C21H45OH)",
            "docosanol (C22H47OH)",
            "tricosanol (C23H49OH)",
            "tetracosanol (C24H51OH)",
            "pentacosanol (C25H53OH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "pentanol",
                "hexanol",
                "heptanol",
                "octanol",
                "nonanol",
                "decanol",
                "undecanol",
                "dodecanol",
                "tridecanol",
                "tetradecanol",
                "pentadecanol",
                "hexadecanol",
                "heptadecanol",
                "octadecanol",
                "nonadecanol",
                "docosanol",
                "tricosanol",
                "tetracosanol",
                "pentacosanol"
            ],
            "mismatches": [
                "propanol (C3H7OH)",
                "butanol (C4H9OH)",
                "eicosanol (C20H43OH)",
                "heneicosanol (C21H45OH)"
            ],
            "true_referents": [
                "(2S)-2-heptanol",
                "1,21-Heneicosanediol",
                "1,7-decanediol",
                "1-O-(2R-hydroxy-eicosanyl)-sn-glycerol",
                "1-octadecyl-heptadecanoate",
                "2-butyl-1-octanol",
                "3,7-dimethyl-3-octanol",
                "3-Hydroxy-1-phenyl-1-eicosanone",
                "3S,7S-dimethyl-2S-tetradecanol",
                "4-Hydroxy-6-docosanone",
                "4-Hydroxy-6-eicosanone",
                "4-Hydroxy-6-heneicosanone",
                "4-Hydroxy-6-tetracosanone",
                "5-Hydroxy-7-docosanone",
                "6-Hydroxy-4-heneicosanone",
                "6-oxo-nonan-1-ol",
                "8E-octadecenyl heptadecanoate",
                "butyl butanoate",
                "butyl octanoate",
                "decanol",
                "docosanol",
                "dodecan-1-ol",
                "dodecanol",
                "dodecyl dodecanoate",
                "heptadecanol",
                "heptanol",
                "hexacosanol",
                "hexadecanol",
                "hexanol",
                "hexyl hexanoate",
                "hexyl propanoate",
                "nonadecanol",
                "nonan-4-ol",
                "nonanol",
                "octadecanol",
                "octanol",
                "pentacosanol",
                "pentadecan-5-ol",
                "pentadecanol",
                "pentan-1-ol",
                "pentanol",
                "propyl decanoate",
                "tetracosanol",
                "tetradecanol",
                "tetradecyl tetradecanoate",
                "tricosanol",
                "tridecanol",
                "undecan-1-ol",
                "undecan-6-ol",
                "undecanol"
            ],
            "TP": 19,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "1-Propanol (C3H8O)",
            "1-Butanol (C4H10O)",
            "1-Pentanol (C5H12O)",
            "1-Hexanol (C6H14O)",
            "1-Heptanol (C7H16O)",
            "1-Octanol (C8H18O)",
            "1-Nonanol (C9H20O)",
            "1-Decanol (C10H22O)",
            "1-Undecanol (C11H24O)",
            "1-Dodecanol (C12H26O)",
            "1-Tridecanol (C13H28O)",
            "1-Tetradecanol (C14H30O)",
            "1-Pentadecanol (C15H32O)",
            "1-Hexadecanol (C16H34O)",
            "1-Heptadecanol (C17H36O)",
            "1-Octadecanol (C18H38O)",
            "1-Nonadecanol (C19H40O)",
            "1-Eicosanol (C20H42O)",
            "1-Heneicosanol (C21H44O)",
            "1-Docosanol (C22H46O)",
            "1-Tricosanol (C23H48O)",
            "1-Tetracosanol (C24H50O)",
            "1-Pentacosanol (C25H52O)",
            "1-Hexacosanol (C26H54O)",
            "1-Heptacosanol (C27H56O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1-Heptanol (C7H16O)",
                "1-Octanol (C8H18O)",
                "1-Nonanol (C9H20O)",
                "1-Decanol (C10H22O)",
                "1-Undecanol (C11H24O)",
                "1-Dodecanol (C12H26O)",
                "1-Tridecanol (C13H28O)",
                "1-Tetradecanol (C14H30O)",
                "1-Pentadecanol (C15H32O)",
                "1-Hexadecanol (C16H34O)",
                "1-Heptadecanol (C17H36O)",
                "1-Octadecanol (C18H38O)",
                "1-Docosanol (C22H46O)",
                "1-Tricosanol (C23H48O)",
                "1-Tetracosanol (C24H50O)",
                "1-Pentacosanol (C25H52O)",
                "1-Hexacosanol (C26H54O)"
            ],
            "mismatches": [
                "1-Propanol (C3H8O)",
                "1-Butanol (C4H10O)",
                "1-Pentanol (C5H12O)",
                "1-Eicosanol (C20H42O)",
                "1-Heneicosanol (C21H44O)",
                "1-Heptacosanol (C27H56O)"
            ],
            "true_referents": [
                "(2S)-2-heptanol",
                "1,7-decanediol",
                "1-O-(2R-hydroxy-eicosanyl)-sn-glycerol",
                "1-O-hexacosyl oleate",
                "1-octadecyl-heptadecanoate",
                "2-butyl-1-octanol",
                "3,7-dimethyl-3-octanol",
                "3-Hydroxy-1-phenyl-1-eicosanone",
                "3S,7S-dimethyl-2-hexadecanol",
                "3S,7S-dimethyl-2S-tetradecanol",
                "4-Hydroxy-6-docosanone",
                "4-Hydroxy-6-heneicosanone",
                "4-Hydroxy-6-tetracosanone",
                "5,10-Pentadecadien-1-ol",
                "5-Hydroxy-7-eicosanone",
                "6-Hydroxy-4-heneicosanone",
                "6-Hydroxy-8-tricosanone",
                "6-oxo-nonan-1-ol",
                "8-Hydroxy-6-heneicosanone",
                "8E-octadecenyl heptadecanoate",
                "9-Hydroxytridecyl docosanoate",
                "butyl butanoate",
                "decanol",
                "docosanol",
                "dodecan-1-ol",
                "dodecan-6-ol",
                "dodecanol",
                "heptadecanol",
                "heptanol",
                "hexacosan-6-ol",
                "hexacosanol",
                "hexadecanol",
                "hexanol",
                "hexyl hexanoate",
                "hexyl propanoate",
                "nonadecanol",
                "nonanol",
                "octadecanol",
                "octanol",
                "pentacosan-5-ol",
                "pentacosanol",
                "pentadecan-1-ol",
                "pentadecanol",
                "pentan-1-ol",
                "pentanol",
                "tetracosanol",
                "tetradecanol",
                "tetradecyl tetradecanoate",
                "tricosanol",
                "tridecanol",
                "undecan-1-ol",
                "undecan-4-ol",
                "undecanol"
            ],
            "TP": 17,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "Propyl alcohol (Propanol)",
            "Butyl alcohol (Butanol)",
            "Pentyl alcohol (Pentanol)",
            "Hexyl alcohol (Hexanol)",
            "Heptyl alcohol (Heptanol)",
            "Octyl alcohol (Octanol)",
            "Nonyl alcohol (Nonanol)",
            "Decyl alcohol (Decanol)",
            "Undecyl alcohol (Undecanol)",
            "Dodecyl alcohol (Dodecanol)",
            "Tridecyl alcohol (Tridecanol)",
            "Tetradecyl alcohol (Tetradecanol)",
            "Pentadecyl alcohol (Pentadecanol)",
            "Hexadecyl alcohol (Hexadecanol)",
            "Heptadecyl alcohol (Heptadecanol)",
            "Octadecyl alcohol (Octadecanol)",
            "Nonadecyl alcohol (Nonadecanol)",
            "Eicosyl alcohol (Eicosanol)",
            "Heneicosyl alcohol (Heneicosanol)",
            "Docosyl alcohol (Docosanol)",
            "Tricosyl alcohol (Tricosanol)",
            "Tetracosyl alcohol (Tetracosanol)",
            "Pentacosyl alcohol (Pentacosanol)",
            "Hexacosyl alcohol (Hexacosanol)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "pentanol",
                "hexanol",
                "heptanol",
                "octanol",
                "nonanol",
                "decanol",
                "undecanol",
                "dodecanol",
                "tridecanol",
                "tetradecanol",
                "pentadecanol",
                "hexadecanol",
                "heptadecanol",
                "octadecanol",
                "nonadecanol",
                "docosanol",
                "tricosanol",
                "tetracosanol",
                "pentacosanol",
                "hexacosanol"
            ],
            "mismatches": [
                "propanol",
                "butanol",
                "eicosanol",
                "heneicosanol"
            ],
            "true_referents": [
                "(2S)-2-heptanol",
                "1,21-Heneicosanediol",
                "1-O-(2R-hydroxy-eicosanyl)-sn-glycerol",
                "1-octadecyl-heptadecanoate",
                "2-butyl-1-octanol",
                "3,7-dimethyl-3-octanol",
                "3-Hydroxy-1-phenyl-1-eicosanone",
                "4-Hydroxy-6-heneicosanone",
                "6-Hydroxy-4-heneicosanone",
                "8E-octadecenyl heptadecanoate",
                "butyl acetate",
                "butyl butanoate",
                "decan-1-ol",
                "decanol",
                "decyl oleate",
                "docosan-3-ol",
                "docosanol",
                "dodecanol",
                "dodecenol",
                "dodecyl dodecanoate",
                "heptadecanol",
                "heptanol",
                "hexacosanol",
                "hexadecanol",
                "hexanol",
                "hexyl hexanoate",
                "hexyl propanoate",
                "nonadecanol",
                "nonan-3-ol",
                "nonanol",
                "nonyl acetate",
                "nonyl palmitate",
                "octadecanol",
                "octanol",
                "pentacosan-1-ol",
                "pentacosanol",
                "pentadecan-1-ol",
                "pentadecanol",
                "pentanol",
                "pentyl propanoate",
                "propyl acetate",
                "propyl decanoate",
                "tetracosanol",
                "tetradecanol",
                "tetradecyl tetradecanoate",
                "tricosanol",
                "tridecanol",
                "undecan-1-ol",
                "undecanol",
                "unsaturated fatty alcohol"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "1-Nonanol (1-Nonanol)",
            "1-Decanol (1-Decanol)",
            "1-Undecanol (1-Undecanol)",
            "1-Dodecanol (1-Dodecanol)",
            "1-Tridecanol (1-Tridecanol)",
            "1-Tetradecanol (1-Tetradecanol)",
            "1-Pentadecanol (1-Pentadecanol)",
            "1-Hexadecanol (1-Hexadecanol)",
            "1-Heptadecanol (1-Heptadecanol)",
            "1-Octadecanol (1-Octadecanol)",
            "1-Nonadecanol (1-Nonadecanol)",
            "1-Eicosanol (1-Eicosanol)",
            "1-Heneicosanol (1-Heneicosanol)",
            "1-Docosanol (1-Docosanol)",
            "1-Tricosanol (1-Tricosanol)",
            "1-Tetracosanol (1-Tetracosanol)",
            "1-Pentacosanol (1-Pentacosanol)",
            "1-Hexacosanol (1-Hexacosanol)",
            "1-Heptacosanol (1-Heptacosanol)",
            "1-Octacosanol (1-Octacosanol)",
            "1-Nonacosanol (1-Nonacosanol)",
            "1-Triacontanol (1-Triacontanol)",
            "1-Dotriacontanol (1-Dotriacontanol)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1-Docosanol (1-Docosanol)",
                "1-Tricosanol (1-Tricosanol)",
                "1-Tetracosanol (1-Tetracosanol)",
                "1-Pentacosanol (1-Pentacosanol)",
                "1-Hexacosanol (1-Hexacosanol)",
                "1-Nonacosanol (1-Nonacosanol)"
            ],
            "mismatches": [
                "1-Nonanol (1-Nonanol)",
                "1-Decanol (1-Decanol)",
                "1-Undecanol (1-Undecanol)",
                "1-Dodecanol (1-Dodecanol)",
                "1-Tridecanol (1-Tridecanol)",
                "1-Tetradecanol (1-Tetradecanol)",
                "1-Pentadecanol (1-Pentadecanol)",
                "1-Hexadecanol (1-Hexadecanol)",
                "1-Heptadecanol (1-Heptadecanol)",
                "1-Octadecanol (1-Octadecanol)",
                "1-Nonadecanol (1-Nonadecanol)",
                "1-Eicosanol (1-Eicosanol)",
                "1-Heneicosanol (1-Heneicosanol)",
                "1-Heptacosanol (1-Heptacosanol)",
                "1-Octacosanol (1-Octacosanol)",
                "1-Triacontanol (1-Triacontanol)",
                "1-Dotriacontanol (1-Dotriacontanol)"
            ],
            "true_referents": [
                "(2S)-2-heptanol",
                "(S)-nonacosan-10-ol",
                "1,21-Heneicosanediol",
                "1,3-decanediol",
                "1,7-decanediol",
                "1-Stearoylglycerol",
                "1-octadecyl-heptadecanoate",
                "15-Nonacosanol",
                "3-Hydroxy-1-phenyl-1-eicosanone",
                "32-methyltetratriacontan-1-ol",
                "4-Hydroxy-6-eicosanone",
                "4-Hydroxy-6-heneicosanone",
                "5-Hydroxy-7-eicosanone",
                "6-Hydroxy-4-heneicosanone",
                "6-oxo-nonan-1-ol",
                "8-Hydroxy-6-docosanone",
                "8E-octadecenyl heptadecanoate",
                "decanol",
                "docosanol",
                "dodecan-1-ol",
                "dodecanol",
                "dodecenol",
                "dotriacontan-1-ol",
                "heptadecanol",
                "hexacosan-1-ol",
                "hexacosanol",
                "hexadecanol",
                "nonadecanol",
                "nonan-3-ol",
                "nonanol",
                "octacosan-1-ol",
                "octadecanol",
                "pentacosan-1-ol",
                "pentacosanol",
                "pentadecan-1-ol",
                "pentadecanol",
                "tetracosanol",
                "tetradecanol",
                "tetradecyl tetradecanoate",
                "triacontan-1-ol",
                "tricosan-1-ol",
                "tricosanol",
                "tridecanol",
                "undecan-1-ol",
                "undecan-6-ol",
                "undecanol"
            ],
            "TP": 6,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "Propanol (C3H8O)",
            "Butanol (C4H10O)",
            "Pentanol (C5H12O)",
            "Hexanol (C6H14O)",
            "Heptanol (C7H16O)",
            "Octanol (C8H18O)",
            "Nonanol (C9H20O)",
            "Decanol (C10H22O)",
            "Undecanol (C11H24O)",
            "Dodecanol (C12H26O)",
            "Tridecanol (C13H28O)",
            "Tetradecanol (C14H30O)",
            "Pentadecanol (C15H32O)",
            "Hexadecanol (C16H34O)",
            "Heptadecanol (C17H36O)",
            "Octadecanol (C18H38O)",
            "Nonadecanol (C19H40O)",
            "Eicosanol (C20H42O)",
            "Heneicosanol (C21H44O)",
            "Docosanol (C22H46O)",
            "Tricosanol (C23H48O)",
            "Tetracosanol (C24H50O)",
            "Pentacosanol (C25H52O)",
            "Hexacosanol (C26H54O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Propanol (C3H8O)",
                "Pentanol (C5H12O)",
                "Hexanol (C6H14O)",
                "Heptanol (C7H16O)",
                "Octanol (C8H18O)",
                "Nonanol (C9H20O)",
                "Decanol (C10H22O)",
                "Undecanol (C11H24O)",
                "Dodecanol (C12H26O)",
                "Tridecanol (C13H28O)",
                "Tetradecanol (C14H30O)",
                "Pentadecanol (C15H32O)",
                "Hexadecanol (C16H34O)",
                "Heptadecanol (C17H36O)",
                "Octadecanol (C18H38O)",
                "Nonadecanol (C19H40O)",
                "Docosanol (C22H46O)",
                "Tricosanol (C23H48O)",
                "Tetracosanol (C24H50O)",
                "Pentacosanol (C25H52O)",
                "Hexacosanol (C26H54O)"
            ],
            "mismatches": [
                "Butanol (C4H10O)",
                "Eicosanol (C20H42O)",
                "Heneicosanol (C21H44O)"
            ],
            "true_referents": [
                "(2S)-2-heptanol",
                "1,21-Heneicosanediol",
                "1,7-decanediol",
                "1-O-(2R-hydroxy-eicosanyl)-sn-glycerol",
                "1-O-hexacosyl oleate",
                "1-octadecyl-heptadecanoate",
                "2-butyl-1-octanol",
                "3,7-dimethyl-3-octanol",
                "3-Hydroxy-1-phenyl-1-eicosanone",
                "4-Hydroxy-6-heneicosanone",
                "5-Hydroxy-7-eicosanone",
                "6-Hydroxy-4-heneicosanone",
                "8E-octadecenyl heptadecanoate",
                "butyl butanoate",
                "butyl octanoate",
                "decanol",
                "docosan-6-ol",
                "docosanol",
                "dodecan-1-ol",
                "dodecanol",
                "dodecyl dodecanoate",
                "heptadecanol",
                "heptanol",
                "hexacosanol",
                "hexadecanol",
                "hexanol",
                "hexyl hexanoate",
                "hexyl propanoate",
                "nonadecanol",
                "nonan-3-ol",
                "nonanol",
                "octadecanol",
                "octanol",
                "pentacosan-5-ol",
                "pentacosanol",
                "pentadecan-5-ol",
                "pentadecanol",
                "pentan-1-ol",
                "pentanol",
                "propyl decanoate",
                "tetracosanol",
                "tetradecanol",
                "tetradecyl tetradecanoate",
                "tricosanol",
                "tridecanol",
                "undecan-1-ol",
                "undecan-4-ol",
                "undecanol"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "Propan-1-ol (C3H8O)",
            "Butan-1-ol (C4H10O)",
            "Pentanol (C5H12O)",
            "Hexanol (C6H14O)",
            "Heptanol (C7H16O)",
            "Octanol (C8H18O)",
            "Nonanol (C9H20O)",
            "Decanol (C10H22O)",
            "Undecanol (C11H24O)",
            "Dodecanol (C12H26O)",
            "Tridecanol (C13H28O)",
            "Tetradecanol (C14H30O)",
            "Pentadecanol (C15H32O)",
            "Hexadecanol (C16H34O)",
            "Heptadecanol (C17H36O)",
            "Octadecanol (C18H38O)",
            "Nonadecanol (C19H40O)",
            "Eicosanol (C20H42O)",
            "Heneicosanol (C21H44O)",
            "Docosanol (C22H46O)",
            "Tricosanol (C23H48O)",
            "Tetracosanol (C24H50O)",
            "Pentacosanol (C25H52O)",
            "Hexacosanol (C26H54O)",
            "Heptacosanol (C27H56O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Propan-1-ol (C3H8O)",
                "Butan-1-ol (C4H10O)",
                "Pentanol (C5H12O)",
                "Hexanol (C6H14O)",
                "Heptanol (C7H16O)",
                "Octanol (C8H18O)",
                "Nonanol (C9H20O)",
                "Decanol (C10H22O)",
                "Undecanol (C11H24O)",
                "Dodecanol (C12H26O)",
                "Tridecanol (C13H28O)",
                "Tetradecanol (C14H30O)",
                "Pentadecanol (C15H32O)",
                "Hexadecanol (C16H34O)",
                "Heptadecanol (C17H36O)",
                "Octadecanol (C18H38O)",
                "Nonadecanol (C19H40O)",
                "Docosanol (C22H46O)",
                "Tricosanol (C23H48O)",
                "Tetracosanol (C24H50O)",
                "Pentacosanol (C25H52O)",
                "Hexacosanol (C26H54O)"
            ],
            "mismatches": [
                "Eicosanol (C20H42O)",
                "Heneicosanol (C21H44O)",
                "Heptacosanol (C27H56O)"
            ],
            "true_referents": [
                "(2R)-octan-2-ol",
                "(2S)-2-heptanol",
                "1,21-Heneicosanediol",
                "1,7-decanediol",
                "1-O-(2R-hydroxy-eicosanyl)-sn-glycerol",
                "1-O-hexacosyl oleate",
                "1-octadecyl-heptadecanoate",
                "2-butyl-1-octanol",
                "3,7-dimethyl-3-octanol",
                "3-Hydroxy-1-phenyl-1-eicosanone",
                "4-Hydroxy-6-heneicosanone",
                "5-Hydroxy-7-eicosanone",
                "6-Hydroxy-4-heneicosanone",
                "8E-octadecenyl heptadecanoate",
                "butan-1-ol",
                "decanol",
                "docosan-6-ol",
                "docosanol",
                "dodecan-1-ol",
                "dodecanol",
                "dodecyl dodecanoate",
                "heptadecanol",
                "heptanol",
                "hexacosanol",
                "hexadecanol",
                "hexanol",
                "hexyl hexanoate",
                "nonadecanol",
                "nonan-3-ol",
                "nonanol",
                "octadecanol",
                "octan-4-ol",
                "octanol",
                "pentacosan-5-ol",
                "pentacosanol",
                "pentadecan-5-ol",
                "pentadecanol",
                "pentan-1-ol",
                "pentanol",
                "propan-1-ol",
                "propan-2-ol",
                "tetracosanol",
                "tetradecanol",
                "tetradecyl tetradecanoate",
                "tricosanol",
                "tridecanol",
                "undecan-1-ol",
                "undecan-4-ol",
                "undecanol"
            ],
            "TP": 22,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "Propanol (PrOH)",
            "Butanol (BuOH)",
            "Pentanol (PeOH)",
            "Hexanol (HeOH)",
            "Heptanol (HpOH)",
            "Octanol (OcOH)",
            "Nonanol (NoOH)",
            "Decanol (DeOH)",
            "Undecanol (UnOH)",
            "Dodecanol (DoOH)",
            "Tridecanol (TrOH)",
            "Tetradecanol (TeOH)",
            "Pentadecanol (PeOH)",
            "Hexadecanol (HeOH)",
            "Heptadecanol (HpOH)",
            "Octadecanol (OcOH)",
            "Nonadecanol (NoOH)",
            "Eicosanol (EiOH)",
            "Heneicosanol (HeOH)",
            "Docosanol (DoOH)",
            "Tricosanol (TrOH)",
            "Tetracosanol (TeOH)",
            "Pentacosanol (PeOH)",
            "Hexacosanol (HeOH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Propanol (PrOH)",
                "Pentanol (PeOH)",
                "Hexanol (HeOH)",
                "Heptanol (HpOH)",
                "Octanol (OcOH)",
                "Nonanol (NoOH)",
                "Decanol (DeOH)",
                "Undecanol (UnOH)",
                "Dodecanol (DoOH)",
                "Tridecanol (TrOH)",
                "Tetradecanol (TeOH)",
                "Pentadecanol (PeOH)",
                "Hexadecanol (HeOH)",
                "Heptadecanol (HpOH)",
                "Octadecanol (OcOH)",
                "Nonadecanol (NoOH)",
                "Docosanol (DoOH)",
                "Tricosanol (TrOH)",
                "Tetracosanol (TeOH)",
                "Pentacosanol (PeOH)",
                "Hexacosanol (HeOH)"
            ],
            "mismatches": [
                "Butanol (BuOH)",
                "Eicosanol (EiOH)",
                "Heneicosanol (HeOH)"
            ],
            "true_referents": [
                "1-octadecyl-heptadecanoate",
                "2-butyl-1-octanol",
                "2-hydroxyethyl octadecanoate",
                "3,7-dimethyl-3-octanol",
                "3-Hydroxy-1-phenyl-1-eicosanone",
                "4-Hydroxy-6-eicosanone",
                "4-Hydroxy-6-heneicosanone",
                "5-Hydroxy-7-eicosanone",
                "6-Hydroxy-4-heneicosanone",
                "6-Hydroxy-4-nonadecanone",
                "butyl butanoate",
                "butyl octanoate",
                "decanol",
                "docosan-6-ol",
                "docosanol",
                "dodecanol",
                "dodecenol",
                "dodecyl dodecanoate",
                "heptadecanol",
                "heptanol",
                "hexacosanol",
                "hexadecanol",
                "hexanol",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl octanoate",
                "hexyl propanoate",
                "nonadecanol",
                "nonan-3-ol",
                "nonan-4-ol",
                "nonanol",
                "octadecanol",
                "octanol",
                "pentacosanol",
                "pentadecan-1-ol",
                "pentadecanol",
                "pentan-1-ol",
                "pentanol",
                "propan-1-ol",
                "propyl decanoate",
                "propyl hexanoate",
                "tetracosanol",
                "tetradecanol",
                "tetradecyl tetradecanoate",
                "tricosan-1-ol",
                "tricosanol",
                "tridecanol",
                "undecan-1-ol",
                "undecan-6-ol",
                "undecanol"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "n-propanol",
            "isobutanol",
            "n-butanol",
            "2-methyl-1-propanol",
            "2-methyl-2-propanol",
            "n-pentanol",
            "isopentanol",
            "neopentanol",
            "n-hexanol",
            "isohexanol",
            "2-ethyl-1-butanol",
            "3-methyl-1-pentanol",
            "2,2-dimethyl-1-propanol",
            "n-heptanol",
            "n-octanol",
            "n-nonanol",
            "n-decanol",
            "n-undecanol",
            "n-dodecanol",
            "n-tridecanol",
            "n-tetradecanol",
            "n-pentadecanol",
            "n-hexadecanol",
            "n-heptadecanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "n-heptanol",
                "n-octanol",
                "n-nonanol",
                "n-decanol",
                "n-undecanol",
                "n-dodecanol",
                "n-tridecanol",
                "n-tetradecanol",
                "n-pentadecanol",
                "n-hexadecanol",
                "n-heptadecanol"
            ],
            "mismatches": [
                "n-propanol",
                "isobutanol",
                "n-butanol",
                "2-methyl-1-propanol",
                "2-methyl-2-propanol",
                "n-pentanol",
                "isopentanol",
                "neopentanol",
                "n-hexanol",
                "isohexanol",
                "2-ethyl-1-butanol",
                "3-methyl-1-pentanol",
                "2,2-dimethyl-1-propanol"
            ],
            "true_referents": [
                "(2S)-2-heptanol",
                "1,3-decanediol",
                "1,7-decanediol",
                "1-octadecyl-heptadecanoate",
                "2-butyl-1-octanol",
                "3,7-dimethyl-3-octanol",
                "butyl butanoate",
                "butyl octanoate",
                "decanol",
                "dodecanol",
                "dodecenol",
                "dodecyl dodecanoate",
                "heptadecanol",
                "heptanol",
                "hexadecanol",
                "hexanol",
                "hexyl hexanoate",
                "hexyl octanoate",
                "hexyl propanoate",
                "isopropyl dodecanoate",
                "isopropyl ester",
                "n-butyl oleate",
                "nonan-3-ol",
                "nonan-4-ol",
                "nonanol",
                "octadecanol",
                "octanol",
                "pentadecan-1-ol",
                "pentadecanol",
                "pentan-1-ol",
                "pentan-3-ol",
                "pentanol",
                "propyl decanoate",
                "tetradecanol",
                "tetradecyl tetradecanoate",
                "tridecanol",
                "undecan-1-ol",
                "undecan-5-ol",
                "undecanol"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "1-Propanol (n-Propanol)",
            "2-Propanol (Isopropanol)",
            "1-Butanol (n-Butanol)",
            "2-Butanol (sec-Butanol)",
            "2-Methyl-2-propanol (tert-Butanol)",
            "1-Pentanol (n-Pentanol)",
            "2-Pentanol",
            "3-Methyl-1-butanol",
            "3-Methyl-2-butanol",
            "1-Hexanol (n-Hexanol)",
            "2-Hexanol",
            "3-Hexanol",
            "1-Heptanol (n-Heptanol)",
            "2-Heptanol",
            "1-Octanol (n-Octanol)",
            "2-Octanol",
            "1-Nonanol (n-Nonanol)",
            "2-Nonanol",
            "1-Decanol (n-Decanol)",
            "2-Decanol",
            "1-Dodecanol (Dodecanol)",
            "1-Tetradecanol (Tetradecanol)",
            "1-Hexadecanol (Hexadecanol)",
            "1-Octacosanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1-Pentanol (n-Pentanol)",
                "2-Pentanol",
                "1-Hexanol (n-Hexanol)",
                "2-Hexanol",
                "3-Hexanol",
                "1-Heptanol (n-Heptanol)",
                "1-Octanol (n-Octanol)",
                "2-Octanol",
                "1-Nonanol (n-Nonanol)",
                "2-Nonanol",
                "1-Decanol (n-Decanol)",
                "2-Decanol",
                "1-Dodecanol (Dodecanol)",
                "1-Tetradecanol (Tetradecanol)",
                "1-Hexadecanol (Hexadecanol)",
                "1-Octacosanol"
            ],
            "mismatches": [
                "1-Propanol (n-Propanol)",
                "2-Propanol (Isopropanol)",
                "1-Butanol (n-Butanol)",
                "2-Butanol (sec-Butanol)",
                "2-Methyl-2-propanol (tert-Butanol)",
                "3-Methyl-1-butanol",
                "3-Methyl-2-butanol"
            ],
            "true_referents": [
                "(2S)-2-heptanol",
                "1,3-decanediol",
                "1,7-decanediol",
                "1-octadecyl-heptadecanoate",
                "2-butyl-1-octanol",
                "3,7-dimethyl-3-octanol",
                "6-oxo-nonan-1-ol",
                "Isopropyl propionate",
                "butyl butanoate",
                "decan-2-ol",
                "decanol",
                "dodecan-1-ol",
                "dodecanol",
                "dodecenol",
                "heptadecanol",
                "heptanol",
                "hexadecanol",
                "hexan-2-ol",
                "hexan-3-ol",
                "hexanol",
                "hexyl 2-methylbutanoate",
                "hexyl hexanoate",
                "hexyl propanoate",
                "isopropyl ester",
                "n-butyl oleate",
                "nonan-2-ol",
                "nonan-4-ol",
                "nonanol",
                "octacosan-1-ol",
                "octan-2-ol",
                "octanol",
                "pentan-1-ol",
                "pentan-2-ol",
                "pentanol",
                "propan-1-ol",
                "secondary fatty alcohol",
                "tetradecanol",
                "tetradecyl tetradecanoate"
            ],
            "TP": 16,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "1-Propanol (n-propyl alcohol)",
            "2-Propanol (isopropyl alcohol)",
            "1-Butanol (n-butanol)",
            "2-Butanol (sec-butanol)",
            "2-Methyl-1-propanol (isobutanol)",
            "tert-Butanol",
            "1-Pentanol (n-pentanol)",
            "3-Pentanol",
            "1-Hexanol",
            "1-Heptanol",
            "1-Octanol",
            "1-Nonanol",
            "1-Decanol",
            "1-Undecanol",
            "1-Dodecanol (lauryl alcohol)",
            "1-Tetradecanol (myristyl alcohol)",
            "1-Hexadecanol (cetyl alcohol)",
            "1-Octadecanol (stearyl alcohol)",
            "1-Eicosanol",
            "1-Docosanol (behenyl alcohol)",
            "1-Tetracosanol (lignoceryl alcohol)",
            "1-Hexacosanol (ceryl alcohol)",
            "1-Octacosanol",
            "1-Triacontanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1-Pentanol (n-pentanol)",
                "3-Pentanol",
                "1-Hexanol",
                "1-Heptanol",
                "1-Octanol",
                "1-Nonanol",
                "1-Decanol",
                "1-Undecanol",
                "1-Dodecanol (lauryl alcohol)",
                "1-Tetradecanol (myristyl alcohol)",
                "1-Hexadecanol (cetyl alcohol)",
                "1-Octadecanol (stearyl alcohol)",
                "1-Docosanol (behenyl alcohol)",
                "1-Tetracosanol (lignoceryl alcohol)",
                "1-Hexacosanol (ceryl alcohol)",
                "1-Octacosanol",
                "1-Triacontanol"
            ],
            "mismatches": [
                "1-Propanol (n-propyl alcohol)",
                "2-Propanol (isopropyl alcohol)",
                "1-Butanol (n-butanol)",
                "2-Butanol (sec-butanol)",
                "2-Methyl-1-propanol (isobutanol)",
                "tert-Butanol",
                "1-Eicosanol"
            ],
            "true_referents": [
                "(2S)-2-heptanol",
                "1,3-decanediol",
                "1,7-decanediol",
                "1-O-dodecylglycerol",
                "1-O-hexacosyl oleate",
                "1-octadecyl-heptadecanoate",
                "2-butyl-1-octanol",
                "3,7-dimethyl-3-octanol",
                "3-Hydroxy-1-phenyl-1-eicosanone",
                "3S,7S-dimethyl-2S-tetradecanol",
                "4-Hydroxy-6-eicosanone",
                "5-Hydroxy-7-eicosanone",
                "8E-octadecenyl heptadecanoate",
                "Isopropyl propionate",
                "butyl butanoate",
                "butyl octanoate",
                "decanol",
                "docosan-3-ol",
                "docosanol",
                "dodecanol",
                "dodecyl dodecanoate",
                "heptanol",
                "hexacosanol",
                "hexadecanol",
                "hexanol",
                "hexyl 2-methylbutanoate",
                "hexyl hexanoate",
                "hexyl propanoate",
                "isopropyl ester",
                "n-butyl oleate",
                "nonan-3-ol",
                "nonan-5-ol",
                "nonanol",
                "octacosan-1-ol",
                "octadecanol",
                "octanol",
                "pentadecan-3-ol",
                "pentan-1-ol",
                "pentan-3-ol",
                "pentanol",
                "propan-1-ol",
                "propyl acetate",
                "secondary fatty alcohol",
                "tetracosanol",
                "tetradecanol",
                "triacontan-1-ol",
                "tricosanol",
                "undecan-1-ol",
                "undecan-6-ol",
                "undecanol"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "1-Propanol (n-propanol)",
            "2-Propanol (isopropanol)",
            "1-Butanol (n-butanol)",
            "2-Butanol (sec-butanol)",
            "2-Methyl-1-propanol (isobutanol)",
            "1-Pentanol (n-pentanol)",
            "1-Hexanol (n-hexanol)",
            "1-Heptanol (n-heptanol)",
            "1-Octanol (n-octanol)",
            "1-Nonanol (n-nonanol)",
            "1-Decanol (n-decanol)",
            "1-Undecanol (n-undecanol)",
            "1-Dodecanol (n-dodecanol)",
            "1-Tridecanol (n-tridecanol)",
            "1-Tetradecanol (n-tetradecanol)",
            "1-Pentadecanol (n-pentadecanol)",
            "1-Hexadecanol (cetyl alcohol)",
            "1-Heptadecanol (n-heptadecanol)",
            "1-Octadecanol (stearyl alcohol)",
            "1-Nonadecanol (n-nonadecanol)",
            "1-Eicosanol (arachidyl alcohol)",
            "1-Heneicosanol (n-heneicosanol)",
            "1-Docosanol (behenyl alcohol)",
            "1-Tetracosanol (lignoceryl alcohol)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "propan-1-ol",
                "pentan-1-ol",
                "hexanol",
                "heptanol",
                "octanol",
                "nonanol",
                "decanol",
                "undecanol",
                "dodecanol",
                "tridecanol",
                "tetradecanol",
                "pentadecanol",
                "hexadecanol",
                "heptadecanol",
                "octadecanol",
                "nonadecanol",
                "docosanol",
                "tetracosanol"
            ],
            "mismatches": [
                "2-Propanol (isopropanol)",
                "1-Butanol (n-butanol)",
                "2-Butanol (sec-butanol)",
                "2-Methyl-1-propanol (isobutanol)",
                "1-Eicosanol (arachidyl alcohol)",
                "1-Heneicosanol (n-heneicosanol)"
            ],
            "true_referents": [
                "(2S)-2-heptanol",
                "1,21-Heneicosanediol",
                "1,3-decanediol",
                "1,7-decanediol",
                "1-O-(2R-hydroxy-eicosanyl)-sn-glycerol",
                "1-octadecyl-heptadecanoate",
                "2-butyl-1-octanol",
                "3,7-dimethyl-3-octanol",
                "3-Hydroxy-1-phenyl-1-eicosanone",
                "5-Hydroxy-7-eicosanone",
                "6-Hydroxy-4-heneicosanone",
                "6-oxo-nonan-1-ol",
                "8-Hydroxy-6-heneicosanone",
                "8E-octadecenyl heptadecanoate",
                "Isopropyl propionate",
                "butyl butanoate",
                "decanol",
                "docosan-3-ol",
                "docosanol",
                "dodecan-1-ol",
                "dodecanol",
                "dodecyl dodecanoate",
                "heptadecanol",
                "heptanol",
                "hexacosanol",
                "hexadecanol",
                "hexanol",
                "hexyl 2-methylbutanoate",
                "hexyl hexanoate",
                "hexyl propanoate",
                "isopropyl ester",
                "n-butyl oleate",
                "nonadecanol",
                "nonan-4-ol",
                "nonanol",
                "nonyl palmitate",
                "octadecanol",
                "octanol",
                "pentadecan-1-ol",
                "pentadecanol",
                "pentan-1-ol",
                "pentanol",
                "propan-1-ol",
                "secondary fatty alcohol",
                "tetracosanol",
                "tetradecanol",
                "tetradecyl tetradecanoate",
                "tricosanol",
                "tridecanol",
                "undecan-1-ol",
                "undecan-6-ol",
                "undecanol"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "Propanol (C3H7OH)",
            "Butanol (C4H9OH)",
            "Pentanol (C5H11OH)",
            "Hexanol (C6H13OH)",
            "Heptanol (C7H15OH)",
            "Octanol (C8H17OH)",
            "Nonanol (C9H19OH)",
            "Decanol (C10H21OH)",
            "Undecanol (C11H23OH)",
            "Dodecanol (C12H25OH)",
            "Tridecanol (C13H27OH)",
            "Tetradecanol (C14H29OH)",
            "Pentadecanol (C15H31OH)",
            "Hexadecanol (C16H33OH)",
            "Heptadecanol (C17H35OH)",
            "Octadecanol (C18H37OH)",
            "Nonadecanol (C19H39OH)",
            "Eicosanol (C20H41OH)",
            "Heneicosanol (C21H43OH)",
            "Docosanol (C22H45OH)",
            "Tricosanol (C23H47OH)",
            "Tetracosanol (C24H49OH)",
            "Pentacosanol (C25H51OH)",
            "Hexacosanol (C26H53OH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Pentanol (C5H11OH)",
                "Hexanol (C6H13OH)",
                "Heptanol (C7H15OH)",
                "Octanol (C8H17OH)",
                "Nonanol (C9H19OH)",
                "Decanol (C10H21OH)",
                "Undecanol (C11H23OH)",
                "Dodecanol (C12H25OH)",
                "Tridecanol (C13H27OH)",
                "Tetradecanol (C14H29OH)",
                "Pentadecanol (C15H31OH)",
                "Hexadecanol (C16H33OH)",
                "Heptadecanol (C17H35OH)",
                "Octadecanol (C18H37OH)",
                "Nonadecanol (C19H39OH)",
                "Docosanol (C22H45OH)",
                "Tricosanol (C23H47OH)",
                "Tetracosanol (C24H49OH)",
                "Pentacosanol (C25H51OH)",
                "Hexacosanol (C26H53OH)"
            ],
            "mismatches": [
                "Propanol (C3H7OH)",
                "Butanol (C4H9OH)",
                "Eicosanol (C20H41OH)",
                "Heneicosanol (C21H43OH)"
            ],
            "true_referents": [
                "(2S)-2-heptanol",
                "1,7-decanediol",
                "1-O-(2R-hydroxy-eicosanyl)-sn-glycerol",
                "1-octadecyl-heptadecanoate",
                "2-butyl-1-octanol",
                "3,7-dimethyl-3-octanol",
                "3-Hydroxy-1-phenyl-1-eicosanone",
                "3S,7S-dimethyl-2S-tetradecanol",
                "4-Hydroxy-6-docosanone",
                "4-Hydroxy-6-eicosanone",
                "4-Hydroxy-6-heneicosanone",
                "4-Hydroxy-6-tetracosanone",
                "6-Hydroxy-4-heneicosanone",
                "6-oxo-nonan-1-ol",
                "8-Hydroxy-6-heneicosanone",
                "8E-octadecenyl heptadecanoate",
                "9-Hydroxytridecyl docosanoate",
                "butyl butanoate",
                "butyl octanoate",
                "decanol",
                "docosanol",
                "dodecan-1-ol",
                "dodecanol",
                "dodecyl dodecanoate",
                "heptadecanol",
                "heptanol",
                "hexacosan-6-ol",
                "hexacosanol",
                "hexadecanol",
                "hexanol",
                "hexyl hexanoate",
                "hexyl propanoate",
                "nonadecanol",
                "nonan-4-ol",
                "nonanol",
                "octadecanol",
                "octanol",
                "pentacosanol",
                "pentadecan-5-ol",
                "pentadecanol",
                "pentan-1-ol",
                "pentanol",
                "propyl decanoate",
                "tetracosanol",
                "tetradecanol",
                "tetradecyl tetradecanoate",
                "tricosanol",
                "tridecanol",
                "undecan-1-ol",
                "undecan-6-ol",
                "undecanol"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "Propanol (Prop)",
            "Butanol (But)",
            "Pentanol (Pent)",
            "Hexanol (Hex)",
            "Heptanol (Hept)",
            "Octanol (Oct)",
            "Nonanol (Non)",
            "Decanol (Dec)",
            "Undecanol (Und)",
            "Dodecanol (Dod)",
            "Tridecanol (Tri)",
            "Tetradecanol (Tet)",
            "Pentadecanol (Pen)",
            "Hexadecanol (Hex)",
            "Heptadecanol (Hep)",
            "Octadecanol (Oca)",
            "Nonadecanol (Noa)",
            "Eicosanol (Eic)",
            "Heneicosanol (Hen)",
            "Docosanol (Doc)",
            "Tricosanol (Tri)",
            "Tetracosanol (Tet)",
            "Pentacosanol (Pen)",
            "Hexacosanol (Hex)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "butanol",
                "pentanol",
                "hexanol",
                "heptanol",
                "octanol",
                "nonanol",
                "decanol",
                "undecanol",
                "dodecanol",
                "tridecanol",
                "tetradecanol",
                "pentadecanol",
                "hexadecanol",
                "heptadecanol",
                "octadecanol",
                "nonadecanol",
                "docosanol",
                "tricosanol",
                "tetracosanol",
                "pentacosanol",
                "hexacosanol"
            ],
            "mismatches": [
                "propanol",
                "eicosanol",
                "heneicosanol"
            ],
            "true_referents": [
                "(2S)-2-heptanol",
                "1,21-Heneicosanediol",
                "1-O-tetracosyl oleate",
                "1-octadecyl-heptadecanoate",
                "2-butyl-1-octanol",
                "3-Hydroxy-1-phenyl-1-eicosanone",
                "4-Hydroxy-6-eicosanone",
                "5-Hydroxy-7-eicosanone",
                "6-Hydroxy-4-heneicosanone",
                "8E-octadecenyl heptadecanoate",
                "Henicosane-6,8-diol",
                "Z-10-Pentadecenol",
                "butan-1-ol",
                "butyl butanoate",
                "decan-1-ol",
                "decan-3-ol",
                "decanol",
                "docosan-3-ol",
                "docosanol",
                "dodecan-1-ol",
                "dodecanol",
                "dodecenol",
                "heptadecanol",
                "heptanol",
                "hexacosanol",
                "hexadecanol",
                "hexanol",
                "hexyl hexanoate",
                "hexyl propanoate",
                "nonadecanol",
                "nonan-1-ol",
                "nonan-2-ol",
                "nonanol",
                "nonyl palmitate",
                "octadecanol",
                "octan-1-ol",
                "octanol",
                "pentacosan-1-ol",
                "pentacosanol",
                "pentadecan-1-ol",
                "pentadecanol",
                "pentan-1-ol",
                "pentanol",
                "propyl acetate",
                "propyl decanoate",
                "tetracosanol",
                "tetradecanol",
                "tetradecyl tetradecanoate",
                "tricosan-3-ol",
                "tricosanol",
                "tridecan-3-ol",
                "tridecanol",
                "undecan-1-ol",
                "undecan-6-ol",
                "undecanol"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "Oleyl alcohol (OLY)",
            "Linoleyl alcohol (LNO)",
            "Ceramide (CER)",
            "Palmitoleyl alcohol (PLO)",
            "Squalene (SQ)",
            "Cholesterol ester (CHE)",
            "Octadecanol (OD)",
            "Eicosanol (EOS)",
            "Docosanol (DOS)",
            "Tetracosanol (TCS)",
            "Hexacosanol (HCS)",
            "Octacosanol (OCS)",
            "Triacontanol (TCS)",
            "Dotriacontanol (DTS)",
            "Tetracontanol (TTS)",
            "Pentacosanol (PCS)",
            "Hexatriacontanol (HTS)",
            "Heptacosanol (HPS)",
            "Octatriacontanol (OTS)",
            "Nonacosanol (NCS)",
            "Triacentanol (TIS)",
            "Tetratriacontanol (TTS)",
            "Pentatriacontanol (PTS)",
            "Hexatriacontanol (HTS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Palmitoleyl alcohol",
                "Docosanol",
                "Hexacosanol",
                "Tetracosanol",
                "Pentacosanol"
            ],
            "mismatches": [
                "Oleyl alcohol (OLY)",
                "Linoleyl alcohol (LNO)",
                "Ceramide (CER)",
                "Squalene (SQ)",
                "Cholesterol ester (CHE)",
                "Octadecanol (OD)",
                "Eicosanol (EOS)",
                "Octacosanol (OCS)",
                "Triacontanol (TCS)",
                "Dotriacontanol (DTS)",
                "Tetracontanol (TTS)",
                "Heptacosanol (HPS)",
                "Octatriacontanol (OTS)",
                "Nonacosanol (NCS)",
                "Triacentanol (TIS)",
                "Tetratriacontanol (TTS)",
                "Pentatriacontanol (PTS)",
                "Hexatriacontanol (HTS)"
            ],
            "true_referents": [
                "1,16-hexadecanediol",
                "1-Stearoylglycerol",
                "1-octadecyl-heptadecanoate",
                "15-Nonacosanol",
                "3-Hydroxy-1-phenyl-1-eicosanone",
                "30-methyldotriacontan-1-ol",
                "32-methyltetratriacontan-1-ol",
                "4-Hydroxy-6-eicosanone",
                "5-Hydroxy-7-eicosanone",
                "Linolenyl laurate",
                "Linolenyl oleate",
                "Linoleyl linoleate",
                "Octacosyl triacontanoate",
                "Stearyl linoleate",
                "Tritriacontyl octacosanoate",
                "docosan-6-ol",
                "docosanol",
                "dotriacontan-1-ol",
                "heptanol",
                "hexacosanol",
                "nonacosan-10-ol",
                "octacosan-1-ol",
                "octadecanol",
                "oleyl oleate",
                "palmitoleyl alcohol",
                "palmitoleyl oleate",
                "pentacosanol",
                "pentanol",
                "stearyl oleate",
                "tetracosanol",
                "tetratriacontan-1-ol",
                "triacontan-1-ol",
                "tricosanol",
                "tridecanol"
            ],
            "TP": 5,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": [
            "Propan-1-ol (1-PrOH)",
            "Butan-1-ol (1-BuOH)",
            "Pentan-1-ol (1-PeOH)",
            "Hexan-1-ol (1-HexOH)",
            "Heptan-1-ol (1-HepOH)",
            "Octan-1-ol (1-OctOH)",
            "Nonan-1-ol (1-NonOH)",
            "Decan-1-ol (1-DecOH)",
            "Dodecan-1-ol (1-DodecOH)",
            "Tridecan-1-ol (1-TridecOH)",
            "Tetradecan-1-ol (1-TetradecOH)",
            "Pentadecan-1-ol (1-PentadecOH)",
            "Hexadecan-1-ol (1-HexadecOH)",
            "Heptadecan-1-ol (1-HeptadecOH)",
            "Octadecan-1-ol (1-OctadecOH)",
            "Nonadecan-1-ol (1-NonadecOH)",
            "Icosan-1-ol (1-IcosOH)",
            "Heneicosan-1-ol (1-HeneicosOH)",
            "Docosan-1-ol (1-DocosOH)",
            "Tricosan-1-ol (1-TricosOH)",
            "Tetracosan-1-ol (1-TetracosOH)",
            "Pentacosan-1-ol (1-PentacosOH)",
            "Hexacosan-1-ol (1-HexacosOH)",
            "Heptacosan-1-ol (1-HeptacosOH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "propan-1-ol",
                "butan-1-ol",
                "pentan-1-ol",
                "hexan-1-ol",
                "heptan-1-ol",
                "octan-1-ol",
                "decan-1-ol",
                "dodecan-1-ol",
                "docosan-1-ol",
                "tricosan-1-ol",
                "tetracosan-1-ol",
                "pentacosan-1-ol",
                "hexacosan-1-ol",
                "heptacosan-1-ol"
            ],
            "mismatches": [
                "nonan-1-ol",
                "tridecan-1-ol",
                "tetradecan-1-ol",
                "pentadecan-1-ol",
                "hexadecan-1-ol",
                "heptadecan-1-ol",
                "octadecan-1-ol",
                "nonadecan-1-ol",
                "icosan-1-ol",
                "heneicosan-1-ol"
            ],
            "true_referents": [
                "(2R)-octan-2-ol",
                "(2S)-octan-2-ol",
                "2-butyl-1-octanol",
                "6-Hydroxy-4-heneicosanone",
                "butan-1-ol",
                "butyl butanoate",
                "decan-1-ol",
                "decan-3-ol",
                "decan-5-ol",
                "docosan-1-ol",
                "dodecan-1-ol",
                "dodecan-4-ol",
                "dodecan-5-ol",
                "henicosan-3-ol",
                "heptacosan-1-ol",
                "heptadecan-1-ol",
                "heptan-1-ol",
                "heptan-2-ol",
                "heptan-3-ol",
                "hexacosan-1-ol",
                "hexadecan-1-ol",
                "hexan-1-ol",
                "hexan-2-ol",
                "hexan-3-ol",
                "icosan-1-ol",
                "nonadecan-1-ol",
                "nonan-2-ol",
                "nonan-3-ol",
                "nonan-4-ol",
                "octadecan-1-ol",
                "octan-1-ol",
                "pentacosan-1-ol",
                "pentadecan-1-ol",
                "pentan-1-ol",
                "pentan-2-ol",
                "propan-1-ol",
                "propan-2-ol",
                "tetracosan-1-ol",
                "tetradecan-1-ol",
                "tricosan-1-ol",
                "tridecan-1-ol"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "fatty alcohol",
        "domain": "chemistry",
        "response": "error when calling model 'amazon.titan-text-express-v1': empty response",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]