[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Ethanol (EtOH)",
            "Propanol (PrOH)",
            "Butanol (BuOH)",
            "Pentanol (PeOH)",
            "Hexanol (HexOH)",
            "Heptanol (HeptOH)",
            "Octanol (OctOH)",
            "Nonanol (NonOH)",
            "Decanol (DecOH)",
            "Undecanol (UndeOH)",
            "Dodecanol (DodecOH)",
            "Tridecanol (TridecOH)",
            "Tetradecanol (TetradecOH)",
            "Pentadecanol (PentadecOH)",
            "Hexadecanol (HexadecOH)",
            "Heptadecanol (HeptadecOH)",
            "Octadecanol (OctadecOH)",
            "Nonadecanol (NonadecOH)",
            "Eicosanol (EicosaOH)",
            "Docosanol (DocosaOH)",
            "Behenol (BehenOH)",
            "Lignoceryl alcohol (LignocerylOH)",
            "Ceryl alcohol (CerylOH)",
            "Montanyl alcohol (MontanylOH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethanol-d6",
                "propan-1-ol",
                "pentan-1-ol",
                "undecan-1-ol",
                "dodecan-1-ol",
                "pentadecan-1-ol"
            ],
            "mismatches": [
                "Butanol (BuOH)",
                "Hexanol (HexOH)",
                "Heptanol (HeptOH)",
                "Octanol (OctOH)",
                "Nonanol (NonOH)",
                "Decanol (DecOH)",
                "Tridecanol (TridecOH)",
                "Tetradecanol (TetradecOH)",
                "Hexadecanol (HexadecOH)",
                "Heptadecanol (HeptadecOH)",
                "Octadecanol (OctadecOH)",
                "Nonadecanol (NonadecOH)",
                "Eicosanol (EicosaOH)",
                "Docosanol (DocosaOH)",
                "Behenol (BehenOH)",
                "Lignoceryl alcohol (LignocerylOH)",
                "Ceryl alcohol (CerylOH)",
                "Montanyl alcohol (MontanylOH)"
            ],
            "true_referents": [
                "(E)-cinnamyl alcohol",
                "1-O-dodecylglycerol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-hydroxyethyl octadecanoate",
                "2-methylbenzyl alcohol",
                "20-hydroxyicosanoic acid",
                "3-methylbenzyl alcohol",
                "4-ethylbenzyl alcohol",
                "Lignoceroyl-EA",
                "N-(docosanoyl)ethanolamine",
                "Octadecadienoic acid, methyl ester",
                "Pentadecanoyl-EA",
                "Pentane-1,5-diol",
                "all-trans-undecaprenol",
                "butyl butanoate",
                "chrysanthemol",
                "decan-1-ol",
                "dodecan-1-ol",
                "dodecyl dodecanoate",
                "ethanol-d6",
                "ethanols",
                "ethyl arachidonate",
                "ethyl decanoate",
                "ethyl heptanoate",
                "ethyl hexadecanoate",
                "ethyl hexanoate",
                "ethyl nonanoate",
                "ethyl octadecanoate",
                "ethyl octanoate",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl octanoate",
                "hexyl propanoate",
                "kahweol",
                "methanol",
                "methyl behenate",
                "methyl heptadecanoate",
                "methyl nonadecanoate",
                "methyl nonanoate",
                "methyl tetradecanoate",
                "methyl tridecanoate",
                "nonyl palmitate",
                "pentadecan-1-ol",
                "pentan-1-ol",
                "propan-1-ol",
                "propenol",
                "sinapyl alcohol",
                "tetradecyl tetradecanoate",
                "undecan-1-ol"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (CH3OH)",
            "Ethanol (C2H5OH)",
            "1-Propanol (C3H7OH)",
            "1-Butanol (C4H9OH)",
            "1-Pentanol (C5H11OH)",
            "1-Hexanol (C6H13OH)",
            "1-Heptanol (C7H15OH)",
            "1-Octanol (C8H17OH)",
            "1-Nonanol (C9H19OH)",
            "1-Decanol (C10H21OH)",
            "1-Undecanol (C11H23OH)",
            "1-Dodecanol (C12H25OH)",
            "1-Tetradecanol (C14H29OH)",
            "1-Pentadecanol (C15H31OH)",
            "1-Hexadecanol (C16H33OH)",
            "1-Heptadecanol (C17H35OH)",
            "1-Octadecanol (C18H37OH)",
            "1-Pentanol (C5H11OH)",
            "1-Nonanol (C9H19OH)",
            "1-Butanol, 2-methyl- (2-Methyl-1-butanol)",
            "1-Pentanol, 3-methyl- (3-Methyl-1-pentanol)",
            "1-Hexanol, 2-methyl- (2-Methyl-1-hexanol)",
            "1-Heptanol, 4-methyl- (4-Methyl-1-heptanol)",
            "1-Octanol, 3-ethyl- (3-Ethyl-1-octanol)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methanol",
                "ethanol"
            ],
            "mismatches": [
                "1-Propanol (C3H7OH)",
                "1-Butanol (C4H9OH)",
                "1-Pentanol (C5H11OH)",
                "1-Hexanol (C6H13OH)",
                "1-Heptanol (C7H15OH)",
                "1-Octanol (C8H17OH)",
                "1-Nonanol (C9H19OH)",
                "1-Decanol (C10H21OH)",
                "1-Undecanol (C11H23OH)",
                "1-Dodecanol (C12H25OH)",
                "1-Tetradecanol (C14H29OH)",
                "1-Pentadecanol (C15H31OH)",
                "1-Hexadecanol (C16H33OH)",
                "1-Heptadecanol (C17H35OH)",
                "1-Octadecanol (C18H37OH)",
                "1-Butanol, 2-methyl- (2-Methyl-1-butanol)",
                "1-Pentanol, 3-methyl- (3-Methyl-1-pentanol)",
                "1-Hexanol, 2-methyl- (2-Methyl-1-hexanol)",
                "1-Heptanol, 4-methyl- (4-Methyl-1-heptanol)",
                "1-Octanol, 3-ethyl- (3-Ethyl-1-octanol)"
            ],
            "true_referents": [
                "(2R)-2,6-dimethylheptan-1-ol",
                "(2S)-2,6-dimethylheptan-1-ol",
                "(3,4-dimethoxyphenyl)methanol",
                "(S)-2-methylbutan-1-ol",
                "1,5-dodecanediol",
                "1,7-decanediol",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-Methyl-2-buten-1-ol",
                "2-butyl-1-octanol",
                "2-hydroxyethyl octadecanoate",
                "2-isopropyl-5-methyl-1-heptanol",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylbutyl hexanoate",
                "3-ethoxy-1-propanol",
                "3-methylpentanol",
                "6-oxo-nonan-1-ol",
                "Pentane-1,5-diol",
                "butyl butanoate",
                "dodecan-1-ol",
                "dodecyl dodecanoate",
                "ethanol-d6",
                "ethanols",
                "ethyl decanoate",
                "ethyl heptanoate",
                "ethyl hexadecanoate",
                "ethyl hexanoate",
                "ethyl nonanoate",
                "ethyl octadecanoate",
                "ethyl octanoate",
                "hexane-1,6-diol",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl propanoate",
                "methanol",
                "methanol-d1",
                "methyl 4,9-dimethyldecanoate",
                "methyl heptadecanoate",
                "methyl hexanoate",
                "methyl undecanoate",
                "pentadecan-1-ol",
                "tetradecyl tetradecanoate",
                "undecan-1-ol",
                "undecane-1,11-diol"
            ],
            "TP": 2,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (CH3OH)",
            "Ethanol (C2H5OH)",
            "Propan-1-ol (C3H7OH)",
            "Butan-1-ol (C4H9OH)",
            "Pentan-1-ol (C5H11OH)",
            "Hexan-1-ol (C6H13OH)",
            "Heptan-1-ol (C7H15OH)",
            "Octan-1-ol (C8H17OH)",
            "Nonan-1-ol (C9H19OH)",
            "Decan-1-ol (C10H21OH)",
            "Dodecan-1-ol (C12H25OH)",
            "Tetradecan-1-ol (C14H29OH)",
            "Hexadecan-1-ol (C16H33OH)",
            "Octadecan-1-ol (C18H37OH)",
            "Eicosan-1-ol (C20H41OH)",
            "Docosan-1-ol (C22H45OH)",
            "Tetracosan-1-ol (C24H49OH)",
            "Heneicosan-1-ol (C21H43OH)",
            "Tricosan-1-ol (C23H47OH)",
            "Pentacosan-1-ol (C25H51OH)",
            "Cyclohexanemethanol",
            "3-Methylbutan-1-ol",
            "2-Methylpropan-1-ol",
            "2-Ethylhexan-1-ol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methanol (CH3OH)",
                "Propan-1-ol (C3H7OH)",
                "Butan-1-ol (C4H9OH)",
                "Pentan-1-ol (C5H11OH)",
                "Hexan-1-ol (C6H13OH)",
                "Heptan-1-ol (C7H15OH)",
                "Octan-1-ol (C8H17OH)",
                "Nonan-1-ol (C9H19OH)",
                "Decan-1-ol (C10H21OH)",
                "Dodecan-1-ol (C12H25OH)",
                "Tetradecan-1-ol (C14H29OH)",
                "Hexadecan-1-ol (C16H33OH)",
                "Octadecan-1-ol (C18H37OH)",
                "Docosan-1-ol (C22H45OH)",
                "Tetracosan-1-ol (C24H49OH)",
                "Tricosan-1-ol (C23H47OH)",
                "Pentacosan-1-ol (C25H51OH)",
                "2-Ethylhexan-1-ol"
            ],
            "mismatches": [
                "Ethanol (C2H5OH)",
                "Eicosan-1-ol (C20H41OH)",
                "Heneicosan-1-ol (C21H43OH)",
                "Cyclohexanemethanol",
                "3-Methylbutan-1-ol",
                "2-Methylpropan-1-ol"
            ],
            "true_referents": [
                "(13Z)-docosen-1-ol",
                "(2-methyl-4,5-ditridecyl-1,4-cyclohexadienyl)methanol",
                "(2E,4E)-2,4-hexadien-1-ol",
                "(3,4-dimethoxyphenyl)methanol",
                "(E)-3-decen-1-ol",
                "(R)-2-methylbutan-1-ol",
                "(S)-2-aminopropan-1-ol",
                "(S)-2-methylbutan-1-ol",
                "2,6-dimethylheptan-1-ol",
                "2-Buten-1-ol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-aminopropan-1-ol",
                "2-butyl-1-octanol",
                "2-ethylhexan-1-ol",
                "2-hexen-1-ol",
                "2-methylbutan-1-ol",
                "2-methylpropane-1,2-diol",
                "20-methylhenicosan-1-ol",
                "3,7,11-trimethyldodecan-1-ol",
                "4-methylcyclohexanemethanol",
                "6-oxo-nonan-1-ol",
                "Cyclohex-2-enylmethanol",
                "Pentane-1,5-diol",
                "butan-1-ol",
                "decan-1-ol",
                "docosan-1-ol",
                "dodecan-1-ol",
                "ethanol-d6",
                "ethanols",
                "ethyl 2-hexenoate",
                "ethyl 9-decenoate",
                "ethyl nonanoate",
                "henicosan-1-ol",
                "heptacosan-1-ol",
                "heptadecan-1-ol",
                "heptan-1-ol",
                "hexacosan-1-ol",
                "hexadecan-1-ol",
                "hexan-1-ol",
                "methanol",
                "methanol-d1",
                "nonan-1-ol",
                "octacosan-1-ol",
                "octadecan-1-ol",
                "octan-1-ol",
                "pentacosan-1-ol",
                "pentadecan-1-ol",
                "pentan-1-ol",
                "propan-1-ol",
                "propan-1-ols",
                "tetracosan-1-ol",
                "tetradecan-1-ol",
                "tricosan-1-ol"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (MeOH)",
            "Ethanol (EtOH)",
            "1-Propanol (1-PrOH)",
            "2-Methyl-1-propanol (Isobutanol)",
            "1-Butanol (1-BuOH)",
            "2-Butanol (sec-Butanol)",
            "3-Methyl-1-butanol (Isoamyl alcohol)",
            "1-Pentanol (1-PentOH)",
            "2-Pentanol",
            "3-Pentanol",
            "2-Methyl-2-butanol (tert-Amyl alcohol)",
            "1-Hexanol (1-HexOH)",
            "1-Octanol (1-OctOH)",
            "1-Decanol (1-DecOH)",
            "1-Dodecanol (Lauryl alcohol)",
            "Glycerol (Glycerol)",
            "Serinol",
            "Sphingosine",
            "Cholesterol (side chain alcohol)",
            "Vitamin D3 (Calciferol, hydroxylated)",
            "Myristyl alcohol",
            "Cetyl alcohol",
            "Stearyl alcohol",
            "Linoleyl alcohol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "isobutanol"
            ],
            "mismatches": [
                "Methanol (MeOH)",
                "Ethanol (EtOH)",
                "1-Propanol (1-PrOH)",
                "1-Butanol (1-BuOH)",
                "2-Butanol (sec-Butanol)",
                "3-Methyl-1-butanol (Isoamyl alcohol)",
                "1-Pentanol (1-PentOH)",
                "2-Pentanol",
                "3-Pentanol",
                "2-Methyl-2-butanol (tert-Amyl alcohol)",
                "1-Hexanol (1-HexOH)",
                "1-Octanol (1-OctOH)",
                "1-Decanol (1-DecOH)",
                "1-Dodecanol (Lauryl alcohol)",
                "Glycerol (Glycerol)",
                "Serinol",
                "Sphingosine",
                "Cholesterol (side chain alcohol)",
                "Vitamin D3 (Calciferol, hydroxylated)",
                "Myristyl alcohol",
                "Cetyl alcohol",
                "Stearyl alcohol",
                "Linoleyl alcohol"
            ],
            "true_referents": [
                "(+)-pinoresinol",
                "(3,4-dimethoxyphenyl)methanol",
                "(S)-2-methylbutan-1-ol",
                "(S)-leucinol(1+)",
                "1,9-decanediol",
                "1-O-dodecylglycerol",
                "13-hydroxy-alpha-tocopherol",
                "13-hydroxy-gamma-tocopherol",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylbutyl butanoate",
                "3,4-dimethylbenzyl alcohol",
                "3-methoxy-1-butanol",
                "3-methylbenzyl alcohol",
                "3-methylpentanol",
                "N-(omega-hydroxytriacontanoyl)sphingosine",
                "Pentane-1,5-diol",
                "Ser-Tyr",
                "Unsaturated alcohol",
                "all-trans-3-hydroxyretinol",
                "arachidyl palmitate",
                "butyl butanoate",
                "dodecyl dodecanoate",
                "dodecyl palmitate",
                "ethanol-d6",
                "ethanols",
                "ethyl decanoate",
                "ethyl ester",
                "ethyl isobutyrate",
                "ethyl linoleate",
                "ethyl linolenate",
                "ethyl myristate",
                "glycerone derivative",
                "glycerone phosphate(2-)",
                "hexane-1,6-diol",
                "hexyl hexanoate",
                "hexyl octanoate",
                "hexyl propanoate",
                "isobutanol",
                "long-chain primary fatty alcohol",
                "methanol",
                "methanol-d1",
                "myristyl palmitate",
                "octan-1-ol",
                "propan-1-ol",
                "short-chain primary fatty alcohol",
                "stearyl oleate",
                "stearyl palmitate"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (CH3OH)",
            "Ethanol (C2H5OH)",
            "Propan-1-ol (C3H7OH)",
            "Butan-1-ol (C4H9OH)",
            "Pentan-1-ol (C5H11OH)",
            "Hexan-1-ol (C6H13OH)",
            "Heptan-1-ol (C7H15OH)",
            "Octan-1-ol (C8H17OH)",
            "Nonan-1-ol (C9H19OH)",
            "Decan-1-ol (C10H21OH)",
            "Undecan-1-ol (C11H23OH)",
            "Dodecan-1-ol (C12H25OH)",
            "Tridecan-1-ol (C13H27OH)",
            "Tetradecan-1-ol (C14H29OH)",
            "Pentadecan-1-ol (C15H31OH)",
            "Hexadecan-1-ol (C16H33OH)",
            "Heptadecan-1-ol (C17H35OH)",
            "Octadecan-1-ol (C18H37OH)",
            "Nonadecan-1-ol (C19H39OH)",
            "Eicosan-1-ol (C20H41OH)",
            "Prop-2-en-1-ol (Allyl alcohol)",
            "But-3-en-1-ol (Crotyl alcohol)",
            "2-Methylpropan-1-ol (Isobutanol)",
            "3-Methylbutan-1-ol (Isoamyl alcohol)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methanol (CH3OH)",
                "Propan-1-ol (C3H7OH)",
                "Butan-1-ol (C4H9OH)",
                "Pentan-1-ol (C5H11OH)",
                "Hexan-1-ol (C6H13OH)",
                "Heptan-1-ol (C7H15OH)",
                "Octan-1-ol (C8H17OH)",
                "Nonan-1-ol (C9H19OH)",
                "Decan-1-ol (C10H21OH)",
                "Undecan-1-ol (C11H23OH)",
                "Dodecan-1-ol (C12H25OH)",
                "Tridecan-1-ol (C13H27OH)",
                "Tetradecan-1-ol (C14H29OH)",
                "Pentadecan-1-ol (C15H31OH)",
                "Hexadecan-1-ol (C16H33OH)",
                "Heptadecan-1-ol (C17H35OH)",
                "Octadecan-1-ol (C18H37OH)",
                "Nonadecan-1-ol (C19H39OH)",
                "Prop-2-en-1-ol (Allyl alcohol)",
                "But-3-en-1-ol (Crotyl alcohol)"
            ],
            "mismatches": [
                "Ethanol (C2H5OH)",
                "Eicosan-1-ol (C20H41OH)",
                "2-Methylpropan-1-ol (Isobutanol)",
                "3-Methylbutan-1-ol (Isoamyl alcohol)"
            ],
            "true_referents": [
                "(2E,4E)-2,4-hexadien-1-ol",
                "(3,4-dimethoxyphenyl)methanol",
                "(E)-3-decen-1-ol",
                "(R)-2-methylbutan-1-ol",
                "(S)-2-methylbutan-1-ol",
                "2,6-dimethylheptan-1-ol",
                "2-Buten-1-ol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-Methyl-3-buten-1-ol",
                "2-butyl-1-octanol",
                "2-ethylhexan-1-ol",
                "2-methylbutan-1-ol",
                "2-methylpropane-1,2-diol",
                "20-methylhenicosan-1-ol",
                "3,7,11-trimethyldodecan-1-ol",
                "3-Buten-1-ol",
                "6-oxo-nonan-1-ol",
                "Pentane-1,5-diol",
                "allyl alcohol",
                "butan-1-ol",
                "crotyl alcohol",
                "decan-1-ol",
                "dodecan-1-ol",
                "ethanol-d6",
                "ethanols",
                "ethyl 9-decenoate",
                "ethyl nonanoate",
                "heptadecan-1-ol",
                "heptan-1-ol",
                "hexadecan-1-ol",
                "hexan-1-ol",
                "methanol",
                "methanol-d1",
                "nonadecan-1-ol",
                "nonan-1-ol",
                "octacosan-1-ol",
                "octadecan-1-ol",
                "octan-1-ol",
                "pentadecan-1-ol",
                "pentan-1-ol",
                "propan-1-ol",
                "propan-1-ols",
                "tetradecan-1-ol",
                "tridecan-1-ol",
                "undecan-1-ol",
                "undecane-1,11-diol"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Ethanol (C2H5OH)",
            "Methanol (CH3OH)",
            "1-Propanol (C3H7OH)",
            "1-Butanol (C4H9OH)",
            "1-Pentanol (C5H11OH)",
            "1-Hexanol (C6H13OH)",
            "1-Heptanol (C7H15OH)",
            "1-Octanol (C8H17OH)",
            "1-Nonanol (C9H19OH)",
            "1-Decanol (C10H21OH)",
            "1-Undecanol (C11H23OH)",
            "1-Dodecanol (C12H25OH)",
            "2-Butanol (C4H10O) - not primary but included for clarity",
            "Benzyl alcohol (C6H5CH2OH)",
            "2-Pentanol (C5H12O) - not primary but included for clarity",
            "2-Butanol (C4H10O) - not primary but included for clarity",
            "1-Phenylethanol (C8H10O)",
            "1-Nonanol (C9H20O)",
            "1-Butanol (C4H10O)",
            "2-Methyl-1-butanol (C5H12O)",
            "3-Methyl-1-butanol (C5H12O)",
            "2-Methyl-2-butanol (C5H12O) - not primary but included for clarity",
            "1-Propyl alcohol (n-propanol)",
            "1-Butyl alcohol (n-butanol)",
            "1-Pentanol (n-pentanol)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methanol",
                "2-phenylethanol",
                "dodecan-1-ol",
                "undecan-1-ol"
            ],
            "mismatches": [
                "ethanol",
                "1-propanol",
                "1-butanol",
                "1-pentanol",
                "1-hexanol",
                "1-heptanol",
                "1-octanol",
                "1-nonanol",
                "1-decanol",
                "2-butanol",
                "benzyl alcohol",
                "2-pentanol",
                "1-phenylethanol",
                "2-methyl-1-butanol",
                "3-methyl-1-butanol",
                "2-methyl-2-butanol",
                "1-propyl alcohol",
                "1-butyl alcohol",
                "1-pentanol"
            ],
            "true_referents": [
                "(3,4-dimethoxyphenyl)methanol",
                "1,5-dodecanediol",
                "1,7-decanediol",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-Methyl-3-buten-1-ol",
                "2-butyl-1-octanol",
                "2-isopropyl-5-methyl-1-heptanol",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylbutyl decanoate",
                "2-methylpropane-1,2-diol",
                "2-phenylethanol",
                "3-ethoxy-1-propanol",
                "3-methoxy-1-butanol",
                "3-methylbenzyl alcohol",
                "4-carboxybenzyl alcohol",
                "4-ethylbenzyl alcohol",
                "6-oxo-nonan-1-ol",
                "Pentane-1,5-diol",
                "butyl butanoate",
                "dodecan-1-ol",
                "dodecyl dodecanoate",
                "ethanol-d6",
                "ethanols",
                "ethyl decanoate",
                "ethyl heptanoate",
                "ethyl hexanoate",
                "ethyl nonanoate",
                "ethyl octanoate",
                "hexane-1,6-diol",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl propanoate",
                "methanol",
                "methanol-d1",
                "methyl undecanoate",
                "undecan-1-ol",
                "undecane-1,11-diol"
            ],
            "TP": 4,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (MeOH)",
            "Ethanol (EtOH)",
            "1-Propanol (1-PrOH)",
            "1-Butanol (1-BuOH)",
            "1-Pentanol (1-PeOH)",
            "1-Hexanol (1-HexOH)",
            "1-Heptanol (1-HeptOH)",
            "1-Octanol (1-OctOH)",
            "1-Nonanol (1-NonOH)",
            "1-Decanol (1-DecOH)",
            "1-Undecanol (1-UndecOH)",
            "1-Dodecanol (1-DodOH)",
            "1-Tridecanol (1-TridOH)",
            "1-Tetradecanol (1-TetradOH)",
            "1-Pentadecanol (1-PentadOH)",
            "1-Hexadecanol (1-HexadOH)",
            "1-Heptadecanol (1-HeptadOH)",
            "1-Octadecanol (1-OctadOH)",
            "1-Nonadecanol (1-NonadOH)",
            "1-Eicosanol (1-EicosOH)",
            "1-Heneicosanol (1-HeneicOH)",
            "1-Docosanol (1-DocosOH)",
            "1-Tricosanol (1-TricOH)",
            "1-Tetracosanol (1-TetracOH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Methanol (MeOH)",
                "Ethanol (EtOH)",
                "1-Propanol (1-PrOH)",
                "1-Butanol (1-BuOH)",
                "1-Pentanol (1-PeOH)",
                "1-Hexanol (1-HexOH)",
                "1-Heptanol (1-HeptOH)",
                "1-Octanol (1-OctOH)",
                "1-Nonanol (1-NonOH)",
                "1-Decanol (1-DecOH)",
                "1-Undecanol (1-UndecOH)",
                "1-Dodecanol (1-DodOH)",
                "1-Tridecanol (1-TridOH)",
                "1-Tetradecanol (1-TetradOH)",
                "1-Pentadecanol (1-PentadOH)",
                "1-Hexadecanol (1-HexadOH)",
                "1-Heptadecanol (1-HeptadOH)",
                "1-Octadecanol (1-OctadOH)",
                "1-Nonadecanol (1-NonadOH)",
                "1-Eicosanol (1-EicosOH)",
                "1-Heneicosanol (1-HeneicOH)",
                "1-Docosanol (1-DocosOH)",
                "1-Tricosanol (1-TricOH)",
                "1-Tetracosanol (1-TetracOH)"
            ],
            "true_referents": [
                "(3,4-dimethoxyphenyl)methanol",
                "(3R)-3,10-dihydroxydecanoic acid",
                "(3R)-3,13-dihydroxytridecanoic acid",
                "1,2-dodecanediol",
                "1,4-dodecanediol",
                "1,9-decanediol",
                "13-Docosenoic acid, methyl ester",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-hydroxyethyl hexadecanoate",
                "2-hydroxyethyl octadecanoate",
                "2-isopropyl-5-methyl-1-heptanol",
                "3-ethoxy-1-propanol",
                "3-methoxy-1-butanol",
                "6-oxo-nonan-1-ol",
                "Methyl Hexacosanoate",
                "Pentane-1,5-diol",
                "butyl butanoate",
                "docosan-1-ol",
                "dodecan-1-ol",
                "ethanol-d6",
                "ethanols",
                "ethyl (4Z,7Z,10Z,13Z,16Z)-henicosapentaenoate",
                "ethyl (4Z,7Z,10Z,13Z,16Z,19Z)-docosahexaenoate",
                "ethyl arachidonate",
                "ethyl decanoate",
                "ethyl heptanoate",
                "ethyl hexadecanoate",
                "ethyl nonanoate",
                "ethyl octadecanoate",
                "hexane-1,6-diol",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl octanoate",
                "hexyl propanoate",
                "methanol",
                "methanol-d1",
                "methyl 4,10-dimethyldodecanoate",
                "methyl henicosanoate",
                "methyl heptadecanoate",
                "methyl tetracosanoate",
                "methyl tricosanoate",
                "methyl undecanoate",
                "octan-1-ol",
                "pentadecan-1-ol",
                "pentan-1-ol",
                "propan-1-ol",
                "tetradecyl tetradecanoate",
                "tricosan-1-ol",
                "undecan-1-ol",
                "undecane-1,11-diol"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol",
            "Ethanol",
            "1-Propanol",
            "2-Propanol",
            "1-Butanol",
            "2-Butanol",
            "2-Methyl-2-propanol",
            "1-Pentanol",
            "2-Pentanol",
            "3-Pentanol",
            "1-Hexanol",
            "2-Hexanol",
            "3-Hexanol",
            "1-Heptanol",
            "2-Heptanol",
            "1-Octanol",
            "2-Octanol",
            "1-Nonanol",
            "2-Nonanol",
            "1-Decanol",
            "2-Decanol",
            "1-Dodecanol",
            "1-Tetradecanol",
            "1-Hexadecanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methanol",
                "Ethanol"
            ],
            "mismatches": [
                "1-Propanol",
                "2-Propanol",
                "1-Butanol",
                "2-Butanol",
                "2-Methyl-2-propanol",
                "1-Pentanol",
                "2-Pentanol",
                "3-Pentanol",
                "1-Hexanol",
                "2-Hexanol",
                "3-Hexanol",
                "1-Heptanol",
                "2-Heptanol",
                "1-Octanol",
                "2-Octanol",
                "1-Nonanol",
                "2-Nonanol",
                "1-Decanol",
                "2-Decanol",
                "1-Dodecanol",
                "1-Tetradecanol",
                "1-Hexadecanol"
            ],
            "true_referents": [
                "(+)-albicanol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1-O-dodecylglycerol",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-hydroxyethyl hexadecanoate",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylbutyl decanoate",
                "2-methylpropane-1,2-diol",
                "3-methylpentanol",
                "Pentane-1,5-diol",
                "butyl butanoate",
                "dodecan-1-ol",
                "dodecyl dodecanoate",
                "ethanol",
                "ethanols",
                "ethyl decanoate",
                "ethyl heptanoate",
                "ethyl hexadecanoate",
                "ethyl hexanoate",
                "ethyl nonanoate",
                "ethyl octanoate",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl propanoate",
                "methanol",
                "methanol-d1",
                "methyl hexanoate",
                "methyl tetradecanoate",
                "naphthylmethanol",
                "octan-1-ol",
                "pentan-1-ol",
                "propyl decanoate",
                "tetradecyl tetradecanoate"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (CH4O)",
            "Ethanol (C2H5OH)",
            "1-Propanol (n-Propanol)",
            "2-Methyl-1-propanol (Isobutanol)",
            "1-Butanol (n-Butanol)",
            "2-Methyl-1-butanol (Isopentyl alcohol)",
            "3-Methyl-1-butanol (Active amyl alcohol)",
            "1-Pentanol (n-Pentanol)",
            "2-Methyl-1-pentanol",
            "1-Hexanol (n-Hexanol)",
            "2-Methyl-1-hexanol",
            "1-Heptanol",
            "1-Octanol (n-Octanol)",
            "1-Nonanol (n-Nonanol)",
            "1-Decanol (n-Decanol)",
            "Benzyl alcohol (C6H5CH2OH)",
            "Allyl alcohol (CH2=CHCH2OH)",
            "Cinnamyl alcohol",
            "Phenethyl alcohol",
            "1-Phenyl-1-ethanol",
            "2-Phenyl-1-propanol",
            "3-Phenyl-1-propanol",
            "4-Methyl-1-pentanol",
            "3-Methyl-1-hexanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methanol",
                "isobutanol",
                "allyl alcohol",
                "cinnamyl alcohol"
            ],
            "mismatches": [
                "ethanol",
                "1-propanol",
                "2-methyl-1-butanol",
                "3-methyl-1-butanol",
                "1-pentanol",
                "2-methyl-1-pentanol",
                "1-hexanol",
                "2-methyl-1-hexanol",
                "1-heptanol",
                "1-octanol",
                "1-nonanol",
                "1-decanol",
                "benzyl alcohol",
                "phenethyl alcohol",
                "1-phenyl-1-ethanol",
                "2-phenyl-1-propanol",
                "3-phenyl-1-propanol",
                "4-methyl-1-pentanol",
                "3-methyl-1-hexanol"
            ],
            "true_referents": [
                "(3,4-dimethoxyphenyl)methanol",
                "(E)-cinnamyl alcohol",
                "(S)-2-methylbutan-1-ol",
                "(Z)-cinnamyl alcohol",
                "2,3,4-Trimethyl-1-pentanol",
                "2-(2-hydroxyphenyl)ethanol",
                "2-(4-hydroxyphenyl)ethanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylbutyl butanoate",
                "2-methylbutyl hexanoate",
                "2-phenylethanol",
                "3,5-dimethylbenzyl alcohol",
                "3-Bromo-1-propanol",
                "3-Cyclohexene-1-ethanol",
                "3-ethoxy-1-propanol",
                "3-methoxy-1-butanol",
                "3-methylbenzyl alcohol",
                "3-methylbutyl hexanoate",
                "4-carboxybenzyl alcohol",
                "4-ethylbenzyl alcohol",
                "4-methylpentan-1-ol",
                "6-oxo-nonan-1-ol",
                "Methyl 5-methylhexanoate",
                "N-(decanoyl)ethanolamine",
                "N-(hexanoyl)ethanolamine",
                "N-(octanoyl)ethanolamine",
                "Pentane-1,5-diol",
                "allyl alcohol",
                "cinnamyl alcohol",
                "ethanol-d6",
                "ethanols",
                "ethyl heptanoate",
                "ethyl nonanoate",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl propanoate",
                "isobutanol",
                "isopentenyl alcohol",
                "methanol",
                "methanol-d1",
                "methyl 3-phenylpropanoate",
                "methyl hexanoate",
                "n-butyl oleate",
                "octan-1-ol",
                "pentan-1-ol",
                "phenethyl acetate",
                "phenethyl isobutyrate",
                "primary allylic alcohol"
            ],
            "TP": 4,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Ethanol (CH3CH2OH)",
            "Methanol (CH3OH)",
            "1-Propanol (CH3CH2CH2OH)",
            "1-Butanol (CH3(CH2)3OH)",
            "1-Pentanol (CH3(CH2)4OH)",
            "1-Hexanol (CH3(CH2)5OH)",
            "1-Heptanol (CH3(CH2)6OH)",
            "1-Octanol (CH3(CH2)7OH)",
            "Allyl alcohol (CH2=CHCH2OH)",
            "Benzyl alcohol (C6H5CH2OH)",
            "Glycerol (HOCH2CH(OH)CH2OH)",
            "Sorbitol (HOCH2(CHOH)4CH2OH)",
            "Mannitol (HOCH2(CHOH)4CH2OH)",
            "Xylitol (HOCH2(CHOH)3CH2OH)",
            "Erythritol (HOCH2(CHOH)2CH2OH)",
            "Propargyl alcohol (HC\u2261CCH2OH)",
            "Cinnamyl alcohol (C6H5CH=CHCH2OH)",
            "Furfuryl alcohol (C4H3OCH2OH)",
            "Geraniol ((CH3)2C=CHCH2CH2C(CH3)=CHCH2OH)",
            "Citronellol ((CH3)2C=CHCH2CH2CH(CH3)CH2CH2OH)",
            "Cholesterol (C27H45OH)",
            "Retinol (Vitamin A alcohol)",
            "Serinol (HOCH2CH(NH2)CH2OH)",
            "Ethanolamine (HOCH2CH2NH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methanol (CH3OH)",
                "Allyl alcohol (CH2=CHCH2OH)",
                "Cinnamyl alcohol (C6H5CH=CHCH2OH)",
                "Furfuryl alcohol (C4H3OCH2OH)",
                "Geraniol ((CH3)2C=CHCH2CH2C(CH3)=CHCH2OH)",
                "Retinol (Vitamin A alcohol)",
                "Ethanolamine (HOCH2CH2NH2)"
            ],
            "mismatches": [
                "Ethanol (CH3CH2OH)",
                "1-Propanol (CH3CH2CH2OH)",
                "1-Butanol (CH3(CH2)3OH)",
                "1-Pentanol (CH3(CH2)4OH)",
                "1-Hexanol (CH3(CH2)5OH)",
                "1-Heptanol (CH3(CH2)6OH)",
                "1-Octanol (CH3(CH2)7OH)",
                "Benzyl alcohol (C6H5CH2OH)",
                "Glycerol (HOCH2CH(OH)CH2OH)",
                "Sorbitol (HOCH2(CHOH)4CH2OH)",
                "Mannitol (HOCH2(CHOH)4CH2OH)",
                "Xylitol (HOCH2(CHOH)3CH2OH)",
                "Erythritol (HOCH2(CHOH)2CH2OH)",
                "Propargyl alcohol (HC\u2261CCH2OH)",
                "Citronellol ((CH3)2C=CHCH2CH2CH(CH3)CH2CH2OH)",
                "Cholesterol (C27H45OH)",
                "Serinol (HOCH2CH(NH2)CH2OH)"
            ],
            "true_referents": [
                "(2S)-2,6-dimethylheptan-1-ol",
                "(3,4-dimethoxyphenyl)methanol",
                "(E)-cinnamyl alcohol",
                "(Z)-cinnamyl alcohol",
                "2,3,4-Trimethyl-1-pentanol",
                "2,6-dimethylheptan-1-ol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-hydroxyethyl octadecanoate",
                "2-isopropyl-5-methyl-1-heptanol",
                "2-methyl-2-hydroxy-1-propanol",
                "3,5-dimethoxy-4-hydroxybenzyl alcohol-4-O-beta-D-glucopyranoside",
                "3-Cyclopentyl-1-propanol",
                "3-ethoxy-1-propanol",
                "3-methoxy-1-butanol",
                "3-methylbenzyl alcohol",
                "3-methylbutyl 2-hydroxypropanoate",
                "4-(hydroxymethyl)-2-propylfuran-3-carboxylic acid",
                "4-carboxybenzyl alcohol",
                "4-ethylbenzyl alcohol",
                "4alpha-hydroxymethyl-5alpha-cholest-7-en-3beta-ol",
                "4beta-(hydroxymethyl)-4alpha-methyl-5alpha-cholest-7-en-3beta-ol",
                "6-[3]-ladderane-1-hexanol",
                "N-(2-hydroxyethyl)-beta-alanine",
                "N-(decanoyl)ethanolamine",
                "Pentane-1,5-diol",
                "all-trans-retinol",
                "allyl alcohol",
                "cinnamyl alcohol",
                "diethyl 2-methyl-3-hydroxysuccinate",
                "ethanol-d6",
                "ethanolamine",
                "ethanols",
                "ethyl (11Z)-docosenoate",
                "ethyl (R)-3-hydroxybutanoate",
                "ethyl (S)-3-hydroxyhexanoate",
                "ethyl 2-hydroxypropanoate",
                "ethyl octanoate",
                "furfuryl alcohol",
                "geraniol",
                "glycerone derivative",
                "hexyl hexanoate",
                "hexyl propanoate",
                "methanol",
                "methanol-d1",
                "methyl 3-(2-phenoxy-6-quinolyl)alaninate",
                "methyl N-(2,6-dimethylphenyl)-N-(methoxyacetyl)alaninate",
                "primary allylic alcohol",
                "retinol",
                "retinyl acetate",
                "tetrahydrofurfuryl alcohol"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (MeOH)",
            "Ethanol (EtOH)",
            "1-Propanol (n-PrOH)",
            "1-Butanol (n-BuOH)",
            "1-Pentanol (n-AmOH)",
            "1-Hexanol (n-HexOH)",
            "1-Heptanol (n-HepOH)",
            "1-Octanol (n-OctOH)",
            "1-Nonanol",
            "1-Decanol",
            "1-Undecanol",
            "1-Dodecanol",
            "1-Tridecanol",
            "1-Tetradecanol",
            "1-Pentadecanol",
            "1-Hexadecanol",
            "1-Heptadecanol",
            "1-Octadecanol",
            "1-Nonadecanol",
            "1-Eicosanol",
            "1-Heneicosanol",
            "1-Docosanol",
            "1-Tricosanol",
            "1-Tetracosanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Methanol (MeOH)",
                "Ethanol (EtOH)",
                "1-Propanol (n-PrOH)",
                "1-Butanol (n-BuOH)",
                "1-Pentanol (n-AmOH)",
                "1-Hexanol (n-HexOH)",
                "1-Heptanol (n-HepOH)",
                "1-Octanol (n-OctOH)",
                "1-Nonanol",
                "1-Decanol",
                "1-Undecanol",
                "1-Dodecanol",
                "1-Tridecanol",
                "1-Tetradecanol",
                "1-Pentadecanol",
                "1-Hexadecanol",
                "1-Heptadecanol",
                "1-Octadecanol",
                "1-Nonadecanol",
                "1-Eicosanol",
                "1-Heneicosanol",
                "1-Docosanol",
                "1-Tricosanol",
                "1-Tetracosanol"
            ],
            "true_referents": [
                "(+)-albicanol",
                "(3,4-dimethoxyphenyl)methanol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1-O-dodecylglycerol",
                "13-Docosenoic acid, methyl ester",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-hydroxyethyl hexadecanoate",
                "2-hydroxyethyl octadecanoate",
                "3-methoxy-1-butanol",
                "Methyl Hexacosanoate",
                "N-(docosanoyl)ethanolamine",
                "N-(hexanoyl)ethanolamine",
                "Pentadecanoyl-EA",
                "Pentane-1,5-diol",
                "Tricosanoyl-EA",
                "all-trans-undecaprenol",
                "butyl butanoate",
                "dodecan-1-ol",
                "dodecyl dodecanoate",
                "ethanol-d6",
                "ethanols",
                "ethyl (4Z,7Z,10Z,13Z,16Z)-henicosapentaenoate",
                "ethyl 3-hydroxytridecanoate",
                "ethyl arachidonate",
                "ethyl decanoate",
                "ethyl heptanoate",
                "ethyl hexadecanoate",
                "ethyl nonanoate",
                "ethyl octadecanoate",
                "ethyl octanoate",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl octanoate",
                "hexyl propanoate",
                "methanol",
                "methanol-d1",
                "methyl arachidonate",
                "methyl henicosanoate",
                "methyl heptadecanoate",
                "methyl nonadecanoate",
                "methyl tetracosanoate",
                "methyl tetradecanoate",
                "methyl tricosanoate",
                "methyl tridecanoate",
                "pentadecan-1-ol",
                "propan-1-ol",
                "tetracosan-1-ol",
                "tetradecyl tetradecanoate",
                "tricosan-1-ol",
                "undecan-1-ol",
                "undecane-1,11-diol"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (CH3OH)",
            "Ethanol (CH3CH2OH)",
            "1-Propanol (CH3CH2CH2OH)",
            "1-Butanol (CH3(CH2)2CH2OH)",
            "1-Pentanol (CH3(CH2)3CH2OH)",
            "1-Hexanol (CH3(CH2)4CH2OH)",
            "1-Heptanol (CH3(CH2)5CH2OH)",
            "1-Octanol (CH3(CH2)6CH2OH)",
            "1-Nonanol (CH3(CH2)7CH2OH)",
            "1-Decanol (CH3(CH2)8CH2OH)",
            "1-Undecanol (CH3(CH2)9CH2OH)",
            "1-Dodecanol (CH3(CH2)10CH2OH)",
            "Benzyl alcohol (C6H5CH2OH)",
            "2-Phenylethanol (C6H5CH2CH2OH)",
            "3-Phenyl-1-propanol (C6H5CH2CH2CH2OH)",
            "Cyclohexanemethanol (C6H11CH2OH)",
            "2-Methylcyclohexanemethanol ((CH3)C6H10CH2OH)",
            "2-Ethylhexan-1-ol (CH3(CH2)3CH(C2H5)CH2OH)",
            "Isobutanol ((CH3)2CHCH2OH)",
            "tert-Butanol ((CH3)3COH)",
            "Allyl alcohol (CH2=CHCH2OH)",
            "2-Propen-1-ol (CH2=CHCH2OH)",
            "3-Buten-1-ol (CH2=CHCH2CH2OH)",
            "2-Buten-1-ol (CH3CH=CHCH2OH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methanol",
                "2-phenylethanol",
                "2-ethylhexan-1-ol",
                "isobutanol",
                "allyl alcohol",
                "3-buten-1-ol",
                "2-buten-1-ol"
            ],
            "mismatches": [
                "ethanol",
                "1-propanol",
                "1-butanol",
                "1-pentanol",
                "1-hexanol",
                "1-heptanol",
                "1-octanol",
                "1-nonanol",
                "1-decanol",
                "1-undecanol",
                "1-dodecanol",
                "benzyl alcohol",
                "3-phenyl-1-propanol",
                "cyclohexanemethanol",
                "2-methylcyclohexanemethanol",
                "tert-butanol",
                "2-propen-1-ol"
            ],
            "true_referents": [
                "(2-methyl-4,5-ditridecyl-1,4-cyclohexadienyl)methanol",
                "(2E,4E)-2,4-hexadien-1-ol",
                "(3,4-dimethoxyphenyl)methanol",
                "(3R)-3,10-dihydroxydecanoic acid",
                "(S)-2-methylbutan-1-ol",
                "1-hydroxy-5-phenyl-3-pentanone",
                "2,3,4-Trimethyl-1-pentanol",
                "2-(2-hydroxyphenyl)ethanol",
                "2-Buten-1-ol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-Methyl-2-buten-1-ol",
                "2-Methyl-3-buten-1-ol",
                "2-butyl-1-octanol",
                "2-ethylhexan-1-ol",
                "2-isopropyl-5-methyl-1-heptanol",
                "2-methyl-2-hydroxy-1-propanol",
                "2-phenoxyethanol",
                "2-phenylethanol",
                "3-Buten-1-ol",
                "3-ethoxy-1-propanol",
                "3-methoxy-1-butanol",
                "3-methylbenzyl alcohol",
                "4-carboxybenzyl alcohol",
                "4-ethylbenzyl alcohol",
                "4-methylcyclohexanemethanol",
                "Cyclohex-2-enylmethanol",
                "Methyl 9-undecenoate",
                "Pentane-1,5-diol",
                "allyl alcohol",
                "ethanol-d6",
                "ethanols",
                "ethyl (R)-3-hydroxybutanoate",
                "ethyl (R)-3-hydroxyhexanoate",
                "ethyl decanoate",
                "ethyl heptanoate",
                "ethyl nonanoate",
                "ethyl octanoate",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl propanoate",
                "isobutanol",
                "methanol",
                "methanol-d1",
                "methyl 4,10-dimethyldodecanoate",
                "methyl 4,9-dimethyldecanoate",
                "primary allylic alcohol",
                "propan-1-ol",
                "undecane-1,11-diol"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (MeOH)",
            "Ethanol (EtOH)",
            "1-Propanol (1-PrOH)",
            "1-Butanol (1-BuOH)",
            "1-Pentanol (1-PeOH)",
            "1-Hexanol (1-HexOH)",
            "1-Heptanol (1-HepOH)",
            "1-Octanol (1-OctOH)",
            "1-Nonanol (1-NonOH)",
            "1-Decanol (1-DecOH)",
            "1-Undecanol (1-UndOH)",
            "1-Dodecanol (1-DodOH)",
            "1-Tridecanol (1-TridOH)",
            "1-Tetradecanol (1-TetradOH)",
            "1-Pentadecanol (1-PentadOH)",
            "1-Hexadecanol (1-HexadOH)",
            "1-Heptadecanol (1-HeptadOH)",
            "1-Octadecanol (1-OctadOH)",
            "1-Nonadecanol (1-NonadOH)",
            "1-Eicosanol (1-EicosOH)",
            "1-Heneicosanol (1-HeneicosOH)",
            "1-Docosanol (1-DocosOH)",
            "1-Tricosanol (1-TricosOH)",
            "1-Tetracosanol (1-TetracosOH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methanol",
                "propan-1-ol",
                "pentan-1-ol",
                "tricosan-1-ol"
            ],
            "mismatches": [
                "ethanol",
                "1-butanol",
                "1-pentanol",
                "1-hexanol",
                "1-heptanol",
                "1-octanol",
                "1-nonanol",
                "1-decanol",
                "1-undecanol",
                "1-dodecanol",
                "1-tridecanol",
                "1-tetradecanol",
                "1-pentadecanol",
                "1-hexadecanol",
                "1-heptadecanol",
                "1-octadecanol",
                "1-nonadecanol",
                "1-eicosanol",
                "1-heneicosanol",
                "1-docosanol",
                "1-tetracosanol"
            ],
            "true_referents": [
                "(3,4-dimethoxyphenyl)methanol",
                "(3R)-3,10-dihydroxydecanoic acid",
                "(3R)-3,13-dihydroxytridecanoic acid",
                "1,2-dodecanediol",
                "1,4-dodecanediol",
                "1,9-decanediol",
                "13-Docosenoic acid, methyl ester",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-hydroxyethyl hexadecanoate",
                "2-hydroxyethyl octadecanoate",
                "2-methyl-2-hydroxy-1-propanol",
                "3,5-dimethoxy-4-hydroxybenzyl alcohol-4-O-beta-D-glucopyranoside",
                "3-ethoxy-1-propanol",
                "3-methoxy-1-butanol",
                "6-oxo-nonan-1-ol",
                "Pentane-1,5-diol",
                "all-trans-undecaprenol",
                "butyl butanoate",
                "docosan-1-ol",
                "dodecan-1-ol",
                "ethanol-d6",
                "ethanols",
                "ethyl (4Z,7Z,10Z,13Z,16Z)-henicosapentaenoate",
                "ethyl (4Z,7Z,10Z,13Z,16Z,19Z)-docosahexaenoate",
                "ethyl arachidonate",
                "ethyl decanoate",
                "ethyl heptanoate",
                "ethyl hexadecanoate",
                "ethyl nonanoate",
                "ethyl octadecanoate",
                "heptan-1-ol",
                "hexane-1,6-diol",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl octanoate",
                "hexyl propanoate",
                "methanol",
                "methanol-d1",
                "methyl 4,10-dimethyldodecanoate",
                "methyl henicosanoate",
                "methyl heptadecanoate",
                "methyl tetracosanoate",
                "octan-1-ol",
                "pentadecan-1-ol",
                "pentan-1-ol",
                "propan-1-ol",
                "tetracosan-1-ol",
                "tetradecyl tetradecanoate",
                "tricosan-1-ol",
                "undecan-1-ol",
                "undecane-1,11-diol"
            ],
            "TP": 4,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Ethanol (EtOH)",
            "Glycerol",
            "Glyceraldehyde",
            "Dihydroxyacetone",
            "Sorbitol",
            "Xylitol",
            "Arabinose",
            "Rhamnose",
            "Fucose",
            "Galactose",
            "Glucose",
            "Mannose",
            "Fructose",
            "Ribose",
            "Adipic acid",
            "Pentaerythritol",
            "Cetyl alcohol",
            "Stearyl alcohol",
            "Oleyl alcohol",
            "Linoleyl alcohol",
            "Linolenyl alcohol",
            "Eicosanoid",
            "Prostaglandin",
            "Cholesterol",
            "Erythritol",
            "Xylaric acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dihydroxyacetone",
                "Pentaerythritol"
            ],
            "mismatches": [
                "Ethanol (EtOH)",
                "Glycerol",
                "Glyceraldehyde",
                "Sorbitol",
                "Xylitol",
                "Arabinose",
                "Rhamnose",
                "Fucose",
                "Galactose",
                "Glucose",
                "Mannose",
                "Fructose",
                "Ribose",
                "Adipic acid",
                "Cetyl alcohol",
                "Stearyl alcohol",
                "Oleyl alcohol",
                "Linoleyl alcohol",
                "Linolenyl alcohol",
                "Eicosanoid",
                "Prostaglandin",
                "Cholesterol",
                "Erythritol",
                "Xylaric acid"
            ],
            "true_referents": [
                "(3S,4R)-Ketose 1-phosphate",
                "(beta-D-glucopyranosyloxymethyl)deoxyuridine",
                "(beta-D-glucopyranosyloxymethyl)deoxyuridine 5'-monophosphate",
                "11beta-prostaglandin F2alpha ethanolamide",
                "3,5-dimethoxy-4-hydroxybenzyl alcohol-4-O-beta-D-glucopyranoside",
                "4-amino-4-deoxy-alpha-L-arabinopyranosyl undecaprenyl phosphate",
                "8-demethyl-8-(2-O-methyl-alpha-L-rhamnosyl)tetracenomycin C",
                "8-demethyl-8-(alpha-L-rhamnosyl)tetracenomycin C",
                "Adifoline",
                "Dimethyl adipate",
                "Methyl Hexacosanoate",
                "Methyl stearate",
                "aspartame",
                "bis(2-ethylhexyl) adipate",
                "dihydroxyacetone",
                "ethanol-d6",
                "ethanols",
                "ethyl (11Z)-docosenoate",
                "ethyl arachidonate",
                "ethyl butyrate",
                "ethyl ester",
                "ethyl glyoxylate",
                "ethyl isobutyrate",
                "ethyl linoleate",
                "ethyl linolenate",
                "ethyl sorbate",
                "glycerone derivative",
                "glycidol",
                "glycolic acid",
                "hydroxyacetone",
                "isopentenyl alcohol",
                "methanol",
                "methyl 9-(alpha-D-galactosyloxy)nonanoate",
                "methyl D-glucopyranuronate",
                "methyl arachidate",
                "methyl arachidonate",
                "methyl beta-D-glucopyranuronate",
                "methyl ester",
                "methyl pyruvate",
                "oleyl acetate",
                "oleyl oleate",
                "pentaerythritol",
                "pentaerythritol dinitrate",
                "pentyl acetate",
                "phosphoglycolohydroxamic acid",
                "propyl butyrate",
                "prostaglandin H2 1-ethanolamide",
                "retinol",
                "stearyl oleate",
                "stearyl palmitate",
                "triethylene glycol"
            ],
            "TP": 2,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (MeOH)",
            "Ethanol (EtOH)",
            "1-Propanol (n-PrOH)",
            "Isopropanol (i-PrOH)",
            "1-Butanol (n-BuOH)",
            "Isobutanol (i-BuOH)",
            "1-Pentanol (n-PeOH)",
            "2-Methyl-1-propanol",
            "1-Hexanol (n-HexOH)",
            "1-Heptanol (n-HepOH)",
            "1-Octanol (n-OctOH)",
            "1-Nonanol (n-NonOH)",
            "1-Decanol (n-DecOH)",
            "Benzyl alcohol",
            "Furfuryl alcohol",
            "Cinnamyl alcohol",
            "Vanillyl alcohol",
            "Salicyl alcohol",
            "Mandelic acid",
            "Glycolic acid",
            "Lactic acid",
            "Retinol",
            "Cholesterol",
            "Ergosterol",
            "Sitosterol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "isobutanol",
                "furfuryl alcohol",
                "cinnamyl alcohol",
                "salicyl alcohol",
                "glycolic acid",
                "retinol"
            ],
            "mismatches": [
                "Methanol (MeOH)",
                "Ethanol (EtOH)",
                "1-Propanol (n-PrOH)",
                "Isopropanol (i-PrOH)",
                "1-Butanol (n-BuOH)",
                "1-Pentanol (n-PeOH)",
                "2-Methyl-1-propanol",
                "1-Hexanol (n-HexOH)",
                "1-Heptanol (n-HepOH)",
                "1-Octanol (n-OctOH)",
                "1-Nonanol (n-NonOH)",
                "1-Decanol (n-DecOH)",
                "Benzyl alcohol",
                "Vanillyl alcohol",
                "Mandelic acid",
                "Lactic acid",
                "Cholesterol",
                "Ergosterol",
                "Sitosterol"
            ],
            "true_referents": [
                "(24Z),26-hydroxydesmosterol",
                "(3,4-dimethoxyphenyl)methanol",
                "(3R,3aS,6aR)-hexahydrofuro[2,3-b]furan-3-yl glycolate",
                "(E)-cinnamyl alcohol",
                "(Z)-cinnamyl alcohol",
                "1,9-decanediol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-hydroxyethyl salicylate",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylbutyl decanoate",
                "2-methylpropane-1,2-diol",
                "3-methoxy-1-butanol",
                "3-methylbenzyl alcohol",
                "3beta-hydroxy-4alpha-hydroxymethyl-4beta-methylsteroid",
                "4-carboxybenzyl alcohol",
                "4-ethylbenzyl alcohol",
                "6-oxo-nonan-1-ol",
                "Methyl stearate",
                "N-(hexanoyl)ethanolamine",
                "Pentane-1,5-diol",
                "\\{4-[(Vinyloxy)methyl]cyclohexyl\\}methanol",
                "all-trans-retinol",
                "butyl butanoate",
                "cinnamyl alcohol",
                "diethyl maleate",
                "ethanol-d6",
                "ethanols",
                "ethyl (2R)-lactate",
                "ethyl (2S)-lactate",
                "ethyl decanoate",
                "ethyl glyoxylate",
                "ethyl heptanoate",
                "ethyl isobutyrate",
                "ethyl nonanoate",
                "ethyl octanoate",
                "farnesol",
                "furfuryl alcohol",
                "gentisyl alcohol",
                "glycolic acid",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl octanoate",
                "hexyl propanoate",
                "isobutanol",
                "isobutyl acetate",
                "isobutyl decanoate",
                "isobutyl hexanoate",
                "methanol",
                "methanol-d1",
                "methyl arachidate",
                "methyl arachidonate",
                "methyl salicylate",
                "pentan-1-ol",
                "propan-1-ol",
                "retinol",
                "retinyl acetate",
                "salicyl alcohol",
                "tetrahydrofurfuryl alcohol",
                "veratryl alcohol methyl ether"
            ],
            "TP": 6,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Propan-1-ol",
            "1-Propanol",
            "1-Hydroxypropane",
            "1-Propanol",
            "1-Hydroxypropane",
            "1-Propanol",
            "1-Hydroxypropane",
            "1-Propanol",
            "1-Hydroxypropane",
            "1-Propanol",
            "1-Hydroxypropane",
            "1-Propanol",
            "1-Hydroxypropane",
            "1-Propanol",
            "1-Hydroxypropane",
            "1-Propanol",
            "1-Hydroxypropane",
            "1-Propanol",
            "1-Hydroxypropane",
            "1-Propanol",
            "1-Hydroxypropane",
            "1-Propanol",
            "1-Hydroxypropane",
            "1-Propanol",
            "1-Hydroxypropane",
            "1-Propanol",
            "1-Hydroxypropane",
            "1-Propanol",
            "1-Hydroxypropane"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Propan-1-ol",
                "1-Propanol"
            ],
            "mismatches": [
                "1-Hydroxypropane"
            ],
            "true_referents": [
                "3-methylbutyl 2-hydroxypropanoate",
                "ethyl 2-hydroxypropanoate",
                "hexyl propanoate",
                "propan-1-ol",
                "propan-1-ols",
                "propyl decanoate"
            ],
            "TP": 2,
            "FP": 1,
            "FN": 0
        }
    }
]