[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Propanol (Isopropanol)",
            "1-Propanol",
            "2-Methyl-2-propanol (Tertiary Butyl Alcohol)",
            "2-Methyl-1-propanol",
            "2,2-Dimethyl-1-propanol",
            "2,2-Dimethyl-1,3-propanediol (Pinacol)",
            "2,2-Dimethyl-1,3-propanediol (Pinacolone)",
            "2,2-Dimethyl-1,3-propanediol (Pinacolone Derivatives)",
            "2,2-Dimethyl-1,3-propanediol (Pinacolone Derivative)",
            "1,1-Dimethyl-1-propanol",
            "1,1-Dimethyl-2-propanol",
            "1,1-Dimethyl-3-propanol",
            "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol)",
            "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol Derivative)",
            "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol Derivatives)",
            "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol Derivative)",
            "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol Derivative)",
            "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol Derivative)",
            "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol Derivative)",
            "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol Derivative)",
            "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol Derivative)",
            "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol Derivative)",
            "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol Derivative)",
            "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol Derivative)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "2-Propanol (Isopropanol)",
                "1-Propanol",
                "2-Methyl-2-propanol (Tertiary Butyl Alcohol)",
                "2-Methyl-1-propanol",
                "2,2-Dimethyl-1-propanol",
                "2,2-Dimethyl-1,3-propanediol (Pinacol)",
                "2,2-Dimethyl-1,3-propanediol (Pinacolone)",
                "2,2-Dimethyl-1,3-propanediol (Pinacolone Derivatives)",
                "2,2-Dimethyl-1,3-propanediol (Pinacolone Derivative)",
                "1,1-Dimethyl-1-propanol",
                "1,1-Dimethyl-2-propanol",
                "1,1-Dimethyl-3-propanol",
                "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol)",
                "2,2-Dimethyl-1-propanol (Di-t-butyl Alcohol Derivative)"
            ],
            "true_referents": [
                "(S)-2-methylbutan-1-ol",
                "1,7-decanediol",
                "1,9-decanediol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylbutyl decanoate",
                "2-methylene-1,4-butanediol",
                "2-methylpropane-1,2-diol",
                "3-ethoxy-1-propanol",
                "3-methoxy-1-butanol",
                "hexyl propanoate",
                "propyl decanoate"
            ],
            "TP": 0,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Ethanol (EtOH)",
            "1-Propanol (n-PrOH)",
            "2-Propanol (Isopropanol, i-PrOH)",
            "1-Butanol (n-Butanol, n-BuOH)",
            "2-Butanol (Sec-Butanol, s-BuOH)",
            "1-Pentanol (n-Pentanol, n-Pentyl alcohol)",
            "2-Pentanol (Methylbutan-2-ol)",
            "1-Hexanol (n-Hexanol, n-Hexyl alcohol)",
            "2-Hexanol (Methylpentan-2-ol)",
            "1-Heptanol (n-Heptanol, n-Heptyl alcohol)",
            "2-Heptanol (Methylhexan-2-ol)",
            "1-Octanol (n-Octanol, n-Octyl alcohol)",
            "2-Octanol (Methylheptan-2-ol)",
            "1-Nonanol (n-Nonanol, n-Nonyl alcohol)",
            "2-Nonanol (Methyloctan-2-ol)",
            "1-Decanol (n-Decanol, n-Decyl alcohol)",
            "2-Decanol (Methylnonan-2-ol)",
            "1-Undecanol (n-Undecanol, n-Undecyl alcohol)",
            "2-Undecanol (Methyldecan-2-ol)",
            "1-Dodecanol (n-Dodecanol, n-Dodecyl alcohol)",
            "2-Dodecanol (Methylundecan-2-ol)",
            "1-Tridecanol (n-Tridecanol, n-Tridecyl alcohol)",
            "2-Tridecanol (Methyldodecan-2-ol)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Ethanol (EtOH)",
                "1-Propanol (n-PrOH)",
                "2-Propanol (Isopropanol, i-PrOH)",
                "1-Butanol (n-Butanol, n-BuOH)",
                "2-Butanol (Sec-Butanol, s-BuOH)",
                "1-Pentanol (n-Pentanol, n-Pentyl alcohol)",
                "2-Pentanol (Methylbutan-2-ol)",
                "1-Hexanol (n-Hexanol, n-Hexyl alcohol)",
                "2-Hexanol (Methylpentan-2-ol)",
                "1-Heptanol (n-Heptanol, n-Heptyl alcohol)",
                "2-Heptanol (Methylhexan-2-ol)",
                "1-Octanol (n-Octanol, n-Octyl alcohol)",
                "2-Octanol (Methylheptan-2-ol)",
                "1-Nonanol (n-Nonanol, n-Nonyl alcohol)",
                "2-Nonanol (Methyloctan-2-ol)",
                "1-Decanol (n-Decanol, n-Decyl alcohol)",
                "2-Decanol (Methylnonan-2-ol)",
                "1-Undecanol (n-Undecanol, n-Undecyl alcohol)",
                "2-Undecanol (Methyldecan-2-ol)",
                "1-Dodecanol (n-Dodecanol, n-Dodecyl alcohol)",
                "2-Dodecanol (Methylundecan-2-ol)",
                "1-Tridecanol (n-Tridecanol, n-Tridecyl alcohol)",
                "2-Tridecanol (Methyldodecan-2-ol)"
            ],
            "true_referents": [
                "(2R)-2,6-dimethylheptan-1-ol",
                "(3R)-3,10-dihydroxydecanoic acid",
                "(6S)-6-methyloctan-1-ol",
                "(S)-2-methylbutan-1-ol",
                "1,2-dodecanediol",
                "11-methyldodecan-1-ol",
                "2,3,4-Trimethyl-1-pentanol",
                "2,6-dimethylheptan-1-ol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-Methylenebutan-1-ol",
                "2-butyl-1-octanol",
                "2-ethylhexan-1-ol",
                "2-isopropyl-5-methyl-1-heptanol",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylbutan-1-ol",
                "2-methylbutyl butanoate",
                "2-methylpropane-1,2-diol",
                "3,7,11-trimethyldodecan-1-ol",
                "3-methoxy-1-butanol",
                "4-methylpentan-1-ol",
                "6-oxo-nonan-1-ol",
                "9-methyldecan-1-ol",
                "N-(decanoyl)ethanolamine",
                "N-(dodecanoyl)ethanolamine",
                "N-(hexanoyl)ethanolamine",
                "N-(tetradecanoyl)ethanolamine",
                "Pentane-1,5-diol",
                "Unsaturated alcohol",
                "butyl butanoate",
                "decan-1-ol",
                "dodecan-1-ol",
                "ethanol-d6",
                "ethanols",
                "ethyl dodec-2-enoate",
                "ethyl heptanoate",
                "ethyl nonanoate",
                "ethyl octanoate",
                "hexan-1-ol",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl propanoate",
                "methanol",
                "octan-1-ol",
                "propan-1-ol",
                "undecan-1-ol",
                "undecane-1,11-diol"
            ],
            "TP": 0,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (CH3OH)",
            "Ethanol (C2H5OH)",
            "1-Propanol (C3H7OH)",
            "2-Propanol (C3H7OH)",
            "1-Butanol (C4H9OH)",
            "2-Butanol (C4H9OH)",
            "Isobutanol (C4H9OH)",
            "Tert-Butanol (C4H9OH)",
            "1-Pentanol (C5H11OH)",
            "2-Pentanol (C5H11OH)",
            "3-Pentanol (C5H11OH)",
            "Cyclopentanol (C5H9OH)",
            "1-Hexanol (C6H13OH)",
            "2-Hexanol (C6H13OH)",
            "3-Hexanol (C6H13OH)",
            "Cyclohexanol (C6H11OH)",
            "1-Heptanol (C7H15OH)",
            "2-Heptanol (C7H15OH)",
            "3-Heptanol (C7H15OH)",
            "4-Heptanol (C7H15OH)",
            "1-Octanol (C8H17OH)",
            "2-Octanol (C8H17OH)",
            "3-Octanol (C8H17OH)",
            "4-Octanol (C8H17OH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Isobutanol"
            ],
            "mismatches": [
                "Methanol (CH3OH)",
                "Ethanol (C2H5OH)",
                "1-Propanol (C3H7OH)",
                "2-Propanol (C3H7OH)",
                "1-Butanol (C4H9OH)",
                "2-Butanol (C4H9OH)",
                "Tert-Butanol (C4H9OH)",
                "1-Pentanol (C5H11OH)",
                "2-Pentanol (C5H11OH)",
                "3-Pentanol (C5H11OH)",
                "Cyclopentanol (C5H9OH)",
                "1-Hexanol (C6H13OH)",
                "2-Hexanol (C6H13OH)",
                "3-Hexanol (C6H13OH)",
                "Cyclohexanol (C6H11OH)",
                "1-Heptanol (C7H15OH)",
                "2-Heptanol (C7H15OH)",
                "3-Heptanol (C7H15OH)",
                "4-Heptanol (C7H15OH)",
                "1-Octanol (C8H17OH)",
                "2-Octanol (C8H17OH)",
                "3-Octanol (C8H17OH)",
                "4-Octanol (C8H17OH)"
            ],
            "true_referents": [
                "(1S,2S)-3-oxo-2-(2Z-pentenyl)cyclopentane-1-butyric acid methyl ester",
                "(2-methyl-4,5-ditridecyl-1,4-cyclohexadienyl)methanol",
                "(3,4-dimethoxyphenyl)methanol",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-isopropyl-5-methyl-1-heptanol",
                "2-methyl-2-hydroxy-1-propanol",
                "3-Cyclohexene-1-ethanol",
                "3-Cyclopentyl-1-propanol",
                "3-ethoxy-1-propanol",
                "Pentane-1,5-diol",
                "butyl butanoate",
                "ethanol-d6",
                "ethanols",
                "ethyl 3-oxohexanoate",
                "ethyl heptanoate",
                "ethyl hexanoate",
                "ethyl isobutyrate",
                "ethyl octanoate",
                "hexane-1,6-diol",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl octanoate",
                "hexyl propanoate",
                "isobutanol",
                "isobutyl acetate",
                "methanol",
                "methanol-d1"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Ethanol (EtOH)",
            "2-Propanol (IPA)",
            "1-Butanol (BuOH)",
            "2-Butanol (sec-BuOH)",
            "3-Methyl-1-Butanol (isoamyl alcohol)",
            "2-Methyl-2-Propanol (tert-Butyl alcohol)",
            "1-Pentanol (Amyl alcohol)",
            "2-Pentanol",
            "3-Pentanol",
            "2-Methyl-1-Butanol",
            "3-Methyl-2-Butanol",
            "1-Hexanol",
            "2-Hexanol",
            "3-Hexanol",
            "Cyclohexanol (CyOH)",
            "4-Methyl-2-Pentanol",
            "2-Ethyl-1-Butanol",
            "1-Heptanol",
            "2-Heptanol",
            "3-Heptanol",
            "1-Octanol",
            "2-Octanol",
            "2,2-Dimethyl-1-Propanol (Neopentyl alcohol)",
            "3-Ethyl-3-Pentanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Ethanol (EtOH)",
                "2-Propanol (IPA)",
                "1-Butanol (BuOH)",
                "2-Butanol (sec-BuOH)",
                "3-Methyl-1-Butanol (isoamyl alcohol)",
                "2-Methyl-2-Propanol (tert-Butyl alcohol)",
                "1-Pentanol (Amyl alcohol)",
                "2-Pentanol",
                "3-Pentanol",
                "2-Methyl-1-Butanol",
                "3-Methyl-2-Butanol",
                "1-Hexanol",
                "2-Hexanol",
                "3-Hexanol",
                "Cyclohexanol (CyOH)",
                "4-Methyl-2-Pentanol",
                "2-Ethyl-1-Butanol",
                "1-Heptanol",
                "2-Heptanol",
                "3-Heptanol",
                "1-Octanol",
                "2-Octanol",
                "2,2-Dimethyl-1-Propanol (Neopentyl alcohol)",
                "3-Ethyl-3-Pentanol"
            ],
            "true_referents": [
                "(S)-2-methylbutan-1-ol",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-ethoxyethanol",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylbutyl butanoate",
                "2-methylbutyl decanoate",
                "2-methylpropane-1,2-diol",
                "3,4-dimethylbenzyl alcohol",
                "3-Cyclohexene-1-ethanol",
                "3-methoxy-1-butanol",
                "3-methylbenzyl alcohol",
                "3-methylbutyl octanoate",
                "3-methylpentanol",
                "4-methylpentan-1-ol",
                "Pentane-1,5-diol",
                "butyl butanoate",
                "ethanol-d6",
                "ethanols",
                "ethyl 3-oxohexanoate",
                "ethyl heptanoate",
                "ethyl hexanoate",
                "ethyl octanoate",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "methanol",
                "methyl hexanoate",
                "octan-1-ol",
                "propyl decanoate"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (CH3OH)",
            "Ethanol (C2H5OH)",
            "Propanol (C3H7OH)",
            "Butanol (C4H9OH)",
            "Isopropanol (C3H8O)",
            "Pentanol (C5H11OH)",
            "Hexanol (C6H13OH)",
            "Heptanol (C7H15OH)",
            "Octanol (C8H17OH)",
            "Nonanol (C9H19OH)",
            "Decanol (C10H21OH)",
            "Undecanol (C11H23OH)",
            "Dodecanol (C12H25OH)",
            "Tridecanol (C13H27OH)",
            "Tetradecanol (C14H29OH)",
            "Pentadecanol (C15H31OH)",
            "Hexadecanol (C16H33OH)",
            "Heptadecanol (C17H35OH)",
            "Octadecanol (C18H37OH)",
            "Nonadecanol (C19H39OH)",
            "Eicosanol (C20H41OH)",
            "Isobutanol (C4H10O)",
            "Isopentanol (C5H12O)",
            "Neopentanol (C5H12O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Isobutanol"
            ],
            "mismatches": [
                "Methanol (CH3OH)",
                "Ethanol (C2H5OH)",
                "Propanol (C3H7OH)",
                "Butanol (C4H9OH)",
                "Isopropanol (C3H8O)",
                "Pentanol (C5H11OH)",
                "Hexanol (C6H13OH)",
                "Heptanol (C7H15OH)",
                "Octanol (C8H17OH)",
                "Nonanol (C9H19OH)",
                "Decanol (C10H21OH)",
                "Undecanol (C11H23OH)",
                "Dodecanol (C12H25OH)",
                "Tridecanol (C13H27OH)",
                "Tetradecanol (C14H29OH)",
                "Pentadecanol (C15H31OH)",
                "Hexadecanol (C16H33OH)",
                "Heptadecanol (C17H35OH)",
                "Octadecanol (C18H37OH)",
                "Nonadecanol (C19H39OH)",
                "Eicosanol (C20H41OH)",
                "Isopentanol (C5H12O)",
                "Neopentanol (C5H12O)"
            ],
            "true_referents": [
                "(3,4-dimethoxyphenyl)methanol",
                "(3R)-3,10-dihydroxydecanoic acid",
                "1,5-dodecanediol",
                "1,7-decanediol",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-hydroxyethyl octadecanoate",
                "2-isopropyl-5-methyl-1-heptanol",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylpropane-1,2-diol",
                "3-ethoxy-1-propanol",
                "3-methylpentanol",
                "5-hydroxypentan-2-one",
                "6-oxo-nonan-1-ol",
                "9R-hydroxy-10E,12E-octadecadienoic acid, methyl ester",
                "Methyl 9,11-epidioxy-12,15-dihydroperoxy-5,7,13-eicosatrienoate",
                "Pentane-1,5-diol",
                "butyl butanoate",
                "dodecan-1-ol",
                "dodecyl dodecanoate",
                "ethanol-d6",
                "ethanols",
                "ethyl 3-hydroxytridecanoate",
                "ethyl decanoate",
                "ethyl heptanoate",
                "ethyl hexadecanoate",
                "ethyl hexanoate",
                "ethyl isobutyrate",
                "ethyl nonanoate",
                "ethyl octadecanoate",
                "ethyl octanoate",
                "hexane-1,6-diol",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl octanoate",
                "hexyl propanoate",
                "isobutanol",
                "isobutyl acetate",
                "methanol",
                "methanol-d1",
                "methyl 4,9-dimethyldecanoate",
                "methyl 5-hydroperoxy-6,8,9,11-bisepidioxy-12,14-eicosadienoate",
                "methyl 6,8-epidioxy-5,15-dihydroperoxy-9,11,13-eicosatrienoate",
                "methyl heptadecanoate",
                "methyl undecanoate",
                "pentadecan-1-ol",
                "tetradecyl tetradecanoate",
                "undecan-1-ol",
                "undecane-1,11-diol"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Ethanol (EtOH)",
            "Propan-1-ol (1-Propanol)",
            "Butan-1-ol (1-Butanol)",
            "Pentanol (Pentyl alcohol)",
            "Hexan-1-ol (1-Hexanol)",
            "Heptan-1-ol (1-Heptanol)",
            "Octan-1-ol (1-Octanol)",
            "Nonan-1-ol (1-Nonanol)",
            "Decan-1-ol (1-Decanol)",
            "Cyclopropanol (Cyclopropyl alcohol)",
            "Cyclobutanol (Cyclobutyl alcohol)",
            "Cyclopentanol (Cyclopentyl alcohol)",
            "Cyclohexanol (Cyclohexyl alcohol)",
            "Phenol (Hydroxybenzene)",
            "Glycerol (Glycerin)",
            "2-Propanol (Isopropanol)",
            "2-Butanol (Sec-butanol)",
            "3-Pentanol (3-Pentanol)",
            "2-Pentanol (2-Pentanol)",
            "2-Hexanol (2-Hexanol)",
            "3-Hexanol (3-Hexanol)",
            "3-Octanol (3-Octanol)",
            "1-Butanol (Butyl alcohol)",
            "1-Pentanol (Pentyl alcohol)",
            "1-Hexanol (Hexyl alcohol)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Propan-1-ol (1-Propanol)",
                "Butan-1-ol (1-Butanol)",
                "Hexan-1-ol (1-Hexanol)",
                "Heptan-1-ol (1-Heptanol)",
                "Octan-1-ol (1-Octanol)",
                "Nonan-1-ol (1-Nonanol)",
                "Decan-1-ol (1-Decanol)"
            ],
            "mismatches": [
                "Ethanol (EtOH)",
                "Pentanol (Pentyl alcohol)",
                "Cyclopropanol (Cyclopropyl alcohol)",
                "Cyclobutanol (Cyclobutyl alcohol)",
                "Cyclopentanol (Cyclopentyl alcohol)",
                "Cyclohexanol (Cyclohexyl alcohol)",
                "Phenol (Hydroxybenzene)",
                "Glycerol (Glycerin)",
                "2-Propanol (Isopropanol)",
                "2-Butanol (Sec-butanol)",
                "3-Pentanol (3-Pentanol)",
                "2-Pentanol (2-Pentanol)",
                "2-Hexanol (2-Hexanol)",
                "3-Hexanol (3-Hexanol)",
                "3-Octanol (3-Octanol)",
                "1-Butanol (Butyl alcohol)",
                "1-Pentanol (Pentyl alcohol)",
                "1-Hexanol (Hexyl alcohol)"
            ],
            "true_referents": [
                "(1S,2S)-3-oxo-2-(2Z-pentenyl)cyclopentane-1-butyric acid methyl ester",
                "(2-methyl-4,5-ditridecyl-1,4-cyclohexadienyl)methanol",
                "(E)-3-decen-1-ol",
                "1-O-dodecylglycerol",
                "2,3,4-Trimethyl-1-pentanol",
                "2,6-dimethylheptan-1-ol",
                "2-(cyclohex-2-en-1-yl)ethanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-ethylhexan-1-ol",
                "2-hexen-1-ol",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylbutyl butanoate",
                "2-methylbutyl hexanoate",
                "2-methylpropane-1,2-diol",
                "3-Cyclohexene-1-ethanol",
                "3-Cyclopentyl-1-propanol",
                "3-ethoxy-1-propanol",
                "3-methylbutyl hexanoate",
                "4-chlorobutanol",
                "6-oxo-nonan-1-ol",
                "Pentane-1,5-diol",
                "butan-1-ol",
                "butyl butanoate",
                "decan-1-ol",
                "ethanol-d6",
                "ethanols",
                "ethyl 3,4-dihydroxybenzoate",
                "ethyl 3-hexenoate",
                "ethyl hydroxy(phenyl)acetate",
                "ethyl nonanoate",
                "ethyl octanoate",
                "glycerone derivative",
                "heptan-1-ol",
                "hexan-1-ol",
                "hexyl hexanoate",
                "hexyl propanoate",
                "isopentenyl alcohol",
                "methanol",
                "nonan-1-ol",
                "octacosan-1-ol",
                "octan-1-ol",
                "pentyl propanoate",
                "propan-1-ol",
                "propan-1-ols",
                "triethylene glycol"
            ],
            "TP": 7,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (CH3OH)",
            "Ethanol (C2H5OH)",
            "Propanol (C3H7OH)",
            "Butanol (C4H9OH)",
            "Pentanol (C5H11OH)",
            "Hexanol (C6H13OH)",
            "Heptanol (C7H15OH)",
            "Octanol (C8H17OH)",
            "Nonanol (C9H19OH)",
            "Decanol (C10H21OH)",
            "Undecanol (C11H23OH)",
            "Dodecanol (C12H25OH)",
            "Tridecanol (C13H27OH)",
            "Tetradecanol (C14H29OH)",
            "Pentadecanol (C15H31OH)",
            "Hexadecanol (C16H33OH)",
            "Heptadecanol (C17H35OH)",
            "Octadecanol (C18H37OH)",
            "Nonadecanol (C19H39OH)",
            "Eicosanol (C20H41OH)",
            "Heneicosanol (C21H43OH)",
            "Docosanol (C22H45OH)",
            "Tricosanol (C23H47OH)",
            "Tetracosanol (C24H49OH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methanol",
                "undecan-1-ol",
                "dodecan-1-ol",
                "pentadecan-1-ol"
            ],
            "mismatches": [
                "ethanol",
                "propanol",
                "butanol",
                "pentanol",
                "hexanol",
                "heptanol",
                "octanol",
                "nonanol",
                "decanol",
                "tridecanol",
                "tetradecanol",
                "hexadecanol",
                "heptadecanol",
                "octadecanol",
                "nonadecanol",
                "eicosanol",
                "heneicosanol",
                "docosanol",
                "tricosanol",
                "tetracosanol"
            ],
            "true_referents": [
                "(3,4-dimethoxyphenyl)methanol",
                "(3R)-3,10-dihydroxydecanoic acid",
                "1,5-dodecanediol",
                "1,7-decanediol",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-hydroxyethyl octadecanoate",
                "2-isopropyl-5-methyl-1-heptanol",
                "2-methyl-2-hydroxy-1-propanol",
                "3,5-dimethoxy-4-hydroxybenzyl alcohol-4-O-beta-D-glucopyranoside",
                "3-ethoxy-1-propanol",
                "3-methoxy-1-butanol",
                "6-oxo-nonan-1-ol",
                "9R-hydroxy-10E,12E-octadecadienoic acid, methyl ester",
                "Methyl 9,11-epidioxy-12,15-dihydroperoxy-5,7,13-eicosatrienoate",
                "Methyl Hexacosanoate",
                "N-(docosanoyl)ethanolamine",
                "Pentane-1,5-diol",
                "butyl butanoate",
                "dodecan-1-ol",
                "dodecyl dodecanoate",
                "ethanol-d6",
                "ethanols",
                "ethyl (11Z)-docosenoate",
                "ethyl (4Z,7Z,10Z,13Z,16Z)-henicosapentaenoate",
                "ethyl 3-hydroxytridecanoate",
                "ethyl decanoate",
                "ethyl heptanoate",
                "ethyl hexadecanoate",
                "ethyl hexanoate",
                "ethyl nonanoate",
                "ethyl octadecanoate",
                "ethyl octanoate",
                "hexane-1,6-diol",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl octanoate",
                "hexyl propanoate",
                "methanol",
                "methanol-d1",
                "methyl 4,9-dimethyldecanoate",
                "methyl 5-hydroperoxy-6,8,9,11-bisepidioxy-12,14-eicosadienoate",
                "methyl 6,8-epidioxy-5,15-dihydroperoxy-9,11,13-eicosatrienoate",
                "methyl henicosanoate",
                "methyl heptadecanoate",
                "methyl tetracosanoate",
                "methyl tricosanoate",
                "methyl undecanoate",
                "pentadecan-1-ol",
                "tetradecyl tetradecanoate",
                "undecan-1-ol",
                "undecane-1,11-diol"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": "[\n  \"ethanol (CH3CH2OH)\",\n  \"glycerol (CH2OHCHOHCH2OH)\",\n  \"isopropanol (CH3CHOHCH3)\",\n  \"propylene glycol (CH3CHOHCH2OH)\",\n  \"butanol (CH3CH2CH2OH)\",\n  \"tert-butanol (CH3)3COH\",\n  \"pentanol (CH3CH2CH2CH2OH)\",\n  \"hexanol (CH3CH2CH2CH2CH2OH)\",\n  \"heptanol (CH3CH2CH2CH2CH2CH2OH)\",\n  \"octanol (CH3CH2CH2CH2CH2CH2CH2OH)\",\n  \"nonanol (CH3CH2CH2CH2CH2CH2CH2CH2OH)\",\n  \"decanol (CH3CH2CH2CH2CH2CH2CH2CH2CH2OH)\",\n  \"undecanol (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2OH)\",\n  \"dodecanol (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2OH)\",\n  \"tridecanol (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2OH)\",\n  \"tetradecanol (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2OH)\",\n  \"pentadecanol (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2OH)\",\n  \"hexadecanol (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2OH)\",\n  \"heptadecanol (CH3CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2CH2OH)\",\n  \"octadecanol (CH3CH2CH2CH2",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (MeOH)",
            "Ethanol (EtOH)",
            "1-Propanol",
            "1-Butanol",
            "1-Pentanol",
            "1-Hexanol",
            "1-Heptanol",
            "1-Octanol",
            "1-Nonanol",
            "1-Decanol",
            "Benzyl Alcohol",
            "Glycerol",
            "1,3-Propanediol",
            "Trimethylolmethane",
            "1,2-Ethanediol",
            "2-Methyl-1-Propanol",
            "3-Methyl-1-Butanol",
            "1,4-Butanediol",
            "1,5-Pentanediol",
            "Cyclohexanol",
            "1,2-Hydroxypropane",
            "1,3-Hydroxybutane",
            "1,2,3-Propanetriol",
            "1,4-Dihydroxybutane"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Methanol (MeOH)",
                "Ethanol (EtOH)",
                "1-Propanol",
                "1-Butanol",
                "1-Pentanol",
                "1-Hexanol",
                "1-Heptanol",
                "1-Octanol",
                "1-Nonanol",
                "1-Decanol",
                "Benzyl Alcohol",
                "Glycerol",
                "1,3-Propanediol",
                "Trimethylolmethane",
                "1,2-Ethanediol",
                "2-Methyl-1-Propanol",
                "3-Methyl-1-Butanol",
                "1,4-Butanediol",
                "1,5-Pentanediol",
                "Cyclohexanol",
                "1,2-Hydroxypropane",
                "1,3-Hydroxybutane",
                "1,2,3-Propanetriol",
                "1,4-Dihydroxybutane"
            ],
            "true_referents": [
                "(+)-albicanol",
                "(3,4-dimethoxyphenyl)methanol",
                "1,11-dodecanediol",
                "1,2-dodecanediol",
                "1,3-dihydroxybutan-2-one",
                "1,3-dodecanediol",
                "1,5-dodecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "2,3,4-Trimethyl-1-pentanol",
                "2,4-dihydroxybutanoic acid",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-Methyl-3-buten-1-ol",
                "2-butyl-1-octanol",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylbutyl decanoate",
                "2-methylene-1,4-butanediol",
                "2-methylpropane-1,2-diol",
                "3,4-dihydroxybutyric acid",
                "3-Cyclohexene-1-ethanol",
                "3-ethoxy-1-propanol",
                "3-methoxy-1-butanol",
                "3-methylbenzyl alcohol",
                "3-methylbutyl 2-hydroxypropanoate",
                "3-methylbutyl octanoate",
                "4-carboxybenzyl alcohol",
                "4-ethylbenzyl alcohol",
                "Pentane-1,5-diol",
                "Trimethylolpropane",
                "butyl butanoate",
                "ethanol-d6",
                "ethanols",
                "ethyl (R)-3-hydroxybutanoate",
                "ethyl 2-hydroxypropanoate",
                "ethyl 3-hydroxybutyrate",
                "ethyl cyclohexanecarboxylate",
                "ethyl decanoate",
                "ethyl heptanoate",
                "ethyl hexanoate",
                "ethyl nonanoate",
                "ethyl octanoate",
                "glycerone derivative",
                "hexane-1,6-diol",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl propanoate",
                "methanol",
                "methanol-d1",
                "methyl ester",
                "methyl hexanoate",
                "octan-1-ol",
                "pentan-1-ol",
                "propyl decanoate",
                "triethylene glycol",
                "triethylene glycol monomethyl ether"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (CH3OH)",
            "Ethanol (C2H5OH)",
            "1-Propanol (CH3CH2CH2OH)",
            "2-Propanol (Isopropanol, IPA)",
            "1-Butanol (n-Butanol)",
            "2-Butanol (sec-Butanol)",
            "2-Methyl-1-propanol (Isobutanol)",
            "tert-Butanol (2-Methyl-2-propanol)",
            "1-Pentanol (n-Pentanol)",
            "2-Pentanol",
            "3-Pentanol",
            "2-Methyl-1-butanol",
            "3-Methyl-1-butanol (Isopentanol)",
            "2-Methyl-2-butanol",
            "3-Methyl-2-butanol",
            "1-Hexanol",
            "2-Hexanol",
            "3-Hexanol",
            "2-Methyl-1-pentanol",
            "4-Methyl-2-pentanol",
            "1-Heptanol",
            "1-Octanol",
            "1-Nonanol",
            "1-Decanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methanol",
                "ethanols",
                "isobutanol",
                "pentan-1-ol"
            ],
            "mismatches": [
                "1-Propanol (CH3CH2CH2OH)",
                "2-Propanol (Isopropanol, IPA)",
                "1-Butanol (n-Butanol)",
                "2-Butanol (sec-Butanol)",
                "tert-Butanol (2-Methyl-2-propanol)",
                "2-Pentanol",
                "3-Pentanol",
                "2-Methyl-1-butanol",
                "3-Methyl-1-butanol (Isopentanol)",
                "2-Methyl-2-butanol",
                "3-Methyl-2-butanol",
                "1-Hexanol",
                "2-Hexanol",
                "3-Hexanol",
                "2-Methyl-1-pentanol",
                "4-Methyl-2-pentanol",
                "1-Heptanol",
                "1-Octanol",
                "1-Nonanol",
                "1-Decanol"
            ],
            "true_referents": [
                "(+)-albicanol",
                "(3,4-dimethoxyphenyl)methanol",
                "(R)-2-methylbutan-1-ol",
                "(S)-2-methylbutan-1-ol",
                "1,7-decanediol",
                "1,9-decanediol",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylbutyl acetate",
                "2-methylbutyl butanoate",
                "2-methylbutyl decanoate",
                "2-methylpropane-1,2-diol",
                "3-ethoxy-1-propanol",
                "3-methoxy-1-butanol",
                "3-methylbutyl octanoate",
                "3-methylpentanol",
                "4-methylpentan-1-ol",
                "Pentane-1,5-diol",
                "butyl butanoate",
                "ethanol-d6",
                "ethanols",
                "ethyl decanoate",
                "ethyl heptanoate",
                "ethyl hexanoate",
                "ethyl nonanoate",
                "ethyl octanoate",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl propanoate",
                "isobutanol",
                "isobutyl acetate",
                "methanol",
                "methanol-d1",
                "methyl hexanoate",
                "n-butyl oleate",
                "octan-1-ol",
                "pentan-1-ol"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (CH3OH)",
            "Ethanol (C2H5OH)",
            "1-Propanol (n-Propanol)",
            "2-Propanol (Isopropanol, IPA)",
            "1-Butanol (n-Butanol)",
            "2-Butanol (sec-Butanol)",
            "2-Methyl-1-propanol (Isobutanol)",
            "2-Methyl-2-propanol (tert-Butanol)",
            "1-Pentanol (n-Pentanol)",
            "2-Pentanol",
            "3-Pentanol",
            "2-Methyl-1-butanol (Isopentanol)",
            "3-Methyl-1-butanol (Isoamyl alcohol)",
            "2-Methyl-2-butanol",
            "3-Methyl-2-butanol",
            "2,2-Dimethyl-1-propanol (Neopentyl alcohol)",
            "1-Hexanol (n-Hexanol)",
            "2-Hexanol",
            "3-Hexanol",
            "2-Methyl-1-pentanol",
            "3-Methyl-1-pentanol",
            "4-Methyl-1-pentanol",
            "2-Methyl-2-pentanol",
            "3-Methyl-2-pentanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methanol",
                "isobutanol",
                "pentan-1-ol"
            ],
            "mismatches": [
                "ethanol",
                "1-propanol",
                "2-propanol",
                "1-butanol",
                "2-butanol",
                "2-methyl-2-propanol",
                "2-pentanol",
                "3-pentanol",
                "2-methyl-1-butanol",
                "3-methyl-1-butanol",
                "2-methyl-2-butanol",
                "3-methyl-2-butanol",
                "2,2-dimethyl-1-propanol",
                "1-hexanol",
                "2-hexanol",
                "3-hexanol",
                "2-methyl-1-pentanol",
                "3-methyl-1-pentanol",
                "4-methyl-1-pentanol",
                "2-methyl-2-pentanol",
                "3-methyl-2-pentanol"
            ],
            "true_referents": [
                "(3,4-dimethoxyphenyl)methanol",
                "(S)-2-methylbutan-1-ol",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-methyl-2-hydroxy-1-propanol",
                "2-methylbutan-1-ol",
                "2-methylbutyl acetate",
                "2-methylbutyl butanoate",
                "2-methylbutyl decanoate",
                "2-methylpropane-1,2-diol",
                "3,4-dimethylbenzyl alcohol",
                "3-ethoxy-1-propanol",
                "3-methoxy-1-butanol",
                "3-methylbenzyl alcohol",
                "3-methylbutyl octanoate",
                "3-methylpentanol",
                "4-methylpentan-1-ol",
                "N-(hexanoyl)ethanolamine",
                "Pentane-1,5-diol",
                "butyl butanoate",
                "ethanol-d6",
                "ethanols",
                "ethyl hexanoate",
                "hexyl hexanoate",
                "hexyl propanoate",
                "isobutanol",
                "isobutyl acetate",
                "methanol",
                "methanol-d1",
                "n-butyl oleate",
                "pentan-1-ol"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (CH3OH)",
            "Ethanol (CH3CH2OH)",
            "Isopropanol (CH3CHOHCH3)",
            "tert-Butanol ((CH3)3COH)",
            "Cyclohexanol (C6H11OH)",
            "Phenol (C6H5OH)",
            "Benzyl alcohol (C6H5CH2OH)",
            "Glycerol (C3H8O3)",
            "Ethylene glycol (C2H6O2)",
            "Propylene glycol (C3H8O2)",
            "Butanol (C4H9OH)",
            "Pentanol (C5H11OH)",
            "Hexanol (C6H13OH)",
            "Heptanol (C7H15OH)",
            "Octanol (C8H17OH)",
            "Nonanol (C9H19OH)",
            "Decanol (C10H21OH)",
            "Undecanol (C11H23OH)",
            "Dodecanol (C12H25OH)",
            "Tridecanol (C13H27OH)",
            "Tetradecanol (C14H29OH)",
            "Pentadecanol (C15H31OH)",
            "Hexadecanol (C16H33OH)",
            "Cholesterol (C27H46O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Methanol (CH3OH)",
                "Undecanol (C11H23OH)",
                "Dodecanol (C12H25OH)",
                "Pentadecanol (C15H31OH)"
            ],
            "mismatches": [
                "Ethanol (CH3CH2OH)",
                "Isopropanol (CH3CHOHCH3)",
                "tert-Butanol ((CH3)3COH)",
                "Cyclohexanol (C6H11OH)",
                "Phenol (C6H5OH)",
                "Benzyl alcohol (C6H5CH2OH)",
                "Glycerol (C3H8O3)",
                "Ethylene glycol (C2H6O2)",
                "Propylene glycol (C3H8O2)",
                "Butanol (C4H9OH)",
                "Pentanol (C5H11OH)",
                "Hexanol (C6H13OH)",
                "Heptanol (C7H15OH)",
                "Octanol (C8H17OH)",
                "Nonanol (C9H19OH)",
                "Decanol (C10H21OH)",
                "Tridecanol (C13H27OH)",
                "Tetradecanol (C14H29OH)",
                "Hexadecanol (C16H33OH)",
                "Cholesterol (C27H46O)"
            ],
            "true_referents": [
                "(2-methyl-4,5-ditridecyl-1,4-cyclohexadienyl)methanol",
                "(3,4-dimethoxyphenyl)methanol",
                "(3R)-3,10-dihydroxydecanoic acid",
                "1,5-dodecanediol",
                "1,7-decanediol",
                "1-O-dodecylglycerol",
                "1-octadecylglycerone 3-phosphate",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-isopropyl-5-methyl-1-heptanol",
                "2-methylpropane-1,2-diol",
                "3-Cyclohexene-1-ethanol",
                "3-methylbenzyl alcohol",
                "4-carboxybenzyl alcohol",
                "4-ethylbenzyl alcohol",
                "4alpha-hydroxymethyl-5alpha-cholest-7-en-3beta-ol",
                "4beta-(hydroxymethyl)-4alpha-methyl-5alpha-cholest-7-en-3beta-ol",
                "6-oxo-nonan-1-ol",
                "Pentane-1,5-diol",
                "Trimethylolpropane",
                "butyl butanoate",
                "dodecan-1-ol",
                "dodecyl dodecanoate",
                "ethanol-d6",
                "ethanols",
                "ethyl (R)-3-hydroxybutanoate",
                "ethyl 3-hydroxytridecanoate",
                "ethyl 3-oxohexanoate",
                "ethyl decanoate",
                "ethyl glyoxylate",
                "ethyl heptanoate",
                "ethyl hexadecanoate",
                "ethyl hexanoate",
                "ethyl hydroxy(phenyl)acetate",
                "ethyl nonanoate",
                "ethyl octanoate",
                "glycerone derivative",
                "hexane-1,6-diol",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl octanoate",
                "methanol",
                "methanol-d1",
                "methyl 4,9-dimethyldecanoate",
                "methyl undecanoate",
                "pentadecan-1-ol",
                "propenol",
                "propyl acetate",
                "tetradecyl tetradecanoate",
                "triethylene glycol",
                "undecan-1-ol",
                "undecane-1,11-diol"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Methanol (CH3OH)",
            "Ethanol (C2H5OH)",
            "Propanol (C3H7OH)",
            "Butanol (C4H9OH)",
            "Pentanol (C5H11OH)",
            "Hexanol (C6H13OH)",
            "Heptanol (C7H15OH)",
            "Octanol (C8H17OH)",
            "Ethylene glycol (C2H6O2)",
            "Glycerol (C3H8O3)",
            "Erythritol (C4H10O4)",
            "Xylitol (C5H12O5)",
            "Mannitol (C6H14O6)",
            "Sorbitol (C6H14O6)",
            "Dulcitol (C6H14O6)",
            "Inositol (C6H12O6)",
            "Ribitol (C5H12O5)",
            "Arabitol (C5H12O5)",
            "Galactitol (C6H14O6)",
            "Allyl alcohol (C3H6O)",
            "Benzyl alcohol (C7H8O)",
            "Phenol (C6H5OH)",
            "Salicyl alcohol (C6H4(OH)CH2OH)",
            "Cholesterol (C27H46O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "methanol",
                "allyl alcohol",
                "salicyl alcohol"
            ],
            "mismatches": [
                "ethanol",
                "propanol",
                "butanol",
                "pentanol",
                "hexanol",
                "heptanol",
                "octanol",
                "ethylene glycol",
                "glycerol",
                "erythritol",
                "xylitol",
                "mannitol",
                "sorbitol",
                "dulcitol",
                "inositol",
                "ribitol",
                "arabitol",
                "galactitol",
                "benzyl alcohol",
                "phenol",
                "cholesterol"
            ],
            "true_referents": [
                "(24R)-24-[(alpha-L-ascarosyl)oxy]-N-(2-hydroxyethyl)-2-methyl-3-oxopentacosanamide",
                "(3,4-dimethoxyphenyl)methanol",
                "(3S,4R)-Ketose 1-phosphate",
                "1-O-dodecylglycerol",
                "1-octadecylglycerone 3-phosphate",
                "16-(beta-D-glucopyranosyloxy)hexadecanoic acid",
                "18-hydroxylinoleic acid",
                "2,3,4-Trimethyl-1-pentanol",
                "2-(3,4-dihydroxyphenyl)-ethyl-O-beta-D-glucopyranoside",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-hydroxyethyl salicylate",
                "2-isopropyl-5-methyl-1-heptanol",
                "2-methyl-2-hydroxy-1-propanol",
                "3-ethoxy-1-propanol",
                "3-methylbenzyl alcohol",
                "3-methylbutyl 2-hydroxypropanoate",
                "4-amino-4-deoxy-alpha-L-arabinopyranosyl undecaprenyl phosphate",
                "4-carboxybenzyl alcohol",
                "4-ethylbenzyl alcohol",
                "4alpha-hydroxymethyl-5alpha-cholest-7-en-3beta-ol",
                "4alpha-phorbol 12,13-didecanoate",
                "4beta-(hydroxymethyl)-4alpha-methyl-5alpha-cholest-7-en-3beta-ol",
                "5-(2-methoxy-2-oxoethyl)uridine 5'-monophosphate",
                "D-erythrulose",
                "L-erythrulose",
                "N-icosanoyl-sn-glycero-3-phosphoethanolamine",
                "Pentane-1,5-diol",
                "allyl alcohol",
                "butyl butanoate",
                "diethyl (2R,3R)-2-hydroxy-3-methylsuccinate",
                "diethyl 2-methyl-3-hydroxysuccinate",
                "erythrulose",
                "ethanol-d6",
                "ethanols",
                "ethyl (11Z)-docosenoate",
                "ethyl glyoxylate",
                "ethyl heptanoate",
                "ethyl hexanoate",
                "ethyl hydroxy(phenyl)acetate",
                "ethyl octanoate",
                "glycerone derivative",
                "hexane-1,6-diol",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl octanoate",
                "hexyl propanoate",
                "methanol",
                "methanol-d1",
                "methyl 13-sophorosyloxydocosanoate",
                "methyl 9-(alpha-D-galactosyloxy)nonanoate",
                "methyl uridin-5-yloxyacetate",
                "primary allylic alcohol",
                "propenol",
                "salicyl alcohol",
                "triethylene glycol"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Allopregnanolone (ALLO)",
            "Altrindole",
            "Arachidonic acid",
            "Betamethasone",
            "Biotin",
            "Cortisol",
            "Cortisone",
            "Dexamethasone",
            "Digoxin",
            "Estradiol",
            "Estrone",
            "Fluocinolone",
            "Fluorometholone",
            "Hydrocortisone",
            "Hydroxyapatite",
            "Hydroxychloroquine",
            "Hydroxyprogesterone",
            "Hydroxyurea",
            "Lansoprazole",
            "Methylprednisolone",
            "Mifepristone",
            "Prednisolone",
            "Prednisone",
            "Progesterone",
            "Rifampicin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Betamethasone",
                "Cortisol",
                "Cortisone",
                "Hydroxychloroquine",
                "Prednisolone",
                "Prednisone"
            ],
            "mismatches": [
                "Allopregnanolone (ALLO)",
                "Altrindole",
                "Arachidonic acid",
                "Biotin",
                "Dexamethasone",
                "Digoxin",
                "Estradiol",
                "Estrone",
                "Fluocinolone",
                "Fluorometholone",
                "Hydrocortisone",
                "Hydroxyapatite",
                "Hydroxyprogesterone",
                "Hydroxyurea",
                "Lansoprazole",
                "Methylprednisolone",
                "Mifepristone",
                "Progesterone",
                "Rifampicin"
            ],
            "true_referents": [
                "(+)-lariciresinol",
                "(R)-lavandulol",
                "(R)-oxamniquine",
                "(S)-monastrol",
                "(S)-oxamniquine",
                "11beta,17alpha,21-trihydroxypregnenolone",
                "17alpha,21-dihydroxypregnenolone",
                "21-hydroxypregnenolone",
                "3-hydroxypyruvic acid",
                "3beta-hydroxy-4alpha-hydroxymethyl-4beta-methylsteroid",
                "3beta-hydroxy-4beta-hydroxymethyl-4alpha-methylsteroid",
                "4-hydroxymethylsteroid",
                "5-hydroxymethyluracil",
                "6-methylprednisolone",
                "amlodipine",
                "betamethasone",
                "betamethasone acetate",
                "clocortolone",
                "corticosterone",
                "cortisol",
                "cortisol 21-acetate",
                "cortisone",
                "eplerenone",
                "ethyl arachidonate",
                "flumethasone",
                "flumethasone pivalate",
                "fluocinolone acetonide",
                "fluthiacet-methyl",
                "hydroxyacetone",
                "hydroxyacetone phosphate",
                "hydroxychloroquine",
                "hydroxypyruvaldehyde",
                "levesquamide",
                "methyl arachidonate",
                "methylprednisolone acetate",
                "metronidazole",
                "monapinone E",
                "prednisolone",
                "prednisone",
                "retinol",
                "retinyl acetate",
                "retinyl palmitate",
                "spirapril",
                "tetrahydrocortisol",
                "triamcinolone",
                "vindoline"
            ],
            "TP": 6,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            "Ethanol (EtOH)",
            "Isopropyl alcohol",
            "Glycerol",
            "1-Propanol",
            "2-Propanol",
            "Cyclohexanol",
            "Methanol (MeOH)",
            "1-Butanol",
            "2-Butanol",
            "tert-Butyl alcohol",
            "1-Pentanol",
            "2-Pentanol",
            "3-Pentanol",
            "Neopentyl alcohol",
            "1-Hexanol",
            "2-Hexanol",
            "1-Heptanol",
            "2-Heptanol",
            "1-Octanol",
            "2-Octanol",
            "Benzyl alcohol",
            "Furfuryl alcohol",
            "Lactic acid",
            "Menthol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Furfuryl alcohol"
            ],
            "mismatches": [
                "Ethanol (EtOH)",
                "Isopropyl alcohol",
                "Glycerol",
                "1-Propanol",
                "2-Propanol",
                "Cyclohexanol",
                "Methanol (MeOH)",
                "1-Butanol",
                "2-Butanol",
                "tert-Butyl alcohol",
                "1-Pentanol",
                "2-Pentanol",
                "3-Pentanol",
                "Neopentyl alcohol",
                "1-Hexanol",
                "2-Hexanol",
                "1-Heptanol",
                "2-Heptanol",
                "1-Octanol",
                "2-Octanol",
                "Benzyl alcohol",
                "Lactic acid",
                "Menthol"
            ],
            "true_referents": [
                "(3,4-dimethoxyphenyl)methanol",
                "(3R,3aS,6aR)-hexahydrofuro[2,3-b]furan-3-yl glycolate",
                "1-neopentylpyrraline",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "2-butyl-1-octanol",
                "2-methyl-2-hydroxy-1-propanol",
                "3-Cyclohexene-1-ethanol",
                "3-methylbenzyl alcohol",
                "3-methylpentanol",
                "4-carboxybenzyl alcohol",
                "4-ethylbenzyl alcohol",
                "Pentane-1,5-diol",
                "butyl butanoate",
                "ethanol-d6",
                "ethanols",
                "ethyl (2R)-lactate",
                "ethyl (2S)-lactate",
                "ethyl cyclohexanecarboxylate",
                "ethyl heptanoate",
                "ethyl hexanoate",
                "ethyl isobutyrate",
                "ethyl octanoate",
                "furfuryl alcohol",
                "geraniol",
                "glycerone derivative",
                "hexyl heptanoate",
                "hexyl hexanoate",
                "hexyl propanoate",
                "isopentenyl alcohol",
                "methanol",
                "methanol-d1",
                "methyl ester",
                "methyl hexanoate",
                "octan-1-ol",
                "pentan-1-ol",
                "pentyl propanoate",
                "propyl decanoate",
                "terpenol",
                "terpineol",
                "tetrahydrofurfuryl alcohol",
                "triethylene glycol"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "primary alcohol",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "ethanol",
                "Canonical name": "ethanol"
            },
            {
                "Referent": "propanol",
                "Canonical name": "propanol"
            },
            {
                "Referent": "butanol",
                "Canonical name": "butanol"
            },
            {
                "Referent": "pentanol",
                "Canonical name": "pentanol"
            },
            {
                "Referent": "hexanol",
                "Canonical name": "hexanol"
            },
            {
                "Referent": "heptanol",
                "Canonical name": "heptanol"
            },
            {
                "Referent": "octanol",
                "Canonical name": "octanol"
            },
            {
                "Referent": "nonanol",
                "Canonical name": "nonanol"
            },
            {
                "Referent": "decanol",
                "Canonical name": "decanol"
            },
            {
                "Referent": "undecanol",
                "Canonical name": "undecanol"
            },
            {
                "Referent": "dodecanol",
                "Canonical name": "dodecanol"
            },
            {
                "Referent": "tridecanol",
                "Canonical name": "tridecanol"
            },
            {
                "Referent": "tetradecanol",
                "Canonical name": "tetradecanol"
            },
            {
                "Referent": "pentadecanol",
                "Canonical name": "pentadecanol"
            },
            {
                "Referent": "hexadecanol",
                "Canonical name": "hexadecanol"
            },
            {
                "Referent": "heptadecanol",
                "Canonical name": "heptadecanol"
            },
            {
                "Referent": "octadecanol",
                "Canonical name": "octadecanol"
            },
            {
                "Referent": "nonadecanol",
                "Canonical name": "nonadecanol"
            },
            {
                "Referent": "eicosanol",
                "Canonical name": "eicosanol"
            },
            {
                "Referent": "docosanol",
                "Canonical name": "docosanol"
            },
            {
                "Referent": "tetracosanol",
                "Canonical name": "tetracosanol"
            },
            {
                "Referent": "pentacosanol",
                "Canonical name": "pentacosanol"
            },
            {
                "Referent": "hexacosanol",
                "Canonical name": "hexacosanol"
            },
            {
                "Referent": "heptacosanol",
                "Canonical name": "heptacosanol"
            },
            {
                "Referent": "octacosanol",
                "Canonical name": "octacosanol"
            },
            {
                "Referent": "nonacosanol",
                "Canonical name": "nonacosanol"
            },
            {
                "Referent": "triacontanol",
                "Canonical name": "triacontanol"
            },
            {
                "Referent": "tetracontanol",
                "Canonical name": "tetracontanol"
            },
            {
                "Referent": "pentacontanol",
                "Canonical name": "pentacontanol"
            },
            {
                "Referent": "hexacontanol",
                "Canonical name": "hexacontanol"
            },
            {
                "Referent": "heptacontanol",
                "Canonical name": "heptacontanol"
            },
            {
                "Referent": "octacontanol",
                "Canonical name": "octacontanol"
            },
            {
                "Referent": "nonacontanol",
                "Canonical name": "nonacontanol"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ethanol"
            ],
            "mismatches": [
                "propanol",
                "butanol",
                "pentanol",
                "hexanol",
                "heptanol",
                "octanol",
                "nonanol",
                "decanol",
                "undecanol",
                "dodecanol",
                "tridecanol",
                "tetradecanol",
                "pentadecanol",
                "hexadecanol",
                "heptadecanol",
                "octadecanol",
                "nonadecanol",
                "eicosanol",
                "docosanol",
                "tetracosanol",
                "pentacosanol",
                "hexacosanol",
                "heptacosanol",
                "octacosanol",
                "nonacosanol",
                "triacontanol",
                "tetracontanol",
                "pentacontanol",
                "hexacontanol",
                "heptacontanol",
                "octacontanol",
                "nonacontanol"
            ],
            "true_referents": [
                "(+)-albicanol",
                "(3R)-3,10-dihydroxydecanoic acid",
                "(9Z,12Z)-octadecadien-1-ol",
                "13-Docosenoic acid, methyl ester",
                "16-(beta-D-glucopyranosyloxy)hexadecanoic acid",
                "2,3,4-Trimethyl-1-pentanol",
                "2-Ethyl-4-methyl-1-pentanol",
                "6-oxo-nonan-1-ol",
                "7-Hexadecenoic acid, methyl ester",
                "9R-hydroxy-10E,12E-octadecadienoic acid, methyl ester",
                "Octadecadienoic acid, methyl ester",
                "Pentane-1,5-diol",
                "butyl butanoate",
                "ethanol",
                "ethanol-d6",
                "ethyl (4Z,7Z,10Z,13Z,16Z)-docosapentaenoate",
                "ethyl (4Z,7Z,10Z,13Z,16Z,19Z)-docosahexaenoate",
                "ethyl hexadecanoate",
                "ethyl nonanoate",
                "ethyl octadecanoate",
                "hexane-1,6-diol",
                "hexyl 2-methylbutanoate",
                "methanol",
                "methyl 4,10-dimethyldodecanoate",
                "methyl 4,9-dimethyldecanoate",
                "methyl arachidonate",
                "methyl hexanoate",
                "methyl nonadecanoate",
                "octan-1-ol",
                "propyl decanoate"
            ],
            "TP": 1,
            "FP": 32,
            "FN": 0
        }
    }
]