[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Propanol (IPA)",
            "2-Methyl-2-propanol (t-Amyl alcohol)",
            "2-Ethyl-1-hexanol",
            "2-Butanol",
            "3-Pentanol",
            "2-Methyl-1-propanol",
            "2-Methyl-2-butanol",
            "2-Methyl-1-butanol",
            "2,2-Dimethyl-1-propanol",
            "2-Phenylethanol",
            "2-Methyl-2-pentanol",
            "2,3-Dimethyl-2-butanol",
            "2-Methyl-3-butanol",
            "2-Heptanol",
            "2-Octanol",
            "2,2-Dimethyl-1-butanol",
            "2-Methyl-1-pentanol",
            "2,3-Dimethyl-1-butanol",
            "2-Ethyl-2-butanol",
            "2,2-Dimethyl-3-butanol",
            "2,2,3-Trimethyl-1-propanol",
            "2,2,4-Trimethyl-1-pentanol",
            "2,3,3-Trimethyl-1-butanol",
            "2,2,4-Trimethyl-2-pentanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "2-Propanol (IPA)",
                "2-Methyl-2-propanol (t-Amyl alcohol)",
                "2-Ethyl-1-hexanol",
                "2-Butanol",
                "3-Pentanol",
                "2-Methyl-1-propanol",
                "2-Methyl-2-butanol",
                "2-Methyl-1-butanol",
                "2,2-Dimethyl-1-propanol",
                "2-Phenylethanol",
                "2-Methyl-2-pentanol",
                "2,3-Dimethyl-2-butanol",
                "2-Methyl-3-butanol",
                "2-Heptanol",
                "2-Octanol",
                "2,2-Dimethyl-1-butanol",
                "2-Methyl-1-pentanol",
                "2,3-Dimethyl-1-butanol",
                "2-Ethyl-2-butanol",
                "2,2-Dimethyl-3-butanol",
                "2,2,3-Trimethyl-1-propanol",
                "2,2,4-Trimethyl-1-pentanol",
                "2,3,3-Trimethyl-1-butanol",
                "2,2,4-Trimethyl-2-pentanol"
            ],
            "true_referents": [
                "(2R)-butan-2-ol",
                "(2R)-octan-2-ol",
                "(2S)-2-heptanol",
                "(2S)-octan-2-ol",
                "(S,S)-butane-2,3-diol",
                "1-(3,4-dimethoxyphenyl)ethane-1,2-diol",
                "1-bromo-2-propanol",
                "1-tert-Butoxy-2-propanol",
                "2,2,4-trimethyl-1,3-Pentanediol",
                "2-hydroxy-1-phenyl-1-propanone",
                "2-methyl-5-nonanol",
                "3,3,5-trimethylcyclohexanol",
                "3-Hydroxy-2-pentanone",
                "3-Methylhexan-2-ol",
                "3-methyl-2-butanol",
                "3-methyl-2-pentanol",
                "Isopropyl propionate",
                "butan-2-ol",
                "butane-2,3-diol",
                "heptan-2-ol",
                "meso-butane-2,3-diol",
                "octan-2-ol",
                "pentan-2-ol",
                "pentan-3-ol"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Butanol (C4H10O)",
            "2-Pentanol (C5H12O)",
            "2-Hexanol (C6H14O)",
            "2-Heptanol (C7H16O)",
            "2-Octanol (C8H18O)",
            "2-Nonanol (C9H20O)",
            "2-Decanol (C10H22O)",
            "2-Methyl-1-propanol (Isoamyl alcohol, C4H10O)",
            "2-Methyl-2-propanol (Tert-Butyl alcohol, C4H10O)",
            "2-Methyl-2-butanol (C5H12O)",
            "2-Ethyl-1-hexanol (C8H18O)",
            "3-Pentanol (C5H12O)",
            "3-Hexanol (C6H14O)",
            "3-Heptanol (C7H16O)",
            "3-Octanol (C8H18O)",
            "3-Nonanol (C9H20O)",
            "3-Decanol (C10H22O)",
            "2,3-Butanediol (C4H10O2)",
            "2,3-Pentanediol (C5H12O2)",
            "2,3-Hexanediol (C6H14O2)",
            "2,3-Heptanediol (C7H16O2)",
            "2,3-Octanediol (C8H18O2)",
            "2,4-Pentanediol (C5H12O2)",
            "2,5-Hexanediol (C6H14O2)",
            "3,4-Hexanediol (C6H14O2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-Heptanol (C7H16O)",
                "2-Octanol (C8H18O)",
                "3-Pentanol (C5H12O)",
                "3-Heptanol (C7H16O)",
                "3-Octanol (C8H18O)",
                "2,3-Butanediol (C4H10O2)",
                "2,5-Hexanediol (C6H14O2)"
            ],
            "mismatches": [
                "2-Butanol (C4H10O)",
                "2-Pentanol (C5H12O)",
                "2-Hexanol (C6H14O)",
                "2-Nonanol (C9H20O)",
                "2-Decanol (C10H22O)",
                "2-Methyl-1-propanol (Isoamyl alcohol, C4H10O)",
                "2-Methyl-2-propanol (Tert-Butyl alcohol, C4H10O)",
                "2-Methyl-2-butanol (C5H12O)",
                "2-Ethyl-1-hexanol (C8H18O)",
                "3-Hexanol (C6H14O)",
                "3-Nonanol (C9H20O)",
                "3-Decanol (C10H22O)",
                "2,3-Pentanediol (C5H12O2)",
                "2,3-Hexanediol (C6H14O2)",
                "2,3-Heptanediol (C7H16O2)",
                "2,3-Octanediol (C8H18O2)",
                "2,4-Pentanediol (C5H12O2)",
                "3,4-Hexanediol (C6H14O2)"
            ],
            "true_referents": [
                "(2R)-octan-2-ol",
                "(2R,5R)-hexanediol",
                "(2S)-2-heptanol",
                "(2S)-octan-2-ol",
                "(2S,5S)-hexanediol",
                "(3R,18R)-3,18-dihydroxynonadecanoic acid",
                "(R,R)-butane-2,3-diol",
                "(S,S)-butane-2,3-diol",
                "1,2-dodecanediol",
                "1,5-dodecanediol",
                "1,6-dodecanediol",
                "1,7-decanediol",
                "1,7-dodecanediol",
                "1,9-decanediol",
                "1-tert-Butoxy-2-propanol",
                "2,2,4-trimethyl-1,3-Pentanediol",
                "2-hydroxy-1-phenyl-1-propanone",
                "2-methyl-5-nonanol",
                "3-Hydroxy-2-pentanone",
                "3-Methylhexan-2-ol",
                "3-hydroxybutane-1,2,3-tricarboxylic acid",
                "3-methyl-2-butanol",
                "3-methyl-2-pentanol",
                "butane-2,3-diol",
                "decan-2-ol",
                "heptan-2-ol",
                "heptan-3-ol",
                "hexan-3-ol",
                "hexane-2,5-diol",
                "isopropyl 3-hydroxybut-2-enoate",
                "nonan-2-ol",
                "nonan-3-ol",
                "nonan-4-ol",
                "octan-2-ol",
                "octan-3-ol",
                "pentan-2-ol",
                "pentan-3-ol"
            ],
            "TP": 7,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Propanol (Isopropyl alcohol)",
            "2-Butanol",
            "2-Pentanol",
            "2-Hexanol",
            "2-Heptanol",
            "2-Octanol",
            "2-Nonanol",
            "2-Decanol",
            "3-Pentanol",
            "3-Hexanol",
            "3-Heptanol",
            "3-Octanol",
            "3-Nonanol",
            "3-Decanol",
            "4-Heptanol",
            "4-Octanol",
            "4-Nonanol",
            "5-Decanol",
            "Cyclohexanol",
            "Menthol",
            "Cholesterol",
            "Testosterone",
            "Estriol",
            "Progesterone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-Butanol",
                "2-Pentanol",
                "2-Heptanol",
                "2-Octanol",
                "3-Pentanol",
                "3-Hexanol",
                "4-Heptanol",
                "Cyclohexanol",
                "Cholesterol"
            ],
            "mismatches": [
                "2-Propanol (Isopropyl alcohol)",
                "2-Hexanol",
                "2-Nonanol",
                "2-Decanol",
                "3-Heptanol",
                "3-Octanol",
                "3-Nonanol",
                "3-Decanol",
                "4-Octanol",
                "4-Nonanol",
                "5-Decanol",
                "Menthol",
                "Testosterone",
                "Estriol",
                "Progesterone"
            ],
            "true_referents": [
                "(+)-menthol",
                "(-)-menthol",
                "(2R)-butan-2-ol",
                "(2R)-octan-2-ol",
                "(2S)-2-heptanol",
                "(2S)-octan-2-ol",
                "1,7-decanediol",
                "1,9-decanediol",
                "2-Hydroxy-2,6,6-trimethylcyclohexanone",
                "2-methyl-5-nonanol",
                "21-hydroxypregnenolone",
                "2beta-hydroxytestosterone",
                "3,3,5-trimethylcyclohexanol",
                "3-Hydroxy-2-pentanone",
                "3-Methylhexan-2-ol",
                "3-methyl-2-butanol",
                "3-methyl-2-pentanol",
                "5-Methylhexan-3-ol",
                "6alpha-hydroxyestrone",
                "Isopropyl propionate",
                "androsterone",
                "butan-2-ol",
                "castasterone",
                "cholesterol",
                "cholesterol-2,2,3,4,4,6-d6",
                "cyclohexanol",
                "decan-2-ol",
                "decan-3-ol",
                "decan-5-ol",
                "heptan-2-ol",
                "heptan-3-ol",
                "heptan-4-ol",
                "hexan-2-ol",
                "hexan-3-ol",
                "isopropyl ester",
                "isopropyl salicylate",
                "lanosterol",
                "nonadecan-4-ol",
                "nonan-2-ol",
                "nonan-3-ol",
                "nonan-4-ol",
                "octan-2-ol",
                "octan-3-ol",
                "octan-4-ol",
                "pentadecan-2-ol",
                "pentadecan-4-ol",
                "pentan-2-ol",
                "pentan-3-ol",
                "pregnenolone"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Propanol (IPA)",
            "Cyclohexanol",
            "1-Phenylethanol",
            "3-Methyl-3-pentanol",
            "2-Methyl-2-butanol (tert-amyl alcohol)",
            "1-Propanol-2-ol",
            "4-Hydroxy-4-methyl-2-pentanone",
            "Benzyl alcohol (\u03b1-phenylmethanol)",
            "1-Cyclopropylethanol",
            "2-Ethyl-1-hexanol",
            "3-Carene-4-ol",
            "Menthol",
            "Isopinocampheol",
            "Bornyl alcohol",
            "Geraniol",
            "Nerol",
            "Citronellol",
            "\u03b1-Terpineol",
            "Linalool",
            "2-Methylcyclohexanol",
            "3-Hydroxy-3-methylbutan-2-one (Acetoin reduction product)",
            "1-(4-Chlorophenyl)ethanol",
            "1,2-Propanediol (after partial oxidation)",
            "Glycerol (after selective oxidation)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cyclohexanol",
                "3-Hydroxy-3-methylbutan-2-one"
            ],
            "mismatches": [
                "2-Propanol (IPA)",
                "1-Phenylethanol",
                "3-Methyl-3-pentanol",
                "2-Methyl-2-butanol (tert-amyl alcohol)",
                "1-Propanol-2-ol",
                "4-Hydroxy-4-methyl-2-pentanone",
                "Benzyl alcohol (\u03b1-phenylmethanol)",
                "1-Cyclopropylethanol",
                "2-Ethyl-1-hexanol",
                "3-Carene-4-ol",
                "Menthol",
                "Isopinocampheol",
                "Bornyl alcohol",
                "Geraniol",
                "Nerol",
                "Citronellol",
                "\u03b1-Terpineol",
                "Linalool",
                "2-Methylcyclohexanol",
                "1-(4-Chlorophenyl)ethanol",
                "1,2-Propanediol (after partial oxidation)",
                "Glycerol (after selective oxidation)"
            ],
            "true_referents": [
                "(+)-isodihydrocarveol",
                "(+)-menthol",
                "(-)-isodihydrocarveol",
                "(-)-menthol",
                "(1E)-1-(4-chlorophenyl)-4,4-dimethyl-2-(1H-1,2,4-triazol-1-yl)pent-1-en-3-ol",
                "(2R)-butan-2-ol",
                "(2R*,3R*)-1,2,3-Butanetriol",
                "(2S)-2-heptanol",
                "(4R)-4-hydroxypentanoic acid",
                "(9R)-9-hydroxydecanoic acid",
                "1,3-dichloropropan-2-ol",
                "1,3-dihydroxybutan-2-one",
                "1,6-Heptadien-4-ol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1-(3,4-dimethoxyphenyl)ethane-1,2-diol",
                "1-(4-chlorophenyl)-2-[4-(4-fluorobenzyl)piperidin-1-yl]ethanol",
                "1-chloropropan-2-ol",
                "1-cyclopentylethanol",
                "1-tert-Butoxy-2-propanol",
                "2,2,4-trimethyl-1,3-Pentanediol",
                "2-Hydroxy-2,6,6-trimethylcyclohexanone",
                "2-hydroxy-pentan-3-one",
                "3,3,5-trimethylcyclohexanol",
                "3-Hydroxy-2-pentanone",
                "3-Hydroxy-3-methylbutan-2-one",
                "3-Methylhexan-2-ol",
                "3-hydroxybutane-1,2,3-tricarboxylic acid",
                "3-methyl-2-butanol",
                "3-methyl-2-pentanol",
                "4-Methyl-4E-hepten-3-ol",
                "Isopropyl propionate",
                "Linalool oxide (trans-pyranoid)",
                "Linalool oxide III",
                "Nilvadipine",
                "butane-2,3-diol",
                "campesterol",
                "colterol",
                "cyclohexanol",
                "diphenylmethanol",
                "dodecan-4-ol",
                "ethyl 3-hydroxybutyrate",
                "ethyl hydroxy(phenyl)acetate",
                "hexane-2,5-diol",
                "isopropyl salicylate",
                "linalool oxide pyranoside",
                "odoratol",
                "pentan-3-ol",
                "pinocarveol",
                "propan-2-ol",
                "pyriculol",
                "terpentecin"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "Isopropanol (IPA)",
            "2-Butanol",
            "2-Pentanol",
            "2-Hexanol",
            "2-Heptanol",
            "2-Octanol",
            "2-Nonanol",
            "2-Decanol",
            "Cyclohexanol",
            "2-Methyl-2-butanol",
            "3-Pentanol",
            "3-Hexanol",
            "3-Heptanol",
            "3-Octanol",
            "3-Nonanol",
            "3-Decanol",
            "4-Methyl-2-pentanol",
            "4-Heptanol",
            "4-Octanol",
            "4-Nonanol",
            "4-Decanol",
            "2,3-Butanediol",
            "2-Methyl-1-butanol",
            "3-Methyl-2-butanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-Butanol",
                "2-Pentanol",
                "2-Hexanol",
                "2-Heptanol",
                "2-Octanol",
                "Cyclohexanol",
                "3-Hexanol",
                "3-Methyl-2-butanol"
            ],
            "mismatches": [
                "Isopropanol (IPA)",
                "2-Nonanol",
                "2-Decanol",
                "2-Methyl-2-butanol",
                "3-Pentanol",
                "3-Heptanol",
                "3-Octanol",
                "3-Nonanol",
                "3-Decanol",
                "4-Methyl-2-pentanol",
                "4-Heptanol",
                "4-Octanol",
                "4-Nonanol",
                "4-Decanol",
                "2,3-Butanediol",
                "2-Methyl-1-butanol"
            ],
            "true_referents": [
                "(+/-)-4-Mercapto-4-methyl-2-pentanol",
                "(2R)-butan-2-ol",
                "(2R)-octan-2-ol",
                "(2S)-2-heptanol",
                "(2S)-octan-2-ol",
                "(S,S)-butane-2,3-diol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1-tert-Butoxy-2-propanol",
                "2-Hydroxy-2,6,6-trimethylcyclohexanone",
                "2-Methyloctan-4R-ol",
                "2-methyl-5-nonanol",
                "3,3,5-trimethylcyclohexanol",
                "3-Hydroxy-2-pentanone",
                "3-Methylhexan-2-ol",
                "3-methyl-2-butanol",
                "3-methyl-2-pentanol",
                "5-Methylhexan-3-ol",
                "butan-2-ol",
                "butane-2,3-diol",
                "cyclohexanol",
                "decan-2-ol",
                "decan-3-ol",
                "decan-4-ol",
                "dodecan-4-ol",
                "heptan-2-ol",
                "heptan-3-ol",
                "heptan-4-ol",
                "hexan-2-ol",
                "hexan-3-ol",
                "isopropyl ester",
                "isopropyl palmitate",
                "meso-butane-2,3-diol",
                "nonadecan-4-ol",
                "nonan-2-ol",
                "nonan-3-ol",
                "nonan-4-ol",
                "octan-2-ol",
                "octan-3-ol",
                "octan-4-ol",
                "pentadecan-2-ol",
                "pentadecan-4-ol",
                "pentan-2-ol",
                "pentan-3-ol"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Propanol (IPA)",
            "2-Butanol (S-2-Butanol)",
            "3-Pentanol (3-Pentanol)",
            "2-Pentanol (2-Pentanol)",
            "3-Hexanol (3-Hexanol)",
            "2-Hexanol (2-Hexanol)",
            "3-Heptanol (3-Heptanol)",
            "2-Heptanol (2-Heptanol)",
            "3-Octanol (3-Octanol)",
            "2-Octanol (2-Octanol)",
            "2-Nonanol (2-Nonanol)",
            "3-Nonanol (3-Nonanol)",
            "2-Decanol (2-Decanol)",
            "3-Decanol (3-Decanol)",
            "2-Undecanol (2-Undecanol)",
            "3-Undecanol (3-Undecanol)",
            "2-Dodecanol (2-Dodecanol)",
            "3-Dodecanol (3-Dodecanol)",
            "2-Butyl-1-pentanol (2-Butyl-1-pentanol)",
            "2-Pentyl-1-butanol (2-Pentyl-1-butanol)",
            "2-Phenyl-1-propanol (2-Phenyl-1-propanol)",
            "3-Phenyl-1-propanol (3-Phenyl-1-propanol)",
            "2-Cyclopentanol (2-Cyclopentanol)",
            "2-Cyclohexanol (2-Cyclohexanol)",
            "2-Methyl-2-butanol (Tert-amyl alcohol)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(2S)-butan-2-ol",
                "3-methyl-2-pentanol",
                "3-methyl-2-butanol",
                "hexan-3-ol",
                "hexan-2-ol",
                "heptan-3-ol",
                "heptan-2-ol",
                "octan-3-ol",
                "octan-2-ol",
                "nonan-2-ol",
                "nonan-3-ol",
                "decan-2-ol",
                "decan-3-ol",
                "undecan-2-ol",
                "undecan-3-ol",
                "dodecan-2-ol",
                "dodecan-3-ol"
            ],
            "mismatches": [
                "2-Propanol (IPA)",
                "2-Butyl-1-pentanol (2-Butyl-1-pentanol)",
                "2-Pentyl-1-butanol (2-Pentyl-1-butanol)",
                "2-Phenyl-1-propanol (2-Phenyl-1-propanol)",
                "3-Phenyl-1-propanol (3-Phenyl-1-propanol)",
                "2-Cyclopentanol (2-Cyclopentanol)",
                "2-Cyclohexanol (2-Cyclohexanol)",
                "2-Methyl-2-butanol (Tert-amyl alcohol)"
            ],
            "true_referents": [
                "(1S,4E,8E,12E)-2,2,5,9,13-pentamethylcyclopentadeca-4,8,12-trien-1-ol",
                "(2R)-octan-2-ol",
                "(2S)-2-heptanol",
                "(2S)-butan-2-ol",
                "(2S)-octan-2-ol",
                "(S)-3-hydroxy-2-oxo-3-phenylpropanoic acid",
                "(S)-4,5-dihydroxy-2-oxopentanal",
                "(S,S)-butane-2,3-diol",
                "1,2-bis(4-hydroxyphenyl)-2-propanol",
                "1,2-dodecanediol",
                "1,3-dodecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1-bromo-2-propanol",
                "1-cyclopentylethanol",
                "1-tert-Butoxy-2-propanol",
                "2-Hydroxy-2,6,6-trimethylcyclohexanone",
                "2-hydroxy-1-phenyl-1-propanone",
                "2-methyl-5-nonanol",
                "3,3,5-trimethylcyclohexanol",
                "3-Hydroxy-2-pentanone",
                "3-Methylhexan-2-ol",
                "3-methyl-2-butanol",
                "3-methyl-2-pentanol",
                "5-Methylhexan-3-ol",
                "Isopropyl propionate",
                "cyclohexanol",
                "decan-2-ol",
                "decan-3-ol",
                "dodecan-2-ol",
                "dodecan-3-ol",
                "dodecan-5-ol",
                "dodecan-6-ol",
                "heptan-2-ol",
                "heptan-3-ol",
                "hexan-2-ol",
                "hexan-3-ol",
                "nonan-2-ol",
                "nonan-3-ol",
                "nonan-4-ol",
                "octan-2-ol",
                "octan-3-ol",
                "pentadecan-2-ol",
                "pentan-2-ol",
                "pentan-3-ol",
                "undecan-2-ol",
                "undecan-3-ol",
                "undecan-5-ol",
                "undecan-6-ol"
            ],
            "TP": 17,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "1-Propanol (PrOH)",
            "2-Propanol (Isopropanol)",
            "2-Butanol (sec-Butanol)",
            "2-Methyl-2-propanol (t-Butanol)",
            "2-Pentanol (sec-Pentanol)",
            "3-Pentanol (3-PentOH)",
            "2-Hexanol (sec-Hexanol)",
            "3-Hexanol (3-HexOH)",
            "2-Heptanol (sec-Heptanol)",
            "3-Heptanol (3-HeptOH)",
            "2-Octanol (sec-Octanol)",
            "3-Octanol (3-OctOH)",
            "2-Nonanol (sec-Nonanol)",
            "3-Nonanol (3-NonOH)",
            "2-Decanol (sec-Decanol)",
            "3-Decanol (3-DecOH)",
            "2-Undecanol (sec-Undecanol)",
            "3-Undecanol (3-UndecOH)",
            "2-Dodecanol (sec-Dodecanol)",
            "3-Dodecanol (3-DodecOH)",
            "2-Tridecanol (sec-Tridecanol)",
            "3-Tridecanol (3-TridecOH)",
            "2-Tetradecanol (sec-Tetradecanol)",
            "3-Tetradecanol (3-TetradecOH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-Propanol (Isopropanol)",
                "2-Butanol (sec-Butanol)",
                "2-Pentanol (sec-Pentanol)",
                "3-Pentanol (3-PentOH)",
                "2-Hexanol (sec-Hexanol)",
                "3-Hexanol (3-HexOH)",
                "2-Heptanol (sec-Heptanol)",
                "3-Heptanol (3-HeptOH)",
                "2-Octanol (sec-Octanol)",
                "3-Octanol (3-OctOH)",
                "2-Nonanol (sec-Nonanol)",
                "3-Nonanol (3-NonOH)",
                "2-Decanol (sec-Decanol)",
                "3-Decanol (3-DecOH)",
                "2-Undecanol (sec-Undecanol)",
                "3-Undecanol (3-UndecOH)",
                "2-Dodecanol (sec-Dodecanol)",
                "3-Dodecanol (3-DodecOH)"
            ],
            "mismatches": [
                "1-Propanol (PrOH)",
                "2-Methyl-2-propanol (t-Butanol)",
                "2-Tridecanol (sec-Tridecanol)",
                "3-Tridecanol (3-TridecOH)",
                "2-Tetradecanol (sec-Tetradecanol)",
                "3-Tetradecanol (3-TetradecOH)"
            ],
            "true_referents": [
                "(2R)-octan-2-ol",
                "(2R,5R)-hexanediol",
                "(2S)-2-heptanol",
                "(2S)-butan-2-ol",
                "(2S)-octan-2-ol",
                "(2S,5S)-hexanediol",
                "(3R,12R)-3,12-dihydroxytridecanoic acid",
                "(3R,9R)-3,9-dihydroxydecanoic acid",
                "1,2-dodecanediol",
                "1,3-dodecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1-Cyano-2-hydroxy-3-butene",
                "1-tert-Butoxy-2-propanol",
                "2-hydroxy-1-phenyl-1-propanone",
                "2-methyl-5-nonanol",
                "3-Hydroxy-2-pentanone",
                "3-hydroxybutane-1,2,3-tricarboxylic acid",
                "3-hydroxyhexane-2,5-dione",
                "3-methyl-2-butanol",
                "3-methyl-2-pentanol",
                "Isopropyl propionate",
                "decan-2-ol",
                "decan-3-ol",
                "dodecan-2-ol",
                "dodecan-3-ol",
                "heptan-2-ol",
                "heptan-3-ol",
                "hexan-2-ol",
                "hexan-3-ol",
                "hexane-2,5-diol",
                "isopropyl ester",
                "nonan-2-ol",
                "nonan-3-ol",
                "nonan-4-ol",
                "octan-2-ol",
                "octan-3-ol",
                "pentadecan-2-ol",
                "pentan-2-ol",
                "pentan-3-ol",
                "propan-2-ol",
                "sec-butyl butyrate",
                "tridecan-2-ol",
                "undecan-2-ol",
                "undecan-3-ol",
                "undecan-5-ol",
                "undecan-6-ol"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "Isopropanol (2-propanol)",
            "Butan-2-ol",
            "Pentan-2-ol",
            "Hexan-2-ol",
            "Heptan-2-ol",
            "Octan-2-ol",
            "Nonan-2-ol",
            "Decan-2-ol",
            "Undecan-2-ol",
            "Dodecan-2-ol",
            "Tridecan-2-ol",
            "Tetradecan-2-ol",
            "Pentadecan-2-ol",
            "Hexadecan-2-ol",
            "Heptadecan-2-ol",
            "Octadecan-2-ol",
            "Nonadecan-2-ol",
            "Eicosan-2-ol",
            "Docosan-2-ol",
            "Tetracosan-2-ol",
            "Hexacosan-2-ol",
            "Octacosan-2-ol",
            "Triacontan-2-ol",
            "Dotriacontan-2-ol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Butan-2-ol",
                "Pentan-2-ol",
                "Hexan-2-ol",
                "Heptan-2-ol",
                "Octan-2-ol",
                "Nonan-2-ol",
                "Decan-2-ol",
                "Undecan-2-ol",
                "Dodecan-2-ol",
                "Tridecan-2-ol",
                "Tetradecan-2-ol",
                "Pentadecan-2-ol",
                "Hexadecan-2-ol",
                "Heptadecan-2-ol",
                "Octadecan-2-ol",
                "Nonadecan-2-ol",
                "Docosan-2-ol",
                "Tetracosan-2-ol",
                "Hexacosan-2-ol"
            ],
            "mismatches": [
                "Isopropanol (2-propanol)",
                "Eicosan-2-ol",
                "Octacosan-2-ol",
                "Triacontan-2-ol",
                "Dotriacontan-2-ol"
            ],
            "true_referents": [
                "(2R)-butan-2-ol",
                "(2R)-octan-2-ol",
                "(2S)-butan-2-ol",
                "(2S)-octan-2-ol",
                "Isopropyl propionate",
                "butan-2-ol",
                "decan-2-ol",
                "decan-3-ol",
                "decan-5-ol",
                "docosan-2-ol",
                "docosan-5-ol",
                "docosan-8-ol",
                "dodecan-2-ol",
                "dodecan-4-ol",
                "dodecan-5-ol",
                "heptadecan-2-ol",
                "heptadecan-5-ol",
                "heptan-2-ol",
                "heptan-3-ol",
                "heptan-4-ol",
                "hexacosan-2-ol",
                "hexacosan-5-ol",
                "hexacosan-8-ol",
                "hexadecan-2-ol",
                "hexadecan-5-ol",
                "hexan-2-ol",
                "hexan-3-ol",
                "isopropyl ester",
                "nonadecan-2-ol",
                "nonadecan-5-ol",
                "nonadecan-8-ol",
                "nonan-2-ol",
                "nonan-4-ol",
                "nonan-5-ol",
                "octadecan-2-ol",
                "octadecan-5-ol",
                "octadecan-8-ol",
                "octan-2-ol",
                "pentacosan-2-ol",
                "pentadecan-2-ol",
                "pentadecan-4-ol",
                "pentadecan-5-ol",
                "pentan-2-ol",
                "pentan-3-ol",
                "tetracosan-2-ol",
                "tetracosan-4-ol",
                "tetracosan-5-ol",
                "tetradecan-2-ol",
                "tetradecan-4-ol",
                "tetradecan-5-ol",
                "tricosan-2-ol",
                "tridecan-2-ol",
                "tridecan-3-ol",
                "tridecan-5-ol",
                "undecan-2-ol",
                "undecan-3-ol",
                "undecan-5-ol"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "Isopropanol (isopropyl alcohol)",
            "Cyclohexanol",
            "2-Butanol (sec-butanol)",
            "2-Pentanol",
            "3-Pentanol",
            "2-Hexanol",
            "3-Hexanol",
            "2-Heptanol",
            "3-Heptanol",
            "2-Octanol",
            "3-Octanol",
            "2-Nonanol",
            "3-Nonanol",
            "2-Decanol",
            "3-Decanol",
            "1-Phenylethanol",
            "Cyclopentanol",
            "Cyclopropanol",
            "4-Methyl-2-pentanol",
            "3-Methyl-2-butanol",
            "2-Methyl-3-butanol",
            "3-Methyl-3-pentanol",
            "2,3-Dimethyl-2-butanol",
            "2-Butyl-2-propanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cyclohexanol",
                "2-Heptanol",
                "3-Heptanol",
                "3-Methyl-2-butanol",
                "2-Pentanol",
                "3-Pentanol",
                "2-Hexanol",
                "3-Hexanol",
                "2-Octanol",
                "3-Octanol",
                "2-Nonanol",
                "3-Nonanol",
                "2-Decanol",
                "3-Decanol"
            ],
            "mismatches": [
                "Isopropanol (isopropyl alcohol)",
                "2-Butanol (sec-butanol)",
                "1-Phenylethanol",
                "Cyclopentanol",
                "Cyclopropanol",
                "4-Methyl-2-pentanol",
                "2-Methyl-3-butanol",
                "3-Methyl-3-pentanol",
                "2,3-Dimethyl-2-butanol",
                "2-Butyl-2-propanol"
            ],
            "true_referents": [
                "(+/-)-4-Mercapto-4-methyl-2-pentanol",
                "(1S,4E,8E,12E)-2,2,5,9,13-pentamethylcyclopentadeca-4,8,12-trien-1-ol",
                "(2R)-octan-2-ol",
                "(2S)-2-heptanol",
                "(2S)-butan-2-ol",
                "(2S)-octan-2-ol",
                "(S,S)-butane-2,3-diol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1-(3,4-dimethoxyphenyl)ethane-1,2-diol",
                "1-bromo-2-propanol",
                "1-cyclopentylethanol",
                "1-tert-Butoxy-2-propanol",
                "2,2,4-trimethyl-1,3-Pentanediol",
                "2-Hydroxy-2,6,6-trimethylcyclohexanone",
                "2-Methyloctan-4R-ol",
                "2-methyl-5-nonanol",
                "3,3,5-trimethylcyclohexanol",
                "3-Hydroxy-2-pentanone",
                "3-Methylhexan-2-ol",
                "3-methyl-2-butanol",
                "3-methyl-2-pentanol",
                "5-Methylhexan-3-ol",
                "Isopropyl propionate",
                "butane-2,3-diol",
                "cyclohexanol",
                "decan-2-ol",
                "decan-3-ol",
                "diphenylmethanol",
                "heptan-2-ol",
                "heptan-3-ol",
                "hexan-2-ol",
                "hexan-3-ol",
                "isopropyl ester",
                "isopropyl palmitate",
                "meso-butane-2,3-diol",
                "nonan-2-ol",
                "nonan-3-ol",
                "nonan-4-ol",
                "octan-2-ol",
                "octan-3-ol",
                "octan-4-ol",
                "pentadecan-2-ol",
                "pentan-2-ol",
                "pentan-3-ol",
                "sec-butyl butyrate"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "Isopropanol (IPA)",
            "2-Butanol",
            "Cyclohexanol",
            "Menthol",
            "Cholesterol",
            "2-Propanol",
            "sec-Butyl alcohol",
            "3-Pentanol",
            "2-Octanol",
            "Borneol",
            "Isoborneol",
            "Terpineol",
            "Linalool",
            "Geraniol",
            "Citronellol",
            "Testosterone",
            "Estradiol",
            "Cortisol",
            "Progesterone",
            "Ergosterol",
            "Camphor",
            "Fenchyl alcohol",
            "2-Methylbutan-2-ol",
            "3-Hexanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cyclohexanol",
                "Cholesterol",
                "Ergosterol"
            ],
            "mismatches": [
                "Isopropanol (IPA)",
                "2-Butanol",
                "Menthol",
                "2-Propanol",
                "sec-Butyl alcohol",
                "3-Pentanol",
                "2-Octanol",
                "Borneol",
                "Isoborneol",
                "Terpineol",
                "Linalool",
                "Geraniol",
                "Citronellol",
                "Testosterone",
                "Estradiol",
                "Cortisol",
                "Progesterone",
                "Camphor",
                "Fenchyl alcohol",
                "2-Methylbutan-2-ol",
                "3-Hexanol"
            ],
            "true_referents": [
                "(+)-isodihydrocarveol",
                "(+)-menthol",
                "(+)-neoisodihydrocarveol",
                "(-)-isodihydrocarveol",
                "(-)-menthol",
                "(2R)-butan-2-ol",
                "(2R)-octan-2-ol",
                "(2S)-octan-2-ol",
                "1-bromo-2-propanol",
                "16beta-hydroxyestrone",
                "17beta-hydroxy-5-androsten-3-one",
                "2-Hydroxy-2,6,6-trimethylcyclohexanone",
                "2-Methyloctan-4R-ol",
                "2-Methyloctan-4S-ol",
                "2-hydroxy-1-phenyl-1-propanone",
                "21-hydroxypregnenolone",
                "2beta-hydroxytestosterone",
                "3,3,5-trimethylcyclohexanol",
                "3-Hydroxy-2-pentanone",
                "3-Hydroxy-3-methylbutan-2-one",
                "3-Methylhexan-2-ol",
                "3-methyl-2-butanol",
                "3-methyl-2-pentanol",
                "5-Methylhexan-3-ol",
                "5beta-dihydrocortisol",
                "6alpha-hydroxyestrone",
                "Antcamphorol A",
                "Linalool oxide (trans-pyranoid)",
                "Linalool oxide III",
                "Nitrothal-isopropyl",
                "androsterone",
                "buddlenol B",
                "butan-2-ol",
                "campesterol",
                "castasterone",
                "cholesterol",
                "cholesterol-2,2,3,4,4,6-d6",
                "cyclohexanol",
                "dehydroergosterol",
                "ergosterol",
                "ganoderol B",
                "hexan-3-ol",
                "hypodiol",
                "isopropyl ester",
                "isopropyl palmitate",
                "isopropyl salicylate",
                "linalool oxide pyranoside",
                "octan-2-ol",
                "odoratol",
                "pentan-3-ol",
                "pregnenolone",
                "prostaglandin F1alpha alcohol",
                "pyriculol",
                "sec-butyl butyrate",
                "secondary fatty alcohol",
                "terpentecin",
                "tetrahydrocortisol",
                "vepaol"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "Propan-2-ol (Isopropyl alcohol)",
            "Butan-2-ol (sec-Butyl alcohol)",
            "Pentan-2-ol (sec-Amyl alcohol)",
            "Hexan-2-ol",
            "Hexan-3-ol",
            "Heptan-2-ol",
            "Heptan-3-ol",
            "Heptan-4-ol",
            "Octan-2-ol",
            "Octan-3-ol",
            "Octan-4-ol",
            "Nonan-2-ol",
            "Nonan-3-ol",
            "Nonan-4-ol",
            "Nonan-5-ol",
            "Decan-2-ol",
            "Decan-3-ol",
            "Decan-4-ol",
            "Decan-5-ol",
            "Cyclohexanol",
            "2-Methylcyclohexanol",
            "3-Methylcyclohexanol",
            "4-Methylcyclohexanol",
            "2-Phenylethanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "propan-2-ol",
                "butan-2-ol",
                "pentan-2-ol",
                "hexan-2-ol",
                "hexan-3-ol",
                "heptan-2-ol",
                "heptan-3-ol",
                "heptan-4-ol",
                "octan-2-ol",
                "octan-3-ol",
                "octan-4-ol",
                "nonan-2-ol",
                "nonan-3-ol",
                "nonan-4-ol",
                "nonan-5-ol",
                "decan-2-ol",
                "decan-3-ol",
                "decan-4-ol",
                "decan-5-ol",
                "cyclohexanol"
            ],
            "mismatches": [
                "2-methylcyclohexanol",
                "3-methylcyclohexanol",
                "4-methylcyclohexanol",
                "2-phenylethanol"
            ],
            "true_referents": [
                "(2R)-butan-2-ol",
                "(2R)-octan-2-ol",
                "(2S)-butan-2-ol",
                "(2S)-octan-2-ol",
                "1-(3,4-dimethoxyphenyl)ethane-1,2-diol",
                "1-Hexen-3-ol",
                "2-Hydroxy-2,6,6-trimethylcyclohexanone",
                "2-[(dimethylamino)methyl]-1-(3-methoxyphenyl)cyclohexanol",
                "2-hydroxy-1-phenyl-1-propanone",
                "3,3,5-trimethylcyclohexanol",
                "3-methyl-2-pentanol",
                "Isopropyl propionate",
                "butan-2-ol",
                "cyclohexanol",
                "decan-2-ol",
                "decan-3-ol",
                "decan-4-ol",
                "decan-5-ol",
                "heptan-2-ol",
                "heptan-3-ol",
                "heptan-4-ol",
                "hexan-2-ol",
                "hexan-3-ol",
                "nonan-2-ol",
                "nonan-3-ol",
                "nonan-4-ol",
                "nonan-5-ol",
                "octan-2-ol",
                "octan-3-ol",
                "octan-4-ol",
                "pentan-2-ol",
                "pentan-3-ol",
                "propan-2-ol"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "Isopropyl alcohol (IPA)",
            "2-Butanol",
            "2-Pentanol",
            "2-Hexanol",
            "2-Heptanol",
            "2-Octanol",
            "2-Nonanol",
            "2-Decanol",
            "Cyclohexanol",
            "Menthol",
            "Cholesterol",
            "Glycerol",
            "Ethylene glycol",
            "Propylene glycol",
            "1,2-Propanediol",
            "1,3-Propanediol",
            "1,2-Butanediol",
            "1,3-Butanediol",
            "1,4-Butanediol",
            "2,3-Butanediol",
            "Lactic acid",
            "Malic acid",
            "Tartaric acid",
            "Citric acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-Butanol",
                "2-Hexanol",
                "2-Octanol",
                "Cyclohexanol",
                "Cholesterol",
                "2,3-Butanediol"
            ],
            "mismatches": [
                "Isopropyl alcohol (IPA)",
                "2-Pentanol",
                "2-Heptanol",
                "2-Nonanol",
                "2-Decanol",
                "Menthol",
                "Glycerol",
                "Ethylene glycol",
                "Propylene glycol",
                "1,2-Propanediol",
                "1,3-Propanediol",
                "1,2-Butanediol",
                "1,3-Butanediol",
                "1,4-Butanediol",
                "Lactic acid",
                "Malic acid",
                "Tartaric acid",
                "Citric acid"
            ],
            "true_referents": [
                "(+)-menthol",
                "(-)-menthol",
                "(2R)-butan-2-ol",
                "(2R)-octan-2-ol",
                "(2S)-2-heptanol",
                "(2S)-octan-2-ol",
                "(R,R)-butane-2,3-diol",
                "(S,S)-butane-2,3-diol",
                "1,7-decanediol",
                "1,9-decanediol",
                "2-Hydroxy-2,6,6-trimethylcyclohexanone",
                "2-methyl-5-nonanol",
                "3,3,5-trimethylcyclohexanol",
                "3-(2-methylthioethyl)malic acid",
                "3-hydroxybutane-1,2,3-tricarboxylic acid",
                "3-methyl-2-butanol",
                "3-methyl-2-pentanol",
                "Heptapropylene glycol",
                "Isopropyl propionate",
                "Pentapropylene glycol",
                "butan-2-ol",
                "butane-2,3-diol",
                "cholesterol",
                "cholesterol-2,2,3,4,4,6-d6",
                "cyclohexanol",
                "decan-2-ol",
                "ethyl (2R)-lactate",
                "ethyl 2-hydroxypropanoate",
                "ethyl hydroxy(phenyl)acetate",
                "heptan-2-ol",
                "hexan-2-ol",
                "hexane-2,5-diol",
                "isocitric acid",
                "isopropyl ester",
                "isopropyl palmitate",
                "isopropyl salicylate",
                "lactate ester",
                "meso-butane-2,3-diol",
                "methylisocitric acid",
                "nonan-2-ol",
                "nonan-4-ol",
                "octan-2-ol",
                "pentadecan-2-ol",
                "pentan-2-ol"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Propanol (IPA)",
            "2-Butanol",
            "2-Pentanol",
            "2-Hexanol",
            "2-Heptanol",
            "2-Octanol",
            "2-Nonanol",
            "2-Decanol",
            "2-Undecanol",
            "2-Dodecanol",
            "2-Tridecanol",
            "2-Tetradecanol",
            "2-Pentadecanol",
            "2-Hexadecanol",
            "2-Heptadecanol",
            "2-Octadecanol",
            "2-Nonadecanol",
            "2-Eicosanol",
            "2-Heneicosanol",
            "2-Docosanol",
            "2-Tricosanol",
            "2-Tetracosanol",
            "2-Pentacosanol",
            "2-Hexacosanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-Butanol",
                "2-Hexanol",
                "2-Octanol",
                "2-Nonanol",
                "2-Decanol",
                "2-Undecanol",
                "2-Dodecanol",
                "2-Tridecanol",
                "2-Pentadecanol",
                "2-Heneicosanol",
                "2-Docosanol",
                "2-Tricosanol",
                "2-Tetracosanol",
                "2-Pentacosanol",
                "2-Hexacosanol"
            ],
            "mismatches": [
                "2-Propanol (IPA)",
                "2-Pentanol",
                "2-Heptanol",
                "2-Tetradecanol",
                "2-Hexadecanol",
                "2-Heptadecanol",
                "2-Octadecanol",
                "2-Nonadecanol",
                "2-Eicosanol"
            ],
            "true_referents": [
                "(2R)-butan-2-ol",
                "(2R)-octan-2-ol",
                "(2S)-2-heptanol",
                "(2S)-octan-2-ol",
                "(3R,12R)-3,12-dihydroxytridecanoic acid",
                "(7R,14S)-dihydroxy-(8E,10E,12Z,16Z,19Z)-docosapentaenoic acid",
                "(9R)-9-hydroxydecanoic acid",
                "1,2-dodecanediol",
                "1,7-decanediol",
                "1,9-decanediol",
                "12-(octadecanoyloxy)octadecanoic acid",
                "2-hydroxyoctadecanal",
                "2-methyl-5-nonanol",
                "3-methyl-2-butanol",
                "3-methyl-2-pentanol",
                "Isopropyl propionate",
                "butan-2-ol",
                "cholesteryl heptadecanoate",
                "cholesteryl nonadecanoate",
                "decan-2-ol",
                "docosan-2-ol",
                "dodecan-2-ol",
                "dodecan-5-ol",
                "henicosan-2-ol",
                "henicosan-3-ol",
                "henicosan-6-ol",
                "heptan-2-ol",
                "hexacosan-2-ol",
                "hexacosan-6-ol",
                "hexacosan-8-ol",
                "hexan-2-ol",
                "hexane-2,5-diol",
                "nonan-2-ol",
                "nonan-4-ol",
                "octan-2-ol",
                "pentacosan-2-ol",
                "pentacosan-5-ol",
                "pentacosan-6-ol",
                "pentadecan-2-ol",
                "pentadecan-4-ol",
                "pentadecan-5-ol",
                "pentan-2-ol",
                "prostaglandin E2",
                "prostaglandin E2 2-glyceryl ester",
                "tetracosan-12-ol",
                "tetracosan-2-ol",
                "tricosan-2-ol",
                "tricosan-8-ol",
                "tridecan-2-ol",
                "undecan-2-ol",
                "undecan-5-ol",
                "undecan-6-ol"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "1-Propanol (1-PrOH)",
            "2-Methyl-1-propanol (2-Me-1-PrOH)",
            "3-Methyl-1-butanol (3-Me-1-BuOH)",
            "4-Methyl-2-pentanol (4-Me-2-PenOH)",
            "5-Methyl-3-hexanol (5-Me-3-HexOH)",
            "Cyclohexanol",
            "Cyclopentanol",
            "Ethylene glycol (EG)",
            "Glycerol (Gly)",
            "Isopropanol (IPA)",
            "Menthyl alcohol",
            "Phenylethanol",
            "Tetrahydrofurfuryl alcohol",
            "Triethanolamine (TEA)",
            "1,2-Propanediol",
            "1,3-Propanediol",
            "1,4-Butanediol",
            "1,5-Pentanediol",
            "1,6-Hexanediol",
            "1,7-Heptanediol",
            "2,3-Butanediol",
            "2,4-Pentanediol",
            "2,5-Hexanediol",
            "2,6-Heptanediol",
            "2,7-Octanediol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyclohexanol",
                "2,5-hexanediol"
            ],
            "mismatches": [
                "1-Propanol (1-PrOH)",
                "2-Methyl-1-propanol (2-Me-1-PrOH)",
                "3-Methyl-1-butanol (3-Me-1-BuOH)",
                "4-Methyl-2-pentanol (4-Me-2-PenOH)",
                "5-Methyl-3-hexanol (5-Me-3-HexOH)",
                "Cyclopentanol",
                "Ethylene glycol (EG)",
                "Glycerol (Gly)",
                "Isopropanol (IPA)",
                "Menthyl alcohol",
                "Phenylethanol",
                "Tetrahydrofurfuryl alcohol",
                "Triethanolamine (TEA)",
                "1,2-Propanediol",
                "1,3-Propanediol",
                "1,4-Butanediol",
                "1,5-Pentanediol",
                "1,6-Hexanediol",
                "1,7-Heptanediol",
                "2,3-Butanediol",
                "2,4-Pentanediol",
                "2,6-Heptanediol",
                "2,7-Octanediol"
            ],
            "true_referents": [
                "(+/-)-4-Mercapto-4-methyl-2-pentanol",
                "(-)-epigallocatechin 3-gallate",
                "(-)-menthyl beta-D-glucoside",
                "(1S,4E,8E,12E)-2,2,5,9,13-pentamethylcyclopentadeca-4,8,12-trien-1-ol",
                "(2R,4S)-2-methyl-2,4-dihydroxydihydrofuran-3-one",
                "(2R,5R)-hexanediol",
                "(2S,5S)-hexanediol",
                "(3R,4S,1'R)-3-(1'-hydroxyethyl)-4-methyldihydrofuran-2(3H)-one",
                "(S,S)-butane-2,3-diol",
                "1,2-dodecanediol",
                "1,4-dodecanediol",
                "1,5-dodecanediol",
                "1,6-dodecanediol",
                "1,7-decanediol",
                "1,7-dodecanediol",
                "1,9-decanediol",
                "1-bromo-2-propanol",
                "1-cyclopentylethanol",
                "1-mononitroglycerol",
                "2,2,4-trimethyl-1,3-Pentanediol",
                "2-Hydroxy-2,6,6-trimethylcyclohexanone",
                "2-hydroxy-1-phenyl-1-propanone",
                "3,3,5-trimethylcyclohexanol",
                "3-Hydroxy-3-methylbutan-2-one",
                "3-Methylhexan-2-ol",
                "3-methyl-2-butanol",
                "3-methyl-2-pentanol",
                "4-formyl-2-methoxyphenyl L-menthyl glutarate",
                "4S-Methylhexan-3S-ol",
                "5-Methylhexan-3-ol",
                "5-hydroxy-3-methylfuran-2(5H)-one",
                "Heptapropylene glycol",
                "Pentapropylene glycol",
                "Polypropylene glycol (m w 1,200-3,000)",
                "butane-2,3-diol",
                "campesterol",
                "cyclohexanol",
                "diphenylmethanol",
                "ethyl 3-hydroxybutyrate",
                "ethyl hydroxy(phenyl)acetate",
                "hexane-2,5-diol",
                "isopropyl ester",
                "isopropyl palmitate",
                "meso-butane-2,3-diol",
                "pentadecan-5-ol",
                "pentan-2-ol",
                "propan-2-ol"
            ],
            "TP": 2,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Propanol (Isopropyl alcohol)",
            "2-Butanol",
            "2-Pentanol",
            "2-Hexanol",
            "2-Heptanol",
            "2-Octanol",
            "2-Nonanol",
            "2-Decanol",
            "1-Phenylethanol",
            "1-Cyclohexylethanol",
            "Benzhydrol (Diphenylmethanol)",
            "2-Phenyl-2-propanol",
            "2-(2-Chlorophenyl)-2-propanol",
            "2-(4-Isobutylphenyl)-2-propanol (IBP)",
            "2-(2,4,4-Trimethyl-1-pentyl)-2-propanol (TXIB)",
            "2-(2-Hydroxy-5-nitrophenyl)-2-propanol",
            "2-(2-Methoxy-5-nitrophenyl)-2-propanol",
            "2-(2-Hydroxy-3-methylphenyl)-2-propanol",
            "2-(2-Methoxy-3-methylphenyl)-2-propanol",
            "2-(2-Hydroxy-4-methylphenyl)-2-propanol",
            "2-(2-Methoxy-4-methylphenyl)-2-propanol",
            "2-(2-Hydroxy-5-methylphenyl)-2-propanol",
            "2-(2-Methoxy-5-methylphenyl)-2-propanol",
            "2-(2-Hydroxy-6-methylphenyl)-2-propanol",
            "2-(2-Methoxy-6-methylphenyl)-2-propanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-Butanol",
                "2-Pentanol",
                "2-Hexanol",
                "2-Heptanol",
                "2-Octanol",
                "Diphenylmethanol"
            ],
            "mismatches": [
                "2-Propanol (Isopropyl alcohol)",
                "2-Nonanol",
                "2-Decanol",
                "1-Phenylethanol",
                "1-Cyclohexylethanol",
                "2-Phenyl-2-propanol",
                "2-(2-Chlorophenyl)-2-propanol",
                "2-(4-Isobutylphenyl)-2-propanol (IBP)",
                "2-(2,4,4-Trimethyl-1-pentyl)-2-propanol (TXIB)",
                "2-(2-Hydroxy-5-nitrophenyl)-2-propanol",
                "2-(2-Methoxy-5-nitrophenyl)-2-propanol",
                "2-(2-Hydroxy-3-methylphenyl)-2-propanol",
                "2-(2-Methoxy-3-methylphenyl)-2-propanol",
                "2-(2-Hydroxy-4-methylphenyl)-2-propanol",
                "2-(2-Methoxy-4-methylphenyl)-2-propanol",
                "2-(2-Hydroxy-5-methylphenyl)-2-propanol",
                "2-(2-Methoxy-5-methylphenyl)-2-propanol",
                "2-(2-Hydroxy-6-methylphenyl)-2-propanol",
                "2-(2-Methoxy-6-methylphenyl)-2-propanol"
            ],
            "true_referents": [
                "(+)-dihydrocarveol",
                "(-)E-1-Chlorotridec-1-ene-6,8-diol",
                "(2R)-butan-2-ol",
                "(2R)-octan-2-ol",
                "(2R*,3R*)-1,2,3-Butanetriol",
                "(2S)-2-heptanol",
                "(2S)-octan-2-ol",
                "1,2-bis(4-hydroxyphenyl)-2-propanol",
                "1,2-bis(4-hydroxyphenyl)propan-2-ol",
                "1,3-dichloropropan-2-ol",
                "1,7-decanediol",
                "1,9-decanediol",
                "1-(3,4-dimethoxyphenyl)ethane-1,2-diol",
                "1-(4-methoxyphenyl)-2-\\{[4-(4-nitrophenyl)butan-2-yl]amino\\}ethanol",
                "1-bromo-2-propanol",
                "1-chloropropan-2-ol",
                "1-cyclopentylethanol",
                "1-tert-Butoxy-2-propanol",
                "2,2,4-trimethyl-1,3-Pentanediol",
                "2-hydroxy-1-phenyl-1-propanone",
                "2-methyl-5-nonanol",
                "3,3,5-trimethylcyclohexanol",
                "3-methyl-2-butanol",
                "3-methyl-2-pentanol",
                "4-(1-hydroxypropyl)-2-methoxy-6-(2-methoxy-4-propylphenoxy)phenol",
                "Isopropyl propionate",
                "butan-2-ol",
                "cyclohexanol",
                "decan-2-ol",
                "diphenylmethanol",
                "heptan-2-ol",
                "hexan-2-ol",
                "isopropyl 3-hydroxybut-2-enoate",
                "isopropyl ester",
                "nonan-2-ol",
                "nonan-4-ol",
                "octan-2-ol",
                "pentadecan-2-ol",
                "pentan-2-ol"
            ],
            "TP": 6,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "secondary alcohol",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Isopropyl alcohol",
                "Canonical name": "(CH3)2CHOH"
            },
            {
                "Referent": "Butyl alcohol",
                "Canonical name": "(CH3)3CHOH"
            },
            {
                "Referent": "Phenylmethyl alcohol",
                "Canonical name": "(CH3)2C6H5OH"
            },
            {
                "Referent": "Benzyl alcohol",
                "Canonical name": "(CH3)2C6H5CH2OH"
            },
            {
                "Referent": "Methylbenzyl alcohol",
                "Canonical name": "(CH3)2C6H4CH2OH"
            },
            {
                "Referent": "Ethylbenzyl alcohol",
                "Canonical name": "(CH3)2C6H4CH2CH2OH"
            },
            {
                "Referent": "Propylbenzyl alcohol",
                "Canonical name": "(CH3)2C6H3CH2OH"
            },
            {
                "Referent": "Isopropylbenzyl alcohol",
                "Canonical name": "(CH3)2C6H3CH2CH2OH"
            },
            {
                "Referent": "Butylbenzyl alcohol",
                "Canonical name": "(CH3)2C6H2CH2OH"
            },
            {
                "Referent": "Phenylmethylbenzyl alcohol",
                "Canonical name": "(CH3)2C6H4CH2CH2OH"
            },
            {
                "Referent": "Benzylbenzyl alcohol",
                "Canonical name": "(CH3)2C6H3CH2CH2OH"
            },
            {
                "Referent": "Methylphenylbenzyl alcohol",
                "Canonical name": "(CH3)2C6H4CH2CH2CH2OH"
            },
            {
                "Referent": "Ethylphenylbenzyl alcohol",
                "Canonical name": "(CH3)2C6H4CH2CH2CH2CH2OH"
            },
            {
                "Referent": "Propylphenylbenzyl alcohol",
                "Canonical name": "(CH3)2C6H3CH2CH2CH2OH"
            },
            {
                "Referent": "Isopropylphenylbenzyl alcohol",
                "Canonical name": "(CH3)2C6H3CH2CH2CH2CH2OH"
            },
            {
                "Referent": "Butylphenylbenzyl alcohol",
                "Canonical name": "(CH3)2C6H2CH2CH2CH2OH"
            },
            {
                "Referent": "Phenylmethanol",
                "Canonical name": "(CH3)2CHOH"
            },
            {
                "Referent": "Benzylmethanol",
                "Canonical name": "(CH3)2CH2CH2OH"
            },
            {
                "Referent": "Methylbenzylmethanol",
                "Canonical name": "(CH3)2CH2CH2CH2OH"
            },
            {
                "Referent": "Ethylbenzylmethanol",
                "Canonical name": "(CH3)2CH2CH2CH2CH2OH"
            },
            {
                "Referent": "Propylbenzylmethanol",
                "Canonical name": "(CH3)2CH2CH2CH2CH2CH2OH"
            },
            {
                "Referent": "Isopropylbenzylmethanol",
                "Canonical name": "(CH3)2CH2CH2CH2CH2CH2OH"
            },
            {
                "Referent": "Butylbenzylmethanol",
                "Canonical name": "(CH3)2CH2CH2CH2CH2CH2CH2OH"
            },
            {
                "Referent": "Phenylmethanol",
                "Canonical name": "(CH3)2CH2CH2CH2OH"
            },
            {
                "Referent": "Benzylmethanol",
                "Canonical name": "(CH3)2CH2CH2CH2CH2OH"
            },
            {
                "Referent": "Methylphenylmethanol",
                "Canonical name": "(CH3)2CH2CH2CH2CH2CH2OH"
            },
            {
                "Referent": "Ethylphenylmethanol",
                "Canonical name": "(CH3)2CH2CH2CH2CH2CH2CH2OH"
            },
            {
                "Referent": "Propylphenylmethanol",
                "Canonical name": "(CH3)2CH2CH2CH2CH2CH2CH2OH"
            },
            {
                "Referent": "Isopropylphenylmethanol",
                "Canonical name": "(CH3)2CH2CH2CH2CH2CH2CH2OH"
            },
            {
                "Referent": "Butylphenylmethanol",
                "Canonical name": "(CH3)2CH2CH2CH2CH2CH2CH2CH2OH"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Isopropyl alcohol",
                "Butyl alcohol",
                "Phenylmethyl alcohol",
                "Benzyl alcohol",
                "Methylbenzyl alcohol",
                "Ethylbenzyl alcohol",
                "Propylbenzyl alcohol",
                "Isopropylbenzyl alcohol",
                "Butylbenzyl alcohol",
                "Phenylmethylbenzyl alcohol",
                "Benzylbenzyl alcohol",
                "Methylphenylbenzyl alcohol",
                "Ethylphenylbenzyl alcohol",
                "Propylphenylbenzyl alcohol",
                "Isopropylphenylbenzyl alcohol",
                "Butylphenylbenzyl alcohol",
                "Phenylmethanol",
                "Benzylmethanol",
                "Methylbenzylmethanol",
                "Ethylbenzylmethanol",
                "Propylbenzylmethanol",
                "Isopropylbenzylmethanol",
                "Butylbenzylmethanol",
                "Methylphenylmethanol",
                "Ethylphenylmethanol",
                "Propylphenylmethanol",
                "Isopropylphenylmethanol",
                "Butylphenylmethanol"
            ],
            "true_referents": [
                "(+)-isodihydrocarveol",
                "(+/-)-4-Mercapto-4-methyl-2-pentanol",
                "(R,R)-butane-2,3-diol",
                "(S)-4,5-dihydroxypentane-2,3-dione",
                "(S,S)-butane-2,3-diol",
                "1,1,1,3,3,3-hexafluoropropan-2-ol",
                "2-methyl-5-nonanol",
                "3-hydroxybutane-1,2,3-tricarboxylic acid",
                "3-methyl-2-butanol",
                "diphenylmethanol",
                "isopropyl 3-hydroxybut-2-enoate"
            ],
            "TP": 0,
            "FP": 28,
            "FN": 0
        }
    }
]