[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Propanol (IPA)",
            "2-Methyl-2-propanol (t-Amyl alcohol)",
            "2-Methyl-1-butanol (tert-Amyl alcohol)",
            "2-Methyl-2-butanol (sec-Amyl alcohol)",
            "2-Methyl-2-pentanol",
            "2-Methyl-2-hexanol",
            "2-Methyl-2-heptanol",
            "2-Methyl-2-octanol",
            "2-Methyl-2-nonanol",
            "2-Methyl-2-decanol",
            "2-Ethyl-2-butanol",
            "2-Ethyl-2-hexanol",
            "2-Ethyl-2-octanol",
            "2-Ethyl-2-decanol",
            "2,2-Dimethyl-1-propanol",
            "2,2-Dimethyl-1-butanol",
            "2,2-Dimethyl-1-hexanol",
            "2,2-Dimethyl-1-octanol",
            "2,2-Dimethyl-1-decanol",
            "2,2-Dimethyl-3-pentanol",
            "2,2-Dimethyl-3-hexanol",
            "2,2-Dimethyl-3-heptanol",
            "2,2-Dimethyl-3-octanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "2-Propanol (IPA)",
                "2-Methyl-2-propanol (t-Amyl alcohol)",
                "2-Methyl-1-butanol (tert-Amyl alcohol)",
                "2-Methyl-2-butanol (sec-Amyl alcohol)",
                "2-Methyl-2-pentanol",
                "2-Methyl-2-hexanol",
                "2-Methyl-2-heptanol",
                "2-Methyl-2-octanol",
                "2-Methyl-2-nonanol",
                "2-Methyl-2-decanol",
                "2-Ethyl-2-butanol",
                "2-Ethyl-2-hexanol",
                "2-Ethyl-2-octanol",
                "2-Ethyl-2-decanol",
                "2,2-Dimethyl-1-propanol",
                "2,2-Dimethyl-1-butanol",
                "2,2-Dimethyl-1-hexanol",
                "2,2-Dimethyl-1-octanol",
                "2,2-Dimethyl-1-decanol",
                "2,2-Dimethyl-3-pentanol",
                "2,2-Dimethyl-3-hexanol",
                "2,2-Dimethyl-3-heptanol",
                "2,2-Dimethyl-3-octanol"
            ],
            "true_referents": [
                "2,4-Dimethyl-4-nonanol",
                "2,6-Dimethyl-7-octene-2,6-diol",
                "2-methyl-4-phenyl-2-butanol",
                "2-methylbutan-2-ol",
                "2-methylpropane-1,2-diol",
                "2-phenylpropan-2-ol",
                "3,7-dimethyl-3-octanol",
                "3-Methyl-1-penten-3-ol",
                "3-methyl-3-heptanol",
                "6-amino-2-methyl-2-heptanol",
                "8,8-Diethoxy-2,6-dimethyl-2-octanol",
                "8,8-Dimethoxy-2,6-dimethyl-2-octanol",
                "tert-butanol"
            ],
            "TP": 0,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "1-Phenyl-2-propanol (CAS: 1569-60-0)",
            "2-Methyl-2-propanol (tert-Butyl alcohol, CAS: 75-65-0)",
            "2-Methyl-2-butanol (CAS: 75-85-4)",
            "2-Methyl-2-pentanol (CAS: 75-84-3)",
            "2-Methyl-2-hexanol (CAS: 589-35-5)",
            "3-Methyl-3-pentanol (CAS: 565-67-3)",
            "3,3-Dimethyl-2-butanol (CAS: 594-82-1)",
            "2,2-Dimethyl-3-pentanol (CAS: 565-68-4)",
            "3,3-Dimethyl-2-pentanol (CAS: 565-70-8)",
            "3-Ethyl-3-pentanol (CAS: 597-29-1)",
            "2,2,3-Trimethyl-3-pentanol (CAS: 1679-85-0)",
            "1-Phenylethanol (CAS: 60-12-8)",
            "2,3-Dimethyl-2-butanol (CAS: 75-84-3)",
            "2,2,3-Trimethyl-2-butanol (CAS: 594-82-1)",
            "3,3-Diethyl-2-butanol (CAS: 597-78-8)",
            "2,2-Dimethyl-3-pentanol (CAS: 565-69-5)",
            "2,3,3-Trimethyl-2-butanol (CAS: 594-82-1)",
            "3,3-Diethyl-2-butanol (CAS: 597-78-8)",
            "1-Phenyl-1-propanol (CAS: 1569-60-0)",
            "2,2-Dimethyl-3-hexanol (CAS: 597-80-2)",
            "3,3-Dimethyl-3-pentanol (CAS: 564-00-3)",
            "2,2,4-Trimethyl-3-pentanol (CAS: 1679-85-0)",
            "3,3-Diethyl-3-pentanol (CAS: 1679-86-1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-Methyl-2-butanol (CAS: 75-85-4)",
                "2-Methyl-2-propanol (tert-Butyl alcohol, CAS: 75-65-0)"
            ],
            "mismatches": [
                "1-Phenyl-2-propanol (CAS: 1569-60-0)",
                "2-Methyl-2-pentanol (CAS: 75-84-3)",
                "2-Methyl-2-hexanol (CAS: 589-35-5)",
                "3-Methyl-3-pentanol (CAS: 565-67-3)",
                "3,3-Dimethyl-2-butanol (CAS: 594-82-1)",
                "2,2-Dimethyl-3-pentanol (CAS: 565-68-4)",
                "3,3-Dimethyl-2-pentanol (CAS: 565-70-8)",
                "3-Ethyl-3-pentanol (CAS: 597-29-1)",
                "2,2,3-Trimethyl-3-pentanol (CAS: 1679-85-0)",
                "1-Phenylethanol (CAS: 60-12-8)",
                "2,3-Dimethyl-2-butanol (CAS: 75-84-3)",
                "2,2,3-Trimethyl-2-butanol (CAS: 594-82-1)",
                "3,3-Diethyl-2-butanol (CAS: 597-78-8)",
                "2,2-Dimethyl-3-pentanol (CAS: 565-69-5)",
                "2,3,3-Trimethyl-2-butanol (CAS: 594-82-1)",
                "1-Phenyl-1-propanol (CAS: 1569-60-0)",
                "2,2-Dimethyl-3-hexanol (CAS: 597-80-2)",
                "3,3-Dimethyl-3-pentanol (CAS: 564-00-3)",
                "2,2,4-Trimethyl-3-pentanol (CAS: 1679-85-0)",
                "3,3-Diethyl-3-pentanol (CAS: 1679-86-1)"
            ],
            "true_referents": [
                "2,4-Dimethyl-4-nonanol",
                "2,6-Dimethyl-3,7-octadiene-2,6-diol",
                "2,6-Dimethyl-7-octene-2,6-diol",
                "2-methyl-4-phenyl-2-butanol",
                "2-methylbutan-2-ol",
                "2-methylpropane-1,2-diol",
                "2-phenylpropan-2-ol",
                "3,7-dimethyl-3-octanol",
                "3-Methyl-1-penten-3-ol",
                "3-methyl-3-heptanol",
                "5-Methyl-5-pentacosanol",
                "6-amino-2-methyl-2-heptanol",
                "7-epi-ent-eudesmane-5,11-diol",
                "8,8-Diethoxy-2,6-dimethyl-2-octanol",
                "8,8-Dimethoxy-2,6-dimethyl-2-octanol",
                "ethylestrenol",
                "tert-butanol",
                "tris(4-chlorophenyl)methanol"
            ],
            "TP": 2,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "2-methyl-2-propanol (tert-butanol)",
            "2-methyl-2-butanol",
            "3-methyl-3-pentanol",
            "2,3-dimethyl-2-butanol",
            "2-methyl-2-pentanol",
            "2-ethyl-2-butanol",
            "2,4-dimethyl-2-pentanol",
            "2-methyl-2-hexanol",
            "3-ethyl-3-pentanol",
            "2,3,3-trimethyl-2-butanol",
            "2,2,3-trimethyl-3-pentanol",
            "2-methyl-2-heptanol",
            "2-ethyl-2-pentanol",
            "2,4-dimethyl-2-hexanol",
            "2,3,4-trimethyl-2-pentanol",
            "2,2,4-trimethyl-3-pentanol",
            "2,3,3-trimethyl-2-pentanol",
            "2,3,4-trimethyl-2-hexanol",
            "2-methyl-2-octanol",
            "2-ethyl-2-hexanol",
            "2,4-dimethyl-2-heptanol",
            "2,3,4-trimethyl-2-hexanol",
            "2,3,3-trimethyl-2-hexanol",
            "2,2,4-trimethyl-3-hexanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "tert-butanol"
            ],
            "mismatches": [
                "2-methyl-2-butanol",
                "3-methyl-3-pentanol",
                "2,3-dimethyl-2-butanol",
                "2-methyl-2-pentanol",
                "2-ethyl-2-butanol",
                "2,4-dimethyl-2-pentanol",
                "2-methyl-2-hexanol",
                "3-ethyl-3-pentanol",
                "2,3,3-trimethyl-2-butanol",
                "2,2,3-trimethyl-3-pentanol",
                "2-methyl-2-heptanol",
                "2-ethyl-2-pentanol",
                "2,4-dimethyl-2-hexanol",
                "2,3,4-trimethyl-2-pentanol",
                "2,2,4-trimethyl-3-pentanol",
                "2,3,3-trimethyl-2-pentanol",
                "2,3,4-trimethyl-2-hexanol",
                "2-methyl-2-octanol",
                "2-ethyl-2-hexanol",
                "2,4-dimethyl-2-heptanol",
                "2,3,4-trimethyl-2-hexanol",
                "2,3,3-trimethyl-2-hexanol",
                "2,2,4-trimethyl-3-hexanol"
            ],
            "true_referents": [
                "2,4-Dimethyl-4-nonanol",
                "2,6-Dimethyl-7-octene-2,6-diol",
                "2-methyl-4-phenyl-2-butanol",
                "2-methylbutan-2-ol",
                "2-methylpropane-1,2-diol",
                "2-phenylpropan-2-ol",
                "3,7-dimethyl-3-octanol",
                "3-Methyl-1-penten-3-ol",
                "3-hydroxybutane-1,2,3-tricarboxylic acid",
                "3-methyl-3-heptanol",
                "6-amino-2-methyl-2-heptanol",
                "8,8-Diethoxy-2,6-dimethyl-2-octanol",
                "8,8-Dimethoxy-2,6-dimethyl-2-octanol",
                "tert-butanol"
            ],
            "TP": 1,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Methyl-2-propanol (t-Butanol)",
            "3-Ethyl-3-pentanol",
            "2-Phenyl-2-propanol",
            "Cyclohexanol",
            "4-Methylcyclohexanol",
            "1-Methylcyclohexanol",
            "2-Ethyl-3-methyl-3-pentanol",
            "1,1-Dimethylcyclohexanol",
            "3-Ethyl-2-methyl-2-butanol",
            "1-Methyl-1-cyclohexanol",
            "2,2-Dimethyl-3-pentanol",
            "3-Hydroxy-3-methyl-2-butanone",
            "Cholesterol (a sterol)",
            "\u03b1-Terpineol",
            "\u03b2-Terpineol",
            "Linalool",
            "Geraniol",
            "Nerol",
            "Citronellol",
            "Menthol",
            "Isopulegol",
            "Bornyl alcohol",
            "Camphor (reduced form)",
            "\u03b1-Pinene hydrate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-Phenyl-2-propanol",
                "1-Methylcyclohexanol",
                "\u03b2-Terpineol",
                "Linalool"
            ],
            "mismatches": [
                "2-Methyl-2-propanol (t-Butanol)",
                "3-Ethyl-3-pentanol",
                "Cyclohexanol",
                "4-Methylcyclohexanol",
                "2-Ethyl-3-methyl-3-pentanol",
                "1,1-Dimethylcyclohexanol",
                "3-Ethyl-2-methyl-2-butanol",
                "1-Methyl-1-cyclohexanol",
                "2,2-Dimethyl-3-pentanol",
                "3-Hydroxy-3-methyl-2-butanone",
                "Cholesterol (a sterol)",
                "\u03b1-Terpineol",
                "Geraniol",
                "Nerol",
                "Citronellol",
                "Menthol",
                "Isopulegol",
                "Bornyl alcohol",
                "Camphor (reduced form)",
                "\u03b1-Pinene hydrate"
            ],
            "true_referents": [
                "(+)-caryolan-1-ol",
                "(+)-cis-isohumulone",
                "(+)-isoafricanol",
                "(3R,6E)-nerolidol",
                "(3S)-3-hydroxy-3-methylglutaryl-CoA",
                "(6E)-nerolidol",
                "(R)-linalool",
                "(S)-9,10-Cyclo-p-menth-1-en-4-ol",
                "(S)-linalool",
                "(S)-mevalonolactone",
                "1-(1,4,5-trihydroxy-3-isocyanocyclopenten-2-enyl)-ethanol",
                "1-Methylcyclohexanol",
                "2,4-Dimethyl-4-nonanol",
                "2,6-Dimethyl-7-octene-2,6-diol",
                "2-[(dimethylamino)methyl]-1-(3-methoxyphenyl)cyclohexanol",
                "2-methyl-4-phenyl-2-butanol",
                "2-methylbutan-2-ol",
                "2-methylpropane-1,2-diol",
                "2-phenylpropan-2-ol",
                "20(R),22(xi),24(S)-dammar-25(26)-ene-3beta,6alpha,12beta,20,22,24-hexanol",
                "3,7-dimethyl-3-octanol",
                "3-Methyl-1-penten-3-ol",
                "3-hydroxy-3-methyl-2-oxopentanoic acid",
                "3-hydroxy-3-methylbut-1-ene",
                "3-hydroxy-3-methylglutaryl-CoA",
                "3-hydroxybutane-1,2,3-tricarboxylic acid",
                "4-terpineol",
                "Dihydrobungeanool",
                "beta-terpineol",
                "isowigtheone hydrate",
                "linalool",
                "myrcenol",
                "nerolidol",
                "tert-butanol",
                "tertiary allylic alcohol"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Methyl-2-propanol (TBA)",
            "2-Methyl-2-butanol",
            "2-Methyl-2-pentanol",
            "3-Methyl-3-pentanol",
            "3-Methyl-3-hexanol",
            "2,3-Dimethyl-2-butanol",
            "2,3-Dimethyl-3-pentanol",
            "2,4-Dimethyl-3-pentanol",
            "2-Ethyl-2-butanol",
            "2-Ethyl-2-pentanol",
            "2-Propyl-2-butanol",
            "2-Propyl-2-pentanol",
            "2-Phenyl-2-propanol",
            "2-Cyclohexyl-2-propanol",
            "2-Cyclopentyl-2-propanol",
            "2-(1-Cyclohexenyl)-2-propanol",
            "2-(1-Cyclopentenyl)-2-propanol",
            "2-(1-Methylcyclohexyl)-2-propanol",
            "2-(1-Methylcyclopentyl)-2-propanol",
            "2-(1-Phenylethyl)-2-propanol",
            "2-(1-Methylphenyl)-2-propanol",
            "2-(1-Ethylphenyl)-2-propanol",
            "2-(1-Isopropylphenyl)-2-propanol",
            "2-(1-tert-Butylphenyl)-2-propanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-phenylpropan-2-ol"
            ],
            "mismatches": [
                "2-Methyl-2-propanol (TBA)",
                "2-Methyl-2-butanol",
                "2-Methyl-2-pentanol",
                "3-Methyl-3-pentanol",
                "3-Methyl-3-hexanol",
                "2,3-Dimethyl-2-butanol",
                "2,3-Dimethyl-3-pentanol",
                "2,4-Dimethyl-3-pentanol",
                "2-Ethyl-2-butanol",
                "2-Ethyl-2-pentanol",
                "2-Propyl-2-butanol",
                "2-Propyl-2-pentanol",
                "2-Cyclohexyl-2-propanol",
                "2-Cyclopentyl-2-propanol",
                "2-(1-Cyclohexenyl)-2-propanol",
                "2-(1-Cyclopentenyl)-2-propanol",
                "2-(1-Methylcyclohexyl)-2-propanol",
                "2-(1-Methylcyclopentyl)-2-propanol",
                "2-(1-Phenylethyl)-2-propanol",
                "2-(1-Methylphenyl)-2-propanol",
                "2-(1-Ethylphenyl)-2-propanol",
                "2-(1-Isopropylphenyl)-2-propanol",
                "2-(1-tert-Butylphenyl)-2-propanol"
            ],
            "true_referents": [
                "(1-hydroxycyclopentyl)phenylacetic acid",
                "1-(1,4,5-trihydroxy-3-isocyanocyclopenten-2-enyl)-ethanol",
                "1-Methylcyclohexanol",
                "2,4-Dimethyl-4-nonanol",
                "2,6-Dimethyl-7-octene-2,6-diol",
                "2-(4-methoxyphenyl)propan-2-ol",
                "2-[(dimethylamino)methyl]-1-(3-methoxyphenyl)cyclohexanol",
                "2-[3-(2,2,3-trimethylcyclopent-3-enyl)cyclohex-3-enyl]propan-2-ol",
                "2-[4-(2,2,3-trimethylcyclopent-3-enyl)cyclohex-3-enyl]propan-2-ol",
                "2-methyl-4-phenyl-2-butanol",
                "2-methylbutan-2-ol",
                "2-methylpropane-1,2-diol",
                "2-phenylpropan-2-ol",
                "3,7-dimethyl-3-octanol",
                "3-Methyl-1-penten-3-ol",
                "3-methyl-3-heptanol",
                "6-amino-2-methyl-2-heptanol",
                "8,8-Dimethoxy-2,6-dimethyl-2-octanol",
                "tert-butanol"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Methyl-2-propanol (tert-Butanol)",
            "2-Pentanol",
            "2-Hexanol",
            "2-Octanol",
            "2-Nonanol",
            "2-Phenyl-2-propanol",
            "2-Butanol",
            "1,1-Dimethyl-2-propanol",
            "2-Methyl-3-pentanol",
            "2-Methyl-3-hexanol",
            "4-Methyl-2-pentanol",
            "2-Methyl-2-butanol",
            "1,1-Dimethyl-1-phenylethanol",
            "3-Methyl-3-pentanol",
            "2-Methyl-1-phenylpropan-1-ol",
            "2-Cyclohexyl-2-propanol",
            "1-Methyl-2-propanol",
            "1,1,1-Tris(hydroxymethyl)ethane",
            "3-Hydroxy-1,1-dimethyl-2-butanone",
            "1,1-Dimethyl-2-phenylethanol",
            "3-Methyl-3-hexanol",
            "2-Methyl-2-hexanol",
            "2-(4-Methylphenyl)-2-propanol",
            "2-(3,4-Dimethylphenyl)-2-propanol",
            "1,1-Diethyl-2-propanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-methyl-4-phenyl-2-butanol",
                "2-methylbutan-2-ol",
                "2-phenylpropan-2-ol",
                "tert-butanol"
            ],
            "mismatches": [
                "2-Methyl-2-propanol (tert-Butanol)",
                "2-Pentanol",
                "2-Hexanol",
                "2-Octanol",
                "2-Nonanol",
                "2-Phenyl-2-propanol",
                "2-Butanol",
                "1,1-Dimethyl-2-propanol",
                "2-Methyl-3-pentanol",
                "2-Methyl-3-hexanol",
                "4-Methyl-2-pentanol",
                "1,1-Dimethyl-1-phenylethanol",
                "3-Methyl-3-pentanol",
                "2-Methyl-1-phenylpropan-1-ol",
                "2-Cyclohexyl-2-propanol",
                "1-Methyl-2-propanol",
                "1,1,1-Tris(hydroxymethyl)ethane",
                "3-Hydroxy-1,1-dimethyl-2-butanone",
                "1,1-Dimethyl-2-phenylethanol",
                "3-Methyl-3-hexanol",
                "2-Methyl-2-hexanol",
                "2-(4-Methylphenyl)-2-propanol",
                "2-(3,4-Dimethylphenyl)-2-propanol",
                "1,1-Diethyl-2-propanol"
            ],
            "true_referents": [
                "(2S,3R)-3-hydroxybutane-1,2,3-tricarboxylic acid",
                "1-Methylcyclohexanol",
                "2,4-Dimethyl-4-nonanol",
                "2,6-Dimethyl-7-octene-2,6-diol",
                "2-(4-methoxyphenyl)propan-2-ol",
                "2-methyl-4-phenyl-2-butanol",
                "2-methylbutan-2-ol",
                "2-methylpropane-1,2-diol",
                "2-phenylpropan-2-ol",
                "3,7-dimethyl-3-octanol",
                "3-Methyl-1-penten-3-ol",
                "3-hydroxy-3-methylbut-1-ene",
                "3-hydroxybutane-1,2,3-tricarboxylic acid",
                "3-methyl-3-heptanol",
                "6-amino-2-methyl-2-heptanol",
                "8,8-Dimethoxy-2,6-dimethyl-2-octanol",
                "Bis[6-(3,4,7-trihydroxy-3, 7-dimethyloctenyl) ether",
                "[1-(2???-methylpropoxy)-2-hydroxy-2-methylpropoxy]butane",
                "tert-butanol"
            ],
            "TP": 4,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Methyl-2-butanol (2M2B)",
            "Tert-Amyl alcohol (TAA)",
            "Tert-Butyl alcohol (TBA)",
            "Tert-Pentyl alcohol (TPA)",
            "Tert-Octanol (TO)",
            "3-Methyl-3-pentanol (3M3P)",
            "2,2-Dimethyl-1-propanol (2,2-DM1P)",
            "3,3-Dimethyl-2-butanol (3,3-DM2B)",
            "2,2,3-Trimethylbutan-3-ol (2,2,3-TMB3O)",
            "2,2,4-Trimethylpentan-3-ol (2,2,4-TMP3O)",
            "2,2-Dimethyl-3-pentanol (2,2-DM3P)",
            "2,2,3-Trimethylpentan-3-ol (2,2,3-TMP3O)",
            "2,2,4,4-Tetramethylpentan-3-ol (2,2,4,4-TMP3O)",
            "2,2,3,3-Tetramethylbutan-2-ol (2,2,3,3-TMB2O)",
            "2,2,4,4-Tetramethylpentan-2-ol (2,2,4,4-TMP2O)",
            "2,2,3,3,4-Pentamethylpentan-3-ol (2,2,3,3,4-PMP3O)",
            "2,2,3,3,4,4-Hexamethylpentan-3-ol (2,2,3,3,4,4-HMP3O)",
            "2,2,3,3,4,4,5-Heptamethylhexan-3-ol (2,2,3,3,4,4,5-HMH3O)",
            "3,3-Dimethyl-2-pentanol (3,3-DM2P)",
            "2,2-Dimethyl-3-butanol (2,2-DM3B)",
            "3,3-Dimethyl-1-butanol (3,3-DM1B)",
            "2,2,3-Trimethylbutan-2-ol (2,2,3-TMB2O)",
            "2,2,3-Trimethylpentan-2-ol (2,2,3-TMP2O)",
            "2,2,4-Trimethylpentan-2-ol (2,2,4-TMP2O)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-Methyl-2-butanol (2M2B)",
                "Tert-Butyl alcohol (TBA)"
            ],
            "mismatches": [
                "Tert-Amyl alcohol (TAA)",
                "Tert-Pentyl alcohol (TPA)",
                "Tert-Octanol (TO)",
                "3-Methyl-3-pentanol (3M3P)",
                "2,2-Dimethyl-1-propanol (2,2-DM1P)",
                "3,3-Dimethyl-2-butanol (3,3-DM2B)",
                "2,2,3-Trimethylbutan-3-ol (2,2,3-TMB3O)",
                "2,2,4-Trimethylpentan-3-ol (2,2,4-TMP3O)",
                "2,2-Dimethyl-3-pentanol (2,2-DM3P)",
                "2,2,3-Trimethylpentan-3-ol (2,2,3-TMP3O)",
                "2,2,4,4-Tetramethylpentan-3-ol (2,2,4,4-TMP3O)",
                "2,2,3,3-Tetramethylbutan-2-ol (2,2,3,3-TMB2O)",
                "2,2,4,4-Tetramethylpentan-2-ol (2,2,4,4-TMP2O)",
                "2,2,3,3,4-Pentamethylpentan-3-ol (2,2,3,3,4-PMP3O)",
                "2,2,3,3,4,4-Hexamethylpentan-3-ol (2,2,3,3,4,4-HMP3O)",
                "2,2,3,3,4,4,5-Heptamethylhexan-3-ol (2,2,3,3,4,4,5-HMH3O)",
                "3,3-Dimethyl-2-pentanol (3,3-DM2P)",
                "2,2-Dimethyl-3-butanol (2,2-DM3B)",
                "3,3-Dimethyl-1-butanol (3,3-DM1B)",
                "2,2,3-Trimethylbutan-2-ol (2,2,3-TMB2O)",
                "2,2,3-Trimethylpentan-2-ol (2,2,3-TMP2O)",
                "2,2,4-Trimethylpentan-2-ol (2,2,4-TMP2O)"
            ],
            "true_referents": [
                "1-(4-chlorophenyl)-4,4-dimethyl-3-(1H-1,2,4-triazol-1-ylmethyl)pentan-3-ol",
                "2,2,6,7-Tetramethylbicyclo[4.3.0]nona-1(9),4-diene-7,8-diol",
                "2,4-Dimethyl-4-nonanol",
                "2,6-Dimethyl-3,7-octadiene-2,6-diol",
                "2,6-Dimethyl-7-octene-2,6-diol",
                "2-methyl-4-phenyl-2-butanol",
                "2-methylbutan-2-ol",
                "2-methylpropane-1,2-diol",
                "2beta-methylhopan-22-ol",
                "3,7-Dimethyl-1,5(E),7-octatrien-3-ol",
                "3,7-dimethyl-3-octanol",
                "3-Methyl-1-penten-3-ol",
                "3-methyl-3-heptanol",
                "4-Allyl-1,6-heptadiene-4-ol",
                "8,8-Dimethoxy-2,6-dimethyl-2-octanol",
                "[1-(2???-methylpropoxy)-2-hydroxy-2-methylpropoxy]butane",
                "tert-butanol",
                "tert-butyl benzoate",
                "tert-butyl ester",
                "tertiary allylic alcohol"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "1-butanol (tert-butyl alcohol)",
            "2-butanol (sec-butyl alcohol)",
            "2-methyl-2-propanol (tert-pentyl alcohol)",
            "2-methyl-1-propanol (sec-pentyl alcohol)",
            "2-methyl-2-butanol (tert-hexyl alcohol)",
            "2-methyl-1-butanol (sec-hexyl alcohol)",
            "2-methyl-1-pentanol (sec-heptyl alcohol)",
            "2-methyl-2-pentanol (tert-heptyl alcohol)",
            "2-methyl-1-hexanol (sec-octyl alcohol)",
            "2-methyl-2-hexanol (tert-octyl alcohol)",
            "3-methyl-2-butanol (tert-amyl alcohol)",
            "3-methyl-1-butanol (sec-amyl alcohol)",
            "3-methyl-2-pentanol (tert-hexyl alcohol)",
            "3-methyl-1-pentanol (sec-hexyl alcohol)",
            "3-methyl-2-hexanol (tert-heptyl alcohol)",
            "3-methyl-1-hexanol (sec-heptyl alcohol)",
            "3-methyl-2-heptanol (tert-octyl alcohol)",
            "3-methyl-1-heptanol (sec-octyl alcohol)",
            "3-methyl-2-octanol (tert-nonyl alcohol)",
            "3-methyl-1-octanol (sec-nonyl alcohol)",
            "3-methyl-2-nonanol (tert-decyl alcohol)",
            "3-methyl-1-nonanol (sec-decyl alcohol)",
            "3-methyl-2-decanol (tert-undecyl alcohol)",
            "3-methyl-1-decanol (sec-undecyl alcohol)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "1-butanol (tert-butyl alcohol)",
                "2-butanol (sec-butyl alcohol)",
                "2-methyl-2-propanol (tert-pentyl alcohol)",
                "2-methyl-1-propanol (sec-pentyl alcohol)",
                "2-methyl-2-butanol (tert-hexyl alcohol)",
                "2-methyl-1-butanol (sec-hexyl alcohol)",
                "2-methyl-1-pentanol (sec-heptyl alcohol)",
                "2-methyl-2-pentanol (tert-heptyl alcohol)",
                "2-methyl-1-hexanol (sec-octyl alcohol)",
                "2-methyl-2-hexanol (tert-octyl alcohol)",
                "3-methyl-2-butanol (tert-amyl alcohol)",
                "3-methyl-1-butanol (sec-amyl alcohol)",
                "3-methyl-2-pentanol (tert-hexyl alcohol)",
                "3-methyl-1-pentanol (sec-hexyl alcohol)",
                "3-methyl-2-hexanol (tert-heptyl alcohol)",
                "3-methyl-1-hexanol (sec-heptyl alcohol)",
                "3-methyl-2-heptanol (tert-octyl alcohol)",
                "3-methyl-1-heptanol (sec-octyl alcohol)",
                "3-methyl-2-octanol (tert-nonyl alcohol)",
                "3-methyl-1-octanol (sec-nonyl alcohol)",
                "3-methyl-2-nonanol (tert-decyl alcohol)",
                "3-methyl-1-nonanol (sec-decyl alcohol)",
                "3-methyl-2-decanol (tert-undecyl alcohol)",
                "3-methyl-1-decanol (sec-undecyl alcohol)"
            ],
            "true_referents": [
                "(S)-2-acetyl-2-hydroxybutanoic acid",
                "2,4-Dimethyl-4-nonanol",
                "2,6-Dimethyl-7-octene-2,6-diol",
                "2-methyl-4-phenyl-2-butanol",
                "2-methylbutan-2-ol",
                "2-methylpropane-1,2-diol",
                "3,7-dimethyl-3-octanol",
                "3-Methyl-1-penten-3-ol",
                "3-methyl-3-heptanol",
                "5-Methyl-5-pentacosanol",
                "6-amino-2-methyl-2-heptanol",
                "8,8-Diethoxy-2,6-dimethyl-2-octanol",
                "8,8-Dimethoxy-2,6-dimethyl-2-octanol",
                "tert-butanol",
                "tert-butyl ester"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "tert-Butanol (tert-BuOH)",
            "tert-Pentanol",
            "tert-Hexanol",
            "2-Methyl-2-propanol",
            "2,2-Dimethyl-2-propanol",
            "2-Methyl-2-butanol",
            "2-Methyl-2-cyclohexanol",
            "2,2-Dimethylcyclohexanol",
            "Cholesterol",
            "Triphenylmethanol",
            "tert-Amyl alcohol",
            "tert-Ethyl alcohol",
            "tert-Nonyl alcohol",
            "3-Methyl-3-pentanol",
            "3,3-Dimethyl-1-butanol",
            "3,3-Diethyl-1-propanol",
            "2,2,4-Trimethyl-1-butanol",
            "2,2,6-Trimethyl-1-propanol",
            "2,2-Diethyl-2-propanol",
            "Laxogenin",
            "Sitosterol",
            "Neosporol",
            "Fluorotert-butanol",
            "tert-Octyl alcohol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "tert-butanol"
            ],
            "mismatches": [
                "tert-Pentanol",
                "tert-Hexanol",
                "2-Methyl-2-propanol",
                "2,2-Dimethyl-2-propanol",
                "2-Methyl-2-butanol",
                "2-Methyl-2-cyclohexanol",
                "2,2-Dimethylcyclohexanol",
                "Cholesterol",
                "Triphenylmethanol",
                "tert-Amyl alcohol",
                "tert-Ethyl alcohol",
                "tert-Nonyl alcohol",
                "3-Methyl-3-pentanol",
                "3,3-Dimethyl-1-butanol",
                "3,3-Diethyl-1-propanol",
                "2,2,4-Trimethyl-1-butanol",
                "2,2,6-Trimethyl-1-propanol",
                "2,2-Diethyl-2-propanol",
                "Laxogenin",
                "Sitosterol",
                "Neosporol",
                "Fluorotert-butanol",
                "tert-Octyl alcohol"
            ],
            "true_referents": [
                "(3S)-3-hydroxy-3-methylglutaryl-CoA",
                "(S)-mevalonolactone",
                "1,1'-dihydroxyneurosporene",
                "1-Methylcyclohexanol",
                "2,4-Dimethyl-4-nonanol",
                "2,6-Dimethyl-7-octene-2,6-diol",
                "2-[(dimethylamino)methyl]-1-(3-methoxyphenyl)cyclohexanol",
                "2-hydroxy-2-methylpropanal",
                "2-methyl-4-phenyl-2-butanol",
                "2-methylbutan-2-ol",
                "2-methylpropane-1,2-diol",
                "3,7-dimethyl-3-octanol",
                "3-Methyl-1-penten-3-ol",
                "3-hydroxy-3-methylglutaryl-CoA",
                "3-methyl-3-heptanol",
                "8,8-Diethoxy-2,6-dimethyl-2-octanol",
                "8,8-Dimethoxy-2,6-dimethyl-2-octanol",
                "Mycosporine",
                "Presphaerol",
                "Punctaporonin L",
                "ethylestrenol",
                "fluorometholone",
                "fluorometholone acetate",
                "prostratin",
                "sesterfisherol",
                "tert-butanol",
                "tert-butyl benzoate",
                "tert-butyl ester",
                "tertiary allylic alcohol",
                "tridihexethyl",
                "tris(4-chlorophenyl)methanol"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "tert-Butanol (2-Methyl-2-propanol)",
            "2-Methyl-2-butanol",
            "3-Methyl-3-pentanol",
            "2-Phenyl-2-propanol",
            "Triphenylmethanol",
            "1-Adamantanol",
            "Linalool",
            "Terpinen-4-ol",
            "\u03b1-Terpineol",
            "Borneol",
            "Isoborneol",
            "Menthol",
            "Cholesterol",
            "Testosterone",
            "Cortisol",
            "Estradiol",
            "Progesterone",
            "Vitamin A (Retinol)",
            "Vitamin E (\u03b1-Tocopherol)",
            "Lanosterol",
            "Ergosterol",
            "Cycloartenol",
            "Ambroxol",
            "Propofol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "tert-Butanol (2-Methyl-2-propanol)",
                "Linalool",
                "Cortisol"
            ],
            "mismatches": [
                "2-Methyl-2-butanol",
                "3-Methyl-3-pentanol",
                "2-Phenyl-2-propanol",
                "Triphenylmethanol",
                "1-Adamantanol",
                "Terpinen-4-ol",
                "\u03b1-Terpineol",
                "Borneol",
                "Isoborneol",
                "Menthol",
                "Cholesterol",
                "Testosterone",
                "Estradiol",
                "Progesterone",
                "Vitamin A (Retinol)",
                "Vitamin E (\u03b1-Tocopherol)",
                "Lanosterol",
                "Ergosterol",
                "Cycloartenol",
                "Ambroxol",
                "Propofol"
            ],
            "true_referents": [
                "(+)-Cyclocitrinol",
                "(+)-cis-isohumulone",
                "(+)-isoafricanol",
                "(3S)-3-hydroxy-3-methylglutaryl-CoA",
                "(R)-linalool",
                "(S)-9,10-Cyclo-p-menth-1-en-4-ol",
                "(S)-linalool",
                "(S)-mevalonolactone",
                "1'-hydroxy-gamma-carotene",
                "17alpha-hydroxyprogesterone",
                "2,4-Dimethyl-4-nonanol",
                "2-methyl-4-phenyl-2-butanol",
                "2-methylbutan-2-ol",
                "2-methylpropane-1,2-diol",
                "2-phenylpropan-2-ol",
                "3,7-dimethyl-3-octanol",
                "3-Amino-5,7-dimethyl-1-adamantanol",
                "3-Methyl-1-penten-3-ol",
                "3-hydroxy-3-methylglutaryl-CoA",
                "3-methyl-3-heptanol",
                "4-terpineol",
                "Cyclopericodiol",
                "anisotanol B",
                "beta-terpineol",
                "cafestol",
                "chloralodol",
                "chloroxanthin",
                "cortisol",
                "cortisol 21-acetate",
                "cyproterone",
                "ethylestrenol",
                "fucoxanthin",
                "haloperidol",
                "hydroxycitronellal",
                "linalool",
                "medroxyprogesterone",
                "megestrol",
                "naloxegol",
                "naloxone",
                "rebaudioside E",
                "sesterfisherol",
                "stanozolol",
                "tert-butanol",
                "tert-butyl ester",
                "tridihexethyl",
                "tris(4-chlorophenyl)methanol",
                "vepaol"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Methylbutan-2-ol",
            "3-Methylpentan-3-ol",
            "2,3-Dimethylbutan-2-ol",
            "2,4-Dimethylpentan-3-ol",
            "3-Ethylpentan-3-ol",
            "2,2-Dimethylbutan-1-ol",
            "2,2,4-Trimethylpentan-3-ol",
            "3,3-Dimethylbutan-2-ol",
            "2,2,3-Trimethylbutan-1-ol",
            "3-Ethyl-3-methylpentan-2-ol",
            "2,2,3,3-Tetramethylbutan-1-ol",
            "2,2,3,4-Tetramethylpentan-3-ol",
            "3,3-Diethylpentan-2-ol",
            "2,2,4,4-Tetramethylhexan-3-ol",
            "3-Ethyl-2,2-dimethylbutan-1-ol",
            "3,3,4-Trimethylhexan-2-ol",
            "2,2,3,3,4-Pentamethylpentan-1-ol",
            "2,2,4,4,5-Pentamethylhexan-3-ol",
            "3,3-Diethyl-2,2-dimethylbutan-1-ol",
            "2,2,3,3,4,4-Hexamethylpentan-1-ol",
            "3-Ethyl-2,2,4,4-tetramethylpentan-3-ol",
            "2,2,3,3,4,4,5-Heptamethylhexan-3-ol",
            "3,3-Diethyl-2,2,4,4-tetramethylpentan-3-ol",
            "2,2,3,3,4,4,5,5-Octamethylhexan-3-ol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-Methylbutan-2-ol"
            ],
            "mismatches": [
                "3-Methylpentan-3-ol",
                "2,3-Dimethylbutan-2-ol",
                "2,4-Dimethylpentan-3-ol",
                "3-Ethylpentan-3-ol",
                "2,2-Dimethylbutan-1-ol",
                "2,2,4-Trimethylpentan-3-ol",
                "3,3-Dimethylbutan-2-ol",
                "2,2,3-Trimethylbutan-1-ol",
                "3-Ethyl-3-methylpentan-2-ol",
                "2,2,3,3-Tetramethylbutan-1-ol",
                "2,2,3,4-Tetramethylpentan-3-ol",
                "3,3-Diethylpentan-2-ol",
                "2,2,4,4-Tetramethylhexan-3-ol",
                "3-Ethyl-2,2-dimethylbutan-1-ol",
                "3,3,4-Trimethylhexan-2-ol",
                "2,2,3,3,4-Pentamethylpentan-1-ol",
                "2,2,4,4,5-Pentamethylhexan-3-ol",
                "3,3-Diethyl-2,2-dimethylbutan-1-ol",
                "2,2,3,3,4,4-Hexamethylpentan-1-ol",
                "3-Ethyl-2,2,4,4-tetramethylpentan-3-ol",
                "2,2,3,3,4,4,5-Heptamethylhexan-3-ol",
                "3,3-Diethyl-2,2,4,4-tetramethylpentan-3-ol",
                "2,2,3,3,4,4,5,5-Octamethylhexan-3-ol"
            ],
            "true_referents": [
                "(2S,3R)-3-hydroxybutane-1,2,3-tricarboxylic acid",
                "2,4-Dimethyl-4-nonanol",
                "2,6-Dimethyl-3,7-octadiene-2,6-diol",
                "2,6-Dimethyl-7-octene-2,6-diol",
                "2-[3-(2,2,3-trimethylcyclopent-3-enyl)cyclohex-3-enyl]propan-2-ol",
                "2-methyl-4-phenyl-2-butanol",
                "2-methylbutan-2-ol",
                "2-methylpropane-1,2-diol",
                "2-phenylpropan-2-ol",
                "3,7-Dimethyl-1,5(E),7-octatrien-3-ol",
                "3,7-dimethyl-3-octanol",
                "3,7-dimethylocta-1,6-dien-3-yl acetate",
                "3-Methyl-1-penten-3-ol",
                "3-hydroxy-3-methylbut-1-ene",
                "3-methyl-3-heptanol",
                "4-Allyl-1,6-heptadiene-4-ol",
                "8,8-Dimethoxy-2,6-dimethyl-2-octanol",
                "Bis[6-(3,4,7-trihydroxy-3, 7-dimethyloctenyl) ether",
                "tridihexethyl"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "2-Methyl-2-propanol (tert-butyl alcohol)",
            "2-Phenyl-2-propanol (cumyl alcohol)",
            "Triphenylmethanol (trityl alcohol)",
            "1,1-Dimethylcyclohexanol",
            "1,1-Dimethyl-1-phenylmethanol",
            "2,6,6-Trimethylbicyclo[3.1.1]heptan-3-ol (isoborneol)",
            "1,1-Dimethylcyclopentanol",
            "1,1-Dimethyl-1-(4-methylphenyl)methanol",
            "2,2-Dimethyl-3-butyn-2-ol",
            "2,2-Dimethylcyclopropanol",
            "2,2-Dimethyl-3-pentanol",
            "2,2-Dimethyl-3-hexanol",
            "2,2-Dimethyl-3-heptanol",
            "2,2-Dimethyl-3-octanol",
            "2,2-Dimethyl-3-nonanol",
            "2,2-Dimethyl-3-decanol",
            "2,2-Dimethyl-3-undecanol",
            "2,2-Dimethyl-3-dodecanol",
            "2,2-Dimethyl-3-tridecanol",
            "2,2-Dimethyl-3-tetradecanol",
            "2,2-Dimethyl-3-pentadecanol",
            "2,2-Dimethyl-3-hexadecanol",
            "2,2-Dimethyl-3-heptadecanol",
            "2,2-Dimethyl-3-octadecanol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-Methyl-2-propanol (tert-butyl alcohol)",
                "2-Phenyl-2-propanol (cumyl alcohol)"
            ],
            "mismatches": [
                "Triphenylmethanol (trityl alcohol)",
                "1,1-Dimethylcyclohexanol",
                "1,1-Dimethyl-1-phenylmethanol",
                "2,6,6-Trimethylbicyclo[3.1.1]heptan-3-ol (isoborneol)",
                "1,1-Dimethylcyclopentanol",
                "1,1-Dimethyl-1-(4-methylphenyl)methanol",
                "2,2-Dimethyl-3-butyn-2-ol",
                "2,2-Dimethylcyclopropanol",
                "2,2-Dimethyl-3-pentanol",
                "2,2-Dimethyl-3-hexanol",
                "2,2-Dimethyl-3-heptanol",
                "2,2-Dimethyl-3-octanol",
                "2,2-Dimethyl-3-nonanol",
                "2,2-Dimethyl-3-decanol",
                "2,2-Dimethyl-3-undecanol",
                "2,2-Dimethyl-3-dodecanol",
                "2,2-Dimethyl-3-tridecanol",
                "2,2-Dimethyl-3-tetradecanol",
                "2,2-Dimethyl-3-pentadecanol",
                "2,2-Dimethyl-3-hexadecanol",
                "2,2-Dimethyl-3-heptadecanol",
                "2,2-Dimethyl-3-octadecanol"
            ],
            "true_referents": [
                "(5E)-5-(4-chlorobenzylidene)-2,2-dimethyl-1-(1,2,4-triazol-1-ylmethyl)cyclopentanol",
                "1-Methylcyclohexanol",
                "2,2,6,7-Tetramethylbicyclo[4.3.0]nona-1(9),4-diene-7,8-diol",
                "2,4-Dimethyl-4-nonanol",
                "2,6-Dimethyl-3,7-octadiene-2,6-diol",
                "2,6-Dimethyl-7-octene-2,6-diol",
                "2-(4-methoxyphenyl)propan-2-ol",
                "2-[(dimethylamino)methyl]-1-(3-methoxyphenyl)cyclohexanol",
                "2-[3-(2,2,3-trimethylcyclopent-3-enyl)cyclohex-3-enyl]propan-2-ol",
                "2-[4-(2,2,3-trimethylcyclopent-3-enyl)cyclohex-3-enyl]propan-2-ol",
                "2-methyl-4-phenyl-2-butanol",
                "2-methylbutan-2-ol",
                "2-methylpropane-1,2-diol",
                "2-phenylpropan-2-ol",
                "3,7-dimethyl-3-octanol",
                "3,7-dimethylocta-1,6-dien-3-yl acetate",
                "3-hydroxybutane-1,2,3-tricarboxylic acid",
                "3-methyl-3-heptanol",
                "5-Methyl-5-pentacosanol",
                "6-amino-2-methyl-2-heptanol",
                "8,8-Diethoxy-2,6-dimethyl-2-octanol",
                "8,8-Dimethoxy-2,6-dimethyl-2-octanol",
                "tert-butanol",
                "tris(4-chlorophenyl)methanol"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "Cholesterol (CHOL)",
            "Ergosterol (ERGO)",
            "Lanosterol (LANO)",
            "Squalene (SQUA)",
            "Campesterol (CAMP)",
            "Stigmasterol (STIG)",
            "\u03b2-Sitosterol (SITO)",
            "Desmosterol (DESM)",
            "Lathosterol (LATH)",
            "7-Dehydrocholesterol (7DHC)",
            "Dihydrolanosterol (DHLA)",
            "Cycloartenol (CYCL)",
            "Obtusifoliol (OBTU)",
            "Parkeol (PARK)",
            "Butyrospermol (BUTY)",
            "Tirucallol (TIRU)",
            "Euphol (EUPH)",
            "Germanicol (GERM)",
            "Dammarenediol-II (DAMM)",
            "Lupeol (LUPE)",
            "Taraxasterol (TARA)",
            "Bauerenol (BAUA)",
            "Multiflorenol (MULT)",
            "Betulin (BETU)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dammarenediol-II"
            ],
            "mismatches": [
                "Cholesterol (CHOL)",
                "Ergosterol (ERGO)",
                "Lanosterol (LANO)",
                "Squalene (SQUA)",
                "Campesterol (CAMP)",
                "Stigmasterol (STIG)",
                "\u03b2-Sitosterol (SITO)",
                "Desmosterol (DESM)",
                "Lathosterol (LATH)",
                "7-Dehydrocholesterol (7DHC)",
                "Dihydrolanosterol (DHLA)",
                "Cycloartenol (CYCL)",
                "Obtusifoliol (OBTU)",
                "Parkeol (PARK)",
                "Butyrospermol (BUTY)",
                "Tirucallol (TIRU)",
                "Euphol (EUPH)",
                "Germanicol (GERM)",
                "Lupeol (LUPE)",
                "Taraxasterol (TARA)",
                "Bauerenol (BAUA)",
                "Multiflorenol (MULT)",
                "Betulin (BETU)"
            ],
            "true_referents": [
                "(+)-Cyclocitrinol",
                "(+)-kolavelool",
                "(+)-pisatin",
                "(-)-Tau-muurolol",
                "(22E,24R)-3beta,5alpha-dihydroxyergosta-7,22-dien-6-one",
                "(3S)-3-hydroxy-3-methylglutaryl-CoA",
                "(6E)-nerolidol",
                "(R)-cyclopentolate",
                "(R)-hexaconazole",
                "(R)-linalool",
                "(R)-mevalonolactone",
                "(R)-nephthenol",
                "(R)-triarimol",
                "(S)-linalool",
                "(S)-mevalonolactone",
                "1(10),5-germacradien-4-ol",
                "17,21-dihydroxy-5beta-pregnane-3,11,20-trione",
                "2-methyl-4-phenyl-2-butanol",
                "20(R),22(xi),24(S)-dammar-25(26)-ene-3beta,6alpha,12beta,20,22,24-hexanol",
                "21-dehydrocortisol",
                "3-hydroxy-3-methylglutaryl-CoA",
                "5(1->10)-Abeo-1,12-patchoulanediol",
                "Alpha-acorenol",
                "Drim-68(12)-dien-9alpha,11-diol",
                "Palmaenone B",
                "Scopariol",
                "Sterostrein U",
                "anisotanol B",
                "betaenone A",
                "bullatantriol",
                "cafestol",
                "camptothecin",
                "cedrol",
                "chlorobutanol",
                "colleterpenol",
                "cyclooctat-9-en-7-ol",
                "dammarenediol-II",
                "epi-cedrol",
                "ethylestrenol",
                "germacra-1(10),5-dien-4alpha-ol",
                "germacra-1(10),5-dien-4beta-ol",
                "lupan-3beta,20-diol",
                "megestrol",
                "myrcenol",
                "nezukol",
                "ophiobolin F",
                "sesterfisherol",
                "stanozolol",
                "t-butyl hexadecanoate",
                "tert-butanol",
                "vitexilactone"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": "[\n\"1,3-Butanediol (1,3-BD)\" ,\n\"1-Propanol\" ,\n\"2-Acetyl-1-propanol\" ,\n\"2-Butanone\" ,\n\"2-Chloro-1-propanol\" ,\n\"2-Ethoxyethanol\" ,\n\"2-Methyl-1-butanol\" ,\n\"2-Methyl-1-propanol\" ,\n\"2-Methyl-2-butanol\" ,\n\"2-Methyl-2-pentanol\" ,\n\"2-Methyl-2-propanol\" ,\n\"3,7-Dimethyl-1,3,7-trioxacyclooctane\" ,\n\"3-Buten-2-ol\" ,\n\"3-Methyl-2-butanol\" ,\n\"4-Methyl-2-pentanol\" ,\n\"Aconitine\" ,\n\"Allyl alcohol\" ,\n\"Benzyl alcohol\" ,\n\"Catechol\" ,\n\"Citronellol\" ,\n\"Ethyl lactate\" ,\n\"Geraniol\" ,\n\"Isobutanol\" ,\n\"Isopulegol\" ,\n\"Menthol\" ,\n\"Octan-2-ol\" ,\n\"Phenylethanol\" ,\n\"Terpinen-4-ol\" ,\n\"Thymol\"",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": [
            "Cholesterol (Chol)",
            "1-Dodecanol",
            "Isoprenalin (INN)",
            "Adonitol (Adon)",
            "Vitamin D2 (Ergocalciferol)",
            "Vitamin D3 (Cholecalciferol)",
            "Fluoxetine (Prozac)",
            "Cholesterol sulfate",
            "1-Hexadecanol",
            "1-Tetradecanol",
            "1-Octadecanol",
            "1-Eicosanol",
            "1-Docosanol",
            "Tetracosanol",
            "Hexacosanol",
            "Octacosanol",
            "Triphenylmethanol",
            "2-Methyl-4-chlorophenoxy-tert-amyl alcohol",
            "2-(4-Morpholinyl)-4-chlorophenoxy-tert-amyl alcohol",
            "2-(4-Methylpiperazinyl)-4-chlorophenoxy-tert-amyl alcohol",
            "2-(Diethylamino)-4-chlorophenoxy-tert-amyl alcohol",
            "2-(Pyrrolidinyl)-4-chlorophenoxy-tert-amyl alcohol",
            "2-(Piperidinyl)-4-chlorophenoxy-tert-amyl alcohol",
            "2-(Hexamethyleneimino)-4-chlorophenoxy-tert-amyl alcohol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Cholesterol (Chol)",
                "1-Dodecanol",
                "Isoprenalin (INN)",
                "Adonitol (Adon)",
                "Vitamin D2 (Ergocalciferol)",
                "Vitamin D3 (Cholecalciferol)",
                "Fluoxetine (Prozac)",
                "Cholesterol sulfate",
                "1-Hexadecanol",
                "1-Tetradecanol",
                "1-Octadecanol",
                "1-Eicosanol",
                "1-Docosanol",
                "Tetracosanol",
                "Hexacosanol",
                "Octacosanol",
                "Triphenylmethanol",
                "2-Methyl-4-chlorophenoxy-tert-amyl alcohol",
                "2-(4-Morpholinyl)-4-chlorophenoxy-tert-amyl alcohol",
                "2-(4-Methylpiperazinyl)-4-chlorophenoxy-tert-amyl alcohol",
                "2-(Diethylamino)-4-chlorophenoxy-tert-amyl alcohol",
                "2-(Pyrrolidinyl)-4-chlorophenoxy-tert-amyl alcohol",
                "2-(Piperidinyl)-4-chlorophenoxy-tert-amyl alcohol",
                "2-(Hexamethyleneimino)-4-chlorophenoxy-tert-amyl alcohol"
            ],
            "true_referents": [
                "(-)-(12E,2S,3S,4R,5R,6R,9S,11S,15R)-3-acetoxy-5,6-epoxylathyr-12-en-15-ol-14-one",
                "(-)-homalomenol D",
                "(2,4-dichlorophenyl)(phenyl)pyrimidin-5-ylmethanol",
                "(2-chlorophenyl)(4-chlorophenyl)pyrimidin-5-ylmethanol",
                "(2R,3R,4S,5S)-6-[(1E)-1-chloro-3-ethylpent-1-en-4-yn-3-yl]-3,4,5-trihydroxyoxane-2-carboxylic acid",
                "(3S)-3-hydroxy-3-methylglutaryl-CoA",
                "(5E)-5-(4-chlorobenzylidene)-2,2-dimethyl-1-(1,2,4-triazol-1-ylmethyl)cyclopentanol",
                "(E)-5-chloro-3-ethynylpent-4-ene-2,3-diol",
                "(S)-linalyl acetate",
                "(S)-mevalonolactone",
                "1-(4-chlorophenyl)-4,4-dimethyl-3-(1H-1,2,4-triazol-1-ylmethyl)pentan-3-ol",
                "1alpha,2beta,25-trihydroxy vitamin D3",
                "2,6-Dimethyl-3,7-octadiene-2,6-diol",
                "2-(2,4-dichlorophenyl)-1-(1H-1,2,4-triazol-1-yl)hexan-2-ol",
                "2-methylpropane-1,2-diol",
                "23(S),25-dihydroxy-24-oxovitamin D3",
                "3,7-dimethyl-3-octanol",
                "3-hydroxy-3-methylglutaryl-CoA",
                "3-hydroxybutane-1,2,3-tricarboxylic acid",
                "3beta-hydroxy-beta-acorenol",
                "4-Allyl-1,6-heptadiene-4-ol",
                "5(1->10)-Abeo-1,12-patchoulanediol",
                "5-Methyl-5-pentacosanol",
                "6alpha-acetoxyisoinuviscolide",
                "8,8-Diethoxy-2,6-dimethyl-2-octanol",
                "8,8-Dimethoxy-2,6-dimethyl-2-octanol",
                "Caryolane-1,7alpha-diol",
                "anisotanol B",
                "cafestol",
                "cortisol 21-sulfate",
                "cyclooctat-9-en-5,7-diol",
                "dihydroisopentenyldehydrorhodopin",
                "ethylestrenol",
                "haloperidol",
                "isopentenyldehydrorhodopin",
                "paxilline",
                "sesterfisherol",
                "t-butyl hexadecanoate",
                "tert-butanol",
                "tridihexethyl",
                "tris(4-chlorophenyl)methanol",
                "venlafaxine"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "tertiary alcohol",
        "domain": "chemistry",
        "response": "[\n  {\n    \"Canonical Name\": \"2-Butanol\" (2-BuOH)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethanol\" (2-PE)\n  },\n  {\n    \"Canonical Name\": \"1-Butanol\" (1-BuOH)\n  },\n  {\n    \"Canonical Name\": \"2-Methyl-2-propanol\" (2-MP)\n  },\n  {\n    \"Canonical Name\": \"1-Phenylethanol\" (1-PE)\n  },\n  {\n    \"Canonical Name\": \"2-Methyl-1-propanol\" (2-MP)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethyl alcohol\" (2-PEA)\n  },\n  {\n    \"Canonical Name\": \"2-Ethyl-1-hexanol\" (2-EH)\n  },\n  {\n    \"Canonical Name\": \"1-Methyl-1-propanol\" (1-MP)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethyl alcohol\" (2-PEA)\n  },\n  {\n    \"Canonical Name\": \"2-Methyl-1-butanol\" (2-MB)\n  },\n  {\n    \"Canonical Name\": \"2-Methyl-2-butanol\" (2-MB)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethyl alcohol\" (2-PEA)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethyl alcohol\" (2-PEA)\n  },\n  {\n    \"Canonical Name\": \"2-Methyl-1-propanol\" (2-MP)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethanol\" (2-PE)\n  },\n  {\n    \"Canonical Name\": \"2-Methyl-1-propanol\" (2-MP)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethyl alcohol\" (2-PEA)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethanol\" (2-PE)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethanol\" (2-PE)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethanol\" (2-PE)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethanol\" (2-PE)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethanol\" (2-PE)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethanol\" (2-PE)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethanol\" (2-PE)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethanol\" (2-PE)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethanol\" (2-PE)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethanol\" (2-PE)\n  },\n  {\n    \"Canonical Name\": \"2-Phenylethanol\" (2-PE)\n  }\n]",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]