[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "Phenazine (Phe)",
            "Phenoxazine",
            "Phenothiazine",
            "Phthalazine",
            "Quinone",
            "Naphthoquinone",
            "Benzoquinone",
            "Anthraquinone",
            "Porphyrin",
            "Corrole",
            "Porphine",
            "Benzoporphyrin",
            "Corazine",
            "Perylenequinone",
            "Naphthacenequinone",
            "Acridine",
            "Quinizarin",
            "Xanthone",
            "Anthracenequinone",
            "Purpurin",
            "Alizarin",
            "Rubiadin",
            "Lawsone",
            "Benzoquinone diimine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Naphthoquinone",
                "Benzoquinone",
                "Anthraquinone",
                "Quinizarin",
                "Purpurin",
                "Alizarin",
                "Rubiadin",
                "Lawsone"
            ],
            "mismatches": [
                "Phenazine (Phe)",
                "Phenoxazine",
                "Phenothiazine",
                "Phthalazine",
                "Quinone",
                "Porphyrin",
                "Corrole",
                "Porphine",
                "Benzoporphyrin",
                "Corazine",
                "Perylenequinone",
                "Naphthacenequinone",
                "Acridine",
                "Xanthone",
                "Anthracenequinone",
                "Benzoquinone diimine"
            ],
            "true_referents": [
                "1,2-benzoquinone",
                "1,2-naphthoquinone",
                "1,4-benzoquinone",
                "1,4-benzoquinone imine",
                "2,3-dimethoxynaphthalene-1,4-dione",
                "2-(4-Methyl-3-pentenyl)anthraquinone",
                "4,5-dihydroxy-1-methyl-anthraquinone",
                "8-chloro-10H-phenothiazine-1,4-dione",
                "9,10-anthraquinone",
                "Acrimine B",
                "Alterporriol N",
                "Alterporriol P",
                "Cytosporanthraxanthone",
                "Diospyrin",
                "Nenesophanol",
                "Phaeosphenone",
                "Porfiromycine",
                "Purpurin 1-methyl ether",
                "Purpurogemutantidin",
                "Radinaphthalenone",
                "Rubellin A",
                "Rubroskyrin",
                "Sorrentanone",
                "Versicol",
                "alizarin",
                "alizarin blue",
                "alizarin complexone",
                "anthraquinone",
                "benzoquinone",
                "benzoquinones",
                "chrysazin",
                "chrysophanol",
                "dysidine",
                "lawsone",
                "m-quinone",
                "naphthazarin",
                "naphthoquinone",
                "p-quinones",
                "purpurin",
                "quinizarin",
                "rubiadin",
                "triaziquone",
                "ubiquinone-1"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "Phenanthraquinone (C14H8O2)",
            "Anthraquinone (C14H8O2)",
            "Chrysazin (C12H8N2O2)",
            "Catechol 1,4-dione (C6H4O3)",
            "1,2-Naphthoquinone (C10H6O2)",
            "Benzanthrone (C13H8O2)",
            "1,8-Naphthalenedione (C10H6O2)",
            "Alizarin (C14H8O4)",
            "Purpurin (C14H8O4)",
            "Chrysophanic acid (C14H8O4)",
            "Rubia tinctorum (C14H8O4)",
            "Phloroglucinol trione (C6H3O3)",
            "9,10-Anthraquinone (C14H8O2)",
            "Emodin (C15H10O5)",
            "Rhein (C15H8O5)",
            "Aloe emodin (C15H10O5)",
            "Chrysophanol (C15H10O4)",
            "Physcion (C15H10O5)",
            "Morin (C15H10O6)",
            "Quercetin-3,3',4',5,7-pentakis (C15H10O7)",
            "Euxanthone (C14H8O4)",
            "Ruberythric acid (C14H8O6)",
            "Luteolin-7,4'-dione (C15H10O5)",
            "Fisetin-3,3',4',7-tetraone (C15H10O6)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Anthraquinone (C14H8O2)",
                "1,2-Naphthoquinone (C10H6O2)",
                "Alizarin (C14H8O4)",
                "Purpurin (C14H8O4)",
                "9,10-Anthraquinone (C14H8O2)",
                "Emodin (C15H10O5)",
                "Rhein (C15H8O5)",
                "Aloe emodin (C15H10O5)",
                "Chrysophanol (C15H10O4)",
                "Physcion (C15H10O5)"
            ],
            "mismatches": [
                "Phenanthraquinone (C14H8O2)",
                "Chrysazin (C12H8N2O2)",
                "Catechol 1,4-dione (C6H4O3)",
                "Benzanthrone (C13H8O2)",
                "1,8-Naphthalenedione (C10H6O2)",
                "Chrysophanic acid (C14H8O4)",
                "Rubia tinctorum (C14H8O4)",
                "Phloroglucinol trione (C6H3O3)",
                "Morin (C15H10O6)",
                "Quercetin-3,3',4',5,7-pentakis (C15H10O7)",
                "Euxanthone (C14H8O4)",
                "Ruberythric acid (C14H8O6)",
                "Luteolin-7,4'-dione (C15H10O5)",
                "Fisetin-3,3',4',7-tetraone (C15H10O6)"
            ],
            "true_referents": [
                "(1'S,5'R)-5'-hydroxyaverantin",
                "(1'S,5'S)-5'-hydroxyaverantin",
                "(1S,3S)-austrocortirubin 8-O-beta-D-gentiobioside",
                "(R)-3,4-Dimethoxydalbergione",
                "(R)-4'-Hydroxy-3,4-dimethoxydalbergione",
                "(S)-2,5-dihydroxy-2-methyl-1,2,3,4-tetrahydroanthracene-9,10-dione",
                "1,2,5,6-tetrahydroxyanthraquinone",
                "1,2-naphthoquinone",
                "1,3,6,8-Tetrahydroxy-2-methoxyethylanthr",
                "1,3,6,8-tetrahydroxyanthraquinone",
                "1,4,5,8-tetrahydroxyanthraquinone",
                "1-O-methyl-6-O-(alpha-D-ribofuranosyl)emodin",
                "2,6,7-trihydroxy-3-methylnaphthalene-1,4-dione",
                "2-Polyprenyl-3-methyl-5-hydroxy-6-methoxy-1,4-benzoquinone",
                "2-ethyl-1,8-dihydroxy-3-methyl-anthraquinone",
                "2-hydroxy-3-(2-hydroxyethyl)naphthalene-1,4-dione",
                "2-hydroxychrysophanol",
                "3,4,3',4'-Bisdehydroxanthomegnin",
                "4,6,11-trihydroxy-9-propyltetracene-5,12-dione",
                "4-hydroxy-3-methylnaphthalene-1,2-dione",
                "5,8-dihydroxy-2,7-dimethoxy-1,4-naphthoquinone",
                "7C-Aglycone",
                "8-Hydroxy-1-methoxy-3-methylanthraquinone",
                "8-O-methyltetrangulol",
                "8-chloro-10H-phenothiazine-1,4-dione",
                "9,10-anthraquinone",
                "A-80915G-8-acid",
                "Alizarin 2-methyl ether",
                "Aloe emodin",
                "Aloe emodin w-acetate",
                "Anhydroflavomannin-9,10-quinone 6,6',8'-tri-O-methyl ether",
                "Emodin 8-beta-D-glucoside",
                "Nidurufin-2'-(4-O-methyl)-beta-D-glucopyranose",
                "Physcion 8-glucoside",
                "Physcionin",
                "Purpurin 1-methyl ether",
                "Rhein",
                "Rubellin A",
                "alizarin",
                "alizarin complexone",
                "anthraquinone",
                "chrysazin",
                "chrysophanol",
                "chrysophanol 8-O-beta-D-glucoside",
                "dibenzo[1,4]dioxine-2,3-dione",
                "emodin",
                "flavopurpurin",
                "physcion",
                "purpurin"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "Naphthoquinone (NQ)",
            "Benzoquinone (BQ)",
            "Anthraquinone (AQ)",
            "Phenanthrenequinone (PHEQ)",
            "1,4-Naphthoquinone",
            "1,2-Naphthoquinone",
            "1,4-Benzoquinone",
            "1,2-Benzoquinone",
            "1,4-Anthraquinone",
            "2,6-Anthraquinone",
            "9,10-Phenanthrenequinone",
            "1,4-Phenanthrenequinone",
            "2,3-Phenanthrenequinone",
            "2,7-Phenanthrenequinone",
            "1,2-Phenanthrenequinone",
            "1,4-Phenanthrenequinone",
            "1,4-Dibenzopyrenequinone",
            "1,4-Dibenzanthracenequinone",
            "1,4-Dibenzofuranquinone",
            "1,4-Dibenzothiophenequinone",
            "1,4-Dibenzoxepinequinone",
            "1,4-Dibenzocycloheptenequinone",
            "1,4-Dibenzocyclooctenequinone",
            "1,4-Dibenzocyclononenequinone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Naphthoquinone (NQ)",
                "Benzoquinone (BQ)",
                "Anthraquinone (AQ)",
                "1,4-Naphthoquinone",
                "1,2-Naphthoquinone",
                "1,4-Benzoquinone",
                "1,2-Benzoquinone"
            ],
            "mismatches": [
                "Phenanthrenequinone (PHEQ)",
                "1,4-Anthraquinone",
                "2,6-Anthraquinone",
                "9,10-Phenanthrenequinone",
                "1,4-Phenanthrenequinone",
                "2,3-Phenanthrenequinone",
                "2,7-Phenanthrenequinone",
                "1,2-Phenanthrenequinone",
                "1,4-Dibenzopyrenequinone",
                "1,4-Dibenzanthracenequinone",
                "1,4-Dibenzofuranquinone",
                "1,4-Dibenzothiophenequinone",
                "1,4-Dibenzoxepinequinone",
                "1,4-Dibenzocycloheptenequinone",
                "1,4-Dibenzocyclooctenequinone",
                "1,4-Dibenzocyclononenequinone"
            ],
            "true_referents": [
                "1,2,5,6-tetrahydroxyanthraquinone",
                "1,2-benzoquinone",
                "1,2-naphthoquinone",
                "1,3,6,8-tetrahydroxyanthraquinone",
                "1,3-Dimethoxyanthraquinone",
                "1,4,5,8-tetrahydroxyanthraquinone",
                "1,4,5-trihydroxyanthraquinone",
                "1,4,6-trihydroxyanthraquinone",
                "1,4-benzoquinone",
                "1,4-naphthoquinone",
                "1-hydroxy-2-methyl-9,10-anthraquinone",
                "2,6-Dimethoxybenzoquinone",
                "2,6-dichlorobenzoquinone",
                "2-(hydroxymethyl)anthraquinone",
                "4,5-dihydroxy-1-methyl-anthraquinone",
                "9,10-anthraquinone",
                "Fluoquinone",
                "Fumaquinone",
                "anthraquinone",
                "benzoquinone",
                "naphthoquinone"
            ],
            "TP": 7,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "Naphthoquinone (NQ)",
            "1,4-Benzoquinone (BQ)",
            "2,3-Dichloro-1,4-benzoquinone (DCBQ)",
            "Anthraquinone (AQ)",
            "Tetracene-5,11-quinone (TCQ)",
            "Phenanthraquinone (PQ)",
            "Chrysazin (CHR)",
            "Lapachol (LAP)",
            "Plumbagin (PLU)",
            "Lawsone (LWS)",
            "Juglone (JUG)",
            "Alizarin (ALZ)",
            "Anthracyclinone A (ACA)",
            "Hypericin (HYP)",
            "Emodin (EMD)",
            "Aloe-emodin (AEM)",
            "Rhein (RHE)",
            "Frangula emodin (FRE)",
            "Naphthazarin (NZR)",
            "5,8-Dihydroxy-1,4-naphthoquinone (DHNQ)",
            "Menadione (VK2)",
            "Phthiocol (PTC)",
            "2,5-Dihydroxy-1,4-benzoquinone (DHBQ)",
            "2,3,5,6-Tetramethyl-1,4-benzoquinone (TMBQ)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,4-Benzoquinone",
                "Anthraquinone",
                "Chrysazin",
                "Lapachol",
                "Plumbagin",
                "Lawsone",
                "Juglone",
                "Alizarin",
                "Emodin",
                "Aloe-emodin",
                "Rhein",
                "Naphthazarin",
                "Menadione",
                "Phthiocol"
            ],
            "mismatches": [
                "Naphthoquinone (NQ)",
                "2,3-Dichloro-1,4-benzoquinone (DCBQ)",
                "Tetracene-5,11-quinone (TCQ)",
                "Phenanthraquinone (PQ)",
                "Anthracyclinone A (ACA)",
                "Hypericin (HYP)",
                "Frangula emodin (FRE)",
                "5,8-Dihydroxy-1,4-naphthoquinone (DHNQ)",
                "2,5-Dihydroxy-1,4-benzoquinone (DHBQ)",
                "2,3,5,6-Tetramethyl-1,4-benzoquinone (TMBQ)"
            ],
            "true_referents": [
                "1,2-benzoquinone",
                "1,2-naphthoquinone",
                "1,4-benzoquinone",
                "1-hydroxy-2-methyl-9,10-anthraquinone",
                "2,3-dihydroxy-5-methyl-1,4-benzoquinone",
                "2,5-di-tert-Butyl-1,4-benzoquinone",
                "2,6-Di-tert-butylbenzoquinone",
                "2,6-dichlorobenzoquinone",
                "2,8-dihydroxy-1,4-naphthoquinone",
                "9,10-anthraquinone",
                "Adriamycinone",
                "Aloe emodin",
                "Aloe emodin w-acetate",
                "Chryso-obtusin",
                "Chrysophanein",
                "Emodin 8-beta-D-glucoside",
                "Emodin 8-glucoside",
                "Frangulin A",
                "Frangulin B",
                "Methylpedicinin",
                "Paramagnetoquinone A",
                "Phaeosphenone",
                "Phthiocol",
                "Rhein",
                "Rheochrysin",
                "Rhodoislandin B",
                "alizarin",
                "alizarin blue",
                "alizarin complexone",
                "anthraquinone",
                "chrysazin",
                "daunorubicin",
                "dithianon",
                "emodin",
                "juglone",
                "lapachol",
                "lawsone",
                "menadione",
                "naphthazarin",
                "naphthoquinone",
                "pentahydroxyanthraquinone",
                "plumbagin",
                "tetracene-1,4-dione",
                "tetracene-5,12-dione",
                "tetracenequinone",
                "tetrachloro-1,4-benzoquinone"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "1,4-Benzoquinone (BQ)",
            "1,2-Benzoquinone",
            "1,4-Naphthoquinone",
            "1,2-Naphthoquinone",
            "Anthraquinone",
            "Phenanthrenequinone",
            "1,4-Anthraquinone",
            "1,2-Anthraquinone",
            "9,10-Phenanthrenequinone",
            "1,4-Phenanthrenequinone",
            "1,4-Pyrenequinone",
            "1,2-Pyrenequinone",
            "9,10-Anthraquinone",
            "9,10-Diphenylanthraquinone",
            "1,4-Anthraquinone",
            "1,2-Anthraquinone",
            "1,4-Chrysenequinone",
            "1,2-Chrysenequinone",
            "1,4-Tetracenequinone",
            "1,2-Tetracenequinone",
            "9,10-Tetracenequinone",
            "1,4-Perylenequinone",
            "1,2-Perylenequinone",
            "9,10-Perylenequinone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,4-Benzoquinone (BQ)",
                "1,2-Benzoquinone",
                "1,4-Naphthoquinone",
                "1,2-Naphthoquinone",
                "Anthraquinone",
                "9,10-Anthraquinone",
                "1,4-Tetracenequinone"
            ],
            "mismatches": [
                "Phenanthrenequinone",
                "1,4-Anthraquinone",
                "1,2-Anthraquinone",
                "9,10-Phenanthrenequinone",
                "1,4-Phenanthrenequinone",
                "1,4-Pyrenequinone",
                "1,2-Pyrenequinone",
                "9,10-Diphenylanthraquinone",
                "1,4-Chrysenequinone",
                "1,2-Chrysenequinone",
                "1,2-Tetracenequinone",
                "9,10-Tetracenequinone",
                "1,4-Perylenequinone",
                "1,2-Perylenequinone",
                "9,10-Perylenequinone"
            ],
            "true_referents": [
                "1,2,5,6-tetrahydroxyanthraquinone",
                "1,2-benzoquinone",
                "1,2-naphthoquinone",
                "1,3,6,8-tetrahydroxyanthraquinone",
                "1,4-benzoquinone",
                "1,4-naphthoquinone",
                "1-hydroxy-2-methyl-9,10-anthraquinone",
                "1-hydroxyanthraquinone",
                "4,5-dihydroxy-1-methyl-anthraquinone",
                "9,10-anthraquinone",
                "anthraquinone",
                "benzo[a]pyrene-7,8-dione",
                "naphthoquinone",
                "plastoquinone-9",
                "tetracenequinone",
                "tetracenequinones"
            ],
            "TP": 7,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "1,3-Cyclohexanedione (1,3-CHD)",
            "1,4-Cyclohexanedione (1,4-CHD)",
            "1,2-Cyclohexanedione (1,2-CHD)",
            "1,3-Cyclopentanedione (1,3-CPD)",
            "1,4-Cyclopentanedione (1,4-CPD)",
            "1,2-Cyclopentanedione (1,2-CPD)",
            "Naphthalene-1,4-dione (Naphth-1,4-D)",
            "Naphthalene-1,2-dione (Naphth-1,2-D)",
            "Anthraquinone (AQ)",
            "Phenanthrene-9,10-dione (Phen-9,10-D)",
            "1,2-Benzenedione (1,2-BD)",
            "1,4-Benzenedione (1,4-BD)",
            "2,3-Dihydroxy-1,4-naphthoquinone (DHNQ)",
            "2-Hydroxy-1,4-naphthoquinone (2-Hydroxy-NQ)",
            "1,3-Benzenedione (1,3-BD)",
            "1,2,3,4-Tetrahydroquinone (THQ)",
            "4-Hydroxy-1,2-benzenedione (4-Hydroxy-BD)",
            "2-Methyl-1,4-benzenedione (2-Methyl-BD)",
            "1,2-Naphthoquinone (1,2-NQ)",
            "1,4-Naphthoquinone (1,4-NQ)",
            "4,5-Dimethyl-1,2-benzenedione (4,5-Dimethyl-BD)",
            "1,3,5-Cyclohexanedione (1,3,5-CHD)",
            "1,2,4-Cyclohexanedione (1,2,4-CHD)",
            "3,4-Dihydroxy-1,2-benzenedione (3,4-Dihydroxy-BD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Anthraquinone (AQ)",
                "1,2-Naphthoquinone (1,2-NQ)",
                "1,4-Naphthoquinone (1,4-NQ)"
            ],
            "mismatches": [
                "1,3-Cyclohexanedione (1,3-CHD)",
                "1,4-Cyclohexanedione (1,4-CHD)",
                "1,2-Cyclohexanedione (1,2-CHD)",
                "1,3-Cyclopentanedione (1,3-CPD)",
                "1,4-Cyclopentanedione (1,4-CPD)",
                "1,2-Cyclopentanedione (1,2-CPD)",
                "Naphthalene-1,4-dione (Naphth-1,4-D)",
                "Naphthalene-1,2-dione (Naphth-1,2-D)",
                "Phenanthrene-9,10-dione (Phen-9,10-D)",
                "1,2-Benzenedione (1,2-BD)",
                "1,4-Benzenedione (1,4-BD)",
                "2,3-Dihydroxy-1,4-naphthoquinone (DHNQ)",
                "2-Hydroxy-1,4-naphthoquinone (2-Hydroxy-NQ)",
                "1,3-Benzenedione (1,3-BD)",
                "1,2,3,4-Tetrahydroquinone (THQ)",
                "4-Hydroxy-1,2-benzenedione (4-Hydroxy-BD)",
                "2-Methyl-1,4-benzenedione (2-Methyl-BD)",
                "4,5-Dimethyl-1,2-benzenedione (4,5-Dimethyl-BD)",
                "1,3,5-Cyclohexanedione (1,3,5-CHD)",
                "1,2,4-Cyclohexanedione (1,2,4-CHD)",
                "3,4-Dihydroxy-1,2-benzenedione (3,4-Dihydroxy-BD)"
            ],
            "true_referents": [
                "(R)-3,4-Dimethoxydalbergione",
                "1,2-naphthoquinone",
                "1,3-Dimethoxyanthraquinone",
                "1,4-naphthoquinone",
                "1-hydroxy-2-methyl-9,10-anthraquinone",
                "2,3-dimethoxynaphthalene-1,4-dione",
                "2,5-Dihydroxy-3-pentadecyl-1,4-benzoquinone",
                "2,8-dihydroxy-1,4-naphthoquinone",
                "2-(3-methylbut-2-enyl)-5-(2-methylbut-3-en-2-yl)cyclohexa-2,5-diene-1,4-dione",
                "2-hydroxy-3-(2-hydroxyethyl)naphthalene-1,4-dione",
                "4-methoxy-3,6-diphenylcyclohexa-3,5-diene-1,2-dione",
                "9,10-anthraquinone",
                "S-3'-hydroxy-4,4'-dimethoxydalbergione",
                "anthraquinone",
                "benzo[a]pyrene-7,8-dione",
                "dibenzo[1,4]dioxine-2,3-dione",
                "hydroxy-1,2-naphthoquinone",
                "naphthoquinone",
                "tetracene-1,4-dione",
                "tetracene-5,12-dione",
                "tetrahydroxy-1,4-benzoquinone"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "1,4-Benzoquinone (BQ)",
            "1,2-Benzoquinone (o-BQ)",
            "1,4-Naphthoquinone (NQ)",
            "1,2-Naphthoquinone (o-NQ)",
            "1,4-Anthraquinone (AQ)",
            "1,2-Anthraquinone (o-AQ)",
            "1,4-Phenanthrenequinone (PQ)",
            "1,2-Phenanthrenequinone (o-PQ)",
            "1,4-Anthrachinon (AnQ)",
            "1,2-Anthrachinon (o-AnQ)",
            "1,4-Phenanthraquinone (PhQ)",
            "1,2-Phenanthraquinone (o-PhQ)",
            "1,4-Pyrenequinone (PyQ)",
            "1,2-Pyrenequinone (o-PyQ)",
            "1,4-Chrysenequinone (ChQ)",
            "1,2-Chrysenequinone (o-ChQ)",
            "1,4-Perylenequinone (PeQ)",
            "1,2-Perylenequinone (o-PeQ)",
            "1,4-Coronenequinone (CoQ)",
            "1,2-Coronenequinone (o-CoQ)",
            "1,4-Picenequinone (PiQ)",
            "1,2-Picenequinone (o-PiQ)",
            "1,4-Terrylenequinone (TeQ)",
            "1,2-Terrylenequinone (o-TeQ)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,4-Benzoquinone",
                "1,2-Benzoquinone",
                "1,4-Naphthoquinone",
                "1,2-Naphthoquinone"
            ],
            "mismatches": [
                "1,4-Anthraquinone (AQ)",
                "1,2-Anthraquinone (o-AQ)",
                "1,4-Phenanthrenequinone (PQ)",
                "1,2-Phenanthrenequinone (o-PQ)",
                "1,4-Anthrachinon (AnQ)",
                "1,2-Anthrachinon (o-AnQ)",
                "1,4-Phenanthraquinone (PhQ)",
                "1,2-Phenanthraquinone (o-PhQ)",
                "1,4-Pyrenequinone (PyQ)",
                "1,2-Pyrenequinone (o-PyQ)",
                "1,4-Chrysenequinone (ChQ)",
                "1,2-Chrysenequinone (o-ChQ)",
                "1,4-Perylenequinone (PeQ)",
                "1,2-Perylenequinone (o-PeQ)",
                "1,4-Coronenequinone (CoQ)",
                "1,2-Coronenequinone (o-CoQ)",
                "1,4-Picenequinone (PiQ)",
                "1,2-Picenequinone (o-PiQ)",
                "1,4-Terrylenequinone (TeQ)",
                "1,2-Terrylenequinone (o-TeQ)"
            ],
            "true_referents": [
                "1,2-benzoquinone",
                "1,2-naphthoquinone",
                "1,4-benzoquinone",
                "1,4-naphthoquinone",
                "2-(hydroxymethyl)anthraquinone",
                "2-Aminoanthraquinone",
                "9,10-anthraquinone",
                "Coenzyme Q4",
                "anthraquinone",
                "benzo[a]pyrene-7,8-dione",
                "naphthoquinone",
                "piceatannolquinone",
                "terrequinone A",
                "tetracenequinone"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "Acetophenone (AP)",
            "Benzophenone (BP)",
            "Cyclopentadione (CPD)",
            "Cyclohexadione (CHD)",
            "Cycloheptadione (CHtD)",
            "Cyclooctadione (COD)",
            "Cyclononadione (CND)",
            "Cyclodecadione (CDD)",
            "Anthraquinone (AQ)",
            "Naphthoquinone (NQ)",
            "Phenanthrenequinone (PQ)",
            "Tetracenequinone (TQ)",
            "Perylenequinone (PQ)",
            "Naphthalenedione (ND)",
            "Indandione (ID)",
            "Indanedione (IND)",
            "Indenone (IN)",
            "Indenodione (IND)",
            "Indenodione (IND)",
            "Fluorenone (FN)",
            "Fluorenedione (FD)",
            "Fluorenedione (FD)",
            "Benzanthrone (BA)",
            "Benzanthraquinone (BQ)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Anthraquinone (AQ)",
                "Naphthoquinone (NQ)",
                "Tetracenequinone (TQ)"
            ],
            "mismatches": [
                "Acetophenone (AP)",
                "Benzophenone (BP)",
                "Cyclopentadione (CPD)",
                "Cyclohexadione (CHD)",
                "Cycloheptadione (CHtD)",
                "Cyclooctadione (COD)",
                "Cyclononadione (CND)",
                "Cyclodecadione (CDD)",
                "Phenanthrenequinone (PQ)",
                "Perylenequinone (PQ)",
                "Naphthalenedione (ND)",
                "Indandione (ID)",
                "Indanedione (IND)",
                "Indenone (IN)",
                "Indenodione (IND)",
                "Fluorenone (FN)",
                "Fluorenedione (FD)",
                "Benzanthrone (BA)",
                "Benzanthraquinone (BQ)"
            ],
            "true_referents": [
                "1,2-benzoquinone",
                "1,2-naphthoquinone",
                "1,4-benzoquinone",
                "1-hydroxy-2-methyl-9,10-anthraquinone",
                "11-O-Demethylpradinone I",
                "2,6-Dimethoxybenzoquinone",
                "2-Hydroxy-4-imino-2,5-cyclohexadienone",
                "2-cyclopentylacetic acid [2-[(3-chloro-9,10-dioxo-2-anthracenyl)amino]-2-oxoethyl] ester",
                "2-hydroxy-3-(2-hydroxyethyl)naphthalene-1,4-dione",
                "2-hydroxy-6-pentadecylcyclohexa-2,5-diene-1,4-dione",
                "4-Bromo-3,5-cyclohexadiene-1,2-dione",
                "5'-deoxyneomacrophorin IV",
                "9,10-anthraquinone",
                "Adriamycinone",
                "Asperphenone A",
                "Daunomycinone",
                "Emodacidamide C",
                "Emodacidamide D",
                "Emodacidamide E",
                "Emodacidamide F",
                "Floricolin B",
                "Fluoquinone",
                "Halawanone A",
                "Halawanone C",
                "Halawanone D",
                "Homostealthin D",
                "Monacyclinone D",
                "Paramagnetoquinone A",
                "Pradinone I",
                "Streptoanthraquinone A",
                "Tetracenoquinocin A",
                "Ventinone A",
                "anthraquinone",
                "benzoisochromanequinone",
                "benzoquinone",
                "benzoquinones",
                "daunorubicin",
                "delta-Indomycinone",
                "docebenone",
                "flaviolin",
                "idebenone",
                "naphthoquinone",
                "pyrroloquinoline quinone",
                "tetracene-1,4-dione",
                "tetracenequinone",
                "tetracenequinones"
            ],
            "TP": 3,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "1,2-Benzoquinone (o-Benzoquinone)",
            "1,4-Benzoquinone (p-Benzoquinone)",
            "1,2-Naphthoquinone",
            "1,4-Naphthoquinone",
            "9,10-Anthraquinone",
            "1,4-Anthraquinone",
            "Plumbagin",
            "Juglone",
            "Lawsone",
            "Thymoquinone",
            "Menadione (Vitamin K3)",
            "Diphenoquinone",
            "2,3-Dimethyl-1,4-benzoquinone",
            "2,5-Dichloro-1,4-benzoquinone",
            "2,3,5,6-Tetramethyl-1,4-benzoquinone",
            "Rhein",
            "Emodin",
            "Alizarin",
            "Protocatechuic quinone",
            "Solavetivone",
            "Plastoquinone",
            "Vitamin K1 (Phytonadione)",
            "Vitamin K2 (Menaquinone)",
            "Vitamin K4 (Menadiol)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,2-Naphthoquinone",
                "1,4-Benzoquinone (p-Benzoquinone)",
                "1,4-Naphthoquinone",
                "9,10-Anthraquinone",
                "Plumbagin",
                "Juglone",
                "Lawsone",
                "Thymoquinone",
                "Rhein",
                "Emodin",
                "Alizarin",
                "Plastoquinone"
            ],
            "mismatches": [
                "1,2-Benzoquinone (o-Benzoquinone)",
                "1,4-Anthraquinone",
                "Menadione (Vitamin K3)",
                "Diphenoquinone",
                "2,3-Dimethyl-1,4-benzoquinone",
                "2,5-Dichloro-1,4-benzoquinone",
                "2,3,5,6-Tetramethyl-1,4-benzoquinone",
                "Protocatechuic quinone",
                "Solavetivone",
                "Vitamin K1 (Phytonadione)",
                "Vitamin K2 (Menaquinone)",
                "Vitamin K4 (Menadiol)"
            ],
            "true_referents": [
                "1,2-benzoquinone",
                "1,2-naphthoquinone",
                "1,4-benzoquinone",
                "1,4-benzoquinones",
                "1,4-naphthoquinone",
                "1-hydroxy-2-methyl-9,10-anthraquinone",
                "2,5-Dimethoxy-6-methyl-3-tridecyl-1,4-benzoquinone",
                "2-Hydroxy-vitamin K",
                "2-chloro-6-hydroxy-1,4-benzoquinone",
                "2-methoxy-5-methyl-1,4-benzoquinone",
                "4,5-dihydroxy-1-methyl-anthraquinone",
                "9,10-anthraquinone",
                "Diploquinone A",
                "Diploquinone B",
                "Emodin 8-beta-D-glucoside",
                "Emodin 8-glucoside",
                "Rhein",
                "Rheochrysin",
                "Rhodoislandin B",
                "alizarin",
                "alizarin blue",
                "alizarin complexone",
                "anthraquinone",
                "atovaquone",
                "caffeic acid quinone",
                "emodin",
                "juglone",
                "lawsone",
                "menadione",
                "menaquinone",
                "menaquinone-4",
                "naphthoquinone",
                "p-quinones",
                "plastoquinone",
                "plumbagin",
                "tetrachloro-1,4-benzoquinone",
                "thymoquinone",
                "tocoquinone",
                "vitamin K"
            ],
            "TP": 12,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "1,4-Benzoquinone (BQ)",
            "1,4-Naphthoquinone (NQ)",
            "9,10-Anthraquinone (AQ)",
            "1,4-Anthracenedione",
            "5,12-Naphthacenedione",
            "6,13-Pentacenedione",
            "1,2-Benzoquinone",
            "1,2-Naphthoquinone",
            "9,10-Phenanthrenequinone",
            "Pyrene-4,5-dione",
            "Chrysene-5,6-dione",
            "Benz[a]anthracene-7,12-dione",
            "1,4-Chrysenequinone",
            "2,3-Dimethylanthraquinone",
            "2-Methylanthraquinone",
            "2-Ethylanthraquinone",
            "2,6-Dihydroxyanthraquinone (Anthraflavic acid)",
            "1,8-Dihydroxyanthraquinone (Dantron)",
            "1,2,4-Trihydroxyanthraquinone (Purpurin)",
            "1,2,5,8-Tetrahydroxyanthraquinone (Quinalizarin)",
            "Tetracene-5,12-dione",
            "Phenanthrene-9,10-dione",
            "Acenaphthylene-1,2-dione",
            "Fluorenone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,4-Benzoquinone (BQ)",
                "1,4-Naphthoquinone (NQ)",
                "9,10-Anthraquinone (AQ)",
                "1,2-Benzoquinone",
                "1,2-Naphthoquinone",
                "2-Methylanthraquinone",
                "Tetracene-5,12-dione"
            ],
            "mismatches": [
                "1,4-Anthracenedione",
                "5,12-Naphthacenedione",
                "6,13-Pentacenedione",
                "9,10-Phenanthrenequinone",
                "Pyrene-4,5-dione",
                "Chrysene-5,6-dione",
                "Benz[a]anthracene-7,12-dione",
                "1,4-Chrysenequinone",
                "2,3-Dimethylanthraquinone",
                "2-Ethylanthraquinone",
                "2,6-Dihydroxyanthraquinone (Anthraflavic acid)",
                "1,8-Dihydroxyanthraquinone (Dantron)",
                "1,2,4-Trihydroxyanthraquinone (Purpurin)",
                "1,2,5,8-Tetrahydroxyanthraquinone (Quinalizarin)",
                "Phenanthrene-9,10-dione",
                "Acenaphthylene-1,2-dione",
                "Fluorenone"
            ],
            "true_referents": [
                "(2R,3S)-7-ethyl-1,2,3,4-tetrahydro-2,3,8-trihydroxy-6-methoxy-3-methyl-9,10-anthracenedione",
                "(5R,6R)-3-ethyl-1,5,6-trihydroxy-8-methoxy-5,6-dihydrobenzo[a]anthracene-7,12-dione",
                "(S)-2,5-dihydroxy-2-methyl-1,2,3,4-tetrahydroanthracene-9,10-dione",
                "1,2,5,6-tetrahydroxyanthraquinone",
                "1,2-benzoquinone",
                "1,2-naphthoquinone",
                "1,3,6,8-tetrahydroxyanthraquinone",
                "1,3-Dimethoxyanthraquinone",
                "1,4,5,8-tetrahydroxyanthraquinone",
                "1,4,5-trihydroxyanthraquinone",
                "1,4,6-trihydroxyanthraquinone",
                "1,4-benzoquinone",
                "1,4-bis[2-(4-hydroxyphenyl)ethylamino]anthracene-9,10-dione",
                "1,4-dihydroxy-2-methylanthraquinone",
                "1,4-naphthoquinone",
                "1-Amino-2-methylanthraquinone",
                "1-hydroxy-2-methyl-9,10-anthraquinone",
                "12-demethylmultiorthoquinone",
                "2,2'-bis-(7-methyl-1,4,5-trihydroxy-anthracene-9,10-dione)",
                "2,3-dimethoxynaphthalene-1,4-dione",
                "2-hydroxyanthraquinone",
                "2-methylanthraquinone",
                "4,5,7-trihydroxy-9,10-dioxo-2-anthracenecarboxylic acid",
                "9,10-anthraquinone",
                "Fluoquinone",
                "anthraquinone",
                "benzo[a]pyrene-7,8-dione",
                "dihydroxyanthraquinone",
                "flaviolin",
                "naphthoquinone",
                "tetracene-1,4-dione",
                "tetracene-5,12-dione",
                "tetracenequinone",
                "trihydroxyanthraquinone"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "1,4-Naphthoquinone",
            "Anthraquinone",
            "Benzoquinone",
            "Ubiquinone (Coenzyme Q10)",
            "Lawsone",
            "Juglone",
            "Plumbagin",
            "Menadione (Vitamin K3)",
            "Phylloquinone (Vitamin K1)",
            "Menaquinone (Vitamin K2)",
            "Emodin",
            "Aloe-emodin",
            "Rhein",
            "Chrysophanol",
            "Physcion",
            "Hypericin",
            "Atovaquone",
            "Mitomycin C",
            "Doxorubicin",
            "Daunorubicin",
            "Mitoxantrone",
            "Ametantrone",
            "Pyrroloquinoline quinone (PQQ)",
            "Shikonin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "1,4-Naphthoquinone",
                "Anthraquinone",
                "Benzoquinone",
                "Lawsone",
                "Juglone",
                "Plumbagin",
                "Menadione (Vitamin K3)",
                "Phylloquinone (Vitamin K1)",
                "Menaquinone (Vitamin K2)",
                "Emodin",
                "Rhein",
                "Chrysophanol",
                "Physcion",
                "Atovaquone",
                "Mitomycin C",
                "Doxorubicin",
                "Daunorubicin",
                "Mitoxantrone",
                "Pyrroloquinoline quinone (PQQ)",
                "Shikonin"
            ],
            "mismatches": [
                "Ubiquinone (Coenzyme Q10)",
                "Aloe-emodin",
                "Hypericin",
                "Ametantrone"
            ],
            "true_referents": [
                "1,2-benzoquinone",
                "1,2-naphthoquinone",
                "1,4-naphthoquinone",
                "2-hydroxychrysophanol",
                "4,5-dihydroxy-1-methyl-anthraquinone",
                "9,10-anthraquinone",
                "Adriamycinone",
                "Aloe emodin",
                "Aloe emodin w-acetate",
                "Daunomycinone",
                "Emodin 8-beta-D-glucoside",
                "Emodin 8-glucoside",
                "L-dopaquinone",
                "Methylpedicinin",
                "Protetrone",
                "Rhein",
                "Rheochrysin",
                "Rhodoislandin B",
                "Shikonin",
                "anthraquinone",
                "atovaquone",
                "atromentin",
                "benzoquinone",
                "benzoquinones",
                "chrysophanol",
                "daunorubicin",
                "doxorubicin",
                "doxorubicinol",
                "emodin",
                "juglone",
                "lawsone",
                "menadione",
                "menaquinone",
                "mitomycin A",
                "mitomycin B",
                "mitomycin C",
                "mitoxantrone",
                "phylloquinone",
                "physcion",
                "plumbagin",
                "pyrroloquinoline quinone",
                "ubiquinone-1"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "Quinone (Q)",
            "Anthraquinone (AQ)",
            "Naphthoquinone (NQ)",
            "Phenanthrenequinone (PQ)",
            "Benzoquinone (BQ)",
            "Toluquinone (TQ)",
            "Xanthone (X)",
            "Thioxanthone (TX)",
            "Acridone (AC)",
            "Phenazine (PZ)",
            "Phenoxazine (PX)",
            "Phenothiazine (PT)",
            "Anthrarobin (AR)",
            "Hypericin (HY)",
            "Plumbagin (PL)",
            "Lapachol (LP)",
            "Lawsone (LW)",
            "Juglone (JG)",
            "Vitamin K (VK)",
            "Ubiquinone (UQ)",
            "Plastoquinone (PQ)",
            "Menaquinone (MK)",
            "Rhodoquinone (RQ)",
            "Chlorobiumquinone (CQ)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Anthraquinone (AQ)",
                "Naphthoquinone (NQ)",
                "Benzoquinone (BQ)",
                "Plumbagin (PL)",
                "Lapachol (LP)",
                "Lawsone (LW)",
                "Juglone (JG)",
                "Vitamin K (VK)",
                "Ubiquinone (UQ)",
                "Plastoquinone (PQ)",
                "Menaquinone (MK)",
                "Rhodoquinone (RQ)"
            ],
            "mismatches": [
                "Quinone (Q)",
                "Phenanthrenequinone (PQ)",
                "Toluquinone (TQ)",
                "Xanthone (X)",
                "Thioxanthone (TX)",
                "Acridone (AC)",
                "Phenazine (PZ)",
                "Phenoxazine (PX)",
                "Phenothiazine (PT)",
                "Anthrarobin (AR)",
                "Hypericin (HY)",
                "Chlorobiumquinone (CQ)"
            ],
            "true_referents": [
                "(1'S,5'R)-5'-hydroxyaverantin",
                "(1'S,5'S)-5'-hydroxyaverantin",
                "(2Z,10Z,26Z)-ubiquinone",
                "(7S,9R)-andicoquinone A",
                "(S)-5'-oxoaverantin",
                "1,2-benzoquinone",
                "1,2-naphthoquinone",
                "1-hydroxy-2-methyl-9,10-anthraquinone",
                "2,6-Dimethoxybenzoquinone",
                "8-chloro-10H-phenothiazine-1,4-dione",
                "9,10-anthraquinone",
                "Acrimine B",
                "Bromochlorogentisylquinone A",
                "Bromochlorogentisylquinone B",
                "Cytosporanthraxanthone",
                "Methylpedicinin",
                "Nenesophanol",
                "Oxyskyrin",
                "Paramagnetoquinone A",
                "anthragallol",
                "anthraquinone",
                "anthrarufin",
                "benzoquinone",
                "chrysazin",
                "dithianon",
                "juglone",
                "lapachol",
                "lawsone",
                "m-quinone",
                "menaquinone",
                "naphthoquinone",
                "p-quinones",
                "plastoquinone",
                "plumbagin",
                "rhodoquinones",
                "tocoquinone-10",
                "triaziquone",
                "triptoquinone A",
                "triptoquinone B",
                "ubiquinone-1",
                "vitamin K",
                "vitamin K epoxide"
            ],
            "TP": 12,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "Benzoquinone (BQ)",
            "Naphthoquinone (NQ)",
            "Anthraquinone (AQ)",
            "Phenanthrenequinone (PQ)",
            "Chrysene-5,12-dione (CD)",
            "Benzo[a]anthracene-7,12-dione (BAD)",
            "Benzo[b]fluorenone (BF)",
            "Benzo[c]phenanthrene-1,4-dione (BPD)",
            "Dibenzo[a,c]anthracene-7,14-dione (DAD)",
            "Pyrene-4,5-dione (PD)",
            "Benzo[a]pyrene-1,6-dione (BPD1)",
            "Benzo[a]pyrene-3,6-dione (BPD3)",
            "Benzo[c]chrysene-1,2-dione (BCD)",
            "Dibenzo[a,h]anthracene-1,12-dione (DAD1)",
            "Dibenzo[a,l]pyrene-3,10-dione (DPD)",
            "Indeno[1,2,3-cd]pyrene-5,12-dione (IPD)",
            "Benzo[ghi]perylene-1,12-dione (BPD)",
            "Coronene-4,5,10,11-tetraone (CT)",
            "Emodin (EMD)",
            "Aloe-emodin (AE)",
            "Rhein (RHN)",
            "Chrysophanol (CP)",
            "Physcion (PC)",
            "Danthron (DAN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Benzoquinone (BQ)",
                "Naphthoquinone (NQ)",
                "Anthraquinone (AQ)",
                "Emodin (EMD)",
                "Aloe-emodin (AE)",
                "Rhein (RHN)",
                "Chrysophanol (CP)",
                "Physcion (PC)"
            ],
            "mismatches": [
                "Phenanthrenequinone (PQ)",
                "Chrysene-5,12-dione (CD)",
                "Benzo[a]anthracene-7,12-dione (BAD)",
                "Benzo[b]fluorenone (BF)",
                "Benzo[c]phenanthrene-1,4-dione (BPD)",
                "Dibenzo[a,c]anthracene-7,14-dione (DAD)",
                "Pyrene-4,5-dione (PD)",
                "Benzo[a]pyrene-1,6-dione (BPD1)",
                "Benzo[a]pyrene-3,6-dione (BPD3)",
                "Benzo[c]chrysene-1,2-dione (BCD)",
                "Dibenzo[a,h]anthracene-1,12-dione (DAD1)",
                "Dibenzo[a,l]pyrene-3,10-dione (DPD)",
                "Indeno[1,2,3-cd]pyrene-5,12-dione (IPD)",
                "Benzo[ghi]perylene-1,12-dione (BPD)",
                "Coronene-4,5,10,11-tetraone (CT)",
                "Danthron (DAN)"
            ],
            "true_referents": [
                "(-)-daeschol A",
                "(1'S,2'R,3'R,4'R,5'R)-decilorene B",
                "(5R,6R)-3-ethyl-1,5,6-trihydroxy-8-methoxy-5,6-dihydrobenzo[a]anthracene-7,12-dione",
                "(S)-2,5-dihydroxy-2-methyl-1,2,3,4-tetrahydroanthracene-9,10-dione",
                "1,2-benzoquinone",
                "1,2-naphthoquinone",
                "1,4-bis[2-(4-hydroxyphenyl)ethylamino]anthracene-9,10-dione",
                "1-hydroxy-2-methyl-9,10-anthraquinone",
                "2,2'-bis-(7-methyl-1,4,5-trihydroxy-anthracene-9,10-dione)",
                "2,3-dimethoxynaphthalene-1,4-dione",
                "2,6-Dimethoxybenzoquinone",
                "2-hydroxychrysophanol",
                "6,6'-oxybis(1,3,8-trihydroxy-2-((S)-1-hydroxyhexyl)anthracene-9,10-dione)",
                "6,6'-oxybis(1,3,8-trihydroxy-2-((S)-1-methoxyhexyl)anthracene-9,10-dione)",
                "9,10-anthraquinone",
                "Aloe emodin",
                "Aloe emodin w-acetate",
                "D-dopachrome",
                "Emodin 8-beta-D-glucoside",
                "Emodin 8-glucoside",
                "Floricolin B",
                "Homostealthin D",
                "Paramagnetoquinone A",
                "Rhein",
                "Rhodoislandin B",
                "anthraquinone",
                "benzo[a]pyrene-7,8-dione",
                "benzoquinone",
                "chrysophanol",
                "dibenzo[1,4]dioxine-2,3-dione",
                "dithianon",
                "emodin",
                "naphthoquinone",
                "physcion",
                "tetracene-1,4-dione",
                "tetracene-5,12-dione"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "Benzil (C6H4(CO)2)",
            "Chalcone (C6H4(CH)=CH(CO)CH=CH(CO)C6H4)",
            "Flavone (C6H4(OCH)3)",
            "Isocoumarin (C6H4(CH)=CH(CO)CH=CH(CO)C6H4)",
            "Phenanthridine (C12H8N2)",
            "Quinoline (C9H7NO)",
            "Isoquinoline (C9H7NO)",
            "Indole (C8H7N)",
            "Carbazole (C12H9N)",
            "Acridine (C13H8N2)",
            "Phthalimide (C8H5NO2)",
            "Benzophenone (C13H10O)",
            "Flavanone (C15H10O2)",
            "Chalcone (C6H4(CH)=CH(CO)CH=CH(CO)C6H4)",
            "Coumarin (C9H6O2)",
            "Furocoumarin (C11H6O3)",
            "Benzoxazole (C7H5NO)",
            "Benzothiazole (C7H5NS)",
            "Quinazoline (C9H7N3)",
            "Phenanthrene (C14H10)",
            "Anthracene (C14H10)",
            "Tetracene (C18H12)",
            "Perylene (C20H12)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Benzil (C6H4(CO)2)",
                "Chalcone (C6H4(CH)=CH(CO)CH=CH(CO)C6H4)",
                "Flavone (C6H4(OCH)3)",
                "Isocoumarin (C6H4(CH)=CH(CO)CH=CH(CO)C6H4)",
                "Phenanthridine (C12H8N2)",
                "Quinoline (C9H7NO)",
                "Isoquinoline (C9H7NO)",
                "Indole (C8H7N)",
                "Carbazole (C12H9N)",
                "Acridine (C13H8N2)",
                "Phthalimide (C8H5NO2)",
                "Benzophenone (C13H10O)",
                "Flavanone (C15H10O2)",
                "Coumarin (C9H6O2)",
                "Furocoumarin (C11H6O3)",
                "Benzoxazole (C7H5NO)",
                "Benzothiazole (C7H5NS)",
                "Quinazoline (C9H7N3)",
                "Phenanthrene (C14H10)",
                "Anthracene (C14H10)",
                "Tetracene (C18H12)",
                "Perylene (C20H12)"
            ],
            "true_referents": [
                "(1S,3R)-austrocortirubin",
                "(2R,3S)-7-ethyl-1,2,3,4-tetrahydro-2,3,8-trihydroxy-6-methoxy-3-methyl-9,10-anthracenedione",
                "(2S)-versicolorone",
                "(3S,4aS,12bS)-3,4a,8,12b-tetrahydroxy-3-methyl-2,4,5,6-tetrahydrobenzo[a]anthracene-1,7,12-trione",
                "(S)-2,5-dihydroxy-2-methyl-1,2,3,4-tetrahydroanthracene-9,10-dione",
                "1,3,6,8-tetrahydroxyanthraquinone",
                "1,4,5,8-tetrahydroxy-3_ethylnaphthalene2,6-dione",
                "1,4,5,8-tetrahydroxyanthraquinone",
                "1,4-benzoquinone imine",
                "11-hydroxy-5-methyl-2-(2-methyl-3-prop-1-enyloxiran-2-yl)naphtho[2,3-h]chromene-4,7,12-trione",
                "2,2'-bis-(7-methyl-1,4,5-trihydroxy-anthracene-9,10-dione)",
                "2,3-bis(2-hydroxyethylthio)naphthalene-1,4-dione",
                "2,3-dimethoxynaphthalene-1,4-dione",
                "3,4,3',4'-Bisdehydroxanthomegnin",
                "3-demethylubiquinone-8(1-)",
                "3-hydroxy-1-methoxy-9,10-dioxo-2-anthracenecarboxaldehyde",
                "3-hydroxy-2-hydroxymethyl-9,10-anthraquinone",
                "3-methyl-6-methoxy-2-octaprenyl-1,4-benzoquinone",
                "5-hydroxy-2-(1'-hydroxyethyl)naphtho[2,3-b]furan-4,9-dione",
                "6,8-O-dimethylbipolarin",
                "6-anilino-5,8-quinolinedione",
                "7-O-geranyl-2-O,3-dimethylflaviolin",
                "7C-Aglycone",
                "8-hydroxy-2-(1'-hydroxyethyl)naphtho-[2,3-b]-furan-4,9-dione",
                "Anhydroflavomannin-9,10-quinone 6,6',8'-tri-O-methyl ether",
                "Carbamazepine-o-quinone",
                "Flaviogeranin",
                "N-[2-(2-methyl-1H-indol-3-yl)ethyl]-1-nitro-9,10-dioxo-2-anthracenecarboxamide",
                "N-acetyl-1,4-benzoquinone imine",
                "benzimidazole-4,7-quinone",
                "benzo[a]pyrene-7,8-dione",
                "benzoquinone",
                "chrysophanol",
                "dibenzo[1,4]dioxine-2,3-dione",
                "indole-5,6-quinone",
                "indole-5,6-quinone-2-carboxylic acid",
                "tetracene-1,4-dione",
                "tetracene-5,12-dione"
            ],
            "TP": 0,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            "Ellipticine (ELL)",
            "Homellipticine (HML)",
            "Olivacine (OLV)",
            "Camptothecin (CPT)",
            "10-Hydroxycamptothecin (HCPT)",
            "10-Hydroxymethylcamptothecin (HMCP)",
            "Dehydrocamptothecin (DHCP)",
            "Chlorocamptothecin (CCPT)",
            "Topotecan (TPT)",
            "Irinotecan (CPT11)",
            "Rubitecan (RBT)",
            "Gimatecan (GBT)",
            "Diflomotecan (DFM)",
            "9-Nitrocamptothecin (9NC)",
            "Belotecan (BLT)",
            "Chloroinsorciben A (CIA)",
            "Insorcen A (ISA)",
            "Insorcen B (ISB)",
            "Insorcen C (ISC)",
            "Insorcen D (ISD)",
            "Insorcen E (ISE)",
            "Pseudorubrocavernine (PRC)",
            "Rubrocavernine (RBC)",
            "Dehydroisojavanicin (DHI)",
            "Isojavanicin (IJV)",
            "Javanicin (JV)",
            "Dehydrojavanicin (DHJV)",
            "Javanicum (JVCM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Ellipticine (ELL)",
                "Homellipticine (HML)",
                "Olivacine (OLV)",
                "Camptothecin (CPT)",
                "10-Hydroxycamptothecin (HCPT)",
                "10-Hydroxymethylcamptothecin (HMCP)",
                "Dehydrocamptothecin (DHCP)",
                "Chlorocamptothecin (CCPT)",
                "Topotecan (TPT)",
                "Irinotecan (CPT11)",
                "Rubitecan (RBT)",
                "Gimatecan (GBT)",
                "Diflomotecan (DFM)",
                "9-Nitrocamptothecin (9NC)",
                "Belotecan (BLT)",
                "Chloroinsorciben A (CIA)",
                "Insorcen A (ISA)",
                "Insorcen B (ISB)",
                "Insorcen C (ISC)",
                "Insorcen D (ISD)",
                "Insorcen E (ISE)",
                "Pseudorubrocavernine (PRC)",
                "Rubrocavernine (RBC)",
                "Dehydroisojavanicin (DHI)",
                "Isojavanicin (IJV)",
                "Javanicin (JV)",
                "Dehydrojavanicin (DHJV)",
                "Javanicum (JVCM)"
            ],
            "true_referents": [
                "(-)-2'R-1-hydroxyisorhodoptilometrin",
                "(1'S)-1'-O-methyl-7-chloroaverantin",
                "(1'S)-6-O-methyl-7-chloroaverantin",
                "(1'S)-7-chloroaverantin",
                "(1S,3R)-austrocortirubin",
                "(S)-5'-oxoaverantin",
                "(S)-averantin",
                "1'-hydroxyisorhodoptilometrin",
                "11aR-stealthin D",
                "11aR-stealthin E",
                "13-dihydrodaunorubicin",
                "2-Methyl-1-nitroanthraquinone",
                "5'-deoxyneomacrophorin IV",
                "5-O-ethyl embelin",
                "6,1???-O,O-dimethylaverantin",
                "8-D-Olivosyl-landomycin",
                "Adriamycinone",
                "Alterporriol C",
                "Ansalactam A",
                "Anserinone A",
                "Anserinone B",
                "Bequinostatin B",
                "Betulinan C",
                "Daunomycinone",
                "Dihydroechinofuran",
                "Dihydromenaquinone-8",
                "Divergolide M",
                "Elloramycin E",
                "Emodacidamide F",
                "Ent-astropaquinone C",
                "Griseusin D",
                "Kirschsteinin C",
                "Myrothecol G",
                "Oxyjavanicin",
                "Rubellin A",
                "Rubellin B",
                "Rubellin E",
                "Rubiflavinone C-1",
                "Rubimycinone A",
                "TMC-66",
                "Termstrin B",
                "Termstrin C",
                "Termstrin D",
                "alterporriol E",
                "daunorubicin",
                "dihydroxyanthraquinone",
                "doxorubicin",
                "epsilon-rhodomycinone",
                "erythrostominone",
                "idebenone",
                "isotanshinone IIB",
                "mitoxantrone",
                "rubiadin",
                "strongylophorine-26"
            ],
            "TP": 0,
            "FP": 28,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "quinone",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "benzene",
                "Canonical name": "benzene"
            },
            {
                "Referent": "butadiene",
                "Canonical name": "butadiene"
            },
            {
                "Referent": "pyridine",
                "Canonical name": "pyridine"
            },
            {
                "Referent": "furan",
                "Canonical name": "furan"
            },
            {
                "Referent": "thiophene",
                "Canonical name": "thiophene"
            },
            {
                "Referent": "pyrrole",
                "Canonical name": "pyrrole"
            },
            {
                "Referent": "pyran",
                "Canonical name": "pyran"
            },
            {
                "Referent": "benzopyran",
                "Canonical name": "benzopyran"
            },
            {
                "Referent": "chromene",
                "Canonical name": "chromene"
            },
            {
                "Referent": "isochromene",
                "Canonical name": "isochromene"
            },
            {
                "Referent": "stilbene",
                "Canonical name": "stilbene"
            },
            {
                "Referent": "indene",
                "Canonical name": "indene"
            },
            {
                "Referent": "anthracene",
                "Canonical name": "anthracene"
            },
            {
                "Referent": "tetracene",
                "Canonical name": "tetracene"
            },
            {
                "Referent": "pentacene",
                "Canonical name": "pentacene"
            },
            {
                "Referent": "hexacene",
                "Canonical name": "hexacene"
            },
            {
                "Referent": "heptacene",
                "Canonical name": "heptacene"
            },
            {
                "Referent": "octacene",
                "Canonical name": "octacene"
            },
            {
                "Referent": "nonacene",
                "Canonical name": "nonacene"
            },
            {
                "Referent": "decacene",
                "Canonical name": "decacene"
            },
            {
                "Referent": "undecacene",
                "Canonical name": "undecacene"
            },
            {
                "Referent": "dodecacene",
                "Canonical name": "dodecacene"
            },
            {
                "Referent": "tridecacene",
                "Canonical name": "tridecacene"
            },
            {
                "Referent": "tetradecacene",
                "Canonical name": "tetradecacene"
            },
            {
                "Referent": "pentadecacene",
                "Canonical name": "pentadecacene"
            },
            {
                "Referent": "hexadecacene",
                "Canonical name": "hexadecacene"
            },
            {
                "Referent": "heptadecacene",
                "Canonical name": "heptadecacene"
            },
            {
                "Referent": "octadecacene",
                "Canonical name": "octadecacene"
            },
            {
                "Referent": "nonadecacene",
                "Canonical name": "nonadecacene"
            },
            {
                "Referent": "icosacene",
                "Canonical name": "icosacene"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "tetracene"
            ],
            "mismatches": [
                "benzene",
                "butadiene",
                "pyridine",
                "furan",
                "thiophene",
                "pyrrole",
                "pyran",
                "benzopyran",
                "chromene",
                "isochromene",
                "stilbene",
                "indene",
                "anthracene",
                "pentacene",
                "hexacene",
                "heptacene",
                "octacene",
                "nonacene",
                "decacene",
                "undecacene",
                "dodecacene",
                "tridecacene",
                "tetradecacene",
                "pentadecacene",
                "hexadecacene",
                "heptadecacene",
                "octadecacene",
                "nonadecacene",
                "icosacene"
            ],
            "true_referents": [
                "(+)-formylanserinone B",
                "(1'S,2'R,3'R,4'R,5'R)-decilorene B",
                "(2S)-versicolorone",
                "(2S,9S,10S,3'S,4'S,6'S)-griseusin E",
                "11-hydroxy-5-methyl-2-(2-methyl-3-prop-1-enyloxiran-2-yl)naphtho[2,3-h]chromene-4,7,12-trione",
                "2,3-bis(2-hydroxyethylthio)naphthalene-1,4-dione",
                "3,4,3',4'-Bisdehydroxanthomegnin",
                "6,6'-oxybis(1,3,8-trihydroxy-2-((S)-1-hydroxyhexyl)anthracene-9,10-dione)",
                "7C-Aglycone",
                "M-4",
                "Mycenon",
                "benzo[a]pyrene-7,8-dione",
                "dysidine",
                "lignin cw compound-275",
                "lignin cw compound-276",
                "tetracene-1,4-dione",
                "tetracene-5,12-dione",
                "torososide B"
            ],
            "TP": 1,
            "FP": 29,
            "FN": 0
        }
    }
]