[
    {
        "test": "decide-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanin betaine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanin betaine"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 2,
            "FP": 0,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "cis-resveratrol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cis-resveratrol"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "dihydroriboflavins",
            "8-amino-8-demethylriboflavin",
            "8-amino-8-demethylriboflavin 5'-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "dihydroriboflavins",
                "8-amino-8-demethylriboflavin",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin"
            ],
            "mismatches": [],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 4,
            "FP": 0,
            "FN": 2
        }
    },
    {
        "test": "decide-referents",
        "responder": "phi-v4",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
            "cyanidin 3,7-di-O-beta-D-glucoside",
            "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanidin 3-O-beta-D-galactoside",
            "cyanin betaine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanin betaine"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "phi-v4",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "(E)-trans-miyabenol C",
            "cis-resveratrol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(E)-trans-miyabenol C",
                "cis-resveratrol"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 2,
            "FP": 0,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "phi-v4",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "8-amino-8-demethylriboflavin",
            "dihydroriboflavins",
            "8-amino-8-demethylriboflavin 5'-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "8-amino-8-demethylriboflavin",
                "dihydroriboflavins",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "phi-v4",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
            "(+)-gallocatechin gallate",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
            ],
            "mismatches": [],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanin betaine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanin betaine"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "(2R,3R)-cis-delta-viniferin",
            "(2R,3S)-trans-epsilon-viniferin",
            "(-)-cis-epsilon-viniferin",
            "(2R,3S)-cis-epsilon-viniferin",
            "cis-resveratrol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(2R,3R)-cis-delta-viniferin",
                "(2R,3S)-trans-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3S)-cis-epsilon-viniferin",
                "cis-resveratrol"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "8-amino-8-demethylriboflavin",
            "dihydroriboflavins",
            "8-amino-8-demethylriboflavin 5'-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "8-amino-8-demethylriboflavin",
                "dihydroriboflavins",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
            "(+)-gallocatechin gallate",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
            "(+)-gallocatechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
            ],
            "mismatches": [
                "(+)-gallocatechin"
            ],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 6,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "gemma-3",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
            "cyanidin 3,7-di-O-beta-D-glucoside",
            "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanidin 3-O-beta-D-galactoside",
            "cyanin betaine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanin betaine"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "gemma-3",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "cis-resveratrol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cis-resveratrol"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "gemma-3",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "8-amino-8-demethylriboflavin",
            "dihydroriboflavins",
            "8-amino-8-demethylriboflavin 5'-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "8-amino-8-demethylriboflavin",
                "dihydroriboflavins",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "gemma-3",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
            "(+)-gallocatechin gallate",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
            ],
            "mismatches": [],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
            "cyanidin 3,7-di-O-beta-D-glucoside",
            "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanidin 3-O-beta-D-galactoside",
            "cyanin betaine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanin betaine"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "cis-resveratrol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cis-resveratrol"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "8-amino-8-demethylriboflavin",
            "dihydroriboflavins",
            "8-amino-8-demethylriboflavin 5'-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "8-amino-8-demethylriboflavin",
                "dihydroriboflavins",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
            "(+)-gallocatechin gallate",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
            ],
            "mismatches": [],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o-mini",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
            "cyanidin 3,7-di-O-beta-D-glucoside",
            "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanidin 3-O-beta-D-galactoside"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o-mini",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "cis-resveratrol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cis-resveratrol"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o-mini",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "8-amino-8-demethylriboflavin",
            "dihydroriboflavins",
            "8-amino-8-demethylriboflavin 5'-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "8-amino-8-demethylriboflavin",
                "dihydroriboflavins",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o-mini",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin gallate",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
            ],
            "mismatches": [],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4-32k",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
            "cyanidin 3,7-di-O-beta-D-glucoside",
            "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanidin 3-O-beta-D-galactoside",
            "cyanin betaine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanin betaine"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4-32k",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "cis-resveratrol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cis-resveratrol"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4-32k",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "8-amino-8-demethylriboflavin",
            "dihydroriboflavins",
            "8-amino-8-demethylriboflavin 5'-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "8-amino-8-demethylriboflavin",
                "dihydroriboflavins",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4-32k",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
            "(+)-gallocatechin gallate",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
            ],
            "mismatches": [],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
            "cyanidin 3,7-di-O-beta-D-glucoside",
            "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanidin 3-O-beta-D-galactoside"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "(2R,3R)-cis-delta-viniferin",
            "(2R,3S)-trans-epsilon-viniferin",
            "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(E)-trans-miyabenol C",
            "(-)-cis-epsilon-viniferin",
            "cis-resveratrol",
            "(2R,3S)-cis-epsilon-viniferin",
            "(+)-gallocatechin gallate",
            "cyanin betaine",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(2R,3R)-cis-delta-viniferin",
                "(2R,3S)-trans-epsilon-viniferin",
                "(E)-trans-miyabenol C",
                "(-)-cis-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin"
            ],
            "mismatches": [
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin gallate",
                "cyanin betaine",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
            ],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 6,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "8-amino-8-demethylriboflavin",
            "8-amino-8-demethylriboflavin 5'-phosphate",
            "dihydroriboflavins"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "8-amino-8-demethylriboflavin",
                "8-amino-8-demethylriboflavin 5'-phosphate",
                "dihydroriboflavins"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin gallate",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
            ],
            "mismatches": [],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "o1-mini",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
            "cyanidin 3,7-di-O-beta-D-glucoside",
            "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanidin 3-O-beta-D-galactoside"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "o1-mini",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "cis-resveratrol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cis-resveratrol"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "o1-mini",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "8-amino-8-demethylriboflavin",
            "dihydroriboflavins",
            "8-amino-8-demethylriboflavin 5'-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "8-amino-8-demethylriboflavin",
                "dihydroriboflavins",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "o1-mini",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
            "(+)-gallocatechin gallate",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
            ],
            "mismatches": [],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
            "cyanidin 3,7-di-O-beta-D-glucoside",
            "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanidin 3-O-beta-D-galactoside",
            "cyanin betaine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanin betaine"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "(2R,3R)-cis-delta-viniferin",
            "(2R,3S)-trans-epsilon-viniferin",
            "(E)-trans-miyabenol C",
            "(-)-cis-epsilon-viniferin",
            "cis-resveratrol",
            "(2R,3S)-cis-epsilon-viniferin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(2R,3R)-cis-delta-viniferin",
                "(2R,3S)-trans-epsilon-viniferin",
                "(E)-trans-miyabenol C",
                "(-)-cis-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "8-amino-8-demethylriboflavin",
            "dihydroriboflavins",
            "8-amino-8-demethylriboflavin 5'-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "8-amino-8-demethylriboflavin",
                "dihydroriboflavins",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
            "(+)-gallocatechin gallate",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
            ],
            "mismatches": [],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
            "cyanidin 3,7-di-O-beta-D-glucoside",
            "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanidin 3-O-beta-D-galactoside",
            "cyanin betaine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanin betaine"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "(2R,3R)-cis-delta-viniferin",
            "(2R,3S)-trans-epsilon-viniferin",
            "(-)-cis-epsilon-viniferin",
            "(2R,3S)-cis-epsilon-viniferin",
            "cis-resveratrol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(2R,3R)-cis-delta-viniferin",
                "(2R,3S)-trans-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3S)-cis-epsilon-viniferin",
                "cis-resveratrol"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "8-amino-8-demethylriboflavin",
            "dihydroriboflavins",
            "8-amino-8-demethylriboflavin 5'-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "8-amino-8-demethylriboflavin",
                "dihydroriboflavins",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
            "(+)-gallocatechin gallate",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin"
            ],
            "mismatches": [],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
            "cyanidin 3,7-di-O-beta-D-glucoside",
            "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanidin 3-O-beta-D-galactoside",
            "cyanin betaine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanin betaine"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "cis-resveratrol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cis-resveratrol"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "dihydroriboflavins",
            "8-amino-8-demethylriboflavin",
            "8-amino-8-demethylriboflavin 5'-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "dihydroriboflavins",
                "8-amino-8-demethylriboflavin",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
            "(+)-gallocatechin gallate",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin"
            ],
            "mismatches": [],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
            "cyanidin 3,7-di-O-beta-D-glucoside",
            "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanidin 3-O-beta-D-galactoside",
            "cyanin betaine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanin betaine"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "cis-resveratrol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cis-resveratrol"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "8-amino-8-demethylriboflavin",
            "8-amino-8-demethylriboflavin 5'-phosphate",
            "dihydroriboflavins"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "8-amino-8-demethylriboflavin",
                "8-amino-8-demethylriboflavin 5'-phosphate",
                "dihydroriboflavins"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-gallocatechin gallate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin gallate"
            ],
            "mismatches": [],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 1
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
            "cyanidin 3,7-di-O-beta-D-glucoside",
            "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanidin 3-O-beta-D-galactoside",
            "cyanin betaine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanin betaine"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "cis-resveratrol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cis-resveratrol"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "8-amino-8-demethylriboflavin",
            "8-amino-8-demethylriboflavin 5'-phosphate",
            "dihydroriboflavins"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "8-amino-8-demethylriboflavin",
                "8-amino-8-demethylriboflavin 5'-phosphate",
                "dihydroriboflavins"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(2R,3S)-trans-epsilon-viniferin",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
            "(+)-gallocatechin gallate",
            "(+)-gallocatechin-(4beta->8)-(+)-catechin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin gallate"
            ],
            "mismatches": [
                "(2R,3S)-trans-epsilon-viniferin"
            ],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 4,
            "FP": 1,
            "FN": 2
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "cyanidin cation",
        "domain": "chemistry",
        "response": [
            "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
            "cyanidin 3,7-di-O-beta-D-glucoside",
            "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
            "cyanidin 3-O-beta-D-galactoside betaine",
            "cyanidin 3-O-beta-D-galactoside",
            "cyanin betaine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanin betaine"
            ],
            "mismatches": [],
            "true_referents": [
                "cyanidin 3,7-di-O-beta-D-glucoside",
                "cyanin betaine",
                "cyanidin 3-O-beta-D-galactoside betaine",
                "cyanidin 3-O-beta-D-galactoside",
                "cyanidin 3-O-(6-O-glucosyl-2-O-xylosylgalactoside)",
                "cyanidin 3-O-(6-O-malonyl-beta-D-glucoside)"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "resveratrol",
        "domain": "chemistry",
        "response": [
            "cis-resveratrol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cis-resveratrol"
            ],
            "mismatches": [],
            "true_referents": [
                "(E)-trans-miyabenol C",
                "(2R,3S)-trans-epsilon-viniferin",
                "cis-resveratrol",
                "(2R,3S)-cis-epsilon-viniferin",
                "(-)-cis-epsilon-viniferin",
                "(2R,3R)-cis-delta-viniferin"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "riboflavin",
        "domain": "chemistry",
        "response": [
            "8-amino-8-demethylriboflavin",
            "8-amino-8-demethylriboflavin 5'-phosphate",
            "dihydroriboflavins"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "8-amino-8-demethylriboflavin",
                "8-amino-8-demethylriboflavin 5'-phosphate",
                "dihydroriboflavins"
            ],
            "mismatches": [],
            "true_referents": [
                "dihydroriboflavins",
                "coenzyme alpha-F420-3",
                "1,5-dihydrocoenzyme F420-6",
                "8-amino-8-demethylriboflavin",
                "1,5-dihydrocoenzyme F420",
                "8-amino-8-demethylriboflavin 5'-phosphate"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "(+)-gallocatechin",
        "domain": "chemistry",
        "response": [
            "(+)-gallocatechin-(4beta->8)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
            "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
            "(+)-gallocatechin gallate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin gallate"
            ],
            "mismatches": [],
            "true_referents": [
                "(+)-catechin-(4alpha->6)-(+)-gallocatechin",
                "(+)-gallocatechin gallate",
                "(+)-gallocatechin-(4alpha->6)-(+)-catechin",
                "(+)-gallocatechin-(4alpha->8)-(+)-catechin",
                "(+)-gallocatechin-(4beta->8)-(+)-catechin",
                "(-)-epicatechin-(4beta->8)-(+)-gallocatechin"
            ],
            "TP": 4,
            "FP": 0,
            "FN": 2
        }
    }
]