[
    {
        "test": "decide-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N(6)-(pyridoxal phosphate)-L-lysine",
            "N-acetyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "mismatches": [
                "N-acetyl-1,4-benzoquinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
            ],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 4,
            "FP": 2,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N(6)-(pyridoxal phosphate)-L-lysine",
            "N-acetyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "true_referents": [
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "beta-aminoorceimine",
                "porphyra-334",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "Hemsleyin imine A",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
                "5-iminohexane-1,2,3,4,6-pentol"
            ],
            "TP": 0,
            "FP": 4,
            "FN": 8
        }
    },
    {
        "test": "decide-referents",
        "responder": "phi-v4",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "phi-v4",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N(6)-(pyridoxal phosphate)-L-lysine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "mismatches": [],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 4,
            "FP": 0,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "phi-v4",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [],
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "N(6)-(pyridoxal phosphate)-L-lysine",
            "2-imino-3-(indol-3-yl)propanoic acid",
            "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "mismatches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 4,
            "FP": 5,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "2-imino-3-(indol-3-yl)propanoic acid",
            "4-iminobutane-1,2,3-triol",
            "5-Imino-2-methyl-1-cyclopenten-1-ol",
            "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
            "methanimine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2-imino-3-(indol-3-yl)propanoic acid",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid"
            ],
            "mismatches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "4-iminobutane-1,2,3-triol",
                "methanimine"
            ],
            "true_referents": [
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "beta-aminoorceimine",
                "porphyra-334",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "Hemsleyin imine A",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
                "5-iminohexane-1,2,3,4,6-pentol"
            ],
            "TP": 3,
            "FP": 5,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "gemma-3",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "gemma-3",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "Hemsleyin imine A",
            "methanimine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "methanimine"
            ],
            "mismatches": [
                "Hemsleyin imine A"
            ],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 4,
            "FP": 1,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "gemma-3",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "Hemsleyin imine A",
            "2-imino-3-(indol-3-yl)propanoic acid",
            "4-iminobutane-1,2,3-triol",
            "beta-aminoorceimine",
            "5-Imino-2-methyl-1-cyclopenten-1-ol",
            "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
            "methanimine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "6-iminohexane-1,2,3,4,5-pentol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hemsleyin imine A",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "beta-aminoorceimine",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid"
            ],
            "mismatches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "4-iminobutane-1,2,3-triol",
                "methanimine",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine",
                "6-iminohexane-1,2,3,4,5-pentol"
            ],
            "true_referents": [
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "beta-aminoorceimine",
                "porphyra-334",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "Hemsleyin imine A",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
                "5-iminohexane-1,2,3,4,6-pentol"
            ],
            "TP": 5,
            "FP": 8,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "methanimine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "methanimine"
            ],
            "mismatches": [],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 4,
            "FP": 0,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "Hemsleyin imine A",
            "5-Imino-2-methyl-1-cyclopenten-1-ol",
            "6-iminohexane-1,2,3,4,5-pentol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hemsleyin imine A",
                "5-Imino-2-methyl-1-cyclopenten-1-ol"
            ],
            "mismatches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "6-iminohexane-1,2,3,4,5-pentol"
            ],
            "true_referents": [
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "beta-aminoorceimine",
                "porphyra-334",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "Hemsleyin imine A",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
                "5-iminohexane-1,2,3,4,6-pentol"
            ],
            "TP": 2,
            "FP": 4,
            "FN": 6
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o-mini",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o-mini",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "5-iminohexane-1,2,3,4,6-pentol",
            "2-imino-3-(indol-3-yl)propanoic acid",
            "4-iminobutane-1,2,3-triol",
            "beta-aminoorceimine",
            "5-Imino-2-methyl-1-cyclopenten-1-ol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "4-iminobutane-1,2,3-triol"
            ],
            "mismatches": [
                "5-iminohexane-1,2,3,4,6-pentol",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "beta-aminoorceimine",
                "5-Imino-2-methyl-1-cyclopenten-1-ol"
            ],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 4,
            "FP": 4,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4o-mini",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [],
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4-32k",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4-32k",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "methanimine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "methanimine"
            ],
            "mismatches": [],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 4,
            "FP": 0,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-4-32k",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [],
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "N-acetyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "mismatches": [
                "salicylaldehyde imine"
            ],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 2,
            "FP": 1,
            "FN": 6
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "N(6)-(pyridoxal phosphate)-L-lysine",
            "Hemsleyin imine A",
            "2-imino-3-(indol-3-yl)propanoic acid",
            "4-iminobutane-1,2,3-triol",
            "para-Benzoquinone dioxime",
            "beta-aminoorceimine",
            "5-Imino-2-methyl-1-cyclopenten-1-ol",
            "MP-A08",
            "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
            "methanimine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "6-iminohexane-1,2,3,4,5-pentol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine",
                "4-iminobutane-1,2,3-triol",
                "MP-A08",
                "methanimine",
                "6-iminohexane-1,2,3,4,5-pentol"
            ],
            "mismatches": [
                "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "Hemsleyin imine A",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "para-Benzoquinone dioxime",
                "beta-aminoorceimine",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 8,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": "",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "decide-referents",
        "responder": "o1-mini",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "o1-mini",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N(6)-(pyridoxal phosphate)-L-lysine",
            "methanimine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine",
                "methanimine"
            ],
            "mismatches": [],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "o1-mini",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [
            "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "N(6)-(pyridoxal phosphate)-L-lysine",
            "2-imino-3-(indol-3-yl)propanoic acid",
            "para-Benzoquinone dioxime",
            "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid"
            ],
            "mismatches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "N(6)-(pyridoxal phosphate)-L-lysine",
                "para-Benzoquinone dioxime",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "true_referents": [
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "beta-aminoorceimine",
                "porphyra-334",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "Hemsleyin imine A",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
                "5-iminohexane-1,2,3,4,6-pentol"
            ],
            "TP": 3,
            "FP": 5,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N(6)-(pyridoxal phosphate)-L-lysine",
            "methanimine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine",
                "methanimine"
            ],
            "mismatches": [],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 3
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
            ],
            "true_referents": [
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "beta-aminoorceimine",
                "porphyra-334",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "Hemsleyin imine A",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
                "5-iminohexane-1,2,3,4,6-pentol"
            ],
            "TP": 0,
            "FP": 4,
            "FN": 8
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "methanimine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "methanimine"
            ],
            "mismatches": [],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 4,
            "FP": 0,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "para-Benzoquinone dioxime",
            "5-Imino-2-methyl-1-cyclopenten-1-ol",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "5-Imino-2-methyl-1-cyclopenten-1-ol"
            ],
            "mismatches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "para-Benzoquinone dioxime",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "true_referents": [
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "beta-aminoorceimine",
                "porphyra-334",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "Hemsleyin imine A",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
                "5-iminohexane-1,2,3,4,6-pentol"
            ],
            "TP": 1,
            "FP": 7,
            "FN": 7
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "N(6)-(pyridoxal phosphate)-L-lysine",
            "5-Imino-2-methyl-1-cyclopenten-1-ol",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "mismatches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 4,
            "FP": 4,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "true_referents": [
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "beta-aminoorceimine",
                "porphyra-334",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "Hemsleyin imine A",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
                "5-iminohexane-1,2,3,4,6-pentol"
            ],
            "TP": 0,
            "FP": 5,
            "FN": 8
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "2,6-dichloroindophenol",
            "N-acetyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine",
            "2,6-dichloroindophenol",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 4,
            "FP": 0,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "5-iminohexane-1,2,3,4,6-pentol",
            "Hemsleyin imine A",
            "2-imino-3-(indol-3-yl)propanoic acid",
            "4-iminobutane-1,2,3-triol",
            "para-Benzoquinone dioxime",
            "beta-aminoorceimine",
            "5-Imino-2-methyl-1-cyclopenten-1-ol",
            "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
            "methanimine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "6-iminohexane-1,2,3,4,5-pentol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "4-iminobutane-1,2,3-triol",
                "methanimine",
                "6-iminohexane-1,2,3,4,5-pentol"
            ],
            "mismatches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-iminohexane-1,2,3,4,6-pentol",
                "Hemsleyin imine A",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "para-Benzoquinone dioxime",
                "beta-aminoorceimine",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 6,
            "FP": 10,
            "FN": 2
        }
    },
    {
        "test": "decide-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "Hemsleyin imine A",
            "2-imino-3-(indol-3-yl)propanoic acid",
            "para-Benzoquinone dioxime",
            "5-Imino-2-methyl-1-cyclopenten-1-ol",
            "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
            "methanimine",
            "N-acetyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hemsleyin imine A",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid"
            ],
            "mismatches": [
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "para-Benzoquinone dioxime",
                "methanimine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "true_referents": [
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "beta-aminoorceimine",
                "porphyra-334",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "Hemsleyin imine A",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
                "5-iminohexane-1,2,3,4,6-pentol"
            ],
            "TP": 4,
            "FP": 6,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-acetyl-1,4-benzoquinone imine",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-acetyl-1,4-benzoquinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "Hemsleyin imine A",
            "beta-aminoorceimine",
            "5-Imino-2-methyl-1-cyclopenten-1-ol",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines"
            ],
            "mismatches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "Hemsleyin imine A",
                "beta-aminoorceimine",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 2,
            "FP": 6,
            "FN": 6
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "Hemsleyin imine A",
            "para-Benzoquinone dioxime",
            "beta-aminoorceimine",
            "5-Imino-2-methyl-1-cyclopenten-1-ol",
            "N-acetyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hemsleyin imine A",
                "beta-aminoorceimine",
                "5-Imino-2-methyl-1-cyclopenten-1-ol"
            ],
            "mismatches": [
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "para-Benzoquinone dioxime",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "true_referents": [
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "beta-aminoorceimine",
                "porphyra-334",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "Hemsleyin imine A",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
                "5-iminohexane-1,2,3,4,6-pentol"
            ],
            "TP": 3,
            "FP": 5,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "quinone imine",
        "domain": "chemistry",
        "response": [
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine",
            "N-acetyl-1,4-benzoquinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-acetyl-1,4-benzoquinone imine"
            ],
            "mismatches": [],
            "true_referents": [
                "para-Benzoquinone dioxime",
                "Sarubicin A",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "2,6-dichloroindophenol"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 5
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "aldimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imine",
            "salicylaldehyde imines",
            "salicylaldehyde N-tosylimines",
            "methanimine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "salicylaldehyde imine",
                "salicylaldehyde imines",
                "salicylaldehyde N-tosylimines",
                "methanimine"
            ],
            "mismatches": [],
            "true_referents": [
                "MP-A08",
                "salicylaldehyde imine",
                "6-iminohexane-1,2,3,4,5-pentol",
                "methanimine",
                "salicylaldehyde imines",
                "4-iminobutane-1,2,3-triol",
                "salicylaldehyde N-tosylimines",
                "N(6)-(pyridoxal phosphate)-L-lysine"
            ],
            "TP": 4,
            "FP": 0,
            "FN": 4
        }
    },
    {
        "test": "decide-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "ketimine",
        "domain": "chemistry",
        "response": [
            "salicylaldehyde imines",
            "salicylaldehyde imine",
            "salicylaldehyde N-tosylimines",
            "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
            "N-acetyl-1,4-benzoquinone imine",
            "5-hydroxydiclofenac quinone imine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "salicylaldehyde imines",
                "salicylaldehyde imine",
                "salicylaldehyde N-tosylimines",
                "N-3,5-dichloro-4-hydroxyphenyl-1,4-benzoquinone imine",
                "N-acetyl-1,4-benzoquinone imine",
                "5-hydroxydiclofenac quinone imine"
            ],
            "true_referents": [
                "2,5-diimino-3,4-bis(indol-3-yl)hexanedioic acid",
                "beta-aminoorceimine",
                "porphyra-334",
                "2-imino-3-(indol-3-yl)propanoic acid",
                "Hemsleyin imine A",
                "5-Imino-2-methyl-1-cyclopenten-1-ol",
                "(4S,5R)-4,5,6-trihydroxy-2-iminohexanoic acid",
                "5-iminohexane-1,2,3,4,6-pentol"
            ],
            "TP": 0,
            "FP": 6,
            "FN": 8
        }
    }
]