[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Adenosine 3',5'-cyclic monophosphate (cAMP)",
            "Guanosine 3',5'-cyclic monophosphate (cGMP)",
            "Cyclic adenosine diphosphate ribose (cADPR)",
            "Cyclic guanosine diphosphate ribose (cGDPR)",
            "Cyclic di-AMP",
            "Cyclic di-GMP",
            "Cyclic di-ADP-ribose",
            "Cyclic AMP-GMP",
            "Cyclic AMP-phosphate",
            "Cyclic GMP-phosphate",
            "Cyclic GMP-AMP",
            "Cyclic AMP-GMP-AMP",
            "Cyclic AMP-GMP-phosphate",
            "Cyclic GMP-AMP-phosphate",
            "Cyclic AMP-GMP-di-AMP",
            "Cyclic GMP-di-AMP",
            "Cyclic AMP-di-AMP",
            "Cyclic AMP-GMP-di-GMP",
            "Cyclic GMP-di-GMP",
            "Cyclic AMP-di-GMP",
            "Cyclic AMP-GMP-di-ADP-ribose",
            "Cyclic GMP-di-ADP-ribose",
            "Cyclic AMP-di-ADP-ribose",
            "Cyclic AMP-GMP-cADPR"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cyclic di-AMP",
                "Cyclic di-GMP",
                "Cyclic GMP-AMP"
            ],
            "mismatches": [
                "Adenosine 3',5'-cyclic monophosphate (cAMP)",
                "Guanosine 3',5'-cyclic monophosphate (cGMP)",
                "Cyclic adenosine diphosphate ribose (cADPR)",
                "Cyclic guanosine diphosphate ribose (cGDPR)",
                "Cyclic di-ADP-ribose",
                "Cyclic AMP-GMP",
                "Cyclic AMP-phosphate",
                "Cyclic GMP-phosphate",
                "Cyclic AMP-GMP-AMP",
                "Cyclic AMP-GMP-phosphate",
                "Cyclic GMP-AMP-phosphate",
                "Cyclic AMP-GMP-di-AMP",
                "Cyclic GMP-di-AMP",
                "Cyclic AMP-di-AMP",
                "Cyclic AMP-GMP-di-GMP",
                "Cyclic GMP-di-GMP",
                "Cyclic AMP-di-GMP",
                "Cyclic AMP-GMP-di-ADP-ribose",
                "Cyclic GMP-di-ADP-ribose",
                "Cyclic AMP-di-ADP-ribose",
                "Cyclic AMP-GMP-cADPR"
            ],
            "true_referents": [
                "2',3'-cyclic AMP",
                "2',3'-cyclic GMP",
                "2'-phospho-cyclic ADP-ribose",
                "3',5'-cyclic GMP",
                "3',5'-cyclic dGMP",
                "Adenosine 2',3'-cyclic phosphate",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "c-GMP-AMP",
                "c-di-GMP",
                "cyclic ADP-beta-D-ribose",
                "cyclic di-AMP",
                "cyclic purine dinucleotide",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Cyclic adenosine monophosphate (cAMP)",
            "Cyclic guanosine monophosphate (cGMP)",
            "Cyclic adenosine diphosphate ribose (cADPR)",
            "Cyclic guanosine diphosphate ribose (cGDPR)",
            "Cyclic adenosine diphosphate (cADP)",
            "Cyclic guanosine diphosphate (cGDP)",
            "Cyclic nucleotide-gated (CNG) channels",
            "Protein kinase A (PKA)",
            "Protein kinase G (PKG)",
            "Phosphodiesterases (PDEs)",
            "Exchange proteins activated by cAMP (EPACs)",
            "Cyclic AMP-dependent transcription factors",
            "Cyclic GMP-dependent protein kinase (PKG)",
            "Cyclic nucleotide phosphodiesterase 5 (PDE5)",
            "Cyclic nucleotide phosphodiesterase 6 (PDE6)",
            "Cyclic nucleotide phosphodiesterase 9 (PDE9)",
            "Cyclic nucleotide phosphodiesterase 10 (PDE10)",
            "Cyclic nucleotide phosphodiesterase 11 (PDE11)",
            "Cyclic nucleotide phosphodiesterase 12 (PDE12)",
            "Cyclic nucleotide phosphodiesterase 13 (PDE13)",
            "Cyclic nucleotide phosphodiesterase 4 (PDE4)",
            "Cyclic nucleotide phosphodiesterase 3 (PDE3)",
            "Cyclic nucleotide phosphodiesterase 7 (PDE7)",
            "Cyclic nucleotide phosphodiesterase 8 (PDE8)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Cyclic adenosine monophosphate (cAMP)",
                "Cyclic guanosine monophosphate (cGMP)",
                "Cyclic adenosine diphosphate ribose (cADPR)",
                "Cyclic guanosine diphosphate ribose (cGDPR)",
                "Cyclic adenosine diphosphate (cADP)",
                "Cyclic guanosine diphosphate (cGDP)",
                "Cyclic nucleotide-gated (CNG) channels",
                "Protein kinase A (PKA)",
                "Protein kinase G (PKG)",
                "Phosphodiesterases (PDEs)",
                "Exchange proteins activated by cAMP (EPACs)",
                "Cyclic AMP-dependent transcription factors",
                "Cyclic GMP-dependent protein kinase (PKG)",
                "Cyclic nucleotide phosphodiesterase 5 (PDE5)",
                "Cyclic nucleotide phosphodiesterase 6 (PDE6)",
                "Cyclic nucleotide phosphodiesterase 9 (PDE9)",
                "Cyclic nucleotide phosphodiesterase 10 (PDE10)",
                "Cyclic nucleotide phosphodiesterase 11 (PDE11)",
                "Cyclic nucleotide phosphodiesterase 12 (PDE12)",
                "Cyclic nucleotide phosphodiesterase 13 (PDE13)",
                "Cyclic nucleotide phosphodiesterase 4 (PDE4)",
                "Cyclic nucleotide phosphodiesterase 3 (PDE3)",
                "Cyclic nucleotide phosphodiesterase 7 (PDE7)",
                "Cyclic nucleotide phosphodiesterase 8 (PDE8)"
            ],
            "true_referents": [
                "2',3'-cyclic AMP",
                "2',3'-cyclic nucleotide",
                "2'-phospho-cyclic ADP-ribose",
                "3',5'-cyclic AMP",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic purine nucleotide",
                "8-nitroguanosine 3',5'-cyclic monophosphate",
                "Adenosine 2',3'-cyclic phosphate",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "cyclic ADP-beta-D-ribose",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Cyclic Adenosine Monophosphate (cAMP)",
            "Cyclic Guanosine Monophosphate (cGMP)",
            "Cyclic Inosine Monophosphate (cIMP)",
            "Cyclic Cytidine Monophosphate (cCMP)",
            "Cyclic Uridine Monophosphate (cUMP)",
            "Cyclic Thymidine Monophosphate (cTMP)",
            "Cyclic Dideoxyadenosine Monophosphate",
            "Cyclic Dideoxyguanosine Monophosphate",
            "Cyclic Dideoxyinosine Monophosphate",
            "Cyclic Dideoxycytidine Monophosphate",
            "Cyclic Dideoxyuridine Monophosphate",
            "Cyclic Dideoxythymidine Monophosphate",
            "Cyclic 3',5'-Adenosine Monophosphate",
            "Cyclic 2',3'-Adenosine Monophosphate",
            "Cyclic 3',5'-Guanosine Monophosphate",
            "Cyclic 2',3'-Guanosine Monophosphate",
            "Cyclic 3',5'-Inosine Monophosphate",
            "Cyclic 2',3'-Inosine Monophosphate",
            "Cyclic 3',5'-Cytidine Monophosphate",
            "Cyclic 2',3'-Cytidine Monophosphate",
            "Cyclic 3',5'-Uridine Monophosphate",
            "Cyclic 2',3'-Uridine Monophosphate",
            "Cyclic 3',5'-Thymidine Monophosphate",
            "Cyclic 2',3'-Thymidine Monophosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cyclic 2',3'-Adenosine Monophosphate",
                "Cyclic 2',3'-Cytidine Monophosphate"
            ],
            "mismatches": [
                "Cyclic Adenosine Monophosphate (cAMP)",
                "Cyclic Guanosine Monophosphate (cGMP)",
                "Cyclic Inosine Monophosphate (cIMP)",
                "Cyclic Cytidine Monophosphate (cCMP)",
                "Cyclic Uridine Monophosphate (cUMP)",
                "Cyclic Thymidine Monophosphate (cTMP)",
                "Cyclic Dideoxyadenosine Monophosphate",
                "Cyclic Dideoxyguanosine Monophosphate",
                "Cyclic Dideoxyinosine Monophosphate",
                "Cyclic Dideoxycytidine Monophosphate",
                "Cyclic Dideoxyuridine Monophosphate",
                "Cyclic Dideoxythymidine Monophosphate",
                "Cyclic 3',5'-Adenosine Monophosphate",
                "Cyclic 3',5'-Guanosine Monophosphate",
                "Cyclic 3',5'-Inosine Monophosphate",
                "Cyclic 2',3'-Inosine Monophosphate",
                "Cyclic 3',5'-Cytidine Monophosphate",
                "Cyclic 3',5'-Uridine Monophosphate",
                "Cyclic 2',3'-Uridine Monophosphate",
                "Cyclic 3',5'-Thymidine Monophosphate",
                "Cyclic 2',3'-Thymidine Monophosphate"
            ],
            "true_referents": [
                "2',3'-cyclic purine nucleotide",
                "2',3'-cyclic pyrimidine nucleotide",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic purine nucleotide",
                "3',5'-cyclic pyrimidine nucleotide",
                "Adenosine 2',3'-cyclic phosphate",
                "Cytidine 2',3'-cyclic monophosphoric acid",
                "Cytidine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "cytidine 5'-phosphate 2',3'-cyclic phosphate",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 2,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Cyclic adenosine monophosphate (cAMP)",
            "Cyclic guanosine monophosphate (cGMP)",
            "Cyclic uridine monophosphate (cUMP)",
            "Cyclic cytidine monophosphate (cCMP)",
            "Cyclic inosine monophosphate (cIMP)",
            "Cyclic thymidine monophosphate (cTMP)",
            "Cyclic deoxyadenosine monophosphate (dcAMP)",
            "Cyclic deoxyguanosine monophosphate (dcGMP)",
            "Cyclic deoxyuridine monophosphate (dcUMP)",
            "Cyclic deoxycytidine monophosphate (dcCMP)",
            "Cyclic deoxyinosine monophosphate (dcIMP)",
            "Cyclic deoxythymidine monophosphate (dcTMP)",
            "Cyclic adenosine diphosphate (cADP)",
            "Cyclic guanosine diphosphate (cGDP)",
            "Cyclic uridine diphosphate (cUDP)",
            "Cyclic cytidine diphosphate (cCDP)",
            "Cyclic inosine diphosphate (cIDP)",
            "Cyclic thymidine diphosphate (cTDP)",
            "3',5'-Cyclic adenosine monophosphate (3',5'-cAMP)",
            "3',5'-Cyclic guanosine monophosphate (3',5'-cGMP)",
            "2',3'-Cyclic adenosine monophosphate (2',3'-cAMP)",
            "2',3'-Cyclic guanosine monophosphate (2',3'-cGMP)",
            "Cyclic GMP-PMP (cGMP-PMP)",
            "Cyclic GMP-PCP (cGMP-PCP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "3',5'-Cyclic adenosine monophosphate (3',5'-cAMP)",
                "3',5'-Cyclic guanosine monophosphate (3',5'-cGMP)",
                "2',3'-Cyclic adenosine monophosphate (2',3'-cAMP)"
            ],
            "mismatches": [
                "Cyclic adenosine monophosphate (cAMP)",
                "Cyclic guanosine monophosphate (cGMP)",
                "Cyclic uridine monophosphate (cUMP)",
                "Cyclic cytidine monophosphate (cCMP)",
                "Cyclic inosine monophosphate (cIMP)",
                "Cyclic thymidine monophosphate (cTMP)",
                "Cyclic deoxyadenosine monophosphate (dcAMP)",
                "Cyclic deoxyguanosine monophosphate (dcGMP)",
                "Cyclic deoxyuridine monophosphate (dcUMP)",
                "Cyclic deoxycytidine monophosphate (dcCMP)",
                "Cyclic deoxyinosine monophosphate (dcIMP)",
                "Cyclic deoxythymidine monophosphate (dcTMP)",
                "Cyclic adenosine diphosphate (cADP)",
                "Cyclic guanosine diphosphate (cGDP)",
                "Cyclic uridine diphosphate (cUDP)",
                "Cyclic cytidine diphosphate (cCDP)",
                "Cyclic inosine diphosphate (cIDP)",
                "Cyclic thymidine diphosphate (cTDP)",
                "2',3'-Cyclic guanosine monophosphate (2',3'-cGMP)",
                "Cyclic GMP-PMP (cGMP-PMP)",
                "Cyclic GMP-PCP (cGMP-PCP)"
            ],
            "true_referents": [
                "2',3'-cyclic AMP",
                "2',3'-cyclic nucleotide",
                "3',5'-cyclic AMP",
                "3',5'-cyclic GMP",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic purine nucleotide",
                "Adenosine 2',3'-cyclic phosphate",
                "Cytidine 2',3'-cyclic monophosphoric acid",
                "Cytidine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "N(1)-methyl-cGMP",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "c-GMP-AMP",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "cytidine 5'-phosphate 2',3'-cyclic phosphate",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Cyclic Adenosine Monophosphate (cAMP)",
            "Cyclic Guanosine Monophosphate (cGMP)",
            "Cyclic Cytidine Monophosphate (cCMP)",
            "Cyclic Uridine Monophosphate (cUMP)",
            "Cyclic Inosine Monophosphate (cIMP)",
            "Cyclic Xanthosine Monophosphate (cXMP)",
            "Cyclic Thymidine Monophosphate (cTMP)",
            "Cyclic Deoxyadenosine Monophosphate (c-dAMP)",
            "Cyclic Deoxyguanosine Monophosphate (c-dGMP)",
            "Cyclic Deoxycytidine Monophosphate (c-dCMP)",
            "Cyclic Deoxyuridine Monophosphate (c-dUMP)",
            "Cyclic Deoxyinosine Monophosphate (c-dIMP)",
            "Cyclic Deoxyxanthosine Monophosphate (c-dXMP)",
            "Cyclic Deoxythymidine Monophosphate (c-dTMP)",
            "Cyclic 2',3'-Adenosine Monophosphate (c2,3-AMP)",
            "Cyclic 2',3'-Guanosine Monophosphate (c2,3-GMP)",
            "Cyclic 2',3'-Cytidine Monophosphate (c2,3-CMP)",
            "Cyclic 2',3'-Uridine Monophosphate (c2,3-UMP)",
            "Cyclic 2',3'-Inosine Monophosphate (c2,3-IMP)",
            "Cyclic 2',3'-Xanthosine Monophosphate (c2,3-XMP)",
            "Cyclic 2',3'-Thymidine Monophosphate (c2,3-TMP)",
            "Cyclic 3',5'-Adenosine Monophosphate (c3,5-AMP)",
            "Cyclic 3',5'-Guanosine Monophosphate (c3,5-GMP)",
            "Cyclic 3',5'-Cytidine Monophosphate (c3,5-CMP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Cyclic Adenosine Monophosphate (cAMP)",
                "Cyclic Guanosine Monophosphate (cGMP)",
                "Cyclic Cytidine Monophosphate (cCMP)",
                "Cyclic Uridine Monophosphate (cUMP)",
                "Cyclic Inosine Monophosphate (cIMP)",
                "Cyclic Xanthosine Monophosphate (cXMP)",
                "Cyclic Thymidine Monophosphate (cTMP)",
                "Cyclic Deoxyadenosine Monophosphate (c-dAMP)",
                "Cyclic Deoxyguanosine Monophosphate (c-dGMP)",
                "Cyclic Deoxycytidine Monophosphate (c-dCMP)",
                "Cyclic Deoxyuridine Monophosphate (c-dUMP)",
                "Cyclic Deoxyinosine Monophosphate (c-dIMP)",
                "Cyclic Deoxyxanthosine Monophosphate (c-dXMP)",
                "Cyclic Deoxythymidine Monophosphate (c-dTMP)",
                "Cyclic 2',3'-Adenosine Monophosphate (c2,3-AMP)",
                "Cyclic 2',3'-Guanosine Monophosphate (c2,3-GMP)",
                "Cyclic 2',3'-Cytidine Monophosphate (c2,3-CMP)",
                "Cyclic 2',3'-Uridine Monophosphate (c2,3-UMP)",
                "Cyclic 2',3'-Inosine Monophosphate (c2,3-IMP)",
                "Cyclic 2',3'-Xanthosine Monophosphate (c2,3-XMP)",
                "Cyclic 2',3'-Thymidine Monophosphate (c2,3-TMP)",
                "Cyclic 3',5'-Adenosine Monophosphate (c3,5-AMP)",
                "Cyclic 3',5'-Guanosine Monophosphate (c3,5-GMP)",
                "Cyclic 3',5'-Cytidine Monophosphate (c3,5-CMP)"
            ],
            "true_referents": [
                "2',3'-cyclic AMP",
                "2',3'-cyclic GMP",
                "2',3'-cyclic purine nucleotide",
                "2',3'-cyclic pyrimidine nucleotide",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic purine nucleotide",
                "8-nitroguanosine 3',5'-cyclic monophosphate",
                "Adenosine 2',3'-cyclic phosphate",
                "Cytidine 2',3'-cyclic monophosphoric acid",
                "Cytidine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "c-GMP-AMP",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "cytidine 5'-phosphate 2',3'-cyclic phosphate",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Adenosine monophosphate (AMP)",
            "Adenosine diphosphate (ADP)",
            "Adenosine triphosphate (ATP)",
            "Cyclic adenosine monophosphate (cAMP)",
            "Cyclic guanosine monophosphate (cGMP)",
            "Guanosine monophosphate (GMP)",
            "Guanosine diphosphate (GDP)",
            "Guanosine triphosphate (GTP)",
            "Cyclic guanosine diphosphate (cGDP)",
            "Cyclic adenosine diphosphate (cADP)",
            "Cyclic inosine monophosphate (cIMP)",
            "Cyclic cytidine monophosphate (cCMP)",
            "Cyclic uridine monophosphate (cUMP)",
            "Cyclic adenosine-5'-monophosphate (cAMP)",
            "Cyclic guanosine-5'-monophosphate (cGMP)",
            "Cyclic adenosine-5'-diphosphate (cADP)",
            "Cyclic guanosine-5'-diphosphate (cGDP)",
            "Cyclic inosine-5'-monophosphate (cIMP)",
            "Cyclic cytidine-5'-monophosphate (cCMP)",
            "Cyclic uridine-5'-monophosphate (cUMP)",
            "Adenosine-5'-monophosphate (AMP)",
            "Guanosine-5'-monophosphate (GMP)",
            "Cyclic 3',5'-adenosine monophosphate (cAMP)",
            "Cyclic 3',5'-guanosine monophosphate (cGMP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cyclic 3',5'-guanosine monophosphate (cGMP)"
            ],
            "mismatches": [
                "Adenosine monophosphate (AMP)",
                "Adenosine diphosphate (ADP)",
                "Adenosine triphosphate (ATP)",
                "Cyclic adenosine monophosphate (cAMP)",
                "Guanosine monophosphate (GMP)",
                "Guanosine diphosphate (GDP)",
                "Guanosine triphosphate (GTP)",
                "Cyclic guanosine diphosphate (cGDP)",
                "Cyclic adenosine diphosphate (cADP)",
                "Cyclic inosine monophosphate (cIMP)",
                "Cyclic cytidine monophosphate (cCMP)",
                "Cyclic uridine monophosphate (cUMP)",
                "Cyclic adenosine-5'-monophosphate (cAMP)",
                "Cyclic guanosine-5'-monophosphate (cGMP)",
                "Cyclic adenosine-5'-diphosphate (cADP)",
                "Cyclic guanosine-5'-diphosphate (cGDP)",
                "Cyclic inosine-5'-monophosphate (cIMP)",
                "Cyclic cytidine-5'-monophosphate (cCMP)",
                "Cyclic uridine-5'-monophosphate (cUMP)",
                "Adenosine-5'-monophosphate (AMP)",
                "Guanosine-5'-monophosphate (GMP)",
                "Cyclic 3',5'-adenosine monophosphate (cAMP)"
            ],
            "true_referents": [
                "3',5'-cyclic GMP",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic purine nucleotide",
                "Adenosine 2',3'-cyclic phosphate",
                "Cytidine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "c-GMP-AMP",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "cytidine 5'-phosphate 2',3'-cyclic phosphate",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 1,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Adenosine Monophosphate (AMP)",
            "Cyclic Adenosine Monophosphate (cAMP)",
            "Guanosine Monophosphate (GMP)",
            "Cyclic Guanosine Monophosphate (cGMP)",
            "Uridine Monophosphate (UMP)",
            "Cyclic Uridine Monophosphate (cUMP)",
            "Cytidine Monophosphate (CMP)",
            "Cyclic Cytidine Monophosphate (cCMP)",
            "Thymidine Monophosphate (TMP)",
            "Cyclic Thymidine Monophosphate (cTMP)",
            "Inosine Monophosphate (IMP)",
            "Cyclic Inosine Monophosphate (cIMP)",
            "Xanthosine Monophosphate (XMP)",
            "Cyclic Xanthosine Monophosphate (cXMP)",
            "Deoxyadenosine Monophosphate (dAMP)",
            "Cyclic Deoxyadenosine Monophosphate (cdAMP)",
            "Deoxyguanosine Monophosphate (dGMP)",
            "Cyclic Deoxyguanosine Monophosphate (cdGMP)",
            "Deoxyuridine Monophosphate (dUMP)",
            "Cyclic Deoxyuridine Monophosphate (cdUMP)",
            "Deoxycytidine Monophosphate (dCMP)",
            "Cyclic Deoxycytidine Monophosphate (cdCMP)",
            "Deoxythymidine Monophosphate (dTMP)",
            "Cyclic Deoxythymidine Monophosphate (cdTMP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "3',5'-cyclic GMP",
                "3',5'-cyclic UMP",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic dTMP"
            ],
            "mismatches": [
                "Adenosine Monophosphate (AMP)",
                "Cyclic Adenosine Monophosphate (cAMP)",
                "Guanosine Monophosphate (GMP)",
                "Uridine Monophosphate (UMP)",
                "Cytidine Monophosphate (CMP)",
                "Cyclic Cytidine Monophosphate (cCMP)",
                "Thymidine Monophosphate (TMP)",
                "Cyclic Thymidine Monophosphate (cTMP)",
                "Inosine Monophosphate (IMP)",
                "Cyclic Inosine Monophosphate (cIMP)",
                "Xanthosine Monophosphate (XMP)",
                "Cyclic Xanthosine Monophosphate (cXMP)",
                "Deoxyadenosine Monophosphate (dAMP)",
                "Cyclic Deoxyadenosine Monophosphate (cdAMP)",
                "Deoxyguanosine Monophosphate (dGMP)",
                "Deoxyuridine Monophosphate (dUMP)",
                "Cyclic Deoxyuridine Monophosphate (cdUMP)",
                "Deoxycytidine Monophosphate (dCMP)",
                "Cyclic Deoxycytidine Monophosphate (cdCMP)",
                "Deoxythymidine Monophosphate (dTMP)"
            ],
            "true_referents": [
                "2',3'-cyclic CMP",
                "2',3'-cyclic UMP",
                "3',5'-cyclic GMP",
                "3',5'-cyclic UMP",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic dTMP",
                "3',5'-cyclic purine nucleotide",
                "3',5'-cyclic pyrimidine nucleotide",
                "8-nitroguanosine 3',5'-cyclic monophosphate",
                "Adenosine 2',3'-cyclic phosphate",
                "Cytidine 2',3'-cyclic monophosphoric acid",
                "Cytidine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "c-GMP-AMP",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "cytidine 5'-phosphate 2',3'-cyclic phosphate",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Cyclic adenosine monophosphate (cAMP)",
            "Cyclic guanosine monophosphate (cGMP)",
            "Cyclic cytidine monophosphate (cCMP)",
            "Cyclic uridine monophosphate (cUMP)",
            "Cyclic thymidine monophosphate (cTMP)",
            "Cyclic inosine monophosphate (cIMP)",
            "Cyclic xanthosine monophosphate (cXMP)",
            "Cyclic hypoxanthine monophosphate (cHMP)",
            "Cyclic deoxyadenosine monophosphate (cdAMP)",
            "Cyclic deoxyguanosine monophosphate (cdGMP)",
            "Cyclic deoxycytidine monophosphate (cdCMP)",
            "Cyclic deoxythymidine monophosphate (cdTMP)",
            "Cyclic deoxyinosine monophosphate (cdIMP)",
            "Cyclic deoxyxanthosine monophosphate (cdXMP)",
            "Cyclic deoxyhypoxanthine monophosphate (cdHMP)",
            "Cyclic adenosine diphosphate ribose (cADPR)",
            "Cyclic guanosine diphosphate ribose (cGDPR)",
            "Cyclic inosine diphosphate ribose (cIDPR)",
            "Cyclic uridine diphosphate ribose (cUDPR)",
            "Cyclic cytidine diphosphate ribose (cCDPR)",
            "Cyclic thymidine diphosphate ribose (cTDPR)",
            "Cyclic adenosine diphosphate ribulose (cADPRulose)",
            "Cyclic guanosine diphosphate ribulose (cGDPRulose)",
            "Cyclic inosine diphosphate ribulose (cIDPRulose)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Cyclic adenosine monophosphate (cAMP)",
                "Cyclic guanosine monophosphate (cGMP)",
                "Cyclic cytidine monophosphate (cCMP)",
                "Cyclic uridine monophosphate (cUMP)",
                "Cyclic thymidine monophosphate (cTMP)",
                "Cyclic inosine monophosphate (cIMP)",
                "Cyclic xanthosine monophosphate (cXMP)",
                "Cyclic hypoxanthine monophosphate (cHMP)",
                "Cyclic deoxyadenosine monophosphate (cdAMP)",
                "Cyclic deoxyguanosine monophosphate (cdGMP)",
                "Cyclic deoxycytidine monophosphate (cdCMP)",
                "Cyclic deoxythymidine monophosphate (cdTMP)",
                "Cyclic deoxyinosine monophosphate (cdIMP)",
                "Cyclic deoxyxanthosine monophosphate (cdXMP)",
                "Cyclic deoxyhypoxanthine monophosphate (cdHMP)",
                "Cyclic adenosine diphosphate ribose (cADPR)",
                "Cyclic guanosine diphosphate ribose (cGDPR)",
                "Cyclic inosine diphosphate ribose (cIDPR)",
                "Cyclic uridine diphosphate ribose (cUDPR)",
                "Cyclic cytidine diphosphate ribose (cCDPR)",
                "Cyclic thymidine diphosphate ribose (cTDPR)",
                "Cyclic adenosine diphosphate ribulose (cADPRulose)",
                "Cyclic guanosine diphosphate ribulose (cGDPRulose)",
                "Cyclic inosine diphosphate ribulose (cIDPRulose)"
            ],
            "true_referents": [
                "2'-phospho-cyclic ADP-ribose",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic purine nucleotide",
                "Adenosine 2',3'-cyclic phosphate",
                "Cytidine 2',3'-cyclic monophosphoric acid",
                "Cytidine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "cyclic ADP-beta-D-ribose",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "cytidine 5'-phosphate 2',3'-cyclic phosphate",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Cyclic adenosine monophosphate (cAMP)",
            "Cyclic guanosine monophosphate (cGMP)",
            "Cyclic cytidine monophosphate (cCMP)",
            "Cyclic uridine monophosphate (cUMP)",
            "Cyclic inosine monophosphate (cIMP)",
            "Cyclic thymidine monophosphate (cTMP)",
            "Cyclic di-adenosine monophosphate (c-di-AMP)",
            "Cyclic di-guanosine monophosphate (c-di-GMP)",
            "Cyclic GMP-AMP (cGAMP)",
            "3',3'-cGAMP",
            "2',3'-cGAMP",
            "Cyclic adenosine diphosphate-ribose (cADPR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cyclic di-guanosine monophosphate (c-di-GMP)",
                "2',3'-cGAMP"
            ],
            "mismatches": [
                "Cyclic adenosine monophosphate (cAMP)",
                "Cyclic guanosine monophosphate (cGMP)",
                "Cyclic cytidine monophosphate (cCMP)",
                "Cyclic uridine monophosphate (cUMP)",
                "Cyclic inosine monophosphate (cIMP)",
                "Cyclic thymidine monophosphate (cTMP)",
                "Cyclic di-adenosine monophosphate (c-di-AMP)",
                "Cyclic GMP-AMP (cGAMP)",
                "3',3'-cGAMP",
                "Cyclic adenosine diphosphate-ribose (cADPR)"
            ],
            "true_referents": [
                "2',3'-cyclic CMP",
                "2'-3'-cGAMP",
                "2'-phospho-cyclic ADP-ribose",
                "3',5'-cyclic IMP",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic purine nucleotide",
                "Adenosine 2',3'-cyclic phosphate",
                "Cytidine 2',3'-cyclic monophosphoric acid",
                "Cytidine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "c-GMP-AMP",
                "c-di-GMP",
                "cyclic ADP-beta-D-ribose",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "cytidine 5'-phosphate 2',3'-cyclic phosphate",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 2,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Cyclic adenosine monophosphate (cAMP)",
            "Cyclic guanosine monophosphate (cGMP)",
            "Cyclic cytidine monophosphate (cCMP)",
            "Cyclic uridine monophosphate (cUMP)",
            "Cyclic inosine monophosphate (cIMP)",
            "3',5'-Cyclic AMP",
            "2',3'-Cyclic AMP",
            "3',5'-Cyclic GMP",
            "2',3'-Cyclic GMP",
            "Cyclic diguanylate (c-di-GMP)",
            "Cyclic di-AMP (c-di-AMP)",
            "Cyclic GMP-AMP (cGAMP)",
            "2',3'-cGAMP",
            "3',3'-cGAMP",
            "Cyclic AMP-GMP (cAGMP)",
            "Cyclic di-UMP (c-di-UMP)",
            "Cyclic di-CMP (c-di-CMP)",
            "Cyclic tri-AMP (cAAA)",
            "Cyclic tri-GMP (cGGG)",
            "Cyclic AMP-AMP-GMP (cAAG)",
            "Cyclic GMP-GMP-AMP (cGGA)",
            "8-Bromo-cAMP",
            "8-Chloro-cAMP",
            "Dibutyryl-cAMP (db-cAMP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "3',5'-Cyclic AMP",
                "2',3'-Cyclic AMP",
                "3',5'-Cyclic GMP",
                "2',3'-Cyclic GMP",
                "Cyclic diguanylate (c-di-GMP)",
                "Cyclic di-AMP (c-di-AMP)",
                "2',3'-cGAMP",
                "8-Bromo-cAMP"
            ],
            "mismatches": [
                "Cyclic adenosine monophosphate (cAMP)",
                "Cyclic guanosine monophosphate (cGMP)",
                "Cyclic cytidine monophosphate (cCMP)",
                "Cyclic uridine monophosphate (cUMP)",
                "Cyclic inosine monophosphate (cIMP)",
                "3',3'-cGAMP",
                "Cyclic GMP-AMP (cGAMP)",
                "Cyclic AMP-GMP (cAGMP)",
                "Cyclic di-UMP (c-di-UMP)",
                "Cyclic di-CMP (c-di-CMP)",
                "Cyclic tri-AMP (cAAA)",
                "Cyclic tri-GMP (cGGG)",
                "Cyclic AMP-AMP-GMP (cAAG)",
                "Cyclic GMP-GMP-AMP (cGGA)",
                "8-Chloro-cAMP",
                "Dibutyryl-cAMP (db-cAMP)"
            ],
            "true_referents": [
                "2',3'-cyclic AMP",
                "2',3'-cyclic CMP",
                "2',3'-cyclic GMP",
                "2',3'-cyclic UMP",
                "2'-3'-cGAMP",
                "2-(dimethylamino)-cAMP",
                "3',5'-cyclic AMP",
                "3',5'-cyclic CMP",
                "3',5'-cyclic GMP",
                "3',5'-cyclic IMP",
                "3',5'-cyclic UMP",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic purine nucleotide",
                "7-deaza-8-chloro-cAMP",
                "8-(4-chlorophenylthio)-cAMP",
                "8-Br-cAMP",
                "8-aza-cAMP",
                "Adenosine 2',3'-cyclic phosphate",
                "Cytidine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "N(6)-butyryl-cAMP",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "c-GMP-AMP",
                "c-di-GMP",
                "cyclic di-AMP",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "cytidine 5'-phosphate 2',3'-cyclic phosphate",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Cyclic adenosine monophosphate (cAMP)",
            "Cyclic guanosine monophosphate (cGMP)",
            "Cyclic inosine monophosphate (cIMP)",
            "Cyclic cytidine monophosphate (cCMP)",
            "Cyclic uridine monophosphate (cUMP)",
            "Cyclic xanthosine monophosphate (cXMP)",
            "Cyclic 7-deazaadenosine monophosphate (c7-deaza-AMP)",
            "Cyclic 7-deazaguanosine monophosphate (c7-deaza-GMP)",
            "Cyclic 7-deazainosine monophosphate (c7-deaza-IMP)",
            "Cyclic 2'-O-methyladenosine monophosphate (c2'-O-Me-AMP)",
            "Cyclic 2'-O-methylguanosine monophosphate (c2'-O-Me-GMP)",
            "Cyclic N6-methyladenosine monophosphate (cN6-Me-AMP)",
            "Cyclic 8-bromoadenosine monophosphate (c8-Br-AMP)",
            "Cyclic 8-bromoguanosine monophosphate (c8-Br-GMP)",
            "Cyclic diadensosine monophosphate (c-di-AMP)",
            "Cyclic diguanosine monophosphate (c-di-GMP)",
            "Cyclic adenosine diphosphate ribose (cADPR)",
            "Cyclic guanosine diphosphate ribose (cGDPR)",
            "Cyclic inosine diphosphate ribose (cIDPR)",
            "Cyclic cytidine diphosphate ribose (cCDPR)",
            "Cyclic uridine diphosphate ribose (cUDPR)",
            "Cyclic xanthosine diphosphate ribose (cXDPR)",
            "Cyclic adenosine triphosphate (cATP)",
            "Cyclic guanosine triphosphate (cGTP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "7-deaza-cGMP",
                "8-bromo-3',5'-cyclic GMP",
                "cyclic di-AMP"
            ],
            "mismatches": [
                "Cyclic adenosine monophosphate (cAMP)",
                "Cyclic guanosine monophosphate (cGMP)",
                "Cyclic inosine monophosphate (cIMP)",
                "Cyclic cytidine monophosphate (cCMP)",
                "Cyclic uridine monophosphate (cUMP)",
                "Cyclic xanthosine monophosphate (cXMP)",
                "Cyclic 7-deazaadenosine monophosphate (c7-deaza-AMP)",
                "Cyclic 7-deazainosine monophosphate (c7-deaza-IMP)",
                "Cyclic 2'-O-methyladenosine monophosphate (c2'-O-Me-AMP)",
                "Cyclic 2'-O-methylguanosine monophosphate (c2'-O-Me-GMP)",
                "Cyclic N6-methyladenosine monophosphate (cN6-Me-AMP)",
                "Cyclic 8-bromoadenosine monophosphate (c8-Br-AMP)",
                "Cyclic diguanosine monophosphate (c-di-GMP)",
                "Cyclic adenosine diphosphate ribose (cADPR)",
                "Cyclic guanosine diphosphate ribose (cGDPR)",
                "Cyclic inosine diphosphate ribose (cIDPR)",
                "Cyclic cytidine diphosphate ribose (cCDPR)",
                "Cyclic uridine diphosphate ribose (cUDPR)",
                "Cyclic xanthosine diphosphate ribose (cXDPR)",
                "Cyclic adenosine triphosphate (cATP)",
                "Cyclic guanosine triphosphate (cGTP)"
            ],
            "true_referents": [
                "2',3'-cyclic AMP",
                "2',3'-cyclic purine nucleotide",
                "2'-phospho-cyclic ADP-ribose",
                "3',5'-cyclic AMP",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic purine nucleotide",
                "7-deaza-cGMP",
                "8-bromo-3',5'-cyclic GMP",
                "8-nitroguanosine 3',5'-cyclic monophosphate",
                "Adenosine 2',3'-cyclic phosphate",
                "Cytidine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "N(1)-methyl-cGMP",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "c-GMP-AMP",
                "cyclic ADP-beta-D-ribose",
                "cyclic di-AMP",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "cytidine 5'-phosphate 2',3'-cyclic phosphate",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Cyclic Adenosine Monophosphate (cAMP)",
            "Cyclic Guanosine Monophosphate (cGMP)",
            "Cyclic Cytidine Monophosphate (cCMP)",
            "Cyclic Uridine Monophosphate (cUMP)",
            "Cyclic Inosine Monophosphate (cIMP)",
            "Cyclic Xanthosine Monophosphate (cXMP)",
            "Cyclic Deoxyadenosine Monophosphate (cDamp)",
            "Cyclic Deoxyguanosine Monophosphate (cDgmp)",
            "Cyclic Deoxycytidine Monophosphate (cDcmp)",
            "Cyclic Deoxyuridine Monophosphate (cDump)",
            "Cyclic Deoxyinosine Monophosphate (cDimp)",
            "Cyclic Deoxyxanthosine Monophosphate (cDxmp)",
            "Cyclic Adenosine Diphosphate Ribose (cADPR)",
            "Cyclic Guanosine Diphosphate Ribose (cGDPR)",
            "Cyclic Cytidine Diphosphate Ribose (cCDPR)",
            "Cyclic Uridine Diphosphate Ribose (cUDPR)",
            "Cyclic Inosine Diphosphate Ribose (cIDPR)",
            "Cyclic Xanthosine Diphosphate Ribose (cXDPR)",
            "Cyclic Deoxyadenosine Diphosphate Ribose (cDaDPR)",
            "Cyclic Deoxyguanosine Diphosphate Ribose (cDgDPR)",
            "Cyclic Deoxycytidine Diphosphate Ribose (cDcDPR)",
            "Cyclic Deoxyuridine Diphosphate Ribose (cDuDPR)",
            "Cyclic Deoxyinosine Diphosphate Ribose (cDiDPR)",
            "Cyclic Deoxyxanthosine Diphosphate Ribose (cDxDPR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Cyclic Adenosine Monophosphate (cAMP)",
                "Cyclic Guanosine Monophosphate (cGMP)",
                "Cyclic Cytidine Monophosphate (cCMP)",
                "Cyclic Uridine Monophosphate (cUMP)",
                "Cyclic Inosine Monophosphate (cIMP)",
                "Cyclic Xanthosine Monophosphate (cXMP)",
                "Cyclic Deoxyadenosine Monophosphate (cDamp)",
                "Cyclic Deoxyguanosine Monophosphate (cDgmp)",
                "Cyclic Deoxycytidine Monophosphate (cDcmp)",
                "Cyclic Deoxyuridine Monophosphate (cDump)",
                "Cyclic Deoxyinosine Monophosphate (cDimp)",
                "Cyclic Deoxyxanthosine Monophosphate (cDxmp)",
                "Cyclic Adenosine Diphosphate Ribose (cADPR)",
                "Cyclic Guanosine Diphosphate Ribose (cGDPR)",
                "Cyclic Cytidine Diphosphate Ribose (cCDPR)",
                "Cyclic Uridine Diphosphate Ribose (cUDPR)",
                "Cyclic Inosine Diphosphate Ribose (cIDPR)",
                "Cyclic Xanthosine Diphosphate Ribose (cXDPR)",
                "Cyclic Deoxyadenosine Diphosphate Ribose (cDaDPR)",
                "Cyclic Deoxyguanosine Diphosphate Ribose (cDgDPR)",
                "Cyclic Deoxycytidine Diphosphate Ribose (cDcDPR)",
                "Cyclic Deoxyuridine Diphosphate Ribose (cDuDPR)",
                "Cyclic Deoxyinosine Diphosphate Ribose (cDiDPR)",
                "Cyclic Deoxyxanthosine Diphosphate Ribose (cDxDPR)"
            ],
            "true_referents": [
                "2'-phospho-cyclic ADP-ribose",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic purine nucleotide",
                "Adenosine 2',3'-cyclic phosphate",
                "Cytidine 2',3'-cyclic monophosphoric acid",
                "Cytidine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "cyclic ADP-beta-D-ribose",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "cytidine 5'-phosphate 2',3'-cyclic phosphate",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Adenosine 3',5'-cyclic monophosphate (cAMP)",
            "Guanosine 3',5'-cyclic monophosphate (cGMP)",
            "Inosine 3',5'-cyclic monophosphate (cIMP)",
            "Cytidine 3',5'-cyclic monophosphate (cCMP)",
            "Uridine 3',5'-cyclic monophosphate (cUMP)",
            "Thymidine 3',5'-cyclic monophosphate (cTMP)",
            "Cyclic adenosine diphosphate ribose (cADPR)",
            "Nicotinic acid adenine dinucleotide phosphate (NAADP)",
            "Cyclic pyridine nucleotide (cPyN)",
            "Cyclic purine nucleotide (cPuN)",
            "Cyclic dinucleotide (c-di-NMP)",
            "Cyclic guanylate (c-di-GMP)",
            "Cyclic AMP-GMP (cAMP-GMP)",
            "Cyclic ADP-ribose (cADPR)",
            "Cyclic IDP-ribose (cIDPR)",
            "Cyclic GDP-ribose (cGDPR)",
            "Cyclic UDP-ribose (cUDPR)",
            "Cyclic TDP-ribose (cTDPR)",
            "Cyclic CDP-ribose (cCDPR)",
            "Cyclic dinucleotide phosphate-AMP (c-di-AMP)",
            "Cyclic dinucleotide phosphate-GMP (c-di-GMP)",
            "Cyclic dinucleotide phosphate-IMP (c-di-IMP)",
            "Cyclic dinucleotide phosphate-CMP (c-di-CMP)",
            "Cyclic dinucleotide phosphate-UMP (c-di-UMP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cyclic purine nucleotide (cPuN)",
                "Cyclic guanylate (c-di-GMP)",
                "Cyclic dinucleotide phosphate-AMP (c-di-AMP)",
                "Cyclic dinucleotide phosphate-GMP (c-di-GMP)"
            ],
            "mismatches": [
                "Adenosine 3',5'-cyclic monophosphate (cAMP)",
                "Guanosine 3',5'-cyclic monophosphate (cGMP)",
                "Inosine 3',5'-cyclic monophosphate (cIMP)",
                "Cytidine 3',5'-cyclic monophosphate (cCMP)",
                "Uridine 3',5'-cyclic monophosphate (cUMP)",
                "Thymidine 3',5'-cyclic monophosphate (cTMP)",
                "Cyclic adenosine diphosphate ribose (cADPR)",
                "Nicotinic acid adenine dinucleotide phosphate (NAADP)",
                "Cyclic pyridine nucleotide (cPyN)",
                "Cyclic dinucleotide (c-di-NMP)",
                "Cyclic AMP-GMP (cAMP-GMP)",
                "Cyclic ADP-ribose (cADPR)",
                "Cyclic IDP-ribose (cIDPR)",
                "Cyclic GDP-ribose (cGDPR)",
                "Cyclic UDP-ribose (cUDPR)",
                "Cyclic TDP-ribose (cTDPR)",
                "Cyclic CDP-ribose (cCDPR)",
                "Cyclic dinucleotide phosphate-IMP (c-di-IMP)",
                "Cyclic dinucleotide phosphate-CMP (c-di-CMP)",
                "Cyclic dinucleotide phosphate-UMP (c-di-UMP)"
            ],
            "true_referents": [
                "2',3'-cyclic CMP",
                "2'-phospho-cyclic ADP-ribose",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic purine nucleotide",
                "Adenosine 2',3'-cyclic phosphate",
                "Cytidine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "N(2),N(2)-dimethyl-cGMP",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "c-GMP-AMP",
                "c-di-GMP",
                "cyclic ADP-beta-D-ribose",
                "cyclic di-AMP",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "cyclic pyrimidine nucleotide",
                "cytidine 5'-phosphate 2',3'-cyclic phosphate",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate",
                "nucleoside 3',5'-cyclic phosphate"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "Cyclic Adenosine Monophosphate (cAMP)",
            "Cyclic Guanosine Monophosphate (cGMP)",
            "Cyclic Uridine Monophosphate (cUMP)",
            "Cyclic Inosine Monophosphate (cIMP)",
            "Cyclic Adenosine Diphosphate (cADP)",
            "Cyclic Guanosine Diphosphate (cGDP)",
            "Cyclic Adenosine Triphosphate (cATP)",
            "Cyclic Guanosine Triphosphate (cGTP)",
            "Cyclic Nucleotide Phosphodiesterase (PDE)",
            "Cyclic Nucleotide-Gated Ion Channel",
            "Cyclic Nucleotide-Dependent Protein Kinase (PKA)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase (PP2C)",
            "Cyclic Nucleotide-Dependent Protein Ser/Thr Kinase (CK1)",
            "Cyclic Nucleotide-Dependent Protein Tyr Kinase (CK2)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 1 (PP1)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 2A (PP2A)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 2B (PP2B)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 3 (PP3)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 4 (PP4)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 5 (PP5)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 6 (PP6)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 7 (PP7)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 8 (PP8)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 9 (PP9)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 10 (PP10)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 11 (PP11)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 12 (PP12)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 13 (PP13)",
            "Cyclic Nucleotide-Dependent Protein Phosphatase 14 (PP14)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Cyclic Adenosine Monophosphate (cAMP)",
                "Cyclic Guanosine Monophosphate (cGMP)",
                "Cyclic Uridine Monophosphate (cUMP)",
                "Cyclic Inosine Monophosphate (cIMP)",
                "Cyclic Adenosine Diphosphate (cADP)",
                "Cyclic Guanosine Diphosphate (cGDP)",
                "Cyclic Adenosine Triphosphate (cATP)",
                "Cyclic Guanosine Triphosphate (cGTP)",
                "Cyclic Nucleotide Phosphodiesterase (PDE)",
                "Cyclic Nucleotide-Gated Ion Channel",
                "Cyclic Nucleotide-Dependent Protein Kinase (PKA)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase (PP2C)",
                "Cyclic Nucleotide-Dependent Protein Ser/Thr Kinase (CK1)",
                "Cyclic Nucleotide-Dependent Protein Tyr Kinase (CK2)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 1 (PP1)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 2A (PP2A)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 2B (PP2B)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 3 (PP3)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 4 (PP4)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 5 (PP5)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 6 (PP6)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 7 (PP7)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 8 (PP8)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 9 (PP9)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 10 (PP10)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 11 (PP11)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 12 (PP12)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 13 (PP13)",
                "Cyclic Nucleotide-Dependent Protein Phosphatase 14 (PP14)"
            ],
            "true_referents": [
                "2',3'-cyclic AMP",
                "2',3'-cyclic nucleotide",
                "3',5'-cyclic AMP",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic purine nucleotide",
                "8-nitroguanosine 3',5'-cyclic monophosphate",
                "Adenosine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 0,
            "FP": 29,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            "cyclic adenosine monophosphate (cAMP)",
            "cyclic guanosine monophosphate (cGMP)",
            "cyclic inosine monophosphate (cIMP)",
            "cyclic xanthosine monophosphate (cXMP)",
            "cyclic thymidine monophosphate (cTMP)",
            "cyclic uridine monophosphate (cUMP)",
            "cyclic cytidine monophosphate (cCMP)",
            "cyclic guanosine 3',5'-monophosphate (cGMP)",
            "adenosine 3',5'-cyclic monophosphate (cAMP)",
            "guanosine 3',5'-cyclic monophosphate (cGMP)",
            "inosine 3',5'-cyclic monophosphate (cIMP)",
            "xanthosine 3',5'-cyclic monophosphate (cXMP)",
            "thymidine 3',5'-cyclic monophosphate (cTMP)",
            "uridine 3',5'-cyclic monophosphate (cUMP)",
            "cytidine 3',5'-cyclic monophosphate (cCMP)",
            "2',3'-cyclic AMP (2',3'-cAMP)",
            "3',5'-cyclic AMP (3',5'-cAMP)",
            "2',3'-cyclic GMP (2',3'-cGMP)",
            "3',5'-cyclic GMP (3',5'-cGMP)",
            "2',3'-cyclic IMP (2',3'-cIMP)",
            "3',5'-cyclic IMP (3',5'-cIMP)",
            "2',3'-cyclic XMP (2',3'-cXMP)",
            "3',5'-cyclic XMP (3',5'-cXMP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "2',3'-cyclic AMP",
                "2',3'-cyclic GMP",
                "3',5'-cyclic AMP",
                "3',5'-cyclic GMP",
                "3',5'-cyclic IMP"
            ],
            "mismatches": [
                "cyclic adenosine monophosphate (cAMP)",
                "cyclic guanosine monophosphate (cGMP)",
                "cyclic inosine monophosphate (cIMP)",
                "cyclic xanthosine monophosphate (cXMP)",
                "cyclic thymidine monophosphate (cTMP)",
                "cyclic uridine monophosphate (cUMP)",
                "cyclic cytidine monophosphate (cCMP)",
                "cyclic guanosine 3',5'-monophosphate (cGMP)",
                "adenosine 3',5'-cyclic monophosphate (cAMP)",
                "guanosine 3',5'-cyclic monophosphate (cGMP)",
                "inosine 3',5'-cyclic monophosphate (cIMP)",
                "xanthosine 3',5'-cyclic monophosphate (cXMP)",
                "thymidine 3',5'-cyclic monophosphate (cTMP)",
                "uridine 3',5'-cyclic monophosphate (cUMP)",
                "cytidine 3',5'-cyclic monophosphate (cCMP)",
                "2',3'-cyclic IMP (2',3'-cIMP)",
                "2',3'-cyclic XMP (2',3'-cXMP)",
                "3',5'-cyclic XMP (3',5'-cXMP)"
            ],
            "true_referents": [
                "2',3'-cyclic AMP",
                "2',3'-cyclic CMP",
                "2',3'-cyclic GMP",
                "3',5'-cyclic AMP",
                "3',5'-cyclic CMP",
                "3',5'-cyclic GMP",
                "3',5'-cyclic IMP",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic dTMP",
                "3',5'-cyclic purine nucleotide",
                "Adenosine 2',3'-cyclic phosphate",
                "Cytidine 2',3'-cyclic monophosphoric acid",
                "Cytidine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "cyclic purine dinucleotide",
                "cyclic purine nucleotide",
                "cytidine 5'-phosphate 2',3'-cyclic phosphate",
                "guanosine-5'-phosphate-2',3'-cyclic phosphate"
            ],
            "TP": 5,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "cyclic nucleotide",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Adenosine monophosphate (AMP)",
                "Canonical name": "(AMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic guanosine monophosphate (cGMP)",
                "Canonical name": "(cGMP)"
            },
            {
                "Referent": "Cyclic inosine monophosphate (cIMP)",
                "Canonical name": "(cIMP)"
            },
            {
                "Referent": "Cyclic thymidine monophosphate (cTMP)",
                "Canonical name": "(cTMP)"
            },
            {
                "Referent": "Cyclic uridine monophosphate (cUMP)",
                "Canonical name": "(cUMP)"
            },
            {
                "Referent": "Cyclic cytidine monophosphate (cCMP)",
                "Canonical name": "(cCMP)"
            },
            {
                "Referent": "Cyclic diguanosine monophosphate (cGMP)",
                "Canonical name": "(cGMP)"
            },
            {
                "Referent": "Cyclic guanosine monophosphate (cGMP)",
                "Canonical name": "(cGMP)"
            },
            {
                "Referent": "Cyclic guanosine monophosphate (cGMP)",
                "Canonical name": "(cGMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            },
            {
                "Referent": "Cyclic adenosine monophosphate (cAMP)",
                "Canonical name": "(cAMP)"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "3',5'-cyclic AMP",
                "3',5'-cyclic dGMP"
            ],
            "mismatches": [
                "Adenosine monophosphate (AMP)",
                "Cyclic inosine monophosphate (cIMP)",
                "Cyclic thymidine monophosphate (cTMP)",
                "Cyclic uridine monophosphate (cUMP)",
                "Cyclic cytidine monophosphate (cCMP)"
            ],
            "true_referents": [
                "3',5'-cyclic AMP",
                "3',5'-cyclic dGMP",
                "3',5'-cyclic purine nucleotide",
                "Adenosine 2',3'-cyclic phosphate",
                "Cytidine 2',3'-cyclic phosphate",
                "Inosine 2',3'-cyclic phosphate",
                "N(1)-methyl-cGMP",
                "N(2),N(2)-dimethyl-cGMP",
                "adenosine-5'-phosphate-2',3'-cyclic phosphate",
                "cytidine 5'-phosphate 2',3'-cyclic phosphate"
            ],
            "TP": 2,
            "FP": 5,
            "FN": 0
        }
    }
]