[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1 (BRCA1)",
            "TP53 (TP53)",
            "APOE (APOE)",
            "EGFR (EGFR)",
            "MYC (MYC)",
            "BRAF (BRAF)",
            "VEGFA (VEGFA)",
            "PDGFRA (PDGFRA)",
            "HER2 (ERBB2)",
            "PTEN (PTEN)",
            "JAK2 (JAK2)",
            "FLT3 (FLT3)",
            "KIT (KIT)",
            "BCL2 (BCL2)",
            "CDH1 (CDH1)",
            "CFTR (CFTR)",
            "GJB2 (GJB2)",
            "SCN5A (SCN5A)",
            "LRP5 (LRP5)",
            "IGF1 (IGF1)",
            "KCNJ11 (KCNJ11)",
            "PSEN1 (PSEN1)",
            "PSEN2 (PSEN2)",
            "SMAD4 (SMAD4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "APOE",
                "EGFR",
                "MYC",
                "BRAF",
                "VEGFA",
                "PDGFRA",
                "PTEN",
                "JAK2",
                "FLT3",
                "KIT",
                "CDH1",
                "CFTR",
                "SCN5A",
                "LRP5",
                "IGF1",
                "KCNJ11",
                "PSEN1",
                "PSEN2",
                "SMAD4"
            ],
            "mismatches": [
                "BRCA1",
                "BCL2",
                "GJB2",
                "HER2"
            ],
            "true_referents": [
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BCL2 like 10 (BCL2L10 aka BCL-B, Boo, Diva, bcl2-L-10)",
                "BCL2 like 11 (BCL2L11 aka BAM, BIM, BOD)",
                "BCL2 like 12 (BCL2L12)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "FLT3 interacting zinc finger 1 (FIZ1 aka ZNF798)",
                "Janus kinase 1 (JAK1 aka AIIDEA, JAK1B, JTK3, JAK1)",
                "Janus kinase 2 (JAK2 aka JTK10)",
                "Janus kinase 3 (JAK3 aka JAK-3_HUMAN, JAKL, L-JAK, LJAK, JAK3)",
                "KIT proto-oncogene, receptor tyrosine kinase (KIT aka C-Kit, CD117, MASTC, PBT, SCFR)",
                "LDL receptor related protein 3 (LRP3)",
                "LDL receptor related protein 5 (LRP5 aka BMND1, EVR1, EVR4, HBM, LR3, LRP-5, LRP-7, LRP7, OPPG, OPS, OPTA1, PCLD4, VBCH2)",
                "LRP2 binding protein (LRP2BP)",
                "MYC binding protein (MYCBP aka AMY-1)",
                "MYC proto-oncogene, bHLH transcription factor (MYC aka MRTLC, bHLHe39, c-Myc, MYC)",
                "MYC target 1 (MYCT1 aka MTLC)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "Raf-1 proto-oncogene, serine/threonine kinase (RAF1 aka CMD1NN, CRAF, NS5, Raf-1, c-Raf)",
                "SMAD family member 1 (SMAD1 aka BSP-1, BSP1, JV4-1, JV41, MADH1, MADR1)",
                "SMAD family member 4 (SMAD4 aka DPC4, JIP, MADH4, MYHRS)",
                "SMAD family member 6 (SMAD6 aka AOVD2, HsT17432, MADH6, MADH7)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "TP53 target 3 (TP53TG3 aka P53TG3A, TP53TG3E, TP53TG3F, TP53TG3)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "cadherin 1 (CDH1 aka Arc-1, BCDS1, CD324, CDHE, ECAD, LCAM, UVO)",
                "cadherin 7 (CDH7 aka CDH7L1)",
                "cadherin 9 (CDH9)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "erb-b2 receptor tyrosine kinase 2 (ERBB2 aka CD340, HER-2, HER-2/neu, HER2, MLN 19, MLN-19, NEU, NGL, TKR1, VSCN2, c-ERB-2, c-ERB2, p185(erbB2))",
                "erb-b2 receptor tyrosine kinase 4 (ERBB4 aka ALS19, HER4, p180erbB4)",
                "fms related receptor tyrosine kinase 3 (FLT3 aka CD135, FLK-2, FLK2, STK1)",
                "fms related receptor tyrosine kinase 3 ligand (FLT3LG aka FL, FLG3L, FLT3L, IMD125)",
                "gap junction protein beta 1 (GJB1 aka CMTX, CMTX1, CX32)",
                "gap junction protein beta 5 (GJB5 aka CX31.1)",
                "glutathione S-transferase alpha 2 (GSTA2 aka GST2-2, GTA2, GTH2, GSTA2)",
                "heat shock protein family A (Hsp70) member 2 (HSPA2 aka HSP70-2, HSP70-3)",
                "insulin like growth factor 1 (IGF1 aka IGF, IGF-I, IGFI, MGF)",
                "insulin like growth factor 1 receptor (IGF1R aka CD221, IGFIR, IGFR, JTK13)",
                "insulin like growth factor binding protein 1 (IGFBP1 aka AFBP, IBP1, IGF-BP25, PP12, hIGFBP-1)",
                "lactase (LCT aka LAC, LPH, LPH1)",
                "mesogenin 1 (MSGN1 aka MSOG, pMsgn1)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "netrin 5 (NTN5)",
                "paired box 4 (PAX4 aka KPD, MODY9)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "platelet derived growth factor receptor alpha (PDGFRA aka CD140A, PDGFR-2, PDGFR2)",
                "platelet derived growth factor receptor like (PDGFRL aka PDGRL, PRLTS)",
                "platelet derived growth factor subunit A (PDGFA aka PDGF-A, PDGF1)",
                "potassium inwardly rectifying channel subfamily J member 1 (KCNJ1 aka KIR1.1, ROMK, ROMK1)",
                "potassium inwardly rectifying channel subfamily J member 10 (KCNJ10 aka BIRK-10, KCNJ13-PEN, KIR1.2, KIR4.1, SESAME)",
                "potassium inwardly rectifying channel subfamily J member 11 (KCNJ11 aka BIR, HHF2, IKATP, KIR6.2, MODY13, PHHI, PNDM2, TNDM3)",
                "presenilin 1 (PSEN1 aka ACNINV3, AD3, CMD1U, FAD, PS-1, PS1, PSNL1, S182)",
                "presenilin 2 (PSEN2 aka AD3L, AD4, CMD1V, PS2, STM2)",
                "presenilin enhancer, gamma-secretase subunit (PSENEN aka ACNINV2, MDS033, MSTP064, PEN-2, PEN2)",
                "protein tyrosine phosphatase receptor type E (PTPRE aka HPTPE, PTPE, R-PTP-EPSILON)",
                "schlafen family member 5 (SLFN5)",
                "sodium voltage-gated channel alpha subunit 5 (SCN5A aka CDCD2, CMD1E, CMPD2, HB1, HB2, HBBD, HH1, ICCD, IVF, LQT3, Nav1.5, PFHB1, SSS1, VF1)",
                "tektin 4 (TEKT4)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "ubiquitin conjugating enzyme E2 J2 (UBE2J2 aka NCUBE-2, NCUBE2, PRO2121, UBC6)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor D (VEGFD aka FIGF, VEGF-D)"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1 (Breast Cancer 1, early onset)",
            "TP53 (Tumor protein p53)",
            "EGFR (Epidermal growth factor receptor)",
            "MYC (MYC proto-oncogene, bHLH transcription factor)",
            "AKT1 (AKT serine/threonine kinase 1)",
            "BRAF (B-Raf proto-oncogene, serine/threonine kinase)",
            "PTEN (Phosphatase and tensin homolog)",
            "KRAS (Kirsten rat sarcoma viral oncogene homolog)",
            "MAP2K1 (Mitogen-activated protein kinase kinase 1)",
            "CDKN2A (Cyclin-dependent kinase inhibitor 2A)",
            "APOE (Apolipoprotein E)",
            "APOB (Apolipoprotein B)",
            "INS (Insulin)",
            "IGF1 (Insulin-like growth factor 1)",
            "VEGFA (Vascular endothelial growth factor A)",
            "TNF (Tumor necrosis factor)",
            "IL6 (Interleukin 6)",
            "HBB (Hemoglobin subunit beta)",
            "HBA1 (Hemoglobin subunit alpha 1)",
            "CFTR (Cystic fibrosis transmembrane conductance regulator)",
            "FMR1 (Fragile X mental retardation 1)",
            "DMD (Dystrophin)",
            "HFE (Hemochromatosis protein)",
            "APP (Amyloid beta A4 precursor protein)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BRCA1",
                "TP53",
                "EGFR",
                "MYC",
                "AKT1",
                "BRAF",
                "PTEN",
                "KRAS",
                "MAP2K1",
                "CDKN2A",
                "APOE",
                "APOB",
                "INS",
                "IGF1",
                "VEGFA",
                "TNF",
                "IL6",
                "HBB",
                "HBA1",
                "CFTR",
                "FMR1",
                "DMD",
                "HFE",
                "APP"
            ],
            "mismatches": [],
            "true_referents": [
                "A-Raf proto-oncogene, serine/threonine kinase (ARAF aka A-RAF1, PKS2, RAFA1, ARAF)",
                "AKT serine/threonine kinase 1 (AKT1 aka AKT, PKB, PKB-ALPHA, PRKBA, RAC, RAC-ALPHA)",
                "AKT serine/threonine kinase 2 (AKT2 aka HIHGHH, PKBB, PKBBETA, PRKBB, RAC-BETA)",
                "AKT serine/threonine kinase 3 (AKT3 aka MPPH, MPPH2, PKB-GAMMA, PKBG, PRKBG, RAC-PK-gamma, RAC-gamma, STK-2)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 DNA repair associated (BRCA1 aka BRCAI, BRCC1, BROVCA1, FANCS, IRIS, PNCA4, PPP1R53, PSCP, RNF53)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "FMR1 autosomal homolog 1 (FXR1 aka CMYO9A, CMYO9B, CMYP9A, CMYP9BP, MYOPMIL, MYORIBF, FXR1)",
                "FMR1 autosomal homolog 2 (FXR2 aka FMR1L2P, FXR2)",
                "HRas proto-oncogene, GTPase (HRAS aka C-BAS/HAS, C-H-RAS, C-HA-RAS1, CTLO, H-RASIDX, HAMSV1, RASH1, p21ras, HRAS)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "MAPK activated protein kinase 2 (MAPKAPK2 aka MAPKAP-K2, MK-2, MK2)",
                "MYC proto-oncogene, bHLH transcription factor (MYC aka MRTLC, bHLHe39, c-Myc, MYC)",
                "MYCL proto-oncogene, bHLH transcription factor (MYCL aka L-Myc, LMYC1, bHLHe38, MYCL)",
                "MYCN proto-oncogene, bHLH transcription factor (MYCN aka FGLDS1, MODED, MPAPAsORF, MYCNsPEP, N-myc, NMYC, ODED, bHLHe37, MYCN)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "Raf-1 proto-oncogene, serine/threonine kinase (RAF1 aka CMD1NN, CRAF, NS5, Raf-1, c-Raf)",
                "TNF superfamily member 11 (TNFSF11 aka CD254, ODF, OPGL, OPTB2, RANKL, TNLG6B, TRANCE, hRANKL2, sOdf)",
                "amyloid beta precursor like protein 1 (APLP1 aka APLP)",
                "amyloid beta precursor like protein 2 (APLP2 aka APLP-2, APPH, APPL2, CDEBP)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein B (APOB aka FCHL2, FLDB, LDLCQ4, apoB-100, apoB-48)",
                "apolipoprotein B receptor (APOBR aka APOB100R, APOB48R)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "cyclin dependent kinase 2 (CDK2 aka CDKN2, p33(CDK2))",
                "cyclin dependent kinase inhibitor 2A (CDKN2A aka ARF, CAI2, CDK4I, CDKN2, CMM2, INK4, INK4A, MLM, MTS-1, MTS1, P14, P14ARF, P16, P16-INK4A, P16INK4, P16INK4A, P19, P19ARF, TP16)",
                "cyclin dependent kinase inhibitor 2D (CDKN2D aka INK4D, p19, p19-INK4D)",
                "dystrophin (DMD aka BMD, CMD3B, DXS142, DXS164, DXS206, DXS230, DXS239, DXS268, DXS269, DXS270, DXS272, MRX85)",
                "dystrophin related protein 2 (DRP2 aka DRP-2)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "fragile X messenger ribonucleoprotein 1 (FMR1 aka FMRP, FRAXA, POF, POF1)",
                "hemoglobin subunit alpha 1 (HBA1 aka ECYT7, HBA-T3, HBH, METHBA)",
                "hemoglobin subunit alpha 2 (HBA2 aka ECYT7, HBA-T2, HBH)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit delta (HBD aka HBK)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "hepcidin antimicrobial peptide (HAMP aka HEPC, HFE2B, LEAP1, PLTR)",
                "homeostatic iron regulator (HFE aka HFE1, HH, HLA-H, MVCD7, TFQTL2)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin degrading enzyme (IDE aka INSULYSIN)",
                "insulin like growth factor 1 (IGF1 aka IGF, IGF-I, IGFI, MGF)",
                "insulin like growth factor 1 receptor (IGF1R aka CD221, IGFIR, IGFR, JTK13)",
                "insulin like growth factor 2 (IGF2 aka C11orf43, GRDF, IGF-II, PP9974, SRS3)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "interleukin 13 (IL13 aka IL-13, P600)",
                "interleukin 5 (IL5 aka EDF, IL-5, TRF)",
                "interleukin 6 (IL6 aka BSF-2, BSF2, CDF, HGF, HSF, IFN-beta-2, IFNB2, IL-6)",
                "interleukin 7 (IL7 aka IL-7, IMD130)",
                "iron responsive element binding protein 2 (IREB2 aka ACO3, IRE-BP 2, IRE-BP2, IRP2, IRP2AD, NDCAMA)",
                "mitogen-activated protein kinase kinase 1 (MAP2K1 aka CFC3, MAPKK1, MEK1, MEL, MKK1, PRKMK1)",
                "mitogen-activated protein kinase kinase 2 (MAP2K2 aka CFC4, MAPKK2, MEK2, MKK2, PRKMK2)",
                "muscle RAS oncogene homolog (MRAS aka M-RAs, NS11, R-RAS3, RRAS3)",
                "myotrophin (MTPN aka GCDP, V-1)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "transmembrane phosphatase with tensin homology (TPTE aka CT44, PTEN21, TPTE)",
                "tumor necrosis factor (TNF aka DIF, IMD127-alpha, TNFA, TNFSF2, TNLG1F, TNF)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor C (VEGFC aka Flt4-L, LMPH1D, LMPHM4, VRP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1 (BRCA1)",
            "TP53 (TP53)",
            "EGFR (EGFR)",
            "BRCA2 (BRCA2)",
            "CFTR (CFTR)",
            "HBB (HBB)",
            "HBA1 (HBA1)",
            "HBA2 (HBA2)",
            "APOE (APOE)",
            "CFH (CFH)",
            "SLC2A1 (SLC2A1)",
            "HBB (HBB)",
            "HBA1 (HBA1)",
            "HBA2 (HBA2)",
            "HER2 (ERBB2)",
            "MYC (MYC)",
            "KIT (KIT)",
            "RET (RET)",
            "RB1 (RB1)",
            "NF1 (NF1)",
            "VHL (VHL)",
            "PTEN (PTEN)",
            "APC (APC)",
            "BMPR2 (BMPR2)",
            "FGFR3 (FGFR3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "EGFR",
                "BRCA2",
                "CFTR",
                "HBB",
                "HBA1",
                "HBA2",
                "APOE",
                "HER2",
                "MYC",
                "KIT",
                "RET",
                "RB1",
                "PTEN",
                "BMPR2"
            ],
            "mismatches": [
                "BRCA1",
                "CFH",
                "SLC2A1",
                "VHL",
                "NF1",
                "APC",
                "FGFR3"
            ],
            "true_referents": [
                "APC down-regulated 1 like (APCDD1L)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BMP2 inducible kinase (BMP2K aka BIKE, HRIHFB2017)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 DNA repair associated (BRCA2 aka BRCC2, BROVCA2, FACD, FAD, FAD1, FANCD, FANCD1, GLM3, PNCA2, XRCC11)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "KIT proto-oncogene, receptor tyrosine kinase (KIT aka C-Kit, CD117, MASTC, PBT, SCFR)",
                "MYC binding protein (MYCBP aka AMY-1)",
                "MYC proto-oncogene, bHLH transcription factor (MYC aka MRTLC, bHLHe39, c-Myc, MYC)",
                "MYC target 1 (MYCT1 aka MTLC)",
                "NBPF member 1 (NBPF1 aka AB13, AB14, AB23, AD2, NBG, NBPF)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "RB transcriptional corepressor 1 (RB1 aka OSRC, PPP1R130, RB, p105-Rb, p110-RB1, pRb, pp110)",
                "RB transcriptional corepressor like 1 (RBL1 aka CP107, PRB1, p107)",
                "RB1 inducible coiled-coil 1 (RB1CC1 aka ATG17, CC1, FIP200, PPP1R131)",
                "RELT like 1 (RELL1)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "TP53 target 3 (TP53TG3 aka P53TG3A, TP53TG3E, TP53TG3F, TP53TG3)",
                "VHL binding protein 1 (VBP1 aka HIBBJ46, PFD3, PFDN3, VBP-1)",
                "VHL like (VHLL aka VHLP, VLP)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "anaphase promoting complex subunit 2 (ANAPC2 aka APC2)",
                "anaphase promoting complex subunit 5 (ANAPC5 aka APC5)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "bone morphogenetic protein receptor type 1A (BMPR1A aka 10q23del, ACVRLK3, ALK-3, ALK3, BMPR-1A, CD292, SKR5)",
                "bone morphogenetic protein receptor type 2 (BMPR2 aka BMPR-II, BMPR3, BMR2, BRK-3, POVD1, PPH1, T-ALK)",
                "complement factor H related 2 (CFHR2 aka CFHL2, FHR2, HFL3)",
                "complement factor H related 4 (CFHR4 aka CFHL4, FHR-4, FHR4)",
                "complement factor H related 5 (CFHR5 aka CFHL5D, FHR-5, FHR5, CFHR5)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "erb-b2 receptor tyrosine kinase 2 (ERBB2 aka CD340, HER-2, HER-2/neu, HER2, MLN 19, MLN-19, NEU, NGL, TKR1, VSCN2, c-ERB-2, c-ERB2, p185(erbB2))",
                "erb-b2 receptor tyrosine kinase 4 (ERBB4 aka ALS19, HER4, p180erbB4)",
                "hemoglobin subunit alpha 1 (HBA1 aka ECYT7, HBA-T3, HBH, METHBA)",
                "hemoglobin subunit alpha 2 (HBA2 aka ECYT7, HBA-T2, HBH)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "high density lipoprotein binding protein (HDLBP aka HBP, PRO2900, VGL)",
                "inhibin subunit beta B (INHBB)",
                "jade family PHD finger 1 (JADE1 aka PHF17)",
                "lactase (LCT aka LAC, LPH, LPH1)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "neurofibromin 1 (NF1 aka NFNS, VRNF, WSS)",
                "paired box 4 (PAX4 aka KPD, MODY9)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "protein tyrosine phosphatase receptor type E (PTPRE aka HPTPE, PTPE, R-PTP-EPSILON)",
                "repetin (RPTN)",
                "ret proto-oncogene (RET aka CDHF12, CDHR16, HSCR1, MEN2A, MEN2B, MTC1, PTC-ELE1, RET)",
                "solute carrier family 2 member 11 (SLC2A11 aka GLUT10, GLUT11)",
                "solute carrier family 2 member 12 (SLC2A12 aka GLUT12, GLUT8)",
                "solute carrier family 2 member 2 (SLC2A2 aka GLUT2)",
                "tektin 4 (TEKT4)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "ubiquitin B (UBB aka HEL-S-50)"
            ],
            "TP": 15,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "Hemoglobin subunit beta (HBB)",
            "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
            "Insulin (INS)",
            "Growth Hormone (GH)",
            "Tumor Protein p53 (TP53)",
            "Epidermal Growth Factor Receptor (EGFR)",
            "Actin, beta (ACTB)",
            "Tubulin, alpha (TUBA)",
            "Myoglobin (MYOG)",
            "Collagen, type I alpha 1 (COL1A1)",
            "Dystrophin (DMD)",
            "Factor VIII (F8)",
            "Albumin (ALB)",
            "Immunoglobulin G heavy chain (IGHG1)",
            "Major Histocompatibility Complex, Class I, A (HLA-A)",
            "Sodium/Potassium ATPase subunit alpha 1 (ATP1A1)",
            "Acetylcholinesterase (ACHE)",
            "Dopamine Receptor D2 (DRD2)",
            "Serotonin Receptor 5-HT1A (HTR1A)",
            "Glutamate Receptor, Ionotropic, AMPA 1 (GRIA1)",
            "Programmed cell death protein 1 (PDCD1)",
            "Cytotoxic T-lymphocyte-associated protein 4 (CTLA4)",
            "Interleukin-2 (IL2)",
            "Transforming growth factor beta 1 (TGFB1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hemoglobin subunit beta (HBB)",
                "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
                "Insulin (INS)",
                "Tumor Protein p53 (TP53)",
                "Epidermal Growth Factor Receptor (EGFR)",
                "Actin, beta (ACTB)",
                "Myoglobin (MB)",
                "Collagen, type I alpha 1 (COL1A1)",
                "Dystrophin (DMD)",
                "Albumin (ALB)",
                "Immunoglobulin G heavy chain (IGHG1)",
                "Major Histocompatibility Complex, Class I, A (HLA-A)",
                "Sodium/Potassium ATPase subunit alpha 1 (ATP1A1)",
                "Acetylcholinesterase (ACHE)",
                "Dopamine Receptor D2 (DRD2)",
                "Serotonin Receptor 5-HT1A (HTR1A)",
                "Glutamate Receptor, Ionotropic, AMPA 1 (GRIA1)",
                "Programmed cell death protein 1 (PDCD1)",
                "Cytotoxic T-lymphocyte-associated protein 4 (CTLA4)",
                "Interleukin-2 (IL2)"
            ],
            "mismatches": [
                "Growth Hormone (GH)",
                "Tubulin, alpha (TUBA)",
                "Factor VIII (F8)",
                "Transforming growth factor beta 1 (TGFB1)",
                "Myoglobin (MYOG)"
            ],
            "true_referents": [
                "5-hydroxytryptamine receptor 1A (HTR1A aka 5-HT-1A, 5-HT1A, 5HT1a, ADRB2RL1, ADRBRL1, G-21, PFMCD)",
                "5-hydroxytryptamine receptor 1E (HTR1E aka 5-HT1E)",
                "5-hydroxytryptamine receptor 5A (HTR5A aka 5-HT5A)",
                "ATPase H+/K+ transporting subunit alpha (ATP4A aka ATP6A)",
                "ATPase Na+/K+ transporting subunit alpha 1 (ATP1A1 aka CMT2DD, HOMGSMR2)",
                "ATPase Na+/K+ transporting subunit alpha 4 (ATP1A4 aka ATP1A1, ATP1AL2)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "acetylcholinesterase (Yt blood group) (ACHE aka ACEE, ARACHE, N-ACHE, YT)",
                "actin beta (ACTB aka BKRNS, BNS, BRWS1, CSMH, DDS1, PS1TP5BP1, THC8)",
                "actin beta like 2 (ACTBL2 aka ACT)",
                "afamin (AFM aka ALB2, ALBA, ALF)",
                "albumin (ALB aka FDAHT, HSA, PRO0883, PRO0903, PRO1341)",
                "butyrylcholinesterase (BCHE aka BCHED, CHE1, CHE2, E1)",
                "capping actin protein of muscle Z-line subunit beta (CAPZB aka CAPB, CAPPB, CAPZ)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "coagulation factor VIII (F8 aka AHF, DXS1253EB, F8C, FVIII, HEMA, THPH13, F8)",
                "coagulation factor VIII associated 1 (F8A1 aka DXS522E, F8A, HAP40)",
                "coagulation factor VIII associated 2 (F8A2 aka HAP40)",
                "collagen like tail subunit of asymmetric acetylcholinesterase (COLQ aka CMS5, EAD)",
                "collagen type I alpha 1 chain (COL1A1 aka CAFYD, EDSARTH1, EDSC, OI1, OI2, OI3, OI4)",
                "collagen type II alpha 1 chain (COL2A1 aka ANFH, AOM, COL11A3, SEDC, STL1)",
                "collagen type X alpha 1 chain (COL10A1)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "cytoglobin (CYGB aka HGB, NOD, STAP)",
                "cytotoxic T-lymphocyte associated protein 4 (CTLA4 aka ALPS5, CD, CD152, CELIAC3, CTLA-4, GRD4, GSE, IDDM12)",
                "dopamine receptor D2 (DRD2 aka D2DR, D2R)",
                "dopamine receptor D4 (DRD4 aka D4DR)",
                "dopamine receptor D5 (DRD5 aka DBDR, DRD1B, DRD1L2)",
                "dystrophin (DMD aka BMD, CMD3B, DXS142, DXS164, DXS206, DXS230, DXS239, DXS268, DXS269, DXS270, DXS272, MRX85)",
                "dystrophin related protein 2 (DRP2 aka DRP-2)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "glutamate ionotropic receptor AMPA type subunit 1 (GRIA1 aka GLUH1, GLUR1, GLURA, GluA1, HBGR1, MRD67, MRT76)",
                "glutamate ionotropic receptor AMPA type subunit 2 (GRIA2 aka GLUR2, GLURB, GluA2, GluR-K2, HBGR2, NEDLIB, gluR-2, gluR-B)",
                "glutamate ionotropic receptor AMPA type subunit 3 (GRIA3 aka GLUR-C, GLUR-K3, GLUR3, GLURC, GluA3, MRX94, MRXSW, iGluR3)",
                "growth hormone 1 (GH1 aka GH, GH-N, GHB5, GHN, IGHD1A, IGHD1B, IGHD2, hGH-N)",
                "growth hormone 2 (GH2 aka GH-V, GHB2, GHL, GHV, hGH-V)",
                "growth hormone receptor (GHR aka GHBP, GHIP)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit delta (HBD aka HBK)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "immunoglobulin heavy constant alpha 1 (IGHA1 aka IgA1)",
                "immunoglobulin heavy constant gamma 1 (G1m marker) (IGHG1)",
                "immunoglobulin heavy constant gamma P (non-functional) (IGHGP aka IGHGP1)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin degrading enzyme (IDE aka INSULYSIN)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "interleukin 2 (IL2 aka IL-2, TCGF, lymphokine)",
                "interleukin 25 (IL25 aka IL17E)",
                "interleukin 5 (IL5 aka EDF, IL-5, TRF)",
                "major histocompatibility complex, class I, A (HLA-A aka HLAA)",
                "major histocompatibility complex, class I, G (HLA-G aka MHC-G)",
                "major histocompatibility complex, class II, DR alpha (HLA-DRA aka HLA-DRA1)",
                "major histocompatibility complex, class II, DR beta 4 (HLA-DRB4 aka DR4, DRB4, HLA-DR4B, HLA-DRB*, HLA-DRB4)",
                "myoglobin (MB aka MYOSB, PVALB)",
                "myosin X (MYO10 aka MyoX)",
                "myotrophin (MTPN aka GCDP, V-1)",
                "parvalbumin (PVALB aka D22S749)",
                "programmed cell death 1 (PDCD1 aka AIMTBS, CD279, PD-1, PD1, SLEB2, hPD-1, hPD-l, hSLE1)",
                "programmed cell death 4 (PDCD4 aka H731)",
                "programmed cell death 7 (PDCD7 aka 59K, ES18, HES18)",
                "transforming growth factor alpha (TGFA aka TFGA)",
                "transforming growth factor beta 2 (TGFB2 aka G-TSF, LDS4, TGF-beta2)",
                "transforming growth factor beta 3 (TGFB3 aka ARVD, ARVD1, LDS5, RNHF, TGF-beta3)",
                "tubulin alpha 1c (TUBA1C aka TUBA6, bcm948)",
                "tubulin alpha 3c (TUBA3C aka TUBA2, bA408E5.3)",
                "tubulin alpha 3d (TUBA3D aka H2-ALPHA, KTCN9, TUBA2)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)"
            ],
            "TP": 20,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "Hemoglobin subunit beta (HBB)",
            "Cystic fibrosis transmembrane conductance regulator (CFTR)",
            "Dystrophin (DMD)",
            "Breast cancer type 1 susceptibility protein (BRCA1)",
            "Breast cancer type 2 susceptibility protein (BRCA2)",
            "Insulin (INS)",
            "Tumor protein p53 (TP53)",
            "Myelin basic protein (MBP)",
            "Huntingtin (HTT)",
            "Apolipoprotein E (APOE)",
            "Collagen type I alpha 1 chain (COL1A1)",
            "Rhodopsin (RHO)",
            "Factor VIII (F8)",
            "Phenylalanine hydroxylase (PAH)",
            "Glucokinase (GCK)",
            "Keratin 1 (KRT1)",
            "Neurofibromin 1 (NF1)",
            "Androgen receptor (AR)",
            "Vascular endothelial growth factor A (VEGFA)",
            "Epidermal growth factor receptor (EGFR)",
            "Alpha-1-antitrypsin (SERPINA1)",
            "C-reactive protein (CRP)",
            "Cytochrome P450 2D6 (CYP2D6)",
            "Glycogen synthase kinase 3 beta (GSK3B)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hemoglobin subunit beta (HBB)",
                "Cystic fibrosis transmembrane conductance regulator (CFTR)",
                "Dystrophin (DMD)",
                "Insulin (INS)",
                "Tumor protein p53 (TP53)",
                "Myelin basic protein (MBP)",
                "Huntingtin (HTT)",
                "Apolipoprotein E (APOE)",
                "Collagen type I alpha 1 chain (COL1A1)",
                "Rhodopsin (RHO)",
                "Phenylalanine hydroxylase (PAH)",
                "Glucokinase (GCK)",
                "Keratin 1 (KRT1)",
                "Neurofibromin 1 (NF1)",
                "Androgen receptor (AR)",
                "Vascular endothelial growth factor A (VEGFA)",
                "Epidermal growth factor receptor (EGFR)",
                "C-reactive protein (CRP)",
                "Cytochrome P450 2D6 (CYP2D6)",
                "Glycogen synthase kinase 3 beta (GSK3B)"
            ],
            "mismatches": [
                "Breast cancer type 1 susceptibility protein (BRCA1)",
                "Breast cancer type 2 susceptibility protein (BRCA2)",
                "Factor VIII (F8)",
                "Alpha-1-antitrypsin (SERPINA1)"
            ],
            "true_referents": [
                "ADP dependent glucokinase (ADPGK aka 2610017G09Rik, ADP-GK)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "BRISC and BRCA1 A complex member 2 (BABAM2 aka BRCC4, BRCC45, BRE)",
                "C-reactive protein (CRP aka PTX1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "androgen receptor (AR aka AIS8, DHTR, HUMARA, HYSP1, KD, NR3C4, SBMA, SMAX1, TFM, AR)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "coagulation factor VIII (F8 aka AHF, DXS1253EB, F8C, FVIII, HEMA, THPH13, F8)",
                "coagulation factor VIII associated 1 (F8A1 aka DXS522E, F8A, HAP40)",
                "coagulation factor VIII associated 2 (F8A2 aka HAP40)",
                "collagen type I alpha 1 chain (COL1A1 aka CAFYD, EDSARTH1, EDSC, OI1, OI2, OI3, OI4)",
                "collagen type I alpha 2 chain (COL1A2 aka EDSARTH2, EDSCV, OI4)",
                "collagen type X alpha 1 chain (COL10A1)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "cysteine rich protein 1 (CRIP1 aka CRHP, CRIP, CRP-1, CRP1)",
                "cysteine rich protein 3 (CRIP3 aka CRP-3, TLP, TLP-A, h6LIMo)",
                "cytochrome P450 2D6 (LOC107987479 aka CYP2D6)",
                "cytochrome P450 family 2 subfamily A member 6 (CYP2A6 aka CPA6, CYP2A, CYP2A3, CYPIIA6, P450C2A, P450PB)",
                "cytochrome P450 family 2 subfamily R member 1 (CYP2R1)",
                "dystrophin (DMD aka BMD, CMD3B, DXS142, DXS164, DXS206, DXS230, DXS239, DXS268, DXS269, DXS270, DXS272, MRX85)",
                "dystrophin related protein 2 (DRP2 aka DRP-2)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "glucokinase (GCK aka FGQTL3, GK, GLK, HHF3, HK4, HKIV, HXKP, LGLK, MODY2, PNDM1)",
                "glucokinase regulator (GCKR aka FGQTL5, GKRP)",
                "glycerol kinase 3 (GK3 aka GK3P, GKP3, GKTB)",
                "glycogen synthase kinase 3 alpha (GSK3A)",
                "glycogen synthase kinase 3 beta (GSK3B)",
                "gonadotropin releasing hormone receptor (GNRHR aka GNRHR1, GRHR, HH7, LHRHR, LRHR)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit delta (HBD aka HBK)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "huntingtin (HTT aka HD, IT15, LOMARS)",
                "huntingtin associated protein 1 (HAP1 aka HAP2, HIP5, HLP, hHLP1)",
                "huntingtin interacting protein K (HYPK aka C15orf63, HSPC136)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin degrading enzyme (IDE aka INSULYSIN)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "keratin 1 (KRT1 aka AEI2, CK1, EHK, EHK1, EPPK, K1A, NEPPK, KRT1)",
                "keratin 76 (KRT76 aka HUMCYT2A, KRT2B, KRT2P)",
                "keratin 77 (KRT77 aka K1B, KRT1B)",
                "myelin associated oligodendrocyte basic protein (MOBP)",
                "myelin basic protein (MBP)",
                "myotrophin (MTPN aka GCDP, V-1)",
                "neurofibromin 1 (NF1 aka NFNS, VRNF, WSS)",
                "neurofilament light chain (NEFL aka CMT1F, CMT2E, CMTDIG, NF-L, NF68, NFL, PPP1R110)",
                "neurofilament medium chain (NEFM aka NEF3, NF-M, NFM)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "peripheral myelin protein 2 (PMP2 aka CMT1G, FABP8, M-FABP, MP2, P2)",
                "phenylalanine hydroxylase (PAH aka PH, PKU, PKU1)",
                "retinal G protein coupled receptor (RGR aka RP44)",
                "retinal pigment epithelium-derived rhodopsin homolog (RRH)",
                "rhodopsin (RHO aka CSNBAD1, OPN2, RP4)",
                "serpin family A member 1 (SERPINA1 aka A1A, A1AT, AAT, PI, PI1, PRO2275, alpha1AT, nNIF)",
                "serpin family A member 11 (SERPINA11)",
                "serpin family A member 3 (SERPINA3 aka AACT, ACT, GIG24, GIG25)",
                "steroid 5 alpha-reductase 1 (SRD5A1 aka S5AR 1)",
                "tryptophan hydroxylase 1 (TPH1 aka TPRH, TRPH)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)",
                "tyrosine hydroxylase (TH aka DYT14, DYT5b, TYH)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor C (VEGFC aka Flt4-L, LMPH1D, LMPHM4, VRP)"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "TP53 (TP53)",
            "BRCA1 (BRCA1)",
            "BRCA2 (BRCA2)",
            "EGFR (EGFR)",
            "APOE (APOE)",
            "KRAS (KRAS)",
            "MYC (MYC)",
            "PTEN (PTEN)",
            "VEGFA (VEGFA)",
            "TNF (TNF)",
            "IL6 (IL6)",
            "CDKN2A (CDKN2A)",
            "TP63 (TP63)",
            "MAPK1 (MAPK1)",
            "CASP3 (CASP3)",
            "GAPDH (GAPDH)",
            "SOD1 (SOD1)",
            "FTO (FTO)",
            "HLA-A (HLA-A)",
            "HBB (HBB)",
            "CFTR (CFTR)",
            "ACE (ACE)",
            "CCND1 (CCND1)",
            "MTHFR (MTHFR)",
            "P53 (P53)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "BRCA2",
                "EGFR",
                "APOE",
                "KRAS",
                "MYC",
                "PTEN",
                "VEGFA",
                "TNF",
                "IL6",
                "TP63",
                "MAPK1",
                "CASP3",
                "GAPDH",
                "SOD1",
                "FTO",
                "HLA-A",
                "HBB",
                "CFTR",
                "ACE",
                "MTHFR"
            ],
            "mismatches": [
                "BRCA1",
                "CDKN2A",
                "CCND1",
                "P53"
            ],
            "true_referents": [
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 DNA repair associated (BRCA2 aka BRCC2, BROVCA2, FACD, FAD, FAD1, FANCD, FANCD1, GLM3, PNCA2, XRCC11)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CD63 molecule (CD63 aka AD1, HOP-26, ME491, MLA1, OMA81H, Pltgp40, TSPAN30)",
                "CDKN2A interacting protein (CDKN2AIP)",
                "CDKN2A interacting protein N-terminal like (CDKN2AIPNL aka C2AIL)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "FOS like 2, AP-1 transcription factor subunit (FOSL2 aka ACED, FRA2)",
                "FTO alpha-ketoglutarate dependent dioxygenase (FTO aka ALKBH9, BMIQ14, GDFD, IFEX9)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "MYC binding protein (MYCBP aka AMY-1)",
                "MYC proto-oncogene, bHLH transcription factor (MYC aka MRTLC, bHLHe39, c-Myc, MYC)",
                "MYC target 1 (MYCT1 aka MTLC)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "RAS related (RRAS aka R-Ras1, RRAS)",
                "RAS related 2 (RRAS2 aka NS12, TC21)",
                "TCF3 fusion partner (TFPT aka FB1, INO80F, amida)",
                "TNF superfamily member 10 (TNFSF10 aka APO2L, Apo-2L, CD253, TANCR, TL2, TNLG6A, TRAIL)",
                "TNF superfamily member 11 (TNFSF11 aka CD254, ODF, OPGL, OPTB2, RANKL, TNLG6B, TRANCE, hRANKL2, sOdf)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "TP53 target 3 (TP53TG3 aka P53TG3A, TP53TG3E, TP53TG3F, TP53TG3)",
                "aldehyde dehydrogenase 5 family member A1 (ALDH5A1 aka SSADH, SSDH)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "angiotensin I converting enzyme (ACE aka ACE1, CD143, DCP, DCP1)",
                "angiotensin converting enzyme 2 (ACE2 aka ACEH)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "caspase 3 (CASP3 aka CPP32, CPP32B, SCA-1)",
                "caspase 5 (CASP5 aka ICE(rel)III, ICEREL-III, ICH-3)",
                "caspase 6 (CASP6 aka CSP-6, MCH2, caspase-6)",
                "claudin domain containing 2 (CLDND2)",
                "copine 1 (CPNE1 aka COPN1, CPN1)",
                "cortexin domain containing 1 (CTXND1 aka LINC01314)",
                "cyclin dependent kinase 2 (CDK2 aka CDKN2, p33(CDK2))",
                "dihydrofolate reductase (DHFR aka DHFR1P1, DYR, DHFR)",
                "dihydrofolate reductase 2 (DHFR2 aka DHFRL1, DHFRP4)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "folate receptor alpha (FOLR1 aka FBP, FOLR, FRalpha, NCFTD)",
                "glyceraldehyde-3-phosphate dehydrogenase (GAPDH aka G3PD, GAPD, HEL-S-162eP)",
                "glyceraldehyde-3-phosphate dehydrogenase, spermatogenic (GAPDHS aka GAPD2, GAPDH-2, GAPDS, HEL-S-278, HSD-35)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "inhibin subunit beta B (INHBB)",
                "interleukin 13 (IL13 aka IL-13, P600)",
                "interleukin 6 (IL6 aka BSF-2, BSF2, CDF, HGF, HSF, IFN-beta-2, IFNB2, IL-6)",
                "interleukin 7 (IL7 aka IL-7, IMD130)",
                "lactase (LCT aka LAC, LPH, LPH1)",
                "major histocompatibility complex, class I, A (HLA-A aka HLAA)",
                "major histocompatibility complex, class I, G (HLA-G aka MHC-G)",
                "major histocompatibility complex, class II, DR alpha (HLA-DRA aka HLA-DRA1)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "mitogen-activated protein kinase 1 (MAPK1 aka ERK, ERK-2, ERK2, ERT1, MAPK2, NS13, P42MAPK, PRKM1, PRKM2, p38, p40, p41, p41mapk, p42-MAPK)",
                "mitogen-activated protein kinase kinase 1 (MAP2K1 aka CFC3, MAPKK1, MEK1, MEL, MKK1, PRKMK1)",
                "mitogen-activated protein kinase kinase kinase 1 (MAP3K1 aka MAPKKK1, MEKK, MEKK 1, MEKK1, SRXY6)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "protein tyrosine phosphatase receptor type E (PTPRE aka HPTPE, PTPE, R-PTP-EPSILON)",
                "superoxide dismutase 1 (SOD1 aka ALS, ALS1, HEL-S-44, IPOA, SOD, STAHP, hSod1, homodimer)",
                "superoxide dismutase 2 (SOD2 aka GC1, GClnc1, IPO-B, IPOB, MNSOD, MVCD6, Mn-SOD, lncRNA-GC1)",
                "superoxide dismutase 3 (SOD3 aka EC-SOD)",
                "tumor necrosis factor (TNF aka DIF, IMD127-alpha, TNFA, TNFSF2, TNLG1F, TNF)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p63 (TP63 aka AIS, B(p51A), B(p51B), EEC3, KET, LMS, NBP, OFC8, RHS, SHFM4, TP53CP, TP53L, TP73L, p40, p51, p53CP, p63, p73H, p73L)",
                "tumor protein p63 regulated 1 like (TPRG1L aka FAM79A, SVAP30, TPRGL, h-mover, mover)",
                "ubiquitin B (UBB aka HEL-S-50)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor D (VEGFD aka FIGF, VEGF-D)"
            ],
            "TP": 21,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "BRCA1, DNA repair associated (BRCA1)",
            "BRCA2, DNA repair associated (BRCA2)",
            "TP53, tumor protein p53 (TP53)",
            "CFTR, cystic fibrosis transmembrane conductance regulator (CFTR)",
            "EGFR, epidermal growth factor receptor (EGFR)",
            "VEGFA, vascular endothelial growth factor A (VEGFA)",
            "TNF, tumor necrosis factor (TNF)",
            "IL6, interleukin 6 (IL6)",
            "MYC, MYC proto-oncogene, bHLH transcription factor (MYC)",
            "AKT1, AKT serine/threonine kinase 1 (AKT1)",
            "ERBB2, erb-b2 receptor tyrosine kinase 2 (ERBB2)",
            "APC, APC regulator of WNT signaling pathway (APC)",
            "PTEN, phosphatase and tensin homolog (PTEN)",
            "RAS, rat sarcoma viral oncogene homolog (RAS)",
            "CDKN1A, cyclin dependent kinase inhibitor 1A (CDKN1A)",
            "FOXO1, forkhead box O1 (FOXO1)",
            "MDM2, MDM2 proto-oncogene (MDM2)",
            "ATM, ATM serine/threonine kinase (ATM)",
            "HIF1A, hypoxia inducible factor 1 subunit alpha (HIF1A)",
            "MMP9, matrix metallopeptidase 9 (MMP9)",
            "STAT3, signal transducer and activator of transcription 3 (STAT3)",
            "SMAD4, SMAD family member 4 (SMAD4)",
            "DNMT1, DNA methyltransferase 1 (DNMT1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin (INS)",
                "BRCA1, DNA repair associated (BRCA1)",
                "BRCA2, DNA repair associated (BRCA2)",
                "TP53, tumor protein p53 (TP53)",
                "CFTR, cystic fibrosis transmembrane conductance regulator (CFTR)",
                "EGFR, epidermal growth factor receptor (EGFR)",
                "VEGFA, vascular endothelial growth factor A (VEGFA)",
                "TNF, tumor necrosis factor (TNF)",
                "IL6, interleukin 6 (IL6)",
                "MYC, MYC proto-oncogene, bHLH transcription factor (MYC)",
                "AKT1, AKT serine/threonine kinase 1 (AKT1)",
                "ERBB2, erb-b2 receptor tyrosine kinase 2 (ERBB2)",
                "APC, APC regulator of WNT signaling pathway (APC)",
                "PTEN, phosphatase and tensin homolog (PTEN)",
                "CDKN1A, cyclin dependent kinase inhibitor 1A (CDKN1A)",
                "FOXO1, forkhead box O1 (FOXO1)",
                "MDM2, MDM2 proto-oncogene (MDM2)",
                "ATM, ATM serine/threonine kinase (ATM)",
                "HIF1A, hypoxia inducible factor 1 subunit alpha (HIF1A)",
                "MMP9, matrix metallopeptidase 9 (MMP9)",
                "STAT3, signal transducer and activator of transcription 3 (STAT3)",
                "SMAD4, SMAD family member 4 (SMAD4)",
                "DNMT1, DNA methyltransferase 1 (DNMT1)"
            ],
            "mismatches": [
                "RAS, rat sarcoma viral oncogene homolog (RAS)"
            ],
            "true_referents": [
                "AKT serine/threonine kinase 1 (AKT1 aka AKT, PKB, PKB-ALPHA, PRKBA, RAC, RAC-ALPHA)",
                "AKT serine/threonine kinase 2 (AKT2 aka HIHGHH, PKBB, PKBBETA, PRKBB, RAC-BETA)",
                "AKT serine/threonine kinase 3 (AKT3 aka MPPH, MPPH2, PKB-GAMMA, PKBG, PRKBG, RAC-PK-gamma, RAC-gamma, STK-2)",
                "APC down-regulated 1 (APCDD1 aka B7323, DRAPC1, FP7019, HHS, HTS, HYPT1)",
                "APC regulator of WNT signaling pathway (APC aka BTPS2, DESMD, DP2, DP2.5, DP3, GS, PPP1R46)",
                "APC regulator of WNT signaling pathway 2 (APC2 aka APCL, MRT74)",
                "ATM serine/threonine kinase (ATM aka AT1, ATA, ATC, ATD, ATDC, ATE, TEL1, TELO1)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 DNA repair associated (BRCA1 aka BRCAI, BRCC1, BROVCA1, FANCS, IRIS, PNCA4, PPP1R53, PSCP, RNF53)",
                "BRCA1 associated ATM activator 1 (BRAT1 aka BAAT1, C7orf27, NEDCAS, RMFSL)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 DNA repair associated (BRCA2 aka BRCC2, BROVCA2, FACD, FAD, FAD1, FANCD, FANCD1, GLM3, PNCA2, XRCC11)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "DNA methyltransferase 1 (DNMT1 aka ADCADN, AIM, CXXC9, DNMT, HSN1E, MCMT, m.HsaI)",
                "DNA methyltransferase 1 associated protein 1 (DMAP1 aka DNMAP1, DNMTAP1, EAF2, MEAF2, SWC4)",
                "DNA methyltransferase 3 beta (DNMT3B aka FSHD4, ICF, ICF1, M.HsaIIIB)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "MDM2 binding protein (MTBP aka MDM2BP)",
                "MDM2 proto-oncogene (MDM2 aka ACTFS, HDMX, LSKB, hdm2)",
                "MDM4 regulator of p53 (MDM4 aka BMFS6, HDMX, MDMX, MRP1)",
                "MYC proto-oncogene, bHLH transcription factor (MYC aka MRTLC, bHLHe39, c-Myc, MYC)",
                "MYCL proto-oncogene, bHLH transcription factor (MYCL aka L-Myc, LMYC1, bHLHe38, MYCL)",
                "MYCN proto-oncogene, bHLH transcription factor (MYCN aka FGLDS1, MODED, MPAPAsORF, MYCNsPEP, N-myc, NMYC, ODED, bHLHe37, MYCN)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "RAS like proto-oncogene A (RALA aka HINCONS, RAL)",
                "SMAD family member 1 (SMAD1 aka BSP-1, BSP1, JV4-1, JV41, MADH1, MADR1)",
                "SMAD family member 4 (SMAD4 aka DPC4, JIP, MADH4, MYHRS)",
                "SMAD family member 9 (SMAD9 aka MADH6, MADH9, PPH2, SMAD8, SMAD8/9, SMAD8A, SMAD8B)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "cyclin dependent kinase 1 (CDK1 aka CDC2, CDC28A, P34CDC2)",
                "cyclin dependent kinase inhibitor 1A (CDKN1A aka CAP20, CDKN1, CIP1, MDA-6, P21, SDI1, WAF1, p21CIP1)",
                "cyclin dependent kinase inhibitor 1B (CDKN1B aka CDKN4, KIP1, MEN1B, MEN4, P27KIP1)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "erb-b2 receptor tyrosine kinase 2 (ERBB2 aka CD340, HER-2, HER-2/neu, HER2, MLN 19, MLN-19, NEU, NGL, TKR1, VSCN2, c-ERB-2, c-ERB2, p185(erbB2))",
                "erb-b2 receptor tyrosine kinase 4 (ERBB4 aka ALS19, HER4, p180erbB4)",
                "forkhead box O1 (FOXO1 aka FKH1, FKHRA, FOXO1)",
                "forkhead box O3 (FOXO3 aka AF6q21, FKHRL1, FKHRL1P2, FOXO2A, FOXO3)",
                "forkhead box O6 (FOXO6)",
                "hypoxia inducible factor 1 subunit alpha (HIF1A aka HIF-1-alpha, HIF-1A, HIF-1alpha, HIF1, HIF1-ALPHA, MOP1, PASD8, bHLHe78)",
                "hypoxia inducible factor 1 subunit alpha inhibitor (HIF1AN aka FIH1)",
                "hypoxia inducible factor 3 subunit alpha (HIF3A aka HIF-3A, HIF3-alpha-1, IPAS, MOP7, PASD7, bHLHe17)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin degrading enzyme (IDE aka INSULYSIN)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "interleukin 13 (IL13 aka IL-13, P600)",
                "interleukin 2 (IL2 aka IL-2, TCGF, lymphokine)",
                "interleukin 5 (IL5 aka EDF, IL-5, TRF)",
                "interleukin 6 (IL6 aka BSF-2, BSF2, CDF, HGF, HSF, IFN-beta-2, IFNB2, IL-6)",
                "interleukin 7 (IL7 aka IL-7, IMD130)",
                "matrix metallopeptidase 24 (MMP24 aka MMP-24, MMP25, MT-MMP 5, MT-MMP5, MT5-MMP, MT5MMP, MTMMP5)",
                "matrix metallopeptidase 26 (MMP26)",
                "matrix metallopeptidase 9 (MMP9 aka CLG4B, GELB, MANDP2, MMP-9)",
                "muscle RAS oncogene homolog (MRAS aka M-RAs, NS11, R-RAS3, RRAS3)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "signal transducer and activator of transcription 1 (STAT1 aka CANDF7, IMD31A, IMD31B, IMD31C, ISGF-3, STAT91)",
                "signal transducer and activator of transcription 3 (STAT3 aka ADMIO, ADMIO1, APRF, HIES)",
                "signal transducer and activator of transcription 6 (STAT6 aka D12S1644, HIES6, IL-4-STATB, STAT6C, STAT6)",
                "transmembrane phosphatase with tensin homology (TPTE aka CT44, PTEN21, TPTE)",
                "tumor necrosis factor (TNF aka DIF, IMD127-alpha, TNFA, TNFSF2, TNLG1F, TNF)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor C (VEGFC aka Flt4-L, LMPH1D, LMPHM4, VRP)"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1 (HGNC:1100)",
            "TP53 (HGNC:11998)",
            "EGFR (HGNC:3236)",
            "PTEN (HGNC:9588)",
            "KRAS (HGNC:6407)",
            "BRAF (HGNC:1097)",
            "HER2 (HGNC:11998)",
            "VEGFA (HGNC:12680)",
            "AKT1 (HGNC:391)",
            "MTOR (HGNC:3942)",
            "EGF (HGNC:3236)",
            "IL6 (HGNC:6018)",
            "TNF (HGNC:11892)",
            "INS (HGNC:6093)",
            "GAPDH (HGNC:4141)",
            "ACTB (HGNC:333)",
            "MYC (HGNC:7553)",
            "CDKN1A (HGNC:1787)",
            "PTGS2 (HGNC:9608)",
            "ESR1 (HGNC:3467)",
            "FOXP2 (HGNC:3803)",
            "HBB (HGNC:4827)",
            "CFTR (HGNC:1884)",
            "COL1A1 (HGNC:2197)",
            "FMR1 (HGNC:3775)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "EGFR",
                "PTEN",
                "KRAS",
                "BRAF",
                "VEGFA",
                "AKT1",
                "IL6",
                "TNF",
                "INS",
                "GAPDH",
                "MYC",
                "CDKN1A",
                "PTGS2",
                "ESR1",
                "FOXP2",
                "HBB",
                "CFTR",
                "COL1A1"
            ],
            "mismatches": [
                "BRCA1",
                "HER2",
                "MTOR",
                "EGF",
                "ACTB",
                "FMR1"
            ],
            "true_referents": [
                "AKT serine/threonine kinase 1 (AKT1 aka AKT, PKB, PKB-ALPHA, PRKBA, RAC, RAC-ALPHA)",
                "AKT serine/threonine kinase 2 (AKT2 aka HIHGHH, PKBB, PKBBETA, PRKBB, RAC-BETA)",
                "AKT serine/threonine kinase 3 (AKT3 aka MPPH, MPPH2, PKB-GAMMA, PKBG, PRKBG, RAC-PK-gamma, RAC-gamma, STK-2)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRISC and BRCA1 A complex member 2 (BABAM2 aka BRCC4, BRCC45, BRE)",
                "CDKN1A interacting zinc finger protein 1 (CIZ1 aka LSFR1, NP94, ZNF356)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "D-2-hydroxyglutarate dehydrogenase (D2HGDH aka D2HGD)",
                "EGF like domain multiple 6 (EGFL6 aka MAEG, W80)",
                "ESX homeobox 1 (ESX1 aka ESX1L, ESXR1)",
                "G protein subunit beta 1 (GNB1 aka HG2A, MDS, MRD42)",
                "G protein subunit beta 3 (GNB3 aka CSNB1H, HG2D)",
                "GINS complex subunit 2 (GINS2 aka HSPC037, PSF2, Pfs2)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "MTOR associated protein, eak-7 homolog (MEAK7 aka EAK7, KIAA1609, TLDC1, mEAK-7)",
                "MYC proto-oncogene, bHLH transcription factor (MYC aka MRTLC, bHLHe39, c-Myc, MYC)",
                "MYC target 1 (MYCT1 aka MTLC)",
                "MYCN proto-oncogene, bHLH transcription factor (MYCN aka FGLDS1, MODED, MPAPAsORF, MYCNsPEP, N-myc, NMYC, ODED, bHLHe37, MYCN)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "RAS related (RRAS aka R-Ras1, RRAS)",
                "RPTOR independent companion of MTOR complex 2 (RICTOR aka AVO3, PIA, hAVO3)",
                "Raf-1 proto-oncogene, serine/threonine kinase (RAF1 aka CMD1NN, CRAF, NS5, Raf-1, c-Raf)",
                "TNF superfamily member 18 (TNFSF18 aka AITRL, GITRL, TL6, TNLG2A, hGITRL)",
                "TNF superfamily member 9 (TNFSF9 aka 4-1BB-L, CD137L, TNLG5A)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "TP53 target 1 (TP53TG1 aka LINC00096, NCRNA00096, P53TG1, P53TG1-D, TP53AP1, TP53LC12)",
                "actin beta like 2 (ACTBL2 aka ACT)",
                "actin gamma 1 (ACTG1 aka ACT, ACTG, DFNA20, DFNA26, HEL-176)",
                "actin like 6B (ACTL6B aka ACTL6, BAF53B, DEE76, EIEE76, IDDSSAD, SMARCN2, arpNalpha)",
                "codanin 1 (CDAN1 aka CDA1, CDAIA, DLT, PRO1295, CDAN1)",
                "collagen type I alpha 1 chain (COL1A1 aka CAFYD, EDSARTH1, EDSC, OI1, OI2, OI3, OI4)",
                "collagen type XX alpha 1 chain (COL20A1)",
                "collagen type XXI alpha 1 chain (COL21A1 aka COLA1L, FP633)",
                "cryptic, EGF-CFC family member 1 (CFC1 aka CFC1B, CRYPTIC, DTGA2, HTX2)",
                "cyclin dependent kinase inhibitor 1A (CDKN1A aka CAP20, CDKN1, CIP1, MDA-6, P21, SDI1, WAF1, p21CIP1)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "erb-b2 receptor tyrosine kinase 2 (ERBB2 aka CD340, HER-2, HER-2/neu, HER2, MLN 19, MLN-19, NEU, NGL, TKR1, VSCN2, c-ERB-2, c-ERB2, p185(erbB2))",
                "erb-b2 receptor tyrosine kinase 4 (ERBB4 aka ALS19, HER4, p180erbB4)",
                "estrogen receptor 1 (ESR1 aka ER, ESR, ESRA, ESTRR, Era, NR3A1)",
                "estrogen related receptor alpha (ESRRA aka ERR1, ERRa, ERRalpha, ESRL1, NR3B1)",
                "forkhead box P1 (FOXP1 aka 12CC4, HSPC215, MFH, QRF1, hFKH1B)",
                "forkhead box P2 (FOXP2 aka CAGH44, SPCH1, TNRC10)",
                "forkhead box P3 (FOXP3 aka AIID, DIETER, IPEX, JM2, PIDX, XPID)",
                "glyceraldehyde-3-phosphate dehydrogenase (GAPDH aka G3PD, GAPD, HEL-S-162eP)",
                "glyceraldehyde-3-phosphate dehydrogenase, spermatogenic (GAPDHS aka GAPD2, GAPDH-2, GAPDS, HEL-S-278, HSD-35)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin induced gene 1 (INSIG1 aka CL6)",
                "interleukin 13 (IL13 aka IL-13, P600)",
                "interleukin 6 (IL6 aka BSF-2, BSF2, CDF, HGF, HSF, IFN-beta-2, IFNB2, IL-6)",
                "interleukin 6 receptor (IL6R aka CD126, HIES5, IL-1Ra, IL-6R, IL-6R-1, IL-6RA, IL6Q, IL6QTLA, IL6RQ, gp80, IL6R)",
                "ninein (NIN aka SCKL7)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "prostaglandin-endoperoxide synthase 2 (PTGS2 aka COX-2, COX2, GRIPGHS, PGG/HS, PGHS-2, PHS-2, hCox-2)",
                "protein tyrosine phosphatase non-receptor type 4 (PTPN4 aka MEG, PTPMEG, PTPMEG1)",
                "regulator of G protein signaling 2 (RGS2 aka G0S8)",
                "regulatory associated protein of MTOR complex 1 (RPTOR aka KOG1, Mip1)",
                "solute carrier family 25 member 52 (SLC25A52 aka MCART2)",
                "tumor necrosis factor (TNF aka DIF, IMD127-alpha, TNFA, TNFSF2, TNLG1F, TNF)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor C (VEGFC aka Flt4-L, LMPH1D, LMPHM4, VRP)"
            ],
            "TP": 19,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "Tumor Protein P53 (TP53)",
            "Breast Cancer Type 1 Susceptibility Protein (BRCA1)",
            "Epidermal Growth Factor Receptor (EGFR)",
            "MYC Proto-Oncogene (MYC)",
            "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
            "Beta Actin (ACTB)",
            "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
            "Hemoglobin Subunit Beta (HBB)",
            "Apolipoprotein E (APOE)",
            "Insulin (INS)",
            "Neurofibromin 1 (NF1)",
            "Vascular Endothelial Growth Factor A (VEGFA)",
            "KRAS Proto-Oncogene (KRAS)",
            "Estrogen Receptor 1 (ESR1)",
            "Methylenetetrahydrofolate Reductase (MTHFR)",
            "Apolipoprotein B (APOB)",
            "Catechol-O-Methyltransferase (COMT)",
            "Interleukin 6 (IL6)",
            "Fat Mass and Obesity-Associated Protein (FTO)",
            "Cyclin-Dependent Kinase 2 (CDK2)",
            "B-Raf Proto-Oncogene (BRAF)",
            "Circadian Locomotor Output Cycles Kaput (CLOCK)",
            "Superoxide Dismutase 1 (SOD1)",
            "Dystrophin (DMD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Tumor Protein P53 (TP53)",
                "Epidermal Growth Factor Receptor (EGFR)",
                "MYC Proto-Oncogene (MYC)",
                "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
                "Beta Actin (ACTB)",
                "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
                "Hemoglobin Subunit Beta (HBB)",
                "Apolipoprotein E (APOE)",
                "Insulin (INS)",
                "Neurofibromin 1 (NF1)",
                "Vascular Endothelial Growth Factor A (VEGFA)",
                "KRAS Proto-Oncogene (KRAS)",
                "Estrogen Receptor 1 (ESR1)",
                "Methylenetetrahydrofolate Reductase (MTHFR)",
                "Apolipoprotein B (APOB)",
                "Catechol-O-Methyltransferase (COMT)",
                "Interleukin 6 (IL6)",
                "Cyclin-Dependent Kinase 2 (CDK2)",
                "B-Raf Proto-Oncogene (BRAF)",
                "Circadian Locomotor Output Cycles Kaput (CLOCK)",
                "Superoxide Dismutase 1 (SOD1)",
                "Dystrophin (DMD)"
            ],
            "mismatches": [
                "Breast Cancer Type 1 Susceptibility Protein (BRCA1)",
                "Fat Mass and Obesity-Associated Protein (FTO)"
            ],
            "true_referents": [
                "A-Raf proto-oncogene, serine/threonine kinase (ARAF aka A-RAF1, PKS2, RAFA1, ARAF)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "MYC proto-oncogene, bHLH transcription factor (MYC aka MRTLC, bHLHe39, c-Myc, MYC)",
                "MYC target 1 (MYCT1 aka MTLC)",
                "MYCN proto-oncogene, bHLH transcription factor (MYCN aka FGLDS1, MODED, MPAPAsORF, MYCNsPEP, N-myc, NMYC, ODED, bHLHe37, MYCN)",
                "NRAS proto-oncogene, GTPase (NRAS aka ALPS4, CMNS, KRAS, N-ras, NCMS1, NS6, NRAS)",
                "Raf-1 proto-oncogene, serine/threonine kinase (RAF1 aka CMD1NN, CRAF, NS5, Raf-1, c-Raf)",
                "actin beta (ACTB aka BKRNS, BNS, BRWS1, CSMH, DDS1, PS1TP5BP1, THC8)",
                "actin beta like 2 (ACTBL2 aka ACT)",
                "adipogenin (ADIG aka SMAF1)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein B (APOB aka FCHL2, FLDB, LDLCQ4, apoB-100, apoB-48)",
                "apolipoprotein B receptor (APOBR aka APOB100R, APOB48R)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "capping actin protein of muscle Z-line subunit beta (CAPZB aka CAPB, CAPPB, CAPZ)",
                "catechol-O-methyltransferase (COMT aka HEL-S-98n)",
                "catechol-O-methyltransferase domain containing 1 (COMTD1)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "circadian associated repressor of transcription (CIART aka C1orf51, CHRONO, GM129)",
                "clock circadian regulator (CLOCK aka KAT13D, bHLHe8)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "cryptochrome circadian regulator 1 (CRY1 aka DSPD, PHLL1)",
                "cyclin dependent kinase 1 (CDK1 aka CDC2, CDC28A, P34CDC2)",
                "cyclin dependent kinase 2 (CDK2 aka CDKN2, p33(CDK2))",
                "cyclin dependent kinase 3 (CDK3)",
                "dihydrofolate reductase (DHFR aka DHFR1P1, DYR, DHFR)",
                "dihydrofolate reductase 2 (DHFR2 aka DHFRL1, DHFRP4)",
                "dystrophin (DMD aka BMD, CMD3B, DXS142, DXS164, DXS206, DXS230, DXS239, DXS268, DXS269, DXS270, DXS272, MRX85)",
                "dystrophin related protein 2 (DRP2 aka DRP-2)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "estrogen receptor 1 (ESR1 aka ER, ESR, ESRA, ESTRR, Era, NR3A1)",
                "estrogen related receptor alpha (ESRRA aka ERR1, ERRa, ERRalpha, ESRL1, NR3B1)",
                "estrogen related receptor beta (ESRRB aka DFNB35, ERR beta-2, ERR2, ERRb, ERRbeta2, ESRL2, NR3B2)",
                "fat storage inducing transmembrane protein 1 (FITM1 aka FIT1)",
                "fatty acid binding protein 2 (FABP2 aka FABPI, I-FABP)",
                "glyceraldehyde-3-phosphate dehydrogenase (GAPDH aka G3PD, GAPD, HEL-S-162eP)",
                "glyceraldehyde-3-phosphate dehydrogenase, spermatogenic (GAPDHS aka GAPD2, GAPDH-2, GAPDS, HEL-S-278, HSD-35)",
                "glycerol-3-phosphate dehydrogenase 1 (GPD1 aka GPD-C, GPDH-C, HTGTI)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit delta (HBD aka HBK)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin degrading enzyme (IDE aka INSULYSIN)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "interleukin 13 (IL13 aka IL-13, P600)",
                "interleukin 6 (IL6 aka BSF-2, BSF2, CDF, HGF, HSF, IFN-beta-2, IFNB2, IL-6)",
                "interleukin 7 (IL7 aka IL-7, IMD130)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "myotrophin (MTPN aka GCDP, V-1)",
                "neurofibromin 1 (NF1 aka NFNS, VRNF, WSS)",
                "neurofilament light chain (NEFL aka CMT1F, CMT2E, CMTDIG, NF-L, NF68, NFL, PPP1R110)",
                "neurofilament medium chain (NEFM aka NEF3, NF-M, NFM)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "superoxide dismutase 1 (SOD1 aka ALS, ALS1, HEL-S-44, IPOA, SOD, STAHP, hSod1, homodimer)",
                "superoxide dismutase 2 (SOD2 aka GC1, GClnc1, IPO-B, IPOB, MNSOD, MVCD6, Mn-SOD, lncRNA-GC1)",
                "superoxide dismutase 3 (SOD3 aka EC-SOD)",
                "transmembrane O-methyltransferase (TOMT aka COMT2)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor C (VEGFC aka Flt4-L, LMPH1D, LMPHM4, VRP)"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "Hemoglobin Subunit Beta (HBB)",
            "Tumor Protein p53 (TP53)",
            "Epidermal Growth Factor Receptor (EGFR)",
            "Insulin (INS)",
            "Breast Cancer 1 (BRCA1)",
            "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
            "Apolipoprotein E (APOE)",
            "Dystrophin (DMD)",
            "Huntingtin (HTT)",
            "Myosin Heavy Chain 7 (MYH7)",
            "Collagen Type I Alpha 1 Chain (COL1A1)",
            "Glucocerebrosidase (GBA)",
            "Androgen Receptor (AR)",
            "Amyloid Beta Precursor Protein (APP)",
            "Estrogen Receptor 1 (ESR1)",
            "Fibroblast Growth Factor Receptor 3 (FGFR3)",
            "Paired Box 6 (PAX6)",
            "Sonic Hedgehog (SHH)",
            "Vascular Endothelial Growth Factor A (VEGFA)",
            "Tumor Necrosis Factor (TNF)",
            "Interleukin 6 (IL6)",
            "Kirsten Rat Sarcoma Viral Oncogene Homolog (KRAS)",
            "Microtubule Associated Protein Tau (MAPT)",
            "Retinoblastoma 1 (RB1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hemoglobin Subunit Beta (HBB)",
                "Tumor Protein p53 (TP53)",
                "Epidermal Growth Factor Receptor (EGFR)",
                "Insulin (INS)",
                "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
                "Apolipoprotein E (APOE)",
                "Dystrophin (DMD)",
                "Huntingtin (HTT)",
                "Myosin Heavy Chain 7 (MYH7)",
                "Collagen Type I Alpha 1 Chain (COL1A1)",
                "Androgen Receptor (AR)",
                "Amyloid Beta Precursor Protein (APP)",
                "Estrogen Receptor 1 (ESR1)",
                "Fibroblast Growth Factor Receptor 3 (FGFR3)",
                "Vascular Endothelial Growth Factor A (VEGFA)",
                "Tumor Necrosis Factor (TNF)",
                "Interleukin 6 (IL6)",
                "Kirsten Rat Sarcoma Viral Oncogene Homolog (KRAS)",
                "Microtubule Associated Protein Tau (MAPT)"
            ],
            "mismatches": [
                "Breast Cancer 1 (BRCA1)",
                "Glucocerebrosidase (GBA)",
                "Paired Box 6 (PAX6)",
                "Sonic Hedgehog (SHH)",
                "Retinoblastoma 1 (RB1)"
            ],
            "true_referents": [
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 DNA repair associated (BRCA1 aka BRCAI, BRCC1, BROVCA1, FANCS, IRIS, PNCA4, PPP1R53, PSCP, RNF53)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "Indian hedgehog signaling molecule (IHH aka BDA1, HHG2)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "SUFU negative regulator of hedgehog signaling (SUFU aka BCNS2, JBTS32, PRO1280H, SUFUXL, SUFU)",
                "TNF superfamily member 11 (TNFSF11 aka CD254, ODF, OPGL, OPTB2, RANKL, TNLG6B, TRANCE, hRANKL2, sOdf)",
                "alpha glucosidase (GAA aka LYAG)",
                "amyloid beta precursor like protein 2 (APLP2 aka APLP-2, APPH, APPL2, CDEBP)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "amyloid beta precursor protein binding protein 2 (APPBP2 aka APP-BP2, HS.84084, PAT1)",
                "androgen receptor (AR aka AIS8, DHTR, HUMARA, HYSP1, KD, NR3C4, SBMA, SMAX1, TFM, AR)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "collagen type I alpha 1 chain (COL1A1 aka CAFYD, EDSARTH1, EDSC, OI1, OI2, OI3, OI4)",
                "collagen type I alpha 2 chain (COL1A2 aka EDSARTH2, EDSCV, OI4)",
                "collagen type X alpha 1 chain (COL10A1)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "dystrophin (DMD aka BMD, CMD3B, DXS142, DXS164, DXS206, DXS230, DXS239, DXS268, DXS269, DXS270, DXS272, MRX85)",
                "dystrophin related protein 2 (DRP2 aka DRP-2)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "estrogen receptor 1 (ESR1 aka ER, ESR, ESRA, ESTRR, Era, NR3A1)",
                "estrogen related receptor alpha (ESRRA aka ERR1, ERRa, ERRalpha, ESRL1, NR3B1)",
                "estrogen related receptor beta (ESRRB aka DFNB35, ERR beta-2, ERR2, ERRb, ERRbeta2, ESRL2, NR3B2)",
                "fibroblast growth factor receptor 1 (FGFR1 aka BFGFR, CD331, CEK, ECCL, FGFBR, FGFR-1, FLG, FLT-2, FLT2, HBGFR, HH2, HRTFDS, KAL2, N-SAM, OGD, bFGF-R-1)",
                "fibroblast growth factor receptor 3 (FGFR3 aka ACH, CD333, CEK2, HSFGFR3EX, JTK4)",
                "fibroblast growth factor receptor like 1 (FGFRL1 aka FGFR-5, FGFR5, FHFR)",
                "glucosylceramidase beta 1 (GBA1 aka GBA, GCB, GLUC)",
                "glucosylceramidase beta 2 (GBA2 aka AD035, NLGase, SPG46)",
                "gonadotropin releasing hormone receptor (GNRHR aka GNRHR1, GRHR, HH7, LHRHR, LRHR)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit delta (HBD aka HBK)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "huntingtin (HTT aka HD, IT15, LOMARS)",
                "huntingtin associated protein 1 (HAP1 aka HAP2, HIP5, HLP, hHLP1)",
                "huntingtin interacting protein K (HYPK aka C15orf63, HSPC136)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin degrading enzyme (IDE aka INSULYSIN)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "interleukin 13 (IL13 aka IL-13, P600)",
                "interleukin 5 (IL5 aka EDF, IL-5, TRF)",
                "interleukin 6 (IL6 aka BSF-2, BSF2, CDF, HGF, HSF, IFN-beta-2, IFNB2, IL-6)",
                "interleukin 7 (IL7 aka IL-7, IMD130)",
                "kinase suppressor of ras 1 (KSR1 aka KSR, RSU2)",
                "microtubule associated protein 2 (MAP2 aka MAP-2A, MAP2B, MAP2C, MAP2)",
                "microtubule associated protein 4 (MAP4)",
                "microtubule associated protein tau (MAPT aka DDPAC, FTD1, FTDP-17L, MSTD, MTBT1, MTBT2, PPND, PPP1R103, TAU, Tau-PHF6, tau-40, MAPT)",
                "muscle RAS oncogene homolog (MRAS aka M-RAs, NS11, R-RAS3, RRAS3)",
                "myosin heavy chain 1 (MYH1 aka HEL71, MYHSA1, MYHa, MyHC-2X/D, MyHC-2x)",
                "myosin heavy chain 7 (MYH7 aka CMD1S, CMH1, CMYO7A, CMYO7B, CMYP7A, CMYP7B, MPD1, MYHCB, SPMD, SPMM)",
                "myosin heavy chain 7B (MYH7B aka MHC14, MYH14, lncMYH7b)",
                "myotrophin (MTPN aka GCDP, V-1)",
                "neural retina leucine zipper (NRL aka D14S46E-MAF, RP27, NRL)",
                "paired box 4 (PAX4 aka KPD, MODY9)",
                "paired box 5 (PAX5 aka ALL3, BSAP, PAX-5)",
                "paired box 8 (PAX8 aka PAX-8)",
                "retinal outer segment membrane protein 1 (ROM1 aka ROM, ROSP1, RP7, TSPAN23)",
                "retinoschisin 1 (RS1 aka RS, XLRS1)",
                "sonic hedgehog signaling molecule (SHH aka HHG1, HLP3, HPE3, MCOPCB5, SMMCI, ShhNC, TPT, TPTPS)",
                "steroid 5 alpha-reductase 1 (SRD5A1 aka S5AR 1)",
                "tumor necrosis factor (TNF aka DIF, IMD127-alpha, TNFA, TNFSF2, TNLG1F, TNF)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor C (VEGFC aka Flt4-L, LMPH1D, LMPHM4, VRP)"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "Tumor Protein P53 (TP53)",
            "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
            "Huntingtin (HTT)",
            "Breast Cancer 1 (BRCA1)",
            "Hemoglobin Subunit Alpha (HBA1)",
            "Dystrophin (DMD)",
            "Amyloid Beta Precursor Protein (APP)",
            "Fibroblast Growth Factor Receptor 2 (FGFR2)",
            "Leptin (LEP)",
            "Rhodopsin (RHO)",
            "Collagen Type I Alpha 1 Chain (COL1A1)",
            "Paired Box 6 (PAX6)",
            "Cytochrome P450 Family 2 Subfamily D Member 6 (CYP2D6)",
            "Methylenetetrahydrofolate Reductase (MTHFR)",
            "Angiotensin I Converting Enzyme (ACE)",
            "Apolipoprotein E (APOE)",
            "Potassium Voltage-Gated Channel Subfamily H Member 2 (KCNH2)",
            "Parkinson Disease Protein 2 (PARK2)",
            "Coagulation Factor V (F5)",
            "Adenosine Deaminase (ADA)",
            "Phenylalanine Hydroxylase (PAH)",
            "Sarcoglycans Alpha (SGCA)",
            "Sonic Hedgehog (SHH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin (INS)",
                "Tumor Protein P53 (TP53)",
                "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
                "Huntingtin (HTT)",
                "Breast Cancer 1 (BRCA1)",
                "Hemoglobin Subunit Alpha (HBA1)",
                "Dystrophin (DMD)",
                "Amyloid Beta Precursor Protein (APP)",
                "Fibroblast Growth Factor Receptor 2 (FGFR2)",
                "Leptin (LEP)",
                "Rhodopsin (RHO)",
                "Collagen Type I Alpha 1 Chain (COL1A1)",
                "Cytochrome P450 Family 2 Subfamily D Member 6 (CYP2D6)",
                "Methylenetetrahydrofolate Reductase (MTHFR)",
                "Angiotensin I Converting Enzyme (ACE)",
                "Apolipoprotein E (APOE)",
                "Coagulation Factor V (F5)",
                "Adenosine Deaminase (ADA)",
                "Phenylalanine Hydroxylase (PAH)",
                "Sarcoglycans Alpha (SGCA)",
                "Sonic Hedgehog (SHH)"
            ],
            "mismatches": [
                "Paired Box 6 (PAX6)",
                "Potassium Voltage-Gated Channel Subfamily H Member 2 (KCNH2)",
                "Parkinson Disease Protein 2 (PARK2)"
            ],
            "true_referents": [
                "BRCA1 DNA repair associated (BRCA1 aka BRCAI, BRCC1, BROVCA1, FANCS, IRIS, PNCA4, PPP1R53, PSCP, RNF53)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "Indian hedgehog signaling molecule (IHH aka BDA1, HHG2)",
                "SUFU negative regulator of hedgehog signaling (SUFU aka BCNS2, JBTS32, PRO1280H, SUFUXL, SUFU)",
                "adenosine deaminase (ADA aka ADA1)",
                "adenosine deaminase 2 (ADA2 aka ADGF, CECR1, IDGFL, PAN, SNEDS, VAIHS)",
                "adenosine deaminase domain containing 1 (ADAD1 aka Tenr)",
                "amyloid beta precursor like protein 2 (APLP2 aka APLP-2, APPH, APPL2, CDEBP)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "amyloid beta precursor protein binding protein 2 (APPBP2 aka APP-BP2, HS.84084, PAT1)",
                "angiotensin I converting enzyme (ACE aka ACE1, CD143, DCP, DCP1)",
                "angiotensin converting enzyme 2 (ACE2 aka ACEH)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "coagulation factor II, thrombin (F2 aka PT, RPRGL2, THPH1)",
                "coagulation factor V (F5 aka FVL, PCCF, RPRGL1, THPH2)",
                "coagulation factor VII (F7 aka SPCA)",
                "collagen type I alpha 1 chain (COL1A1 aka CAFYD, EDSARTH1, EDSC, OI1, OI2, OI3, OI4)",
                "collagen type I alpha 2 chain (COL1A2 aka EDSARTH2, EDSCV, OI4)",
                "collagen type X alpha 1 chain (COL10A1)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "cytochrome P450 2D6 (LOC107987479 aka CYP2D6)",
                "cytochrome P450 family 2 subfamily A member 6 (CYP2A6 aka CPA6, CYP2A, CYP2A3, CYPIIA6, P450C2A, P450PB)",
                "cytochrome P450 family 2 subfamily R member 1 (CYP2R1)",
                "dihydrofolate reductase (DHFR aka DHFR1P1, DYR, DHFR)",
                "dihydrofolate reductase 2 (DHFR2 aka DHFRL1, DHFRP4)",
                "dystrophin (DMD aka BMD, CMD3B, DXS142, DXS164, DXS206, DXS230, DXS239, DXS268, DXS269, DXS270, DXS272, MRX85)",
                "dystrophin related protein 2 (DRP2 aka DRP-2)",
                "endothelin converting enzyme 1 (ECE1 aka ECE)",
                "fibroblast growth factor 2 (FGF2 aka BFGF, FGF-2, FGFB, HBGF-2)",
                "fibroblast growth factor receptor 1 (FGFR1 aka BFGFR, CD331, CEK, ECCL, FGFBR, FGFR-1, FLG, FLT-2, FLT2, HBGFR, HH2, HRTFDS, KAL2, N-SAM, OGD, bFGF-R-1)",
                "fibroblast growth factor receptor 2 (FGFR2 aka BBDS, BEK, BFR-1, CD332, CEK3, CFD1, ECT1, JWS, K-SAM, KGFR, TK14, TK25)",
                "hemoglobin subunit alpha 1 (HBA1 aka ECYT7, HBA-T3, HBH, METHBA)",
                "hemoglobin subunit alpha 2 (HBA2 aka ECYT7, HBA-T2, HBH)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "huntingtin (HTT aka HD, IT15, LOMARS)",
                "huntingtin associated protein 1 (HAP1 aka HAP2, HIP5, HLP, hHLP1)",
                "huntingtin interacting protein K (HYPK aka C15orf63, HSPC136)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin degrading enzyme (IDE aka INSULYSIN)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "leptin (LEP aka LEPD, OB, OBS)",
                "leptin receptor (LEPR aka CD295, LEP-RD, OB-R, OBR, LEPR)",
                "leptin receptor overlapping transcript (LEPROT aka LEPR, OB-RGRP, OBRGRP, VPS55)",
                "leucine rich repeat kinase 2 (LRRK2 aka AURA17, DARDARIN, PARK8, RIPK7, ROCO2)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "myotrophin (MTPN aka GCDP, V-1)",
                "paired box 4 (PAX4 aka KPD, MODY9)",
                "paired box 5 (PAX5 aka ALL3, BSAP, PAX-5)",
                "paired box 8 (PAX8 aka PAX-8)",
                "parkin coregulated (PACRG aka BUG21, GLUP, HAK0057712.1, PARK2CRG, pf12, PACRG)",
                "parkin coregulated like (PACRGL aka C4orf28)",
                "phenylalanine hydroxylase (PAH aka PH, PKU, PKU1)",
                "potassium voltage-gated channel subfamily H member 1 (KCNH1 aka EAG, EAG1, K(V)10.1, Kv10.1, TMBTS, ZLS1, h-eag, hEAG, hEAG1)",
                "potassium voltage-gated channel subfamily H member 3 (KCNH3 aka BEC1, ELK2, Kv12.2)",
                "potassium voltage-gated channel subfamily H member 5 (KCNH5 aka DEE112, EAG2, H-EAG2, Kv10.2, hEAG2)",
                "retinal G protein coupled receptor (RGR aka RP44)",
                "retinal pigment epithelium-derived rhodopsin homolog (RRH)",
                "rhodopsin (RHO aka CSNBAD1, OPN2, RP4)",
                "sarcoglycan alpha (SGCA aka 50DAG, ADL, DAG2, DMDA2, LGMD2D, LGMDR3, SCARMD1, adhalin)",
                "sarcoglycan beta (SGCB aka A3b, LGMD2E, LGMDR4, SGC)",
                "sarcoglycan delta (SGCD aka 35DAG, CMD1L, DAGD, LGMDR6, SG-deltaP, SGD, SGCD)",
                "sonic hedgehog signaling molecule (SHH aka HHG1, HLP3, HPE3, MCOPCB5, SMMCI, ShhNC, TPT, TPTPS)",
                "tryptophan hydroxylase 1 (TPH1 aka TPRH, TRPH)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)",
                "tyrosine hydroxylase (TH aka DYT14, DYT5b, TYH)"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "Tumor protein p53 (TP53)",
            "BRCA1 gene",
            "Apolipoprotein E (APOE)",
            "Huntingtin (HTT)",
            "Cystic fibrosis transmembrane conductance regulator (CFTR)",
            "Glucokinase (GCK)",
            "Phenylalanine hydroxylase (PAH)",
            "Survival motor neuron 1 (SMN1)",
            "Dystrophin (DMD)",
            "Hemoglobin subunit beta (HBB)",
            "Methylenetetrahydrofolate reductase (MTHFR)",
            "Prion protein (PRNP)",
            "Hexokinase 1 (HK1)",
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "Leptin (LEP)",
            "Insulin (INS)",
            "Cytochrome P450 2D6 (CYP2D6)",
            "Angiotensin-converting enzyme (ACE)",
            "Serotonin transporter (SLC6A4)",
            "Catechol-O-methyltransferase (COMT)",
            "Superoxide dismutase 1 (SOD1)",
            "Myoglobin (MB)",
            "Proprotein convertase subtilisin/kexin type 9 (PCSK9)",
            "Telomerase reverse transcriptase (TERT)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Tumor protein p53 (TP53)",
                "Apolipoprotein E (APOE)",
                "Huntingtin (HTT)",
                "Cystic fibrosis transmembrane conductance regulator (CFTR)",
                "Glucokinase (GCK)",
                "Phenylalanine hydroxylase (PAH)",
                "Survival motor neuron 1 (SMN1)",
                "Dystrophin (DMD)",
                "Hemoglobin subunit beta (HBB)",
                "Methylenetetrahydrofolate reductase (MTHFR)",
                "Prion protein (PRNP)",
                "Hexokinase 1 (HK1)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Leptin (LEP)",
                "Insulin (INS)",
                "Cytochrome P450 2D6 (CYP2D6)",
                "Angiotensin-converting enzyme (ACE)",
                "Catechol-O-methyltransferase (COMT)",
                "Superoxide dismutase 1 (SOD1)",
                "Myoglobin (MB)",
                "Proprotein convertase subtilisin/kexin type 9 (PCSK9)",
                "Telomerase reverse transcriptase (TERT)"
            ],
            "mismatches": [
                "BRCA1 gene",
                "Serotonin transporter (SLC6A4)"
            ],
            "true_referents": [
                "5-hydroxytryptamine receptor 4 (HTR4 aka 5-HT4, 5-HT4R)",
                "5-hydroxytryptamine receptor 6 (HTR6 aka 5-HT6, 5-HT6R)",
                "ADP dependent glucokinase (ADPGK aka 2610017G09Rik, ADP-GK)",
                "BRCA1 DNA repair associated (BRCA1 aka BRCAI, BRCC1, BROVCA1, FANCS, IRIS, PNCA4, PPP1R53, PSCP, RNF53)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "angiotensin I converting enzyme (ACE aka ACE1, CD143, DCP, DCP1)",
                "angiotensin converting enzyme 2 (ACE2 aka ACEH)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "catechol-O-methyltransferase (COMT aka HEL-S-98n)",
                "catechol-O-methyltransferase domain containing 1 (COMTD1)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "creatine kinase, M-type (CKM aka CKMM, CPK-M, M-CK)",
                "cytochrome P450 2D6 (LOC107987479 aka CYP2D6)",
                "cytochrome P450 family 2 subfamily A member 6 (CYP2A6 aka CPA6, CYP2A, CYP2A3, CYPIIA6, P450C2A, P450PB)",
                "cytochrome P450 family 2 subfamily R member 1 (CYP2R1)",
                "dihydrofolate reductase (DHFR aka DHFR1P1, DYR, DHFR)",
                "dihydrofolate reductase 2 (DHFR2 aka DHFRL1, DHFRP4)",
                "dystrophin (DMD aka BMD, CMD3B, DXS142, DXS164, DXS206, DXS230, DXS239, DXS268, DXS269, DXS270, DXS272, MRX85)",
                "dystrophin related protein 2 (DRP2 aka DRP-2)",
                "endothelin converting enzyme 1 (ECE1 aka ECE)",
                "glucokinase (GCK aka FGQTL3, GK, GLK, HHF3, HK4, HKIV, HXKP, LGLK, MODY2, PNDM1)",
                "glucokinase regulator (GCKR aka FGQTL5, GKRP)",
                "glucose-6-phosphate dehydrogenase (G6PD aka CNSHA11, G6PD)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit delta (HBD aka HBK)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "hexokinase 1 (HK1 aka CNSHA5, HK-ta, HK1-tb, HK1-tc, HKD, HKI, HMSNR, HXK1, NEDVIBA, NMSR, RP79, hexokinase, HK1)",
                "hexokinase 2 (HK2 aka HKII, HXK2)",
                "hexokinase 3 (HK3 aka HKIII, HXK3)",
                "hexose-6-phosphate dehydrogenase/glucose 1-dehydrogenase (H6PD aka CORTRD1, G6PDH, GDHH, H6PD)",
                "huntingtin (HTT aka HD, IT15, LOMARS)",
                "huntingtin associated protein 1 (HAP1 aka HAP2, HIP5, HLP, hHLP1)",
                "huntingtin interacting protein K (HYPK aka C15orf63, HSPC136)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin degrading enzyme (IDE aka INSULYSIN)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "leptin (LEP aka LEPD, OB, OBS)",
                "leptin receptor (LEPR aka CD295, LEP-RD, OB-R, OBR, LEPR)",
                "leptin receptor overlapping transcript (LEPROT aka LEPR, OB-RGRP, OBRGRP, VPS55)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "myoglobin (MB aka MYOSB, PVALB)",
                "myotrophin (MTPN aka GCDP, V-1)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phenylalanine hydroxylase (PAH aka PH, PKU, PKU1)",
                "phosphogluconate dehydrogenase (PGD aka 6PGD)",
                "prion like protein doppel (PRND aka DOPPEL, DPL, PrPLP, dJ1068H6.4)",
                "prion protein (Kanno blood group) (PRNP aka ASCR, AltPrP, CD230, CJD, GSS, KURU, PRIP, PrP, PrP27-30, PrP33-35C, PrPc, p27-30)",
                "proprotein convertase subtilisin/kexin type 1 (PCSK1 aka BMIQ12, NEC1, PC1, PC1/3, PC3, SPC3)",
                "proprotein convertase subtilisin/kexin type 5 (PCSK5 aka PC5, PC6, PC6A, SPC6)",
                "proprotein convertase subtilisin/kexin type 9 (PCSK9 aka FH3, FHCL3, HCHOLA3, LDLCQ1, NARC-1, NARC1, PC9)",
                "shadow of prion protein (SPRN aka SHADOO, SHO, bA108K14.1)",
                "solute carrier family 6 member 4 (SLC6A4 aka 5-HTT, 5-HTTLPR, 5HTT, HTT, OCD1, SERT, SERT1, hSERT)",
                "superoxide dismutase 1 (SOD1 aka ALS, ALS1, HEL-S-44, IPOA, SOD, STAHP, hSod1, homodimer)",
                "superoxide dismutase 2 (SOD2 aka GC1, GClnc1, IPO-B, IPOB, MNSOD, MVCD6, Mn-SOD, lncRNA-GC1)",
                "superoxide dismutase 3 (SOD3 aka EC-SOD)",
                "survival motor neuron domain containing 1 (SMNDC1 aka SMNR, SPF30, TDRD16C)",
                "survival of motor neuron 1, telomeric (SMN1 aka BCD541, GEMIN1, SMA, SMA1, SMA2, SMA3, SMA4, SMA@, SMN, SMNT, T-BCD541, TDRD16A)",
                "survival of motor neuron 2, centromeric (SMN2 aka BCD541, C-BCD541, GEMIN1, SMNC, TDRD16B)",
                "telomerase RNA component interacting RNase (TRIR aka C19orf43, TERCIR, fSAP18)",
                "telomerase reverse transcriptase (TERT aka CMM9, DKCA2, DKCB4, EST2, PFBMFT1, TCS1, TP2, TRT, hEST2, hTRT)",
                "telomere repeat binding bouquet formation protein 1 (TERB1 aka CCDC79, SPGF60)",
                "transmembrane O-methyltransferase (TOMT aka COMT2)",
                "tryptophan hydroxylase 1 (TPH1 aka TPRH, TRPH)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)",
                "tyrosine hydroxylase (TH aka DYT14, DYT5b, TYH)"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "Albumin (ALB)",
            "Amyloid Beta Precursor Protein (APP)",
            "Apolipoprotein E (APOE)",
            "Breast Cancer 1 (BRCA1)",
            "Breast Cancer 2 (BRCA2)",
            "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
            "Cytochrome P450 2D6 (CYP2D6)",
            "Epidermal Growth Factor Receptor (EGFR)",
            "Glucose-6-Phosphate Dehydrogenase (G6PD)",
            "Hemoglobin Subunit Alpha 1 (HBA1)",
            "Hemoglobin Subunit Beta (HBB)",
            "Huntingtin (HTT)",
            "Insulin (INS)",
            "Insulin-Like Growth Factor 1 (IGF1)",
            "Methylenetetrahydrofolate Reductase (MTHFR)",
            "Prion Protein (PRNP)",
            "Sickle Cell Anemia Hemoglobin Subunit Beta (HBB)",
            "Superoxide Dismutase 1 (SOD1)",
            "Tau Microtubule Associated Protein (MAPT)",
            "Thymidylate Synthase (TYMS)",
            "Tumor Protein P53 (TP53)",
            "Warfarin Metabolism Cytochrome P450 2C9 (CYP2C9)",
            "X-Box Binding Protein 1 (XBP1)",
            "Xylosyltransferase 1 (XYLT1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Albumin (ALB)",
                "Amyloid Beta Precursor Protein (APP)",
                "Apolipoprotein E (APOE)",
                "Breast Cancer 1 (BRCA1)",
                "Breast Cancer 2 (BRCA2)",
                "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
                "Cytochrome P450 2D6 (CYP2D6)",
                "Epidermal Growth Factor Receptor (EGFR)",
                "Glucose-6-Phosphate Dehydrogenase (G6PD)",
                "Hemoglobin Subunit Alpha 1 (HBA1)",
                "Hemoglobin Subunit Beta (HBB)",
                "Huntingtin (HTT)",
                "Insulin (INS)",
                "Insulin-Like Growth Factor 1 (IGF1)",
                "Methylenetetrahydrofolate Reductase (MTHFR)",
                "Prion Protein (PRNP)",
                "Superoxide Dismutase 1 (SOD1)",
                "Tau Microtubule Associated Protein (MAPT)",
                "Thymidylate Synthase (TYMS)",
                "Tumor Protein P53 (TP53)",
                "X-Box Binding Protein 1 (XBP1)",
                "Xylosyltransferase 1 (XYLT1)"
            ],
            "mismatches": [
                "Sickle Cell Anemia Hemoglobin Subunit Beta (HBB)",
                "Warfarin Metabolism Cytochrome P450 2C9 (CYP2C9)"
            ],
            "true_referents": [
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 DNA repair associated (BRCA1 aka BRCAI, BRCC1, BROVCA1, FANCS, IRIS, PNCA4, PPP1R53, PSCP, RNF53)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 DNA repair associated (BRCA2 aka BRCC2, BROVCA2, FACD, FAD, FAD1, FANCD, FANCD1, GLM3, PNCA2, XRCC11)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "BRISC and BRCA1 A complex member 2 (BABAM2 aka BRCC4, BRCC45, BRE)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "F-box protein 4 (FBXO4 aka FBX4)",
                "X-box binding protein 1 (XBP1 aka TREB-5, TREB5, XBP-1, XBP2)",
                "afamin (AFM aka ALB2, ALBA, ALF)",
                "albumin (ALB aka FDAHT, HSA, PRO0883, PRO0903, PRO1341)",
                "amyloid beta precursor like protein 2 (APLP2 aka APLP-2, APPH, APPL2, CDEBP)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "amyloid beta precursor protein binding protein 2 (APPBP2 aka APP-BP2, HS.84084, PAT1)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "cytochrome P450 2D6 (LOC107987479 aka CYP2D6)",
                "cytochrome P450 family 2 subfamily A member 6 (CYP2A6 aka CPA6, CYP2A, CYP2A3, CYPIIA6, P450C2A, P450PB)",
                "cytochrome P450 family 2 subfamily C member 9 (CYP2C9 aka CPC9, CYP2C, CYP2C10, CYPIIC9, P450-2C9, P450IIC9)",
                "cytochrome P450 family 2 subfamily R member 1 (CYP2R1)",
                "cytochrome P450 family 2 subfamily W member 1 (CYP2W1)",
                "cytochrome P450 family 39 subfamily A member 1 (CYP39A1)",
                "deoxythymidylate kinase (DTYMK aka CDC8, CONPM, PP3731, TMPK, TYMK)",
                "dihydrofolate reductase (DHFR aka DHFR1P1, DYR, DHFR)",
                "dihydrofolate reductase 2 (DHFR2 aka DHFRL1, DHFRP4)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "glucose-6-phosphate dehydrogenase (G6PD aka CNSHA11, G6PD)",
                "glucoside xylosyltransferase 1 (GXYLT1 aka GLT8D3)",
                "hemoglobin subunit alpha 1 (HBA1 aka ECYT7, HBA-T3, HBH, METHBA)",
                "hemoglobin subunit alpha 2 (HBA2 aka ECYT7, HBA-T2, HBH)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit delta (HBD aka HBK)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "hexose-6-phosphate dehydrogenase/glucose 1-dehydrogenase (H6PD aka CORTRD1, G6PDH, GDHH, H6PD)",
                "huntingtin (HTT aka HD, IT15, LOMARS)",
                "huntingtin associated protein 1 (HAP1 aka HAP2, HIP5, HLP, hHLP1)",
                "huntingtin interacting protein K (HYPK aka C15orf63, HSPC136)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin degrading enzyme (IDE aka INSULYSIN)",
                "insulin like growth factor 1 (IGF1 aka IGF, IGF-I, IGFI, MGF)",
                "insulin like growth factor 1 receptor (IGF1R aka CD221, IGFIR, IGFR, JTK13)",
                "insulin like growth factor 2 (IGF2 aka C11orf43, GRDF, IGF-II, PP9974, SRS3)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "microtubule associated protein 2 (MAP2 aka MAP-2A, MAP2B, MAP2C, MAP2)",
                "microtubule associated protein 4 (MAP4)",
                "microtubule associated protein tau (MAPT aka DDPAC, FTD1, FTDP-17L, MSTD, MTBT1, MTBT2, PPND, PPP1R103, TAU, Tau-PHF6, tau-40, MAPT)",
                "parvalbumin (PVALB aka D22S749)",
                "phosphogluconate dehydrogenase (PGD aka 6PGD)",
                "prion like protein doppel (PRND aka DOPPEL, DPL, PrPLP, dJ1068H6.4)",
                "prion protein (Kanno blood group) (PRNP aka ASCR, AltPrP, CD230, CJD, GSS, KURU, PRIP, PrP, PrP27-30, PrP33-35C, PrPc, p27-30)",
                "shadow of prion protein (SPRN aka SHADOO, SHO, bA108K14.1)",
                "superoxide dismutase 1 (SOD1 aka ALS, ALS1, HEL-S-44, IPOA, SOD, STAHP, hSod1, homodimer)",
                "superoxide dismutase 2 (SOD2 aka GC1, GClnc1, IPO-B, IPOB, MNSOD, MVCD6, Mn-SOD, lncRNA-GC1)",
                "superoxide dismutase 3 (SOD3 aka EC-SOD)",
                "thymidine phosphorylase (TYMP aka ECGF, ECGF1, MEDPS1, MNGIE, MTDPS1, PDECGF, TP, hPD-ECGF)",
                "thymidylate synthetase (TYMS aka DKCD, HST422, TMS, TS)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)",
                "upstream binding protein 1 (UBP1 aka LBP-1B, LBP-1a, LBP1A, LBP1B)",
                "xylosyltransferase 1 (XYLT1 aka DBQD2, PXYLT1, XT-I, XT1, XTI, XYLTI, xylT-I)",
                "xylosyltransferase 2 (XYLT2 aka PXYLT2, SOS, XT-II, XT2, xylT-II)"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1 (BRCA1)",
            "TP53 (TP53)",
            "EGFR (EGFR)",
            "KRAS (KRAS)",
            "BRCA2 (BRCA2)",
            "HBB (HBB)",
            "HBA1 (HBA1)",
            "HBA2 (HBA2)",
            "HBA1-HBA2 (HBA1-HBA2)",
            "F5 (F5)",
            "F2 (F2)",
            "F9 (F9)",
            "F10 (F10)",
            "F11 (F11)",
            "F12 (F12)",
            "F13A1 (F13A1)",
            "F13B (F13B)",
            "F7 (F7)",
            "F8 (F8)",
            "VWF (VWF)",
            "A1BG (A1BG)",
            "A1CF (A1CF)",
            "A2M (A2M)",
            "A4GALT (A4GALT)",
            "A5H (A5H)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "EGFR",
                "KRAS",
                "BRCA2",
                "HBB",
                "HBA1",
                "HBA2",
                "F13A1",
                "F13B",
                "VWF",
                "A1BG",
                "A1CF",
                "A2M"
            ],
            "mismatches": [
                "BRCA1",
                "HBA1-HBA2",
                "F5",
                "F2",
                "F9",
                "F10",
                "F11",
                "F12",
                "F7",
                "F8",
                "A4GALT",
                "A5H"
            ],
            "true_referents": [
                "APOBEC1 complementation factor (A1CF aka ACF, ACF64, ACF65, APOBEC1CF, ASP)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 DNA repair associated (BRCA2 aka BRCC2, BROVCA2, FACD, FAD, FAD1, FANCD, FANCD1, GLM3, PNCA2, XRCC11)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "E2F transcription factor 2 (E2F2 aka E2F-2)",
                "E2F transcription factor 5 (E2F5 aka E2F-5)",
                "E2F transcription factor 7 (E2F7)",
                "EFR3 homolog B (EFR3B aka KIAA0953)",
                "F10 antisense RNA 2 (F10-AS2 aka SCAR-6)",
                "F11 receptor (F11R aka CD321, JAM, JAM1, JAMA, JCAM, KAT, PAM-1)",
                "G antigen 4 (GAGE4 aka CT4.4)",
                "IQ motif containing F5 (IQCF5)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "MAGE family member A8 (MAGEA8 aka CT1.8, MAGE8)",
                "MAGE family member A9 (MAGEA9 aka CT1.9, MAGE9)",
                "MAGE family member B10 (MAGEB10)",
                "MAGE family member F1 (MAGEF1 aka MAGE-F1)",
                "RAS related (RRAS aka R-Ras1, RRAS)",
                "RAS related 2 (RRAS2 aka NS12, TC21)",
                "SSX family member 7 (SSX7)",
                "Sp5 transcription factor (SP5)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "TP53 target 3 (TP53TG3 aka P53TG3A, TP53TG3E, TP53TG3F, TP53TG3)",
                "XK related 9 (XKR9 aka XRG9, hXKR9)",
                "adrenomedullin 2 (ADM2 aka AM2, dJ579N16.4)",
                "alpha-1-B glycoprotein (A1BG aka A1B, ABG, GAB, HYST2477)",
                "alpha-2-macroglobulin (A2M aka A2MD, CPAMD5, FWP007, S863-7)",
                "beta-1,4-N-acetyl-galactosaminyltransferase 4 (B4GALNT4)",
                "beta-1,4-galactosyltransferase 4 (B4GALT4 aka B4Gal-T4, beta4Gal-T4)",
                "coagulation factor XIII A chain (F13A1 aka F13A)",
                "coagulation factor XIII B chain (F13B aka FXIIIB)",
                "complement C7 (C7)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "family with sequence similarity 133 member B (FAM133B)",
                "forkhead box J2 (FOXJ2 aka FHX)",
                "formin 2 (FMN2)",
                "formin like 2 (FMNL2 aka FHOD2)",
                "frizzled class receptor 8 (FZD8 aka FZ-8, hFZ8)",
                "frizzled class receptor 9 (FZD9 aka CD349, FZD3)",
                "golgin A8 family member F (GOLGA8F)",
                "hemoglobin subunit alpha 1 (HBA1 aka ECYT7, HBA-T3, HBH, METHBA)",
                "hemoglobin subunit alpha 2 (HBA2 aka ECYT7, HBA-T2, HBH)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "immunoglobulin heavy constant alpha 2 (A2m marker) (IGHA2 aka A2M)",
                "inhibin subunit beta B (INHBB)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "jade family PHD finger 1 (JADE1 aka PHF17)",
                "jade family PHD finger 2 (JADE2 aka JADE-2, PHF15)",
                "jade family PHD finger 3 (JADE3 aka JADE-3, PHF16)",
                "pancreas associated transcription factor 1a (PTF1A aka PACA, PAGEN2, PTF1-p48, bHLHa29, p48)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "sex hormone binding globulin (SHBG aka ABP, SBP, TEBG)",
                "synergin gamma (SYNRG aka AP1GBP1, SYNG)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "ubiquitin B (UBB aka HEL-S-50)",
                "von Willebrand factor (VWF aka F8VWF, VWD)",
                "von Willebrand factor A domain containing 3A (VWA3A)",
                "von Willebrand factor A domain containing 3B (VWA3B aka SCAR22)"
            ],
            "TP": 13,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "TP53 (TP53)",
            "BRCA1 (BRCA1)",
            "BRCA2 (BRCA2)",
            "CFTR (CFTR)",
            "HTT (HTT)",
            "APP (APP)",
            "SNCA (SNCA)",
            "MAPT (MAPT)",
            "APOE (APOE)",
            "DRD4 (DRD4)",
            "COMT (COMT)",
            "SLC6A4 (SLC6A4)",
            "HLA-B (HLA-B)",
            "HLA-A (HLA-A)",
            "IL10 (IL10)",
            "IL6 (IL6)",
            "TNF (TNF)",
            "IFNG (IFNG)",
            "CTLA4 (CTLA4)",
            "PSEN1 (PSEN1)",
            "PSEN2 (PSEN2)",
            "GRIN1 (GRIN1)",
            "GRIN2A (GRIN2A)",
            "GRIN2B (GRIN2B)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "BRCA2",
                "CFTR",
                "HTT",
                "APP",
                "SNCA",
                "APOE",
                "DRD4",
                "COMT",
                "SLC6A4",
                "HLA-B",
                "HLA-A",
                "IL10",
                "IL6",
                "TNF",
                "IFNG",
                "CTLA4",
                "PSEN1",
                "PSEN2",
                "GRIN1",
                "GRIN2A",
                "GRIN2B"
            ],
            "mismatches": [
                "BRCA1",
                "MAPT"
            ],
            "true_referents": [
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 DNA repair associated (BRCA2 aka BRCC2, BROVCA2, FACD, FAD, FAD1, FANCD, FANCD1, GLM3, PNCA2, XRCC11)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "G protein regulated inducer of neurite outgrowth 1 (GPRIN1 aka GRIN1)",
                "GIT ArfGAP 1 (GIT1 aka p95-APP1)",
                "GPRIN family member 3 (GPRIN3 aka GRIN3)",
                "MAPT intronic transcript 1 (MAPT-IT1)",
                "NADH dehydrogenase subunit 4 (ND4)",
                "Raf-1 proto-oncogene, serine/threonine kinase (RAF1 aka CMD1NN, CRAF, NS5, Raf-1, c-Raf)",
                "TNF superfamily member 10 (TNFSF10 aka APO2L, Apo-2L, CD253, TANCR, TL2, TNLG6A, TRAIL)",
                "TNF superfamily member 11 (TNFSF11 aka CD254, ODF, OPGL, OPTB2, RANKL, TNLG6B, TRANCE, hRANKL2, sOdf)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "TP53 target 3 (TP53TG3 aka P53TG3A, TP53TG3E, TP53TG3F, TP53TG3)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "catalase (CAT)",
                "catechol-O-methyltransferase (COMT aka HEL-S-98n)",
                "catechol-O-methyltransferase domain containing 1 (COMTD1)",
                "cytotoxic T-lymphocyte associated protein 4 (CTLA4 aka ALPS5, CD, CD152, CELIAC3, CTLA-4, GRD4, GSE, IDDM12)",
                "dopamine receptor D4 (DRD4 aka D4DR)",
                "glutamate ionotropic receptor NMDA type subunit 1 (GRIN1 aka DEE101, GluN1, MRD8, NDHMSD, NDHMSR, NMD-R1, NMDA1, NMDAR1, NR1, hNR1)",
                "glutamate ionotropic receptor NMDA type subunit 2A (GRIN2A aka EPND, FESD, GluN2A, LKS, NMDAR2A, NR2A)",
                "glutamate ionotropic receptor NMDA type subunit 2B (GRIN2B aka DEE27, EIEE27, GluN2B, MRD6, NMDAR2B, NR2B, NR3, hNR3)",
                "glutamate ionotropic receptor NMDA type subunit 2C (GRIN2C aka GluN2C, NMDAR2C, NR2C)",
                "glutamate ionotropic receptor NMDA type subunit 2D (GRIN2D aka DEE46, EB11, EIEE46, GluN2D, NMDAR2D, NR2D)",
                "glutamate ionotropic receptor NMDA type subunit 3B (GRIN3B aka GluN3B, NR3B)",
                "glutathione S-transferase alpha 2 (GSTA2 aka GST2-2, GTA2, GTH2, GSTA2)",
                "glutathione S-transferase theta 1 (GSTT1)",
                "glutathione S-transferase theta 4 (GSTT4 aka GSTTP1, HS322B1A)",
                "heat shock protein family A (Hsp70) member 2 (HSPA2 aka HSP70-2, HSP70-3)",
                "huntingtin (HTT aka HD, IT15, LOMARS)",
                "interferon beta 1 (IFNB1 aka IFB, IFF, IFN-beta, IFNB)",
                "interferon gamma (IFNG aka IFG, IFI, IMD69)",
                "interleukin 10 (IL10 aka CSIF, GVHDS, IL-10A, TGIF, IL10)",
                "interleukin 13 (IL13 aka IL-13, P600)",
                "interleukin 19 (IL19 aka IL-10C, MDA1, NG.1, ZMDA1)",
                "interleukin 20 (IL20 aka IL-20, IL10D, ZCYTO10)",
                "interleukin 6 (IL6 aka BSF-2, BSF2, CDF, HGF, HSF, IFN-beta-2, IFNB2, IL-6)",
                "interleukin 7 (IL7 aka IL-7, IMD130)",
                "lactase (LCT aka LAC, LPH, LPH1)",
                "leucine rich repeat containing 25 (LRRC25 aka MAPA)",
                "major histocompatibility complex, class I, A (HLA-A aka HLAA)",
                "major histocompatibility complex, class I, B (HLA-B aka AS, B-4901, HLAB)",
                "major histocompatibility complex, class I, G (HLA-G aka MHC-G)",
                "major histocompatibility complex, class II, DO beta (HLA-DOB aka DOB, HLA_DOB)",
                "major histocompatibility complex, class II, DR alpha (HLA-DRA aka HLA-DRA1)",
                "major histocompatibility complex, class II, DR beta 4 (HLA-DRB4 aka DR4, DRB4, HLA-DR4B, HLA-DRB*, HLA-DRB4)",
                "mesogenin 1 (MSGN1 aka MSOG, pMsgn1)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "myosin IF (MYO1F)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "presenilin 1 (PSEN1 aka ACNINV3, AD3, CMD1U, FAD, PS-1, PS1, PSNL1, S182)",
                "presenilin 2 (PSEN2 aka AD3L, AD4, CMD1V, PS2, STM2)",
                "presenilin enhancer, gamma-secretase subunit (PSENEN aka ACNINV2, MDS033, MSTP064, PEN-2, PEN2)",
                "reprimo like (RPRML)",
                "saitohin (STH aka MAPTIT)",
                "solute carrier family 1 member 6 (SLC1A6 aka EAAT4)",
                "solute carrier family 2 member 4 (SLC2A4 aka GLUT4)",
                "solute carrier family 6 member 4 (SLC6A4 aka 5-HTT, 5-HTTLPR, 5HTT, HTT, OCD1, SERT, SERT1, hSERT)",
                "synuclein alpha (SNCA aka NACP, PARK1, PARK4, PD1)",
                "transmembrane O-methyltransferase (TOMT aka COMT2)",
                "tumor necrosis factor (TNF aka DIF, IMD127-alpha, TNFA, TNFSF2, TNLG1F, TNF)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            },
            {
                "name": "ACTB",
                "identifier": "ACTB"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ACTB"
            ],
            "mismatches": [],
            "true_referents": [
                "POTE ankyrin domain family member F (POTEF aka A26C1B, ACTB, POTE2alpha, POTEACTIN)",
                "actin beta like 2 (ACTBL2 aka ACT)",
                "double C2 domain beta (DOC2B aka DOC2BL)"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 0
        }
    }
]