[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "TP53 (p53)",
            "BRCA1",
            "BRCA2",
            "EGFR",
            "MYC",
            "VEGFA",
            "KRAS",
            "HER2 (ERBB2)",
            "CDKN2A",
            "PTEN",
            "BRAF",
            "NF1",
            "APC",
            "IDH1",
            "RB1",
            "JAK2",
            "FLT3",
            "NOTCH1",
            "KIT",
            "PIK3CA",
            "BCL2",
            "MDM2",
            "CDH1",
            "SMAD4"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53 (p53)",
                "BRCA2",
                "EGFR",
                "MYC",
                "VEGFA",
                "KRAS",
                "HER2 (ERBB2)",
                "PTEN",
                "BRAF",
                "IDH1",
                "JAK2",
                "FLT3",
                "NOTCH1",
                "PIK3CA",
                "MDM2",
                "CDH1",
                "SMAD4"
            ],
            "mismatches": [
                "BRCA1",
                "CDKN2A",
                "NF1",
                "APC",
                "RB1",
                "KIT",
                "BCL2"
            ],
            "true_referents": [
                "A-Raf proto-oncogene, serine/threonine kinase (ARAF aka A-RAF1, PKS2, RAFA1, ARAF)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BCL2 like 10 (BCL2L10 aka BCL-B, Boo, Diva, bcl2-L-10)",
                "BCL2 like 11 (BCL2L11 aka BAM, BIM, BOD)",
                "BCL2 like 12 (BCL2L12)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 DNA repair associated (BRCA2 aka BRCC2, BROVCA2, FACD, FAD, FAD1, FANCD, FANCD1, GLM3, PNCA2, XRCC11)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "BRISC and BRCA1 A complex member 2 (BABAM2 aka BRCC4, BRCC45, BRE)",
                "CDKN2A interacting protein (CDKN2AIP)",
                "CDKN2A interacting protein N-terminal like (CDKN2AIPNL aka C2AIL)",
                "FLT3 interacting zinc finger 1 (FIZ1 aka ZNF798)",
                "Janus kinase 1 (JAK1 aka AIIDEA, JAK1B, JTK3, JAK1)",
                "Janus kinase 2 (JAK2 aka JTK10)",
                "Janus kinase 3 (JAK3 aka JAK-3_HUMAN, JAKL, L-JAK, LJAK, JAK3)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "MDM2 binding protein (MTBP aka MDM2BP)",
                "MDM2 proto-oncogene (MDM2 aka ACTFS, HDMX, LSKB, hdm2)",
                "MDM4 regulator of p53 (MDM4 aka BMFS6, HDMX, MDMX, MRP1)",
                "MYC associated zinc finger protein (MAZ aka PUR1, Pur-1, SAF-1, SAF-2, SAF-3, ZF87, ZNF801, Zif87)",
                "MYC proto-oncogene, bHLH transcription factor (MYC aka MRTLC, bHLHe39, c-Myc, MYC)",
                "MYC target 1 (MYCT1 aka MTLC)",
                "NBPF member 1 (NBPF1 aka AB13, AB14, AB23, AD2, NBG, NBPF)",
                "NBPF member 11 (NBPF11 aka NBPF24)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "RAS related (RRAS aka R-Ras1, RRAS)",
                "RAS related 2 (RRAS2 aka NS12, TC21)",
                "RB transcriptional corepressor like 1 (RBL1 aka CP107, PRB1, p107)",
                "RB1 inducible coiled-coil 1 (RB1CC1 aka ATG17, CC1, FIP200, PPP1R131)",
                "Raf-1 proto-oncogene, serine/threonine kinase (RAF1 aka CMD1NN, CRAF, NS5, Raf-1, c-Raf)",
                "SHOX homeobox 2 (SHOX2 aka OG12, OG12X, SHOT)",
                "SMAD family member 1 (SMAD1 aka BSP-1, BSP1, JV4-1, JV41, MADH1, MADR1)",
                "SMAD family member 4 (SMAD4 aka DPC4, JIP, MADH4, MYHRS)",
                "SMAD family member 6 (SMAD6 aka AOVD2, HsT17432, MADH6, MADH7)",
                "TP53 regulated inhibitor of apoptosis 1 (TRIAP1 aka HSPC132, MDM35, P53CSV, WF-1)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "anaphase promoting complex subunit 2 (ANAPC2 aka APC2)",
                "anaphase promoting complex subunit 5 (ANAPC5 aka APC5)",
                "bridging integrator 3 (BIN3)",
                "cadherin 1 (CDH1 aka Arc-1, BCDS1, CD324, CDHE, ECAD, LCAM, UVO)",
                "cadherin 7 (CDH7 aka CDH7L1)",
                "cadherin 9 (CDH9)",
                "cyclin dependent kinase 2 (CDK2 aka CDKN2, p33(CDK2))",
                "delta like canonical Notch ligand 1 (DLL1 aka DELTA1, DL1, Delta, NEDBAS)",
                "delta like non-canonical Notch ligand 1 (DLK1 aka DLK, DLK-1, Delta1, FA1, PREF1, Pref-1, ZOG, pG2)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "erb-b2 receptor tyrosine kinase 2 (ERBB2 aka CD340, HER-2, HER-2/neu, HER2, MLN 19, MLN-19, NEU, NGL, TKR1, VSCN2, c-ERB-2, c-ERB2, p185(erbB2))",
                "erb-b2 receptor tyrosine kinase 4 (ERBB4 aka ALS19, HER4, p180erbB4)",
                "fibroblast growth factor receptor 1 (FGFR1 aka BFGFR, CD331, CEK, ECCL, FGFBR, FGFR-1, FLG, FLT-2, FLT2, HBGFR, HH2, HRTFDS, KAL2, N-SAM, OGD, bFGF-R-1)",
                "fms related receptor tyrosine kinase 3 (FLT3 aka CD135, FLK-2, FLK2, STK1)",
                "fms related receptor tyrosine kinase 3 ligand (FLT3LG aka FL, FLG3L, FLT3L, IMD125)",
                "isocitrate dehydrogenase (NAD(+)) 3 catalytic subunit alpha (IDH3A aka RP90)",
                "isocitrate dehydrogenase (NADP(+)) 1 (IDH1 aka HEL-216, HEL-S-26, IDCD, IDH, IDP, IDPC, PICD)",
                "isocitrate dehydrogenase (NADP(+)) 2 (IDH2 aka D2HGA2, ICD-M, IDH, IDH-2, IDHM, IDP, IDPM, mNADP-IDH)",
                "neurofibromin 1 (NF1 aka NFNS, VRNF, WSS)",
                "notch receptor 1 (NOTCH1 aka AOS5, AOVD1, TAN1, hN1)",
                "paired box 4 (PAX4 aka KPD, MODY9)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "phosphatidylinositol-4,5-bisphosphate 3-kinase catalytic subunit alpha (PIK3CA aka CCM4, CLAPO, CLOVE, CWS5, HMH, MCAP, MCM, MCMTC, PI3K, PI3K-alpha, p110-alpha)",
                "phosphatidylinositol-4,5-bisphosphate 3-kinase catalytic subunit beta (PIK3CB aka P110BETA, PI3K, PI3KBETA, PIK3C1)",
                "phosphoinositide-3-kinase regulatory subunit 3 (PIK3R3 aka p55, p55-GAMMA, p55PIK)",
                "protein tyrosine phosphatase receptor type E (PTPRE aka HPTPE, PTPE, R-PTP-EPSILON)",
                "ring-box 1 (RBX1 aka BA554C12.1, RNF75, ROC1)",
                "solute carrier family 25 member 24 (SLC25A24 aka APC1, SCAMC-1, SCAMC1)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor D (VEGFD aka FIGF, VEGF-D)"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1 (BRCA1)",
            "TP53 (TP53)",
            "EGFR (EGFR)",
            "MYC (MYC)",
            "APOE (APOE)",
            "INS (INS)",
            "CFTR (CFTR)",
            "HBB (HBB)",
            "HBA1 (HBA1)",
            "IGF1 (IGF1)",
            "VEGFA (VEGFA)",
            "TNF (TNF)",
            "IL2 (IL2)",
            "ACTB (ACTB)",
            "GAPDH (GAPDH)",
            "BRAF (BRAF)",
            "HER2 (ERBB2)",
            "KRAS (KRAS)",
            "LDLR (LDLR)",
            "P53 (TP53)",
            "MAP2K1 (MEK1)",
            "RB1 (RB1)",
            "MTOR (MTOR)",
            "AKT1 (AKT1)",
            "SRC (SRC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "EGFR",
                "MYC",
                "APOE",
                "CFTR",
                "HBB",
                "HBA1",
                "IGF1",
                "VEGFA",
                "TNF",
                "IL2",
                "GAPDH",
                "BRAF",
                "KRAS",
                "LDLR",
                "MAP2K1",
                "RB1",
                "MTOR",
                "AKT1"
            ],
            "mismatches": [
                "BRCA1",
                "INS",
                "ACTB",
                "HER2",
                "P53",
                "SRC"
            ],
            "true_referents": [
                "AKT serine/threonine kinase 1 (AKT1 aka AKT, PKB, PKB-ALPHA, PRKBA, RAC, RAC-ALPHA)",
                "AKT serine/threonine kinase 2 (AKT2 aka HIHGHH, PKBB, PKBBETA, PRKBB, RAC-BETA)",
                "AKT serine/threonine kinase 3 (AKT3 aka MPPH, MPPH2, PKB-GAMMA, PKBG, PRKBG, RAC-PK-gamma, RAC-gamma, STK-2)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "MTOR associated protein, eak-7 homolog (MEAK7 aka EAK7, KIAA1609, TLDC1, mEAK-7)",
                "MYC binding protein (MYCBP aka AMY-1)",
                "MYC proto-oncogene, bHLH transcription factor (MYC aka MRTLC, bHLHe39, c-Myc, MYC)",
                "MYC target 1 (MYCT1 aka MTLC)",
                "RAS related (RRAS aka R-Ras1, RRAS)",
                "RAS related 2 (RRAS2 aka NS12, TC21)",
                "RB transcriptional corepressor 1 (RB1 aka OSRC, PPP1R130, RB, p105-Rb, p110-RB1, pRb, pp110)",
                "RB transcriptional corepressor like 1 (RBL1 aka CP107, PRB1, p107)",
                "RB1 inducible coiled-coil 1 (RB1CC1 aka ATG17, CC1, FIP200, PPP1R131)",
                "RPTOR independent companion of MTOR complex 2 (RICTOR aka AVO3, PIA, hAVO3)",
                "Raf-1 proto-oncogene, serine/threonine kinase (RAF1 aka CMD1NN, CRAF, NS5, Raf-1, c-Raf)",
                "TNF superfamily member 10 (TNFSF10 aka APO2L, Apo-2L, CD253, TANCR, TL2, TNLG6A, TRAIL)",
                "TNF superfamily member 11 (TNFSF11 aka CD254, ODF, OPGL, OPTB2, RANKL, TNLG6B, TRANCE, hRANKL2, sOdf)",
                "TP53 regulated inhibitor of apoptosis 1 (TRIAP1 aka HSPC132, MDM35, P53CSV, WF-1)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "TP53 target 3 (TP53TG3 aka P53TG3A, TP53TG3E, TP53TG3F, TP53TG3)",
                "actin beta like 2 (ACTBL2 aka ACT)",
                "actin like 6B (ACTL6B aka ACTL6, BAF53B, DEE76, EIEE76, IDDSSAD, SMARCN2, arpNalpha)",
                "aldehyde dehydrogenase 5 family member A1 (ALDH5A1 aka SSADH, SSDH)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "erb-b2 receptor tyrosine kinase 2 (ERBB2 aka CD340, HER-2, HER-2/neu, HER2, MLN 19, MLN-19, NEU, NGL, TKR1, VSCN2, c-ERB-2, c-ERB2, p185(erbB2))",
                "erb-b2 receptor tyrosine kinase 4 (ERBB4 aka ALS19, HER4, p180erbB4)",
                "glyceraldehyde-3-phosphate dehydrogenase (GAPDH aka G3PD, GAPD, HEL-S-162eP)",
                "glyceraldehyde-3-phosphate dehydrogenase, spermatogenic (GAPDHS aka GAPD2, GAPDH-2, GAPDS, HEL-S-278, HSD-35)",
                "hemoglobin subunit alpha 1 (HBA1 aka ECYT7, HBA-T3, HBH, METHBA)",
                "hemoglobin subunit alpha 2 (HBA2 aka ECYT7, HBA-T2, HBH)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "importin 4 (IPO4 aka Imp4)",
                "importin 9 (IPO9 aka Imp9)",
                "inhibin subunit beta B (INHBB)",
                "insulin like growth factor 1 (IGF1 aka IGF, IGF-I, IGFI, MGF)",
                "insulin like growth factor 1 receptor (IGF1R aka CD221, IGFIR, IGFR, JTK13)",
                "insulin like growth factor binding protein 1 (IGFBP1 aka AFBP, IBP1, IGF-BP25, PP12, hIGFBP-1)",
                "interleukin 2 (IL2 aka IL-2, TCGF, lymphokine)",
                "interleukin 25 (IL25 aka IL17E)",
                "interleukin 7 (IL7 aka IL-7, IMD130)",
                "lactase (LCT aka LAC, LPH, LPH1)",
                "low density lipoprotein receptor (LDLR aka FH, FHC, FHCL1, LDLCQ2)",
                "low density lipoprotein receptor class A domain containing 1 (LDLRAD1)",
                "mechanistic target of rapamycin kinase (MTOR aka FRAP, FRAP1, FRAP2, RAFT1, RAPT1, SKS)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "mitogen-activated protein kinase kinase 1 (MAP2K1 aka CFC3, MAPKK1, MEK1, MEL, MKK1, PRKMK1)",
                "mitogen-activated protein kinase kinase 2 (MAP2K2 aka CFC4, MAPKK2, MEK2, MKK2, PRKMK2)",
                "mitogen-activated protein kinase kinase kinase 2 (MAP3K2 aka MEKK2, MEKK2B)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "septin 11 (SEPTIN11 aka SEPT11, Septin-11)",
                "tectorin beta (TECTB)",
                "tumor necrosis factor (TNF aka DIF, IMD127-alpha, TNFA, TNFSF2, TNLG1F, TNF)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "ubiquitin B (UBB aka HEL-S-50)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor D (VEGFD aka FIGF, VEGF-D)",
                "very low density lipoprotein receptor (VLDLR aka CAMRQ1, CARMQ1, CHRMQ1, VLDL-RCH, VLDLR)"
            ],
            "TP": 19,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1 (BRCA1)",
            "TP53 (TP53)",
            "EGFR (EGFR)",
            "HER2 (ERBB2)",
            "KRAS (KRAS)",
            "BRAF (BRAF)",
            "MYC (MYC)",
            "BCL2 (BCL2)",
            "PIK3CA (PIK3CA)",
            "PTEN (PTEN)",
            "ALK (ALK)",
            "ROS1 (ROS1)",
            "RET (RET)",
            "NTRK1 (NTRK1)",
            "NTRK2 (NTRK2)",
            "NTRK3 (NTRK3)",
            "EML4-ALK (EML4-ALK)",
            "FGFR1 (FGFR1)",
            "FGFR2 (FGFR2)",
            "FGFR3 (FGFR3)",
            "FGFR4 (FGFR4)",
            "CDK4 (CDK4)",
            "CDK6 (CDK6)",
            "MET (MET)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "EGFR",
                "HER2",
                "KRAS",
                "BRAF",
                "MYC",
                "PIK3CA",
                "PTEN",
                "ROS1",
                "RET",
                "NTRK1",
                "NTRK2",
                "NTRK3",
                "FGFR1",
                "FGFR2",
                "FGFR3",
                "FGFR4",
                "CDK4",
                "CDK6",
                "MET"
            ],
            "mismatches": [
                "BRCA1",
                "BCL2",
                "ALK",
                "EML4-ALK"
            ],
            "true_referents": [
                "ALK and LTK ligand 1 (ALKAL1 aka AUGA, AUGB, FAM150A, UNQ9433)",
                "ALK receptor tyrosine kinase (ALK aka ALK1, CD246, NBLST3)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BCL2 like 10 (BCL2L10 aka BCL-B, Boo, Diva, bcl2-L-10)",
                "BCL2 like 11 (BCL2L11 aka BAM, BIM, BOD)",
                "BCL2 like 12 (BCL2L12)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "MET proto-oncogene, receptor tyrosine kinase (MET aka AUTS9, DA11, DFNB97, HGFR, RCCP2, c-Met)",
                "MYC binding protein (MYCBP aka AMY-1)",
                "MYC proto-oncogene, bHLH transcription factor (MYC aka MRTLC, bHLHe39, c-Myc, MYC)",
                "MYC target 1 (MYCT1 aka MTLC)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "RAS related (RRAS aka R-Ras1, RRAS)",
                "RAS related 2 (RRAS2 aka NS12, TC21)",
                "RELT like 1 (RELL1)",
                "ROS proto-oncogene 1, receptor tyrosine kinase (ROS1 aka MCF3, ROS, c-ros-1)",
                "Raf-1 proto-oncogene, serine/threonine kinase (RAF1 aka CMD1NN, CRAF, NS5, Raf-1, c-Raf)",
                "SLIT and NTRK like family member 3 (SLITRK3)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "TP53 target 3 (TP53TG3 aka P53TG3A, TP53TG3E, TP53TG3F, TP53TG3)",
                "aarF domain containing kinase 2 (ADCK2 aka AARF)",
                "alpha kinase 1 (ALPK1 aka 8430410J10Rik, LAK, ROSAH)",
                "alpha kinase 2 (ALPK2 aka HAK)",
                "cyclin dependent kinase 3 (CDK3)",
                "cyclin dependent kinase 4 (CDK4 aka CMM3, PSK-J3)",
                "cyclin dependent kinase 6 (CDK6 aka MCPH12, PLSTIRE)",
                "cyclin dependent kinase like 1 (CDKL1 aka KKIALRE, P42)",
                "cyclin dependent kinase like 2 (CDKL2 aka KKIAMRE, P56)",
                "cyclin dependent kinase like 4 (CDKL4)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "erb-b2 receptor tyrosine kinase 2 (ERBB2 aka CD340, HER-2, HER-2/neu, HER2, MLN 19, MLN-19, NEU, NGL, TKR1, VSCN2, c-ERB-2, c-ERB2, p185(erbB2))",
                "erb-b2 receptor tyrosine kinase 4 (ERBB4 aka ALS19, HER4, p180erbB4)",
                "fibroblast growth factor 2 (FGF2 aka BFGF, FGF-2, FGFB, HBGF-2)",
                "fibroblast growth factor 3 (FGF3 aka HBGF-3, INT2)",
                "fibroblast growth factor receptor 1 (FGFR1 aka BFGFR, CD331, CEK, ECCL, FGFBR, FGFR-1, FLG, FLT-2, FLT2, HBGFR, HH2, HRTFDS, KAL2, N-SAM, OGD, bFGF-R-1)",
                "fibroblast growth factor receptor 2 (FGFR2 aka BBDS, BEK, BFR-1, CD332, CEK3, CFD1, ECT1, JWS, K-SAM, KGFR, TK14, TK25)",
                "fibroblast growth factor receptor 3 (FGFR3 aka ACH, CD333, CEK2, HSFGFR3EX, JTK4)",
                "fibroblast growth factor receptor 4 (FGFR4 aka CD334, JTK2, TKF)",
                "fibroblast growth factor receptor like 1 (FGFRL1 aka FGFR-5, FGFR5, FHFR)",
                "granzyme M (GZMM aka LMET1, MET1)",
                "methenyltetrahydrofolate synthetase (MTHFS aka HsT19268, NEDMEHM)",
                "netrin 3 (NTN3 aka NTN2L)",
                "neurotrophic receptor tyrosine kinase 1 (NTRK1 aka MTC, TRK, TRK1, TRKA, Trk-A, p140-TrkA)",
                "neurotrophic receptor tyrosine kinase 2 (NTRK2 aka DEE58, EIEE58, GP145-TrkB, OBHD, TRKB, trk-B)",
                "neurotrophic receptor tyrosine kinase 3 (NTRK3 aka GP145-TrkC, TRKC, gp145(trkC))",
                "nicotinamide riboside kinase 1 (NMRK1 aka C9orf95, NRK1, bA235O14.2)",
                "nicotinamide riboside kinase 2 (NMRK2 aka ITGB1BP3, MIBP, NRK2)",
                "oxidative stress responsive kinase 1 (OXSR1 aka OSR1)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "phosphatidylinositol-4,5-bisphosphate 3-kinase catalytic subunit alpha (PIK3CA aka CCM4, CLAPO, CLOVE, CWS5, HMH, MCAP, MCM, MCMTC, PI3K, PI3K-alpha, p110-alpha)",
                "phosphatidylinositol-4,5-bisphosphate 3-kinase catalytic subunit beta (PIK3CB aka P110BETA, PI3K, PI3KBETA, PIK3C1)",
                "phosphatidylinositol-4-phosphate 3-kinase catalytic subunit type 2 beta (PIK3C2B aka C2-PI3K)",
                "protein tyrosine phosphatase receptor type E (PTPRE aka HPTPE, PTPE, R-PTP-EPSILON)",
                "receptor tyrosine kinase like orphan receptor 1 (ROR1 aka NTRKR1, dJ537F10.1)",
                "repetin (RPTN)",
                "ret proto-oncogene (RET aka CDHF12, CDHR16, HSCR1, MEN2A, MEN2B, MTC1, PTC-ELE1, RET)",
                "ribosome biogenesis regulator 1 homolog (RRS1)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "unc-51 like kinase 4 (ULK4 aka FAM7C1, REC01035)"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "Hemoglobin subunit beta (HBB)",
            "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
            "Insulin (INS)",
            "Growth Hormone (GH)",
            "Tumor Protein p53 (TP53)",
            "Epidermal Growth Factor Receptor (EGFR)",
            "Beta-2-Adrenergic Receptor (ADRB2)",
            "Duchenne Muscular Dystrophy gene (DMD)",
            "Huntingtin (HTT)",
            "Amyloid Precursor Protein (APP)",
            "Factor VIII (F8)",
            "Phenylalanine Hydroxylase (PAH)",
            "Albumin (ALB)",
            "Collagen Alpha-1 (COL1A1)",
            "Myoglobin (MYOG)",
            "Actin Beta (ACTB)",
            "Tubulin Alpha (TUBA1A)",
            "Keratin 5 (KRT5)",
            "Fibronectin 1 (FN1)",
            "Interleukin-2 (IL2)",
            "Granzyme B (GZMB)",
            "Peroxisome Proliferator-Activated Receptor Gamma (PPARG)",
            "Thyroid Peroxidase (TPO)",
            "Von Willebrand Factor (VWF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hemoglobin subunit beta (HBB)",
                "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
                "Insulin (INS)",
                "Tumor Protein p53 (TP53)",
                "Epidermal Growth Factor Receptor (EGFR)",
                "Beta-2-Adrenergic Receptor (ADRB2)",
                "Huntingtin (HTT)",
                "Amyloid Precursor Protein (APP)",
                "Factor VIII (F8)",
                "Phenylalanine Hydroxylase (PAH)",
                "Albumin (ALB)",
                "Actin Beta (ACTB)",
                "Keratin 5 (KRT5)",
                "Fibronectin 1 (FN1)",
                "Interleukin-2 (IL2)",
                "Granzyme B (GZMB)",
                "Peroxisome Proliferator-Activated Receptor Gamma (PPARG)",
                "Thyroid Peroxidase (TPO)",
                "Von Willebrand Factor (VWF)"
            ],
            "mismatches": [
                "Growth Hormone (GH)",
                "Duchenne Muscular Dystrophy gene (DMD)",
                "Collagen Alpha-1 (COL1A1)",
                "Myoglobin (MYOG)",
                "Tubulin Alpha (TUBA1A)"
            ],
            "true_referents": [
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "DM1 locus, WD repeat containing (DMWD aka D19S593E, DMR-N9, DMRN9, gene59)",
                "PPARG coactivator 1 beta (PPARGC1B aka ERRL1, PERC, PGC-1(beta), PGC1B)",
                "actin beta (ACTB aka BKRNS, BNS, BRWS1, CSMH, DDS1, PS1TP5BP1, THC8)",
                "actin beta like 2 (ACTBL2 aka ACT)",
                "actin related protein 3B (ACTR3B aka ARP11, ARP3BETA)",
                "adrenoceptor beta 1 (ADRB1 aka ADRB1R, B1AR, BETA1AR, FNSS2, RHR)",
                "adrenoceptor beta 2 (ADRB2 aka ADRB2R, ADRBR, ARB2, B2AR, BAR, BETA2AR)",
                "adrenoceptor beta 3 (ADRB3 aka BETA3AR)",
                "afamin (AFM aka ALB2, ALBA, ALF)",
                "albumin (ALB aka FDAHT, HSA, PRO0883, PRO0903, PRO1341)",
                "amyloid beta precursor like protein 1 (APLP1 aka APLP)",
                "amyloid beta precursor like protein 2 (APLP2 aka APLP-2, APPH, APPL2, CDEBP)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "coagulation factor VIII (F8 aka AHF, DXS1253EB, F8C, FVIII, HEMA, THPH13, F8)",
                "coagulation factor VIII associated 1 (F8A1 aka DXS522E, F8A, HAP40)",
                "coagulation factor VIII associated 2 (F8A2 aka HAP40)",
                "collagen type I alpha 1 chain (COL1A1 aka CAFYD, EDSARTH1, EDSC, OI1, OI2, OI3, OI4)",
                "collagen type X alpha 1 chain (COL10A1)",
                "collagen type XX alpha 1 chain (COL20A1)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "cytoglobin (CYGB aka HGB, NOD, STAP)",
                "dystrophin (DMD aka BMD, CMD3B, DXS142, DXS164, DXS206, DXS230, DXS239, DXS268, DXS269, DXS270, DXS272, MRX85)",
                "dystrophin related protein 2 (DRP2 aka DRP-2)",
                "eosinophil peroxidase (EPX aka EPO, EPP-PEN, EPXD, EPX)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "fibronectin 1 (FN1 aka CIG, ED-B, FINC, FN, FNZ, GFND, GFND2, LETS, MSF, SMDCF)",
                "granzyme A (GZMA aka CTLA3, HFSP)",
                "granzyme B (GZMB aka C11, CCPI, CGL-1, CGL1, CSP-B, CSPB, CTLA1, CTSGL1, HLP, SECT)",
                "granzyme M (GZMM aka LMET1, MET1)",
                "growth hormone 1 (GH1 aka GH, GH-N, GHB5, GHN, IGHD1A, IGHD1B, IGHD2, hGH-N)",
                "growth hormone 2 (GH2 aka GH-V, GHB2, GHL, GHV, hGH-V)",
                "growth hormone receptor (GHR aka GHBP, GHIP)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit delta (HBD aka HBK)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "huntingtin (HTT aka HD, IT15, LOMARS)",
                "huntingtin associated protein 1 (HAP1 aka HAP2, HIP5, HLP, hHLP1)",
                "huntingtin interacting protein K (HYPK aka C15orf63, HSPC136)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin degrading enzyme (IDE aka INSULYSIN)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "interleukin 2 (IL2 aka IL-2, TCGF, lymphokine)",
                "interleukin 25 (IL25 aka IL17E)",
                "interleukin 5 (IL5 aka EDF, IL-5, TRF)",
                "keratin 35 (KRT35 aka HA5, Ha-5, K35, KRTHA5, hHa5)",
                "keratin 5 (KRT5 aka CK5, DDD, DDD1, EBS1, EBS2, EBS2A, EBS2B, EBS2C, EBS2D, EBS2E, EBS2F, K5A, KRT5)",
                "keratin 85 (KRT85 aka ECTD4, HB5, Hb-5, K85, KRTHB5, hHb5)",
                "leucine rich repeat and fibronectin type III domain containing 2 (LRFN2 aka FIGLER2, KIAA1246, SALM1)",
                "leucine rich repeat and fibronectin type III domain containing 3 (LRFN3 aka FIGLER1, SALM4)",
                "myoglobin (MB aka MYOSB, PVALB)",
                "myosin X (MYO10 aka MyoX)",
                "parvalbumin (PVALB aka D22S749)",
                "peroxisome proliferator activated receptor alpha (PPARA aka NR1C1, PPAR, PPAR-alpha, PPARalpha, hPPAR)",
                "peroxisome proliferator activated receptor gamma (PPARG aka CIMT1, FPLD3, GLM1, NR1C31, PPARG2, PPARG5, PPARgamma, PPARG)",
                "phenylalanine hydroxylase (PAH aka PH, PKU, PKU1)",
                "pyridoxamine 5'-phosphate oxidase (PNPO aka HEL-S-302, PDXPO)",
                "thyroid peroxidase (TPO aka MSA, TDH2A, TPX)",
                "tryptophan hydroxylase 1 (TPH1 aka TPRH, TRPH)",
                "tubulin alpha 1b (TUBA1B aka K-ALPHA-1)",
                "tubulin alpha 1c (TUBA1C aka TUBA6, bcm948)",
                "tubulin alpha 4a (TUBA4A aka ALS22, H2-ALPHA, TUBA1)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)",
                "tyrosine hydroxylase (TH aka DYT14, DYT5b, TYH)",
                "von Willebrand factor (VWF aka F8VWF, VWD)",
                "von Willebrand factor A domain containing 5B1 (VWA5B1)",
                "von Willebrand factor A domain containing 5B2 (VWA5B2)"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1 (Breast Cancer Type 1 Susceptibility Protein)",
            "TP53 (Tumor Protein p53)",
            "EGFR (Epidermal Growth Factor Receptor)",
            "CFTR (Cystic Fibrosis Transmembrane Conductance Regulator)",
            "HBB (Hemoglobin Subunit Beta)",
            "APOE (Apolipoprotein E)",
            "FMR1 (Fragile X Mental Retardation 1)",
            "HTT (Huntingtin)",
            "G6PD (Glucose-6-Phosphate Dehydrogenase)",
            "MTHFR (Methylenetetrahydrofolate Reductase)",
            "ACE (Angiotensin I Converting Enzyme)",
            "INS (Insulin)",
            "PAH (Phenylalanine Hydroxylase)",
            "VHL (Von Hippel-Lindau Tumor Suppressor)",
            "DMD (Dystrophin)",
            "TTR (Transthyretin)",
            "COL1A1 (Collagen Type I Alpha 1 Chain)",
            "F8 (Coagulation Factor VIII)",
            "SMN1 (Survival Motor Neuron 1)",
            "RB1 (Retinoblastoma 1)",
            "ALB (Albumin)",
            "MYH7 (Myosin Heavy Chain 7)",
            "LDLR (Low Density Lipoprotein Receptor)",
            "SOD1 (Superoxide Dismutase 1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "EGFR",
                "CFTR",
                "HBB",
                "APOE",
                "HTT",
                "G6PD",
                "MTHFR",
                "ACE",
                "INS",
                "PAH",
                "VHL",
                "DMD",
                "TTR",
                "COL1A1",
                "F8",
                "SMN1",
                "RB1",
                "ALB",
                "MYH7",
                "LDLR",
                "SOD1"
            ],
            "mismatches": [
                "BRCA1",
                "FMR1"
            ],
            "true_referents": [
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "FMR1 autosomal homolog 1 (FXR1 aka CMYO9A, CMYO9B, CMYP9A, CMYP9BP, MYOPMIL, MYORIBF, FXR1)",
                "FMR1 autosomal homolog 2 (FXR2 aka FMR1L2P, FXR2)",
                "Fas binding factor 1 (FBF1 aka Alb, FBF-1)",
                "RB transcriptional corepressor 1 (RB1 aka OSRC, PPP1R130, RB, p105-Rb, p110-RB1, pRb, pp110)",
                "RB transcriptional corepressor like 1 (RBL1 aka CP107, PRB1, p107)",
                "RB1 inducible coiled-coil 1 (RB1CC1 aka ATG17, CC1, FIP200, PPP1R131)",
                "VHL binding protein 1 (VBP1 aka HIBBJ46, PFD3, PFDN3, VBP-1)",
                "VHL like (VHLL aka VHLP, VLP)",
                "afamin (AFM aka ALB2, ALBA, ALF)",
                "albumin (ALB aka FDAHT, HSA, PRO0883, PRO0903, PRO1341)",
                "angiotensin I converting enzyme (ACE aka ACE1, CD143, DCP, DCP1)",
                "angiotensin converting enzyme 2 (ACE2 aka ACEH)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "coagulation factor VIII (F8 aka AHF, DXS1253EB, F8C, FVIII, HEMA, THPH13, F8)",
                "coagulation factor VIII associated 1 (F8A1 aka DXS522E, F8A, HAP40)",
                "coagulation factor VIII associated 2 (F8A2 aka HAP40)",
                "collagen type I alpha 1 chain (COL1A1 aka CAFYD, EDSARTH1, EDSC, OI1, OI2, OI3, OI4)",
                "collagen type II alpha 1 chain (COL2A1 aka ANFH, AOM, COL11A3, SEDC, STL1)",
                "collagen type X alpha 1 chain (COL10A1)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "dihydrofolate reductase (DHFR aka DHFR1P1, DYR, DHFR)",
                "dihydrofolate reductase 2 (DHFR2 aka DHFRL1, DHFRP4)",
                "dystrophin (DMD aka BMD, CMD3B, DXS142, DXS164, DXS206, DXS230, DXS239, DXS268, DXS269, DXS270, DXS272, MRX85)",
                "dystrophin related protein 2 (DRP2 aka DRP-2)",
                "endothelin converting enzyme 1 (ECE1 aka ECE)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "fragile X messenger ribonucleoprotein 1 (FMR1 aka FMRP, FRAXA, POF, POF1)",
                "glucose-6-phosphate dehydrogenase (G6PD aka CNSHA11, G6PD)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit delta (HBD aka HBK)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "hexose-6-phosphate dehydrogenase/glucose 1-dehydrogenase (H6PD aka CORTRD1, G6PDH, GDHH, H6PD)",
                "huntingtin (HTT aka HD, IT15, LOMARS)",
                "huntingtin associated protein 1 (HAP1 aka HAP2, HIP5, HLP, hHLP1)",
                "huntingtin interacting protein K (HYPK aka C15orf63, HSPC136)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin degrading enzyme (IDE aka INSULYSIN)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "low density lipoprotein receptor (LDLR aka FH, FHC, FHCL1, LDLCQ2)",
                "low density lipoprotein receptor class A domain containing 1 (LDLRAD1)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "myosin heavy chain 1 (MYH1 aka HEL71, MYHSA1, MYHa, MyHC-2X/D, MyHC-2x)",
                "myosin heavy chain 7 (MYH7 aka CMD1S, CMH1, CMYO7A, CMYO7B, CMYP7A, CMYP7B, MPD1, MYHCB, SPMD, SPMM)",
                "myosin heavy chain 8 (MYH8 aka DA7, MyHC-peri, MyHC-pn, gtMHC-F)",
                "myotrophin (MTPN aka GCDP, V-1)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phenylalanine hydroxylase (PAH aka PH, PKU, PKU1)",
                "phosphogluconate dehydrogenase (PGD aka 6PGD)",
                "superoxide dismutase 1 (SOD1 aka ALS, ALS1, HEL-S-44, IPOA, SOD, STAHP, hSod1, homodimer)",
                "superoxide dismutase 2 (SOD2 aka GC1, GClnc1, IPO-B, IPOB, MNSOD, MVCD6, Mn-SOD, lncRNA-GC1)",
                "superoxide dismutase 3 (SOD3 aka EC-SOD)",
                "survival motor neuron domain containing 1 (SMNDC1 aka SMNR, SPF30, TDRD16C)",
                "survival of motor neuron 1, telomeric (SMN1 aka BCD541, GEMIN1, SMA, SMA1, SMA2, SMA3, SMA4, SMA@, SMN, SMNT, T-BCD541, TDRD16A)",
                "survival of motor neuron 2, centromeric (SMN2 aka BCD541, C-BCD541, GEMIN1, SMNC, TDRD16B)",
                "tetratricopeptide repeat domain 1 (TTC1 aka TPR1)",
                "thyrotropin releasing hormone receptor (TRHR aka CHNG7, TRH-R)",
                "transthyretin (TTR aka ATTR, CTS, CTS1, HEL111, HsT2651, PALB, TBPA, TTN)",
                "tryptophan hydroxylase 1 (TPH1 aka TPRH, TRPH)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)",
                "tyrosine hydroxylase (TH aka DYT14, DYT5b, TYH)",
                "very low density lipoprotein receptor (VLDLR aka CAMRQ1, CARMQ1, CHRMQ1, VLDL-RCH, VLDLR)",
                "von Hippel-Lindau tumor suppressor (VHL aka HRCA1, RCA11, pVHL, VHL)"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "TP53 (TP53)",
            "BRCA1 (BRCA1)",
            "EGFR (EGFR)",
            "MYC (MYC)",
            "KRAS (KRAS)",
            "VEGFA (VEGFA)",
            "PTEN (PTEN)",
            "APOE (APOE)",
            "IL6 (IL6)",
            "TNF (TNF)",
            "CASP3 (CASP3)",
            "BRAF (BRAF)",
            "CDKN2A (CDKN2A)",
            "PGR (PGR)",
            "SOD1 (SOD1)",
            "CFTR (CFTR)",
            "HBB (HBB)",
            "TPP1 (TPP1)",
            "FBN1 (FBN1)",
            "G6PD (G6PD)",
            "NTRK1 (NTRK1)",
            "HLA-DRB1 (HLA-DRB1)",
            "MTHFR (MTHFR)",
            "SLC6A4 (SLC6A4)",
            "RHO (RHO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "EGFR",
                "MYC",
                "KRAS",
                "VEGFA",
                "PTEN",
                "APOE",
                "IL6",
                "TNF",
                "CASP3",
                "BRAF",
                "PGR",
                "SOD1",
                "CFTR",
                "HBB",
                "TPP1",
                "G6PD",
                "NTRK1",
                "HLA-DRB1",
                "MTHFR",
                "SLC6A4"
            ],
            "mismatches": [
                "BRCA1",
                "CDKN2A",
                "FBN1",
                "RHO"
            ],
            "true_referents": [
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CDKN2A interacting protein (CDKN2AIP)",
                "CDKN2A interacting protein N-terminal like (CDKN2AIPNL aka C2AIL)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "G protein-coupled receptor 142 (GPR142 aka GPRg1b, PGR2)",
                "G protein-coupled receptor 153 (GPR153 aka PGR1)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "MYC binding protein (MYCBP aka AMY-1)",
                "MYC proto-oncogene, bHLH transcription factor (MYC aka MRTLC, bHLHe39, c-Myc, MYC)",
                "MYC target 1 (MYCT1 aka MTLC)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "RAS related (RRAS aka R-Ras1, RRAS)",
                "RAS related 2 (RRAS2 aka NS12, TC21)",
                "Raf-1 proto-oncogene, serine/threonine kinase (RAF1 aka CMD1NN, CRAF, NS5, Raf-1, c-Raf)",
                "TNF superfamily member 10 (TNFSF10 aka APO2L, Apo-2L, CD253, TANCR, TL2, TNLG6A, TRAIL)",
                "TNF superfamily member 11 (TNFSF11 aka CD254, ODF, OPGL, OPTB2, RANKL, TNLG6B, TRANCE, hRANKL2, sOdf)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "TP53 target 3 (TP53TG3 aka P53TG3A, TP53TG3E, TP53TG3F, TP53TG3)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "caspase 3 (CASP3 aka CPP32, CPP32B, SCA-1)",
                "caspase 5 (CASP5 aka ICE(rel)III, ICEREL-III, ICH-3)",
                "caspase 6 (CASP6 aka CSP-6, MCH2, caspase-6)",
                "cyclin dependent kinase 2 (CDK2 aka CDKN2, p33(CDK2))",
                "dihydrofolate reductase (DHFR aka DHFR1P1, DYR, DHFR)",
                "dihydrofolate reductase 2 (DHFR2 aka DHFRL1, DHFRP4)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "fibrillin 3 (FBN3)",
                "glucose-6-phosphate dehydrogenase (G6PD aka CNSHA11, G6PD)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hexose-6-phosphate dehydrogenase/glucose 1-dehydrogenase (H6PD aka CORTRD1, G6PDH, GDHH, H6PD)",
                "inhibin subunit beta B (INHBB)",
                "interleukin 13 (IL13 aka IL-13, P600)",
                "interleukin 6 (IL6 aka BSF-2, BSF2, CDF, HGF, HSF, IFN-beta-2, IFNB2, IL-6)",
                "interleukin 7 (IL7 aka IL-7, IMD130)",
                "lactase (LCT aka LAC, LPH, LPH1)",
                "major histocompatibility complex, class I, B (HLA-B aka AS, B-4901, HLAB)",
                "major histocompatibility complex, class II, DR alpha (HLA-DRA aka HLA-DRA1)",
                "major histocompatibility complex, class II, DR beta 1 (HLA-DRB1 aka DRB1, HLA-DR1B, HLA-DRB, SS1)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "neurotrophic receptor tyrosine kinase 1 (NTRK1 aka MTC, TRK, TRK1, TRKA, Trk-A, p140-TrkA)",
                "nicotinamide riboside kinase 1 (NMRK1 aka C9orf95, NRK1, bA235O14.2)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "phosphogluconate dehydrogenase (PGD aka 6PGD)",
                "plexin B1 (PLXNB1 aka PLEXIN-B1, PLXN5, SEP)",
                "progesterone receptor (PGR aka NR3C3, PR)",
                "proline rich and Gla domain 1 (PRRG1 aka PRGP1)",
                "protein tyrosine phosphatase receptor type E (PTPRE aka HPTPE, PTPE, R-PTP-EPSILON)",
                "receptor tyrosine kinase like orphan receptor 1 (ROR1 aka NTRKR1, dJ537F10.1)",
                "solute carrier family 1 member 6 (SLC1A6 aka EAAT4)",
                "solute carrier family 2 member 4 (SLC2A4 aka GLUT4)",
                "solute carrier family 6 member 4 (SLC6A4 aka 5-HTT, 5-HTTLPR, 5HTT, HTT, OCD1, SERT, SERT1, hSERT)",
                "superoxide dismutase 1 (SOD1 aka ALS, ALS1, HEL-S-44, IPOA, SOD, STAHP, hSod1, homodimer)",
                "superoxide dismutase 2 (SOD2 aka GC1, GClnc1, IPO-B, IPOB, MNSOD, MVCD6, Mn-SOD, lncRNA-GC1)",
                "superoxide dismutase 3 (SOD3 aka EC-SOD)",
                "tripeptidyl peptidase 1 (TPP1 aka CLN2, GIG1, LPIC, SCAR7, TPP-1)",
                "tripeptidyl peptidase 2 (TPP2 aka IMD78, TPP-2, TPP-II, TPPII)",
                "tumor necrosis factor (TNF aka DIF, IMD127-alpha, TNFA, TNFSF2, TNLG1F, TNF)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "ubinuclein 1 (UBN1 aka VT, VT4)",
                "ubiquitin B (UBB aka HEL-S-50)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor D (VEGFD aka FIGF, VEGF-D)"
            ],
            "TP": 21,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1 (BRCA1)",
            "BRCA2 (BRCA2)",
            "TP53 (TP53)",
            "EGFR (EGFR)",
            "HER2 (HER2)",
            "CFTR (CFTR)",
            "APC (APC)",
            "MYC (MYC)",
            "PTEN (PTEN)",
            "RB1 (RB1)",
            "KRAS (KRAS)",
            "PIK3CA (PIK3CA)",
            "AKT1 (AKT1)",
            "VHL (VHL)",
            "MDM2 (MDM2)",
            "CDKN2A (CDKN2A)",
            "BCL2 (BCL2)",
            "FLT3 (FLT3)",
            "KIT (KIT)",
            "MYB (MYB)",
            "NOTCH1 (NOTCH1)",
            "ABL1 (ABL1)",
            "JAK2 (JAK2)",
            "RET (RET)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BRCA2 (BRCA2)",
                "TP53 (TP53)",
                "EGFR (EGFR)",
                "CFTR (CFTR)",
                "MYC (MYC)",
                "PTEN (PTEN)",
                "RB1 (RB1)",
                "KRAS (KRAS)",
                "PIK3CA (PIK3CA)",
                "AKT1 (AKT1)",
                "MDM2 (MDM2)",
                "FLT3 (FLT3)",
                "KIT (KIT)",
                "MYB (MYB)",
                "NOTCH1 (NOTCH1)",
                "RET (RET)"
            ],
            "mismatches": [
                "BRCA1 (BRCA1)",
                "HER2 (HER2)",
                "APC (APC)",
                "VHL (VHL)",
                "CDKN2A (CDKN2A)",
                "BCL2 (BCL2)",
                "ABL1 (ABL1)",
                "JAK2 (JAK2)"
            ],
            "true_referents": [
                "ABL proto-oncogene 1, non-receptor tyrosine kinase (ABL1 aka ABL, BCR-ABL, CHDSKM, JTK7, bcr/abl, c-ABL, c-ABL1, p150, v-abl)",
                "ABL proto-oncogene 2, non-receptor tyrosine kinase (ABL2 aka ABLL, ARG)",
                "AKT serine/threonine kinase 1 (AKT1 aka AKT, PKB, PKB-ALPHA, PRKBA, RAC, RAC-ALPHA)",
                "AKT serine/threonine kinase 2 (AKT2 aka HIHGHH, PKBB, PKBBETA, PRKBB, RAC-BETA)",
                "AKT serine/threonine kinase 3 (AKT3 aka MPPH, MPPH2, PKB-GAMMA, PKBG, PRKBG, RAC-PK-gamma, RAC-gamma, STK-2)",
                "APC down-regulated 1 like (APCDD1L)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BCL2 like 10 (BCL2L10 aka BCL-B, Boo, Diva, bcl2-L-10)",
                "BCL2 like 11 (BCL2L11 aka BAM, BIM, BOD)",
                "BCL2 like 12 (BCL2L12)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 DNA repair associated (BRCA2 aka BRCC2, BROVCA2, FACD, FAD, FAD1, FANCD, FANCD1, GLM3, PNCA2, XRCC11)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CDKN2A interacting protein (CDKN2AIP)",
                "CDKN2A interacting protein N-terminal like (CDKN2AIPNL aka C2AIL)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "FLT3 interacting zinc finger 1 (FIZ1 aka ZNF798)",
                "Janus kinase 1 (JAK1 aka AIIDEA, JAK1B, JTK3, JAK1)",
                "Janus kinase 2 (JAK2 aka JTK10)",
                "Janus kinase 3 (JAK3 aka JAK-3_HUMAN, JAKL, L-JAK, LJAK, JAK3)",
                "KIT proto-oncogene, receptor tyrosine kinase (KIT aka C-Kit, CD117, MASTC, PBT, SCFR)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "MDM2 binding protein (MTBP aka MDM2BP)",
                "MDM2 proto-oncogene (MDM2 aka ACTFS, HDMX, LSKB, hdm2)",
                "MDM4 regulator of p53 (MDM4 aka BMFS6, HDMX, MDMX, MRP1)",
                "MYB proto-oncogene, transcription factor (MYB aka Cmyb, c-myb, c-myb_CDS, efg)",
                "MYC binding protein (MYCBP aka AMY-1)",
                "MYC proto-oncogene, bHLH transcription factor (MYC aka MRTLC, bHLHe39, c-Myc, MYC)",
                "MYC target 1 (MYCT1 aka MTLC)",
                "Myb/SANT DNA binding domain containing 7 (MSANTD7)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "RAS related (RRAS aka R-Ras1, RRAS)",
                "RAS related 2 (RRAS2 aka NS12, TC21)",
                "RB transcriptional corepressor 1 (RB1 aka OSRC, PPP1R130, RB, p105-Rb, p110-RB1, pRb, pp110)",
                "RB transcriptional corepressor like 1 (RBL1 aka CP107, PRB1, p107)",
                "RB1 inducible coiled-coil 1 (RB1CC1 aka ATG17, CC1, FIP200, PPP1R131)",
                "RELT like 1 (RELL1)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "TP53 target 3 (TP53TG3 aka P53TG3A, TP53TG3E, TP53TG3F, TP53TG3)",
                "VHL binding protein 1 (VBP1 aka HIBBJ46, PFD3, PFDN3, VBP-1)",
                "VHL like (VHLL aka VHLP, VLP)",
                "abl interactor 1 (ABI1 aka ABI-1, ABLBP4, E3B1, NAP1BP, SSH3BP, SSH3BP1)",
                "anaphase promoting complex subunit 2 (ANAPC2 aka APC2)",
                "anaphase promoting complex subunit 5 (ANAPC5 aka APC5)",
                "cyclin dependent kinase 2 (CDK2 aka CDKN2, p33(CDK2))",
                "delta like canonical Notch ligand 1 (DLL1 aka DELTA1, DL1, Delta, NEDBAS)",
                "delta like non-canonical Notch ligand 1 (DLK1 aka DLK, DLK-1, Delta1, FA1, PREF1, Pref-1, ZOG, pG2)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "erb-b2 receptor tyrosine kinase 2 (ERBB2 aka CD340, HER-2, HER-2/neu, HER2, MLN 19, MLN-19, NEU, NGL, TKR1, VSCN2, c-ERB-2, c-ERB2, p185(erbB2))",
                "erb-b2 receptor tyrosine kinase 4 (ERBB4 aka ALS19, HER4, p180erbB4)",
                "fms related receptor tyrosine kinase 3 (FLT3 aka CD135, FLK-2, FLK2, STK1)",
                "fms related receptor tyrosine kinase 3 ligand (FLT3LG aka FL, FLG3L, FLT3L, IMD125)",
                "high density lipoprotein binding protein (HDLBP aka HBP, PRO2900, VGL)",
                "lactase (LCT aka LAC, LPH, LPH1)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "notch receptor 1 (NOTCH1 aka AOS5, AOVD1, TAN1, hN1)",
                "paired box 4 (PAX4 aka KPD, MODY9)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "phosphatidylinositol-4,5-bisphosphate 3-kinase catalytic subunit alpha (PIK3CA aka CCM4, CLAPO, CLOVE, CWS5, HMH, MCAP, MCM, MCMTC, PI3K, PI3K-alpha, p110-alpha)",
                "phosphatidylinositol-4,5-bisphosphate 3-kinase catalytic subunit beta (PIK3CB aka P110BETA, PI3K, PI3KBETA, PIK3C1)",
                "phosphatidylinositol-4-phosphate 3-kinase catalytic subunit type 2 beta (PIK3C2B aka C2-PI3K)",
                "protein tyrosine phosphatase receptor type E (PTPRE aka HPTPE, PTPE, R-PTP-EPSILON)",
                "repetin (RPTN)",
                "ret proto-oncogene (RET aka CDHF12, CDHR16, HSCR1, MEN2A, MEN2B, MTC1, PTC-ELE1, RET)",
                "target of myb1 membrane trafficking protein (TOM1 aka IMD85)",
                "tektin 4 (TEKT4)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1",
            "TP53",
            "EGFR",
            "CFTR",
            "ACTA1",
            "MYH7",
            "INS",
            "APOE",
            "HBB",
            "PTEN",
            "KRAS",
            "LMNA",
            "CDH1",
            "SMN1",
            "FGFR3",
            "GJB2",
            "COL1A1",
            "DMD",
            "FMR1",
            "HTT",
            "SMAD4",
            "MTHFR",
            "BRCA2",
            "CYP2D6"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "EGFR",
                "CFTR",
                "APOE",
                "HBB",
                "PTEN",
                "KRAS",
                "CDH1",
                "FGFR3",
                "COL1A1",
                "DMD",
                "SMAD4",
                "MTHFR",
                "BRCA2",
                "CYP2D6"
            ],
            "mismatches": [
                "BRCA1",
                "ACTA1",
                "MYH7",
                "INS",
                "LMNA",
                "SMN1",
                "GJB2",
                "FMR1",
                "HTT"
            ],
            "true_referents": [
                "5-methyltetrahydrofolate-homocysteine methyltransferase reductase (MTRR aka MSR, cblE)",
                "ATP binding cassette subfamily F member 3 (ABCF3 aka EST201864)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 DNA repair associated (BRCA2 aka BRCC2, BROVCA2, FACD, FAD, FAD1, FANCD, FANCD1, GLM3, PNCA2, XRCC11)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "BRISC and BRCA1 A complex member 2 (BABAM2 aka BRCC4, BRCC45, BRE)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "FMR1 autosomal homolog 1 (FXR1 aka CMYO9A, CMYO9B, CMYP9A, CMYP9BP, MYOPMIL, MYORIBF, FXR1)",
                "FMR1 autosomal homolog 2 (FXR2 aka FMR1L2P, FXR2)",
                "FMR1 neighbor (FMR1NB aka CT37, NY-SAR-35, NYSAR35)",
                "G protein subunit alpha 12 (GNA12 aka HG1M1, NNX3, RMP, gep)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "RAS related (RRAS aka R-Ras1, RRAS)",
                "RAS related 2 (RRAS2 aka NS12, TC21)",
                "SMAD family member 1 (SMAD1 aka BSP-1, BSP1, JV4-1, JV41, MADH1, MADR1)",
                "SMAD family member 4 (SMAD4 aka DPC4, JIP, MADH4, MYHRS)",
                "SMAD family member 6 (SMAD6 aka AOVD2, HsT17432, MADH6, MADH7)",
                "TP53 regulated inhibitor of apoptosis 1 (TRIAP1 aka HSPC132, MDM35, P53CSV, WF-1)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "actin gamma 1 (ACTG1 aka ACT, ACTG, DFNA20, DFNA26, HEL-176)",
                "actin related protein 1A (ACTR1A aka ARP1, Arp1A, CTRN1)",
                "actin related protein T1 (ACTRT1 aka AIP1, ARIP1, ARPT1, HSD27)",
                "apolipoprotein A1 (APOA1 aka AMYLD3, HPALP2, apo(a))",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "cadherin 1 (CDH1 aka Arc-1, BCDS1, CD324, CDHE, ECAD, LCAM, UVO)",
                "cadherin 7 (CDH7 aka CDH7L1)",
                "cadherin 9 (CDH9)",
                "collagen type I alpha 1 chain (COL1A1 aka CAFYD, EDSARTH1, EDSC, OI1, OI2, OI3, OI4)",
                "collagen type X alpha 1 chain (COL10A1)",
                "collagen type XXI alpha 1 chain (COL21A1 aka COLA1L, FP633)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "cytochrome P450 2D6 (LOC107987479 aka CYP2D6)",
                "cytochrome P450 family 2 subfamily A member 6 (CYP2A6 aka CPA6, CYP2A, CYP2A3, CYPIIA6, P450C2A, P450PB)",
                "cytochrome P450 family 2 subfamily R member 1 (CYP2R1)",
                "dihydrofolate reductase (DHFR aka DHFR1P1, DYR, DHFR)",
                "dymeclin (DYM aka DMC, SMC)",
                "dynamin 3 (DNM3 aka Dyna III)",
                "dystrophin (DMD aka BMD, CMD3B, DXS142, DXS164, DXS206, DXS230, DXS239, DXS268, DXS269, DXS270, DXS272, MRX85)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "fibroblast growth factor 3 (FGF3 aka HBGF-3, INT2)",
                "fibroblast growth factor receptor 1 (FGFR1 aka BFGFR, CD331, CEK, ECCL, FGFBR, FGFR-1, FLG, FLT-2, FLT2, HBGFR, HH2, HRTFDS, KAL2, N-SAM, OGD, bFGF-R-1)",
                "fibroblast growth factor receptor 3 (FGFR3 aka ACH, CD333, CEK2, HSFGFR3EX, JTK4)",
                "fibroblast growth factor receptor like 1 (FGFRL1 aka FGFR-5, FGFR5, FHFR)",
                "formin 1 (FMN1 aka FMN, LD)",
                "gap junction protein beta 1 (GJB1 aka CMTX, CMTX1, CX32)",
                "gap junction protein beta 5 (GJB5 aka CX31.1)",
                "glutathione S-transferase theta 1 (GSTT1)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hepatocellular carcinoma associated transcript 5 (HCCAT5 aka FJ222407, HTA)",
                "high density lipoprotein binding protein (HDLBP aka HBP, PRO2900, VGL)",
                "huntingtin (HTT aka HD, IT15, LOMARS)",
                "importin 9 (IPO9 aka Imp9)",
                "inhibin subunit beta B (INHBB)",
                "maestro heat like repeat family member 1 (MROH1 aka HEATR7A)",
                "melan-A (MLANA aka MART-1, MART1)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "myeloid cell nuclear differentiation antigen (MNDA aka PYHIN3)",
                "myosin heavy chain 7B (MYH7B aka MHC14, MYH14, lncMYH7b)",
                "myosin heavy chain 8 (MYH8 aka DA7, MyHC-peri, MyHC-pn, gtMHC-F)",
                "netrin 1 (NTN1 aka MRMV4, NET1L, NTN1)",
                "ninein (NIN aka SCKL7)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "protein tyrosine phosphatase receptor type E (PTPRE aka HPTPE, PTPE, R-PTP-EPSILON)",
                "secernin 1 (SCRN1 aka SES1)",
                "septin 11 (SEPTIN11 aka SEPT11, Septin-11)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "ubiquitin conjugating enzyme E2 J2 (UBE2J2 aka NCUBE-2, NCUBE2, PRO2121, UBC6)"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "Tumor protein p53 (TP53)",
            "Breast cancer type 1 susceptibility protein (BRCA1)",
            "BRCA2 DNA repair associated (BRCA2)",
            "Epidermal growth factor receptor (EGFR)",
            "Insulin receptor (INSR)",
            "Signal transducer and activator of transcription 3 (STAT3)",
            "Vascular endothelial growth factor A (VEGFA)",
            "Cyclin dependent kinase 2 (CDK2)",
            "B-cell lymphoma 2 (BCL2)",
            "Nuclear factor kappa B subunit 1 (NFKB1)",
            "Mitogen-activated protein kinase kinase 1 (MAP2K1)",
            "Phosphoinositide-3-kinase catalytic subunit alpha (PIK3CA)",
            "Retinoblastoma protein (RB1)",
            "Hepatocyte growth factor receptor (MET)",
            "Janus kinase 2 (JAK2)",
            "Ras oncogene homolog (HRAS)",
            "Neurotrophic tyrosine kinase receptor type 2 (NTRK2)",
            "Phosphatase and tensin homolog (PTEN)",
            "Cyclin D1 (CCND1)",
            "Proto-oncogene tyrosine-protein kinase (ABL1)",
            "Fibroblast growth factor receptor 3 (FGFR3)",
            "KIT proto-oncogene receptor tyrosine kinase (KIT)",
            "Anaplastic lymphoma kinase (ALK)",
            "Nuclear receptor subfamily 3 group C member 1 (NR3C1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Tumor protein p53 (TP53)",
                "BRCA2 DNA repair associated (BRCA2)",
                "Epidermal growth factor receptor (EGFR)",
                "Insulin receptor (INSR)",
                "Signal transducer and activator of transcription 3 (STAT3)",
                "Vascular endothelial growth factor A (VEGFA)",
                "Cyclin dependent kinase 2 (CDK2)",
                "Nuclear factor kappa B subunit 1 (NFKB1)",
                "Mitogen-activated protein kinase kinase 1 (MAP2K1)",
                "Phosphatase and tensin homolog (PTEN)",
                "Cyclin D1 (CCND1)",
                "Janus kinase 2 (JAK2)",
                "Neurotrophic receptor tyrosine kinase 2 (NTRK2)",
                "Fibroblast growth factor receptor 3 (FGFR3)",
                "KIT proto-oncogene, receptor tyrosine kinase (KIT)",
                "Anaplastic lymphoma kinase (ALK)",
                "Nuclear receptor subfamily 3 group C member 1 (NR3C1)"
            ],
            "mismatches": [
                "Breast cancer type 1 susceptibility protein (BRCA1)",
                "B-cell lymphoma 2 (BCL2)",
                "Retinoblastoma protein (RB1)",
                "Hepatocyte growth factor receptor (MET)",
                "Ras oncogene homolog (HRAS)",
                "Proto-oncogene tyrosine-protein kinase (ABL1)"
            ],
            "true_referents": [
                "ABL proto-oncogene 1, non-receptor tyrosine kinase (ABL1 aka ABL, BCR-ABL, CHDSKM, JTK7, bcr/abl, c-ABL, c-ABL1, p150, v-abl)",
                "ABL proto-oncogene 2, non-receptor tyrosine kinase (ABL2 aka ABLL, ARG)",
                "ALK receptor tyrosine kinase (ALK aka ALK1, CD246, NBLST3)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BCL2 like 10 (BCL2L10 aka BCL-B, Boo, Diva, bcl2-L-10)",
                "BCL2 like 11 (BCL2L11 aka BAM, BIM, BOD)",
                "BCL2 like 12 (BCL2L12)",
                "BRCA1 DNA repair associated (BRCA1 aka BRCAI, BRCC1, BROVCA1, FANCS, IRIS, PNCA4, PPP1R53, PSCP, RNF53)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 DNA repair associated (BRCA2 aka BRCC2, BROVCA2, FACD, FAD, FAD1, FANCD, FANCD1, GLM3, PNCA2, XRCC11)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "ES cell expressed Ras (ERAS aka HRAS2, HRASP)",
                "HRas proto-oncogene, GTPase (HRAS aka C-BAS/HAS, C-H-RAS, C-HA-RAS1, CTLO, H-RASIDX, HAMSV1, RASH1, p21ras, HRAS)",
                "Janus kinase 1 (JAK1 aka AIIDEA, JAK1B, JTK3, JAK1)",
                "Janus kinase 2 (JAK2 aka JTK10)",
                "Janus kinase 3 (JAK3 aka JAK-3_HUMAN, JAKL, L-JAK, LJAK, JAK3)",
                "KIT ligand (KITLG aka DCUA, DFNA69, FPH2, FPHH, KL-1, Kitl, MGF, SCF, SF, SHEP7, SLF, WS2F)",
                "KIT proto-oncogene, receptor tyrosine kinase (KIT aka C-Kit, CD117, MASTC, PBT, SCFR)",
                "MET proto-oncogene, receptor tyrosine kinase (MET aka AUTS9, DA11, DFNB97, HGFR, RCCP2, c-Met)",
                "RAS related (RRAS aka R-Ras1, RRAS)",
                "RB transcriptional corepressor like 1 (RBL1 aka CP107, PRB1, p107)",
                "RB1 inducible coiled-coil 1 (RB1CC1 aka ATG17, CC1, FIP200, PPP1R131)",
                "abl interactor 1 (ABI1 aka ABI-1, ABLBP4, E3B1, NAP1BP, SSH3BP, SSH3BP1)",
                "alpha kinase 1 (ALPK1 aka 8430410J10Rik, LAK, ROSAH)",
                "alpha kinase 2 (ALPK2 aka HAK)",
                "cyclin D1 (CCND1 aka BCL1, D11S287E, PRAD1, U21B31)",
                "cyclin D2 (CCND2 aka KIAK0002, MPPH3)",
                "cyclin D3 (CCND3)",
                "cyclin dependent kinase 1 (CDK1 aka CDC2, CDC28A, P34CDC2)",
                "cyclin dependent kinase 2 (CDK2 aka CDKN2, p33(CDK2))",
                "cyclin dependent kinase 3 (CDK3)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "fibroblast growth factor receptor 1 (FGFR1 aka BFGFR, CD331, CEK, ECCL, FGFBR, FGFR-1, FLG, FLT-2, FLT2, HBGFR, HH2, HRTFDS, KAL2, N-SAM, OGD, bFGF-R-1)",
                "fibroblast growth factor receptor 3 (FGFR3 aka ACH, CD333, CEK2, HSFGFR3EX, JTK4)",
                "fibroblast growth factor receptor like 1 (FGFRL1 aka FGFR-5, FGFR5, FHFR)",
                "hepatocyte growth factor (HGF aka DFNB39, F-TCFB, HPTA, SF, HGF)",
                "hepatocyte growth factor-regulated tyrosine kinase substrate (HGS aka HRS)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "insulin receptor related receptor (INSRR aka IRR)",
                "insulin receptor substrate 1 (IRS1 aka HIRS-1)",
                "mitogen-activated protein kinase 1 (MAPK1 aka ERK, ERK-2, ERK2, ERT1, MAPK2, NS13, P42MAPK, PRKM1, PRKM2, p38, p40, p41, p41mapk, p42-MAPK)",
                "mitogen-activated protein kinase kinase 1 (MAP2K1 aka CFC3, MAPKK1, MEK1, MEL, MKK1, PRKMK1)",
                "mitogen-activated protein kinase kinase kinase 1 (MAP3K1 aka MAPKKK1, MEKK, MEKK 1, MEKK1, SRXY6)",
                "neurotrophic receptor tyrosine kinase 1 (NTRK1 aka MTC, TRK, TRK1, TRKA, Trk-A, p140-TrkA)",
                "neurotrophic receptor tyrosine kinase 2 (NTRK2 aka DEE58, EIEE58, GP145-TrkB, OBHD, TRKB, trk-B)",
                "neurotrophic receptor tyrosine kinase 3 (NTRK3 aka GP145-TrkC, TRKC, gp145(trkC))",
                "nuclear factor kappa B subunit 1 (NFKB1 aka CVID12, EBP-1, KBF1, NF-kB, NF-kB1, NF-kappa-B1, NF-kappaB, NF-kappabeta, NFKB-p105, NFKB-p50, NFkappaB)",
                "nuclear factor kappa B subunit 2 (NFKB2 aka CVID10, H2TF1, LYT-10, LYT10, NF-kB2, p100, p49/p100, p52)",
                "nuclear factor related to kappaB binding protein (NFRKB aka INO80G)",
                "nuclear receptor subfamily 2 group E member 3 (NR2E3 aka ESCS, PNR, RNR, RP37, rd7)",
                "nuclear receptor subfamily 3 group C member 1 (NR3C1 aka GCCR, GCR, GCRST, GR, GRL)",
                "nuclear receptor subfamily 3 group C member 2 (NR3C2 aka MCR, MLR, MRVIT, NR3C2)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "phosphatidylinositol-4,5-bisphosphate 3-kinase catalytic subunit alpha (PIK3CA aka CCM4, CLAPO, CLOVE, CWS5, HMH, MCAP, MCM, MCMTC, PI3K, PI3K-alpha, p110-alpha)",
                "phosphatidylinositol-4,5-bisphosphate 3-kinase catalytic subunit beta (PIK3CB aka P110BETA, PI3K, PI3KBETA, PIK3C1)",
                "phosphoinositide-3-kinase regulatory subunit 3 (PIK3R3 aka p55, p55-GAMMA, p55PIK)",
                "retinol binding protein 1 (RBP1 aka CRABP-I, CRBP, CRBP1, CRBPI, RBPC, hCRBP1)",
                "signal transducer and activator of transcription 1 (STAT1 aka CANDF7, IMD31A, IMD31B, IMD31C, ISGF-3, STAT91)",
                "signal transducer and activator of transcription 2 (STAT2 aka IMD44, ISGF-3, P113, PTORCH3, STAT113)",
                "signal transducer and activator of transcription 3 (STAT3 aka ADMIO, ADMIO1, APRF, HIES)",
                "transmembrane phosphatase with tensin homology (TPTE aka CT44, PTEN21, TPTE)",
                "transmembrane phosphoinositide 3-phosphatase and tensin homolog 2 (TPTE2 aka TPIP)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor C (VEGFC aka Flt4-L, LMPH1D, LMPHM4, VRP)"
            ],
            "TP": 17,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1 (Breast Cancer 1)",
            "TP53 (Tumor Protein 53)",
            "CFTR (Cystic Fibrosis Transmembrane Conductance Regulator)",
            "APOE (Apolipoprotein E)",
            "INS (Insulin)",
            "HBB (Hemoglobin Subunit Beta)",
            "EGFR (Epidermal Growth Factor Receptor)",
            "KRAS (KRAS Proto-Oncogene, GTPase)",
            "PTEN (Phosphatase and Tensin Homolog)",
            "IL6 (Interleukin 6)",
            "TNF (Tumor Necrosis Factor)",
            "APP (Amyloid Beta Precursor Protein)",
            "VEGFA (Vascular Endothelial Growth Factor A)",
            "MTHFR (Methylenetetrahydrofolate Reductase)",
            "ACE (Angiotensin I Converting Enzyme)",
            "BDNF (Brain Derived Neurotrophic Factor)",
            "COL1A1 (Collagen Type I Alpha 1 Chain)",
            "CYP2D6 (Cytochrome P450 Family 2 Subfamily D Member 6)",
            "F8 (Coagulation Factor VIII)",
            "GH1 (Growth Hormone 1)",
            "HMGCR (3-Hydroxy-3-Methylglutaryl-CoA Reductase)",
            "LDLR (Low Density Lipoprotein Receptor)",
            "MAOA (Monoamine Oxidase A)",
            "PAH (Phenylalanine Hydroxylase)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BRCA1 (Breast Cancer 1)",
                "TP53 (Tumor Protein 53)",
                "CFTR (Cystic Fibrosis Transmembrane Conductance Regulator)",
                "APOE (Apolipoprotein E)",
                "INS (Insulin)",
                "HBB (Hemoglobin Subunit Beta)",
                "EGFR (Epidermal Growth Factor Receptor)",
                "KRAS (KRAS Proto-Oncogene, GTPase)",
                "PTEN (Phosphatase and Tensin Homolog)",
                "IL6 (Interleukin 6)",
                "TNF (Tumor Necrosis Factor)",
                "APP (Amyloid Beta Precursor Protein)",
                "VEGFA (Vascular Endothelial Growth Factor A)",
                "MTHFR (Methylenetetrahydrofolate Reductase)",
                "ACE (Angiotensin I Converting Enzyme)",
                "BDNF (Brain Derived Neurotrophic Factor)",
                "COL1A1 (Collagen Type I Alpha 1 Chain)",
                "CYP2D6 (Cytochrome P450 Family 2 Subfamily D Member 6)",
                "F8 (Coagulation Factor VIII)",
                "GH1 (Growth Hormone 1)",
                "HMGCR (3-Hydroxy-3-Methylglutaryl-CoA Reductase)",
                "LDLR (Low Density Lipoprotein Receptor)",
                "MAOA (Monoamine Oxidase A)",
                "PAH (Phenylalanine Hydroxylase)"
            ],
            "mismatches": [],
            "true_referents": [
                "3-hydroxy-3-methylglutaryl-CoA lyase (HMGCL aka HL1, HMGCL)",
                "3-hydroxy-3-methylglutaryl-CoA reductase (HMGCR aka LDLCQ3, LGMDR28, MYPLG)",
                "3-hydroxy-3-methylglutaryl-CoA synthase 1 (HMGCS1 aka HMGCS)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 DNA repair associated (BRCA1 aka BRCAI, BRCC1, BROVCA1, FANCS, IRIS, PNCA4, PPP1R53, PSCP, RNF53)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "DIRAS family GTPase 2 (DIRAS2 aka Di-Ras2)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "NRAS proto-oncogene, GTPase (NRAS aka ALPS4, CMNS, KRAS, N-ras, NCMS1, NS6, NRAS)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "TNF superfamily member 11 (TNFSF11 aka CD254, ODF, OPGL, OPTB2, RANKL, TNLG6B, TRANCE, hRANKL2, sOdf)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "amyloid beta precursor like protein 2 (APLP2 aka APLP-2, APPH, APPL2, CDEBP)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "amyloid beta precursor protein binding protein 2 (APPBP2 aka APP-BP2, HS.84084, PAT1)",
                "angiotensin I converting enzyme (ACE aka ACE1, CD143, DCP, DCP1)",
                "angiotensin converting enzyme 2 (ACE2 aka ACEH)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "brain derived neurotrophic factor (BDNF aka ANON2, BULN2)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "coagulation factor VIII (F8 aka AHF, DXS1253EB, F8C, FVIII, HEMA, THPH13, F8)",
                "coagulation factor VIII associated 1 (F8A1 aka DXS522E, F8A, HAP40)",
                "coagulation factor VIII associated 2 (F8A2 aka HAP40)",
                "collagen type I alpha 1 chain (COL1A1 aka CAFYD, EDSARTH1, EDSC, OI1, OI2, OI3, OI4)",
                "collagen type II alpha 1 chain (COL2A1 aka ANFH, AOM, COL11A3, SEDC, STL1)",
                "collagen type X alpha 1 chain (COL10A1)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "cytochrome P450 2D6 (LOC107987479 aka CYP2D6)",
                "cytochrome P450 family 2 subfamily A member 6 (CYP2A6 aka CPA6, CYP2A, CYP2A3, CYPIIA6, P450C2A, P450PB)",
                "cytochrome P450 family 2 subfamily R member 1 (CYP2R1)",
                "dihydrofolate reductase (DHFR aka DHFR1P1, DYR, DHFR)",
                "dihydrofolate reductase 2 (DHFR2 aka DHFRL1, DHFRP4)",
                "endothelin converting enzyme 1 (ECE1 aka ECE)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "growth hormone 1 (GH1 aka GH, GH-N, GHB5, GHN, IGHD1A, IGHD1B, IGHD2, hGH-N)",
                "growth hormone 2 (GH2 aka GH-V, GHB2, GHL, GHV, hGH-V)",
                "growth hormone receptor (GHR aka GHBP, GHIP)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit delta (HBD aka HBK)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin degrading enzyme (IDE aka INSULYSIN)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "interleukin 13 (IL13 aka IL-13, P600)",
                "interleukin 5 (IL5 aka EDF, IL-5, TRF)",
                "interleukin 6 (IL6 aka BSF-2, BSF2, CDF, HGF, HSF, IFN-beta-2, IFNB2, IL-6)",
                "interleukin 7 (IL7 aka IL-7, IMD130)",
                "low density lipoprotein receptor (LDLR aka FH, FHC, FHCL1, LDLCQ2)",
                "low density lipoprotein receptor class A domain containing 1 (LDLRAD1)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "monoamine oxidase A (MAOA aka BRNRS, MAO-A)",
                "monoamine oxidase B (MAOB)",
                "nerve growth factor (NGF aka Beta-NGF, HSAN5B, NGF)",
                "neurotrophin 3 (NTF3 aka HDNF, NGF-2, NGF2, NT-3, NT3)",
                "phenylalanine hydroxylase (PAH aka PH, PKU, PKU1)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "polyamine oxidase (PAOX aka PAO)",
                "transmembrane phosphatase with tensin homology (TPTE aka CT44, PTEN21, TPTE)",
                "tryptophan hydroxylase 1 (TPH1 aka TPRH, TRPH)",
                "tumor necrosis factor (TNF aka DIF, IMD127-alpha, TNFA, TNFSF2, TNLG1F, TNF)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tyrosine hydroxylase (TH aka DYT14, DYT5b, TYH)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor C (VEGFC aka Flt4-L, LMPH1D, LMPHM4, VRP)",
                "very low density lipoprotein receptor (VLDLR aka CAMRQ1, CARMQ1, CHRMQ1, VLDL-RCH, VLDLR)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "Tumor Protein P53 (TP53)",
            "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
            "Huntingtin (HTT)",
            "Breast Cancer 1 (BRCA1)",
            "Hemoglobin Subunit Beta (HBB)",
            "Apolipoprotein E (APOE)",
            "Dystrophin (DMD)",
            "Amyloid Beta Precursor Protein (APP)",
            "Fibroblast Growth Factor Receptor 2 (FGFR2)",
            "Methylenetetrahydrofolate Reductase (MTHFR)",
            "Parkin RBR E3 Ubiquitin Protein Ligase (PRKN)",
            "Sickle Cell Hemoglobin (HbS)",
            "Adenomatous Polyposis Coli (APC)",
            "Alpha-Synuclein (SNCA)",
            "Neurofibromin 1 (NF1)",
            "Phenylalanine Hydroxylase (PAH)",
            "Retinoblastoma 1 (RB1)",
            "Superoxide Dismutase 1 (SOD1)",
            "PTEN Induced Kinase 1 (PINK1)",
            "Microtubule Associated Protein Tau (MAPT)",
            "Presenilin 1 (PSEN1)",
            "Glucocerebrosidase (GBA)",
            "Coagulation Factor VIII (F8)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin (INS)",
                "Tumor Protein P53 (TP53)",
                "Cystic Fibrosis Transmembrane Conductance Regulator (CFTR)",
                "Huntingtin (HTT)",
                "Breast Cancer 1 (BRCA1)",
                "Hemoglobin Subunit Beta (HBB)",
                "Apolipoprotein E (APOE)",
                "Dystrophin (DMD)",
                "Amyloid Beta Precursor Protein (APP)",
                "Fibroblast Growth Factor Receptor 2 (FGFR2)",
                "Methylenetetrahydrofolate Reductase (MTHFR)",
                "Parkin RBR E3 Ubiquitin Protein Ligase (PRKN)",
                "Adenomatous Polyposis Coli (APC)",
                "Alpha-Synuclein (SNCA)",
                "Neurofibromin 1 (NF1)",
                "Phenylalanine Hydroxylase (PAH)",
                "Superoxide Dismutase 1 (SOD1)",
                "PTEN Induced Kinase 1 (PINK1)",
                "Microtubule Associated Protein Tau (MAPT)",
                "Presenilin 1 (PSEN1)",
                "Coagulation Factor VIII (F8)"
            ],
            "mismatches": [
                "Sickle Cell Hemoglobin (HbS)",
                "Retinoblastoma 1 (RB1)",
                "Glucocerebrosidase (GBA)"
            ],
            "true_referents": [
                "APC regulator of WNT signaling pathway (APC aka BTPS2, DESMD, DP2, DP2.5, DP3, GS, PPP1R46)",
                "BRCA1 DNA repair associated (BRCA1 aka BRCAI, BRCC1, BROVCA1, FANCS, IRIS, PNCA4, PPP1R53, PSCP, RNF53)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "alpha glucosidase (GAA aka LYAG)",
                "amyloid beta precursor like protein 2 (APLP2 aka APLP-2, APPH, APPL2, CDEBP)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "amyloid beta precursor protein binding protein 2 (APPBP2 aka APP-BP2, HS.84084, PAT1)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "coagulation factor VIII (F8 aka AHF, DXS1253EB, F8C, FVIII, HEMA, THPH13, F8)",
                "coagulation factor VIII associated 1 (F8A1 aka DXS522E, F8A, HAP40)",
                "coagulation factor VIII associated 2 (F8A2 aka HAP40)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "colorectal cancer associated 1 (COLCA1 aka C11orf92, CASC12, LOH11CR1F)",
                "colorectal neoplasia differentially expressed (CRNDE aka CRNDEP, LINC00180, NCRNA00180, PNAS-108, lincIRX5)",
                "dihydrofolate reductase (DHFR aka DHFR1P1, DYR, DHFR)",
                "dihydrofolate reductase 2 (DHFR2 aka DHFRL1, DHFRP4)",
                "dystrophin (DMD aka BMD, CMD3B, DXS142, DXS164, DXS206, DXS230, DXS239, DXS268, DXS269, DXS270, DXS272, MRX85)",
                "dystrophin related protein 2 (DRP2 aka DRP-2)",
                "fibroblast growth factor 2 (FGF2 aka BFGF, FGF-2, FGFB, HBGF-2)",
                "fibroblast growth factor receptor 1 (FGFR1 aka BFGFR, CD331, CEK, ECCL, FGFBR, FGFR-1, FLG, FLT-2, FLT2, HBGFR, HH2, HRTFDS, KAL2, N-SAM, OGD, bFGF-R-1)",
                "fibroblast growth factor receptor 2 (FGFR2 aka BBDS, BEK, BFR-1, CD332, CEK3, CFD1, ECT1, JWS, K-SAM, KGFR, TK14, TK25)",
                "glucosylceramidase beta 1 (GBA1 aka GBA, GCB, GLUC)",
                "glucosylceramidase beta 2 (GBA2 aka AD035, NLGase, SPG46)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit delta (HBD aka HBK)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "huntingtin (HTT aka HD, IT15, LOMARS)",
                "huntingtin associated protein 1 (HAP1 aka HAP2, HIP5, HLP, hHLP1)",
                "huntingtin interacting protein K (HYPK aka C15orf63, HSPC136)",
                "insulin (INS aka IDDM, IDDM1, IDDM2, ILPR, IRDN, MODY10, PNDM4)",
                "insulin degrading enzyme (IDE aka INSULYSIN)",
                "insulin receptor (INSR aka CD220, HHF5)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "microtubule associated protein 2 (MAP2 aka MAP-2A, MAP2B, MAP2C, MAP2)",
                "microtubule associated protein 4 (MAP4)",
                "microtubule associated protein tau (MAPT aka DDPAC, FTD1, FTDP-17L, MSTD, MTBT1, MTBT2, PPND, PPP1R103, TAU, Tau-PHF6, tau-40, MAPT)",
                "myotrophin (MTPN aka GCDP, V-1)",
                "neural retina leucine zipper (NRL aka D14S46E-MAF, RP27, NRL)",
                "neurofibromin 1 (NF1 aka NFNS, VRNF, WSS)",
                "neurofilament light chain (NEFL aka CMT1F, CMT2E, CMTDIG, NF-L, NF68, NFL, PPP1R110)",
                "neurofilament medium chain (NEFM aka NEF3, NF-M, NFM)",
                "parkin RBR E3 ubiquitin protein ligase (PRKN aka AR-JP, LPRS2, PARK2, PDJ)",
                "parkin coregulated (PACRG aka BUG21, GLUP, HAK0057712.1, PARK2CRG, pf12, PACRG)",
                "phenylalanine hydroxylase (PAH aka PH, PKU, PKU1)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "praja ring finger ubiquitin ligase 2 (PJA2 aka Neurodap1, RNF131)",
                "presenilin 1 (PSEN1 aka ACNINV3, AD3, CMD1U, FAD, PS-1, PS1, PSNL1, S182)",
                "presenilin 2 (PSEN2 aka AD3L, AD4, CMD1V, PS2, STM2)",
                "presenilin enhancer, gamma-secretase subunit (PSENEN aka ACNINV2, MDS033, MSTP064, PEN-2, PEN2)",
                "protein tyrosine phosphatase receptor type K (PTPRK aka R-PTP-kappa)",
                "retinal outer segment membrane protein 1 (ROM1 aka ROM, ROSP1, RP7, TSPAN23)",
                "retinoschisin 1 (RS1 aka RS, XLRS1)",
                "superoxide dismutase 1 (SOD1 aka ALS, ALS1, HEL-S-44, IPOA, SOD, STAHP, hSod1, homodimer)",
                "superoxide dismutase 2 (SOD2 aka GC1, GClnc1, IPO-B, IPOB, MNSOD, MVCD6, Mn-SOD, lncRNA-GC1)",
                "superoxide dismutase 3 (SOD3 aka EC-SOD)",
                "synuclein alpha (SNCA aka NACP, PARK1, PARK4, PD1)",
                "synuclein beta (SNCB)",
                "synuclein gamma (SNCG aka BCSG1, SR)",
                "tryptophan hydroxylase 1 (TPH1 aka TPRH, TRPH)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)",
                "tyrosine hydroxylase (TH aka DYT14, DYT5b, TYH)"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1 gene (BRCA1)",
            "TP53 gene (TP53)",
            "EGFR gene (EGFR)",
            "CFTR gene (CFTR)",
            "HBB gene (HBB)",
            "APOE gene (APOE)",
            "MTHFR gene (MTHFR)",
            "FTO gene (FTO)",
            "LDLR gene (LDLR)",
            "VEGFA gene (VEGFA)",
            "TERT gene (TERT)",
            "HFE gene (HFE)",
            "PTEN gene (PTEN)",
            "KRAS gene (KRAS)",
            "BRAF gene (BRAF)",
            "MTOR gene (MTOR)",
            "FOXP2 gene (FOXP2)",
            "GJB2 gene (GJB2)",
            "HTT gene (HTT)",
            "LRRK2 gene (LRRK2)",
            "SNCA gene (SNCA)",
            "APP gene (APP)",
            "MAPT gene (MAPT)",
            "SOD1 gene (SOD1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BRCA1 gene (BRCA1)",
                "TP53 gene (TP53)",
                "EGFR gene (EGFR)",
                "CFTR gene (CFTR)",
                "HBB gene (HBB)",
                "APOE gene (APOE)",
                "MTHFR gene (MTHFR)",
                "FTO gene (FTO)",
                "LDLR gene (LDLR)",
                "VEGFA gene (VEGFA)",
                "TERT gene (TERT)",
                "HFE gene (HFE)",
                "PTEN gene (PTEN)",
                "KRAS gene (KRAS)",
                "BRAF gene (BRAF)",
                "LRRK2 gene (LRRK2)",
                "SNCA gene (SNCA)",
                "SOD1 gene (SOD1)"
            ],
            "mismatches": [
                "MTOR gene (MTOR)",
                "FOXP2 gene (FOXP2)",
                "GJB2 gene (GJB2)",
                "HTT gene (HTT)",
                "APP gene (APP)",
                "MAPT gene (MAPT)"
            ],
            "true_referents": [
                "A-Raf proto-oncogene, serine/threonine kinase (ARAF aka A-RAF1, PKS2, RAFA1, ARAF)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 DNA repair associated (BRCA1 aka BRCAI, BRCC1, BROVCA1, FANCS, IRIS, PNCA4, PPP1R53, PSCP, RNF53)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "F-box and WD repeat domain containing 12 (FBXW12 aka FBW12, FBXO12, FBXO35)",
                "FTO alpha-ketoglutarate dependent dioxygenase (FTO aka ALKBH9, BMIQ14, GDFD, IFEX9)",
                "GIT ArfGAP 1 (GIT1 aka p95-APP1)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "MAPT intronic transcript 1 (MAPT-IT1)",
                "MTOR associated protein, eak-7 homolog (MEAK7 aka EAK7, KIAA1609, TLDC1, mEAK-7)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "RAP2C, member of RAS oncogene family (RAP2C)",
                "RAS related (RRAS aka R-Ras1, RRAS)",
                "RPTOR independent companion of MTOR complex 2 (RICTOR aka AVO3, PIA, hAVO3)",
                "Raf-1 proto-oncogene, serine/threonine kinase (RAF1 aka CMD1NN, CRAF, NS5, Raf-1, c-Raf)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "TP53 target 3 (TP53TG3 aka P53TG3A, TP53TG3E, TP53TG3F, TP53TG3)",
                "adaptor protein, phosphotyrosine interacting with PH domain and leucine zipper 1 (APPL1 aka APPL, DIP13alpha, MODY14)",
                "adaptor protein, phosphotyrosine interacting with PH domain and leucine zipper 2 (APPL2 aka DIP13B)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "chondrosarcoma associated gene 1 (CSAG1 aka CSAGE, CT24.1)",
                "dihydrofolate reductase (DHFR aka DHFR1P1, DYR, DHFR)",
                "dihydrofolate reductase 2 (DHFR2 aka DHFRL1, DHFRP4)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "folate receptor alpha (FOLR1 aka FBP, FOLR, FRalpha, NCFTD)",
                "forkhead box P1 (FOXP1 aka 12CC4, HSPC215, MFH, QRF1, hFKH1B)",
                "forkhead box P2 (FOXP2 aka CAGH44, SPCH1, TNRC10)",
                "forkhead box R2 (FOXR2 aka FOXN6)",
                "gap junction protein beta 1 (GJB1 aka CMTX, CMTX1, CX32)",
                "gap junction protein beta 2 (GJB2 aka BAPS, CX26, DFNA3, DFNA3A, DFNB1, DFNB1A, HID, KID, NSRD1, PPK)",
                "gap junction protein beta 5 (GJB5 aka CX31.1)",
                "glutathione S-transferase theta 1 (GSTT1)",
                "glutathione S-transferase theta 2B (GSTT2B aka GSTT2P)",
                "glutathione S-transferase theta 4 (GSTT4 aka GSTTP1, HS322B1A)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit gamma 1 (HBG1 aka HBG-T2, HBGA, HBGR, HSGGL1, PRO2979)",
                "homeostatic iron regulator (HFE aka HFE1, HH, HLA-H, MVCD7, TFQTL2)",
                "inhibin subunit beta B (INHBB)",
                "iron responsive element binding protein 2 (IREB2 aka ACO3, IRE-BP 2, IRE-BP2, IRP2, IRP2AD, NDCAMA)",
                "lactase (LCT aka LAC, LPH, LPH1)",
                "leucine rich repeat containing 2 (LRRC2)",
                "leucine rich repeat containing 25 (LRRC25 aka MAPA)",
                "leucine rich repeat kinase 1 (LRRK1 aka OSMD, RIPK6, Roco1)",
                "leucine rich repeat kinase 2 (LRRK2 aka AURA17, DARDARIN, PARK8, RIPK7, ROCO2)",
                "low density lipoprotein receptor (LDLR aka FH, FHC, FHCL1, LDLCQ2)",
                "low density lipoprotein receptor class A domain containing 1 (LDLRAD1)",
                "low density lipoprotein receptor class A domain containing 2 (LDLRAD2)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "microtubule associated protein 1A (MAP1A aka MAP1L, MTAP1A)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "protein tyrosine phosphatase non-receptor type 4 (PTPN4 aka MEG, PTPMEG, PTPMEG1)",
                "regulatory associated protein of MTOR complex 1 (RPTOR aka KOG1, Mip1)",
                "superoxide dismutase 1 (SOD1 aka ALS, ALS1, HEL-S-44, IPOA, SOD, STAHP, hSod1, homodimer)",
                "superoxide dismutase 2 (SOD2 aka GC1, GClnc1, IPO-B, IPOB, MNSOD, MVCD6, Mn-SOD, lncRNA-GC1)",
                "superoxide dismutase 3 (SOD3 aka EC-SOD)",
                "synuclein alpha (SNCA aka NACP, PARK1, PARK4, PD1)",
                "synuclein gamma (SNCG aka BCSG1, SR)",
                "telomerase reverse transcriptase (TERT aka CMM9, DKCA2, DKCB4, EST2, PFBMFT1, TCS1, TP2, TRT, hEST2, hTRT)",
                "telomere repeat binding bouquet formation protein 1 (TERB1 aka CCDC79, SPGF60)",
                "telomere repeat binding bouquet formation protein 2 (TERB2 aka C15orf43, SPGF59)",
                "transferrin receptor 2 (TFR2 aka HFE3, TFRC2)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "vascular endothelial growth factor A (VEGFA aka L-VEGF, MVCD1, VEGF, VPF)",
                "vascular endothelial growth factor B (VEGFB aka VEGFL, VRF)",
                "vascular endothelial growth factor C (VEGFC aka Flt4-L, LMPH1D, LMPHM4, VRP)"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1 (BRCA1)",
            "TP53 (TP53)",
            "KRAS (KRAS)",
            "EGFR (EGFR)",
            "PTEN (PTEN)",
            "PIK3CA (PIK3CA)",
            "BRAF (BRAF)",
            "ERBB2 (ERBB2)",
            "CDKN2A (CDKN2A)",
            "IDH1 (IDH1)",
            "NOTCH1 (NOTCH1)",
            "ARID1A (ARID1A)",
            "ATM (ATM)",
            "SMAD4 (SMAD4)",
            "FLT3 (FLT3)",
            "NPM1 (NPM1)",
            "NRAS (NRAS)",
            "GNAS (GNAS)",
            "KEAP1 (KEAP1)",
            "MET (MET)",
            "JAK2 (JAK2)",
            "FBXW7 (FBXW7)",
            "DNMT3A (DNMT3A)",
            "RB1 (RB1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "KRAS",
                "EGFR",
                "PTEN",
                "PIK3CA",
                "BRAF",
                "ERBB2",
                "IDH1",
                "NOTCH1",
                "ATM",
                "SMAD4",
                "FLT3",
                "NPM1",
                "NRAS",
                "GNAS",
                "KEAP1",
                "MET",
                "JAK2",
                "DNMT3A",
                "RB1"
            ],
            "mismatches": [
                "BRCA1",
                "CDKN2A",
                "ARID1A",
                "FBXW7"
            ],
            "true_referents": [
                "AT-rich interaction domain 3C (ARID3C)",
                "AT-rich interaction domain 4A (ARID4A aka RBBP-1, RBBP1, RBP-1, RBP1)",
                "AT-rich interaction domain 4B (ARID4B aka BCAA, BRCAA1, RBBP1L1, RBP1L1, SAP180)",
                "ATM interactor (ATMIN aka ASCIZ, ZNF822)",
                "ATM serine/threonine kinase (ATM aka AT1, ATA, ATC, ATD, ATDC, ATE, TEL1, TELO1)",
                "B-Raf proto-oncogene, serine/threonine kinase (BRAF aka B-RAF1, B-raf-1, BRAF1, NS7, RAFB1, BRAF)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CDKN2A interacting protein (CDKN2AIP)",
                "CDKN2A interacting protein N-terminal like (CDKN2AIPNL aka C2AIL)",
                "DNA methyltransferase 3 alpha (DNMT3A aka DNMT3A2, HESJAS, M.HsaIIIA, TBRS)",
                "DNA methyltransferase 3 beta (DNMT3B aka FSHD4, ICF, ICF1, M.HsaIIIB)",
                "DNA methyltransferase 3 like (DNMT3L)",
                "F-box and leucine rich repeat protein 7 (FBXL7 aka FBL6, FBL7)",
                "FBXW7 antisense RNA 1 (FBXW7-AS1 aka DEAR, DEspR)",
                "FLT3 interacting zinc finger 1 (FIZ1 aka ZNF798)",
                "G protein subunit alpha transducin 3 (GNAT3 aka GDCA, HG1E)",
                "GNAS complex locus (GNAS aka AHO, AIMAH1, C20orf451, GPSA, GSA, GSP, NESP, PITA3, POH, SCG6, SgVI, GNAS)",
                "Janus kinase 1 (JAK1 aka AIIDEA, JAK1B, JTK3, JAK1)",
                "Janus kinase 2 (JAK2 aka JTK10)",
                "Janus kinase 3 (JAK3 aka JAK-3_HUMAN, JAKL, L-JAK, LJAK, JAK3)",
                "KRAS proto-oncogene, GTPase (KRAS aka 'C-K-RAS, C-K-RAS, CFC2, K-RAS2A, K-RAS2B, K-RAS4A, K-RAS4B, K-Ras, K-Ras 2, KI-RAS1, KRAS2, NS, NS3, OES, RALD, RASK2, c-Ki-ras, c-Ki-ras2, KRAS)",
                "MET proto-oncogene, receptor tyrosine kinase (MET aka AUTS9, DA11, DFNB97, HGFR, RCCP2, c-Met)",
                "NODAL modulator 1 (NOMO1 aka Nomo, PM5)",
                "NRAS proto-oncogene, GTPase (NRAS aka ALPS4, CMNS, KRAS, N-ras, NCMS1, NS6, NRAS)",
                "PTEN induced kinase 1 (PINK1 aka BRPK, PARK6)",
                "RAS related (RRAS aka R-Ras1, RRAS)",
                "RAS related 2 (RRAS2 aka NS12, TC21)",
                "RB transcriptional corepressor 1 (RB1 aka OSRC, PPP1R130, RB, p105-Rb, p110-RB1, pRb, pp110)",
                "RB transcriptional corepressor like 1 (RBL1 aka CP107, PRB1, p107)",
                "RB1 inducible coiled-coil 1 (RB1CC1 aka ATG17, CC1, FIP200, PPP1R131)",
                "Raf-1 proto-oncogene, serine/threonine kinase (RAF1 aka CMD1NN, CRAF, NS5, Raf-1, c-Raf)",
                "SMAD family member 1 (SMAD1 aka BSP-1, BSP1, JV4-1, JV41, MADH1, MADR1)",
                "SMAD family member 4 (SMAD4 aka DPC4, JIP, MADH4, MYHRS)",
                "SMAD family member 6 (SMAD6 aka AOVD2, HsT17432, MADH6, MADH7)",
                "SSX family member 7 (SSX7)",
                "STEAP family member 1 (STEAP1 aka PRSS24, STEAP)",
                "STEAP family member 1B (STEAP1B)",
                "TP53 regulating kinase (TP53RK aka BUD32, C20orf64, GAMOS4, Nori-2, Nori-2p, PRPK, TPRKB, dJ101A2)",
                "TP53 target 3 (TP53TG3 aka P53TG3A, TP53TG3E, TP53TG3F, TP53TG3)",
                "cyclin dependent kinase 2 (CDK2 aka CDKN2, p33(CDK2))",
                "delta like canonical Notch ligand 1 (DLL1 aka DELTA1, DL1, Delta, NEDBAS)",
                "delta like non-canonical Notch ligand 1 (DLK1 aka DLK, DLK-1, Delta1, FA1, PREF1, Pref-1, ZOG, pG2)",
                "epidermal growth factor (EGF aka HOMG4, URG)",
                "epidermal growth factor receptor (EGFR aka ERBB, ERBB1, ERRP, HER1, NISBD2, NNCIS, PIG61, mENA)",
                "erb-b2 receptor tyrosine kinase 2 (ERBB2 aka CD340, HER-2, HER-2/neu, HER2, MLN 19, MLN-19, NEU, NGL, TKR1, VSCN2, c-ERB-2, c-ERB2, p185(erbB2))",
                "erb-b2 receptor tyrosine kinase 4 (ERBB4 aka ALS19, HER4, p180erbB4)",
                "fms related receptor tyrosine kinase 3 (FLT3 aka CD135, FLK-2, FLK2, STK1)",
                "fms related receptor tyrosine kinase 3 ligand (FLT3LG aka FL, FLG3L, FLT3L, IMD125)",
                "glucosamine (N-acetyl)-6-sulfatase (GNS aka G6S)",
                "granzyme M (GZMM aka LMET1, MET1)",
                "isocitrate dehydrogenase (NAD(+)) 3 catalytic subunit alpha (IDH3A aka RP90)",
                "isocitrate dehydrogenase (NADP(+)) 1 (IDH1 aka HEL-216, HEL-S-26, IDCD, IDH, IDP, IDPC, PICD)",
                "isocitrate dehydrogenase (NADP(+)) 2 (IDH2 aka D2HGA2, ICD-M, IDH, IDH-2, IDHM, IDP, IDPM, mNADP-IDH)",
                "kelch like ECH associated protein 1 (KEAP1 aka INrf2, KLHL19)",
                "methenyltetrahydrofolate synthetase (MTHFS aka HsT19268, NEDMEHM)",
                "nestin (NES aka Nbla00170)",
                "notch receptor 1 (NOTCH1 aka AOS5, AOVD1, TAN1, hN1)",
                "nucleophosmin 1 (NPM1 aka B23, NPM)",
                "nucleophosmin/nucleoplasmin 2 (NPM2)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)",
                "phosphatase and tensin homolog (PTEN aka 10q23del, BZS, CWS1, DEC, GLM2, MHAM, MMAC11, PTENbeta, PTENgama, TEP1, PTEN)",
                "phosphatidylinositol-4,5-bisphosphate 3-kinase catalytic subunit alpha (PIK3CA aka CCM4, CLAPO, CLOVE, CWS5, HMH, MCAP, MCM, MCMTC, PI3K, PI3K-alpha, p110-alpha)",
                "phosphatidylinositol-4,5-bisphosphate 3-kinase catalytic subunit beta (PIK3CB aka P110BETA, PI3K, PI3KBETA, PIK3C1)",
                "phosphatidylinositol-4-phosphate 3-kinase catalytic subunit type 2 beta (PIK3C2B aka C2-PI3K)",
                "protein tyrosine phosphatase receptor type E (PTPRE aka HPTPE, PTPE, R-PTP-EPSILON)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "HBB (Hemoglobin beta)",
            "TP53 (Tumor protein p53)",
            "BRCA1 (Breast Cancer 1)",
            "BRCA2 (Breast Cancer 2)",
            "CFTR (Cystic Fibrosis Transmembrane Conductance Regulator)",
            "HFE (Hemochromatosis)",
            "APOE (Apolipoprotein E)",
            "F5 (Coagulation factor V)",
            "F2 (Coagulation factor II)",
            "F9 (Coagulation factor IX)",
            "MTHFR (Methylenetetrahydrofolate reductase)",
            "ACE (Angiotensin-converting enzyme)",
            "APOA1 (Apolipoprotein A1)",
            "LDLR (Low-density lipoprotein receptor)",
            "CFTR (Cystic Fibrosis Transmembrane Conductance Regulator)",
            "ATM (Ataxia-telangiectasia mutated)",
            "BRCA1 (Breast Cancer 1)",
            "BRCA2 (Breast Cancer 2)",
            "TP53 (Tumor protein p53)",
            "HBB (Hemoglobin beta)",
            "HFE (Hemochromatosis)",
            "F5 (Coagulation factor V)",
            "F2 (Coagulation factor II)",
            "F9 (Coagulation factor IX)",
            "MTHFR (Methylenetetrahydrofolate reductase)",
            "ACE (Angiotensin-converting enzyme)",
            "APOA1 (Apolipoprotein A1)",
            "LDLR (Low-density lipoprotein receptor)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "HBB (Hemoglobin beta)",
                "TP53 (Tumor protein p53)",
                "BRCA1 (Breast Cancer 1)",
                "BRCA2 (Breast Cancer 2)",
                "CFTR (Cystic Fibrosis Transmembrane Conductance Regulator)",
                "HFE (Hemochromatosis)",
                "APOE (Apolipoprotein E)",
                "F5 (Coagulation factor V)",
                "F2 (Coagulation factor II)",
                "F9 (Coagulation factor IX)",
                "MTHFR (Methylenetetrahydrofolate reductase)",
                "ACE (Angiotensin-converting enzyme)",
                "APOA1 (Apolipoprotein A1)",
                "LDLR (Low-density lipoprotein receptor)",
                "ATM (Ataxia-telangiectasia mutated)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATM serine/threonine kinase (ATM aka AT1, ATA, ATC, ATD, ATDC, ATE, TEL1, TELO1)",
                "BRCA1 DNA repair associated (BRCA1 aka BRCAI, BRCC1, BROVCA1, FANCS, IRIS, PNCA4, PPP1R53, PSCP, RNF53)",
                "BRCA1 associated ATM activator 1 (BRAT1 aka BAAT1, C7orf27, NEDCAS, RMFSL)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 DNA repair associated (BRCA2 aka BRCC2, BROVCA2, FACD, FAD, FAD1, FANCD, FANCD1, GLM3, PNCA2, XRCC11)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "BRISC and BRCA1 A complex member 2 (BABAM2 aka BRCC4, BRCC45, BRE)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "angiotensin I converting enzyme (ACE aka ACE1, CD143, DCP, DCP1)",
                "angiotensin converting enzyme 2 (ACE2 aka ACEH)",
                "apolipoprotein A1 (APOA1 aka AMYLD3, HPALP2, apo(a))",
                "apolipoprotein A2 (APOA2 aka Apo-AII, ApoA-II, apoAII)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "ataxin 1 (ATXN1 aka ATX1, D6S504E, SCA1)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "coagulation factor II thrombin receptor (F2R aka CF2R, HTR, PAR-1, PAR1, TR)",
                "coagulation factor II thrombin receptor like 2 (F2RL2 aka PAR-3, PAR3)",
                "coagulation factor II, thrombin (F2 aka PT, RPRGL2, THPH1)",
                "coagulation factor IX (F9 aka F9 p22, FIX, HEMB, P19, PTC, THPH8)",
                "coagulation factor V (F5 aka FVL, PCCF, RPRGL1, THPH2)",
                "coagulation factor VII (F7 aka SPCA)",
                "coagulation factor X (F10 aka FX, FXA)",
                "coagulation factor XII (F12 aka HAE3, HAEX, HAF)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "dihydrofolate reductase (DHFR aka DHFR1P1, DYR, DHFR)",
                "dihydrofolate reductase 2 (DHFR2 aka DHFRL1, DHFRP4)",
                "endothelin converting enzyme 1 (ECE1 aka ECE)",
                "ferrochelatase (FECH aka EPP, EPP1, FCE)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit delta (HBD aka HBK)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "homeostatic iron regulator (HFE aka HFE1, HH, HLA-H, MVCD7, TFQTL2)",
                "iron responsive element binding protein 2 (IREB2 aka ACO3, IRE-BP 2, IRE-BP2, IRP2, IRP2AD, NDCAMA)",
                "low density lipoprotein receptor (LDLR aka FH, FHC, FHCL1, LDLCQ2)",
                "low density lipoprotein receptor class A domain containing 1 (LDLRAD1)",
                "methylenetetrahydrofolate reductase (MTHFR)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)",
                "very low density lipoprotein receptor (VLDLR aka CAMRQ1, CARMQ1, CHRMQ1, VLDL-RCH, VLDLR)"
            ],
            "TP": 15,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            "BRCA1 (Breast Cancer 1)",
            "TP53 (Tumor Protein P53)",
            "CFTR (Cystic Fibrosis Transmembrane Conductance Regulator)",
            "HTT (Huntingtin)",
            "APOE (Apolipoprotein E)",
            "DRD4 (Dopamine Receptor D4)",
            "COMT (Catechol-O-Methyltransferase)",
            "HTR2A (5-Hydroxytryptamine Receptor 2A)",
            "SLC6A4 (Solute Carrier Family 6 Member 4)",
            "HFE (Homeostatic Iron Regulator)",
            "FMR1 (Fragile X Mental Retardation 1)",
            "ATM (Ataxia-Telangiectasia Mutated)",
            "NOS1 (Nitric Oxide Synthase 1)",
            "NOS2 (Nitric Oxide Synthase 2)",
            "NOS3 (Nitric Oxide Synthase 3)",
            "FGFR3 (Fibroblast Growth Factor Receptor 3)",
            "SHH (Sonic Hedgehog)",
            "PSEN1 (Presenilin 1)",
            "PSEN2 (Presenilin 2)",
            "APP (Amyloid Beta Precursor Protein)",
            "TTR ( Transthyretin)",
            "APOA1 (Apolipoprotein A1)",
            "LDLR (Low-Density Lipoprotein Receptor)",
            "HBB (Hemoglobin Subunit Beta)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BRCA1 (Breast Cancer 1)",
                "TP53 (Tumor Protein P53)",
                "CFTR (Cystic Fibrosis Transmembrane Conductance Regulator)",
                "HTT (Huntingtin)",
                "APOE (Apolipoprotein E)",
                "DRD4 (Dopamine Receptor D4)",
                "COMT (Catechol-O-Methyltransferase)",
                "HTR2A (5-Hydroxytryptamine Receptor 2A)",
                "SLC6A4 (Solute Carrier Family 6 Member 4)",
                "HFE (Homeostatic Iron Regulator)",
                "ATM (Ataxia-Telangiectasia Mutated)",
                "NOS1 (Nitric Oxide Synthase 1)",
                "NOS2 (Nitric Oxide Synthase 2)",
                "NOS3 (Nitric Oxide Synthase 3)",
                "FGFR3 (Fibroblast Growth Factor Receptor 3)",
                "PSEN1 (Presenilin 1)",
                "PSEN2 (Presenilin 2)",
                "APP (Amyloid Beta Precursor Protein)",
                "TTR ( Transthyretin)",
                "APOA1 (Apolipoprotein A1)",
                "LDLR (Low-Density Lipoprotein Receptor)",
                "HBB (Hemoglobin Subunit Beta)"
            ],
            "mismatches": [
                "FMR1 (Fragile X Mental Retardation 1)",
                "SHH (Sonic Hedgehog)"
            ],
            "true_referents": [
                "5-hydroxytryptamine receptor 2A (HTR2A aka 5-HT2A, HTR2)",
                "5-hydroxytryptamine receptor 2B (HTR2B aka 5-HT(2B), 5-HT-2B, 5-HT2B)",
                "5-hydroxytryptamine receptor 5A (HTR5A aka 5-HT5A)",
                "ATM serine/threonine kinase (ATM aka AT1, ATA, ATC, ATD, ATDC, ATE, TEL1, TELO1)",
                "BRCA1 DNA repair associated (BRCA1 aka BRCAI, BRCC1, BROVCA1, FANCS, IRIS, PNCA4, PPP1R53, PSCP, RNF53)",
                "BRCA1 associated ATM activator 1 (BRAT1 aka BAAT1, C7orf27, NEDCAS, RMFSL)",
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRCA2 and CDKN1A interacting protein (BCCIP aka TOK-1, TOK1)",
                "CF transmembrane conductance regulator (CFTR aka ABC35, ABCC7, CF/MRP, MRP7, TNR-CFTR, dJ760C5.1, CFTR)",
                "FMR1 autosomal homolog 1 (FXR1 aka CMYO9A, CMYO9B, CMYP9A, CMYP9BP, MYOPMIL, MYORIBF, FXR1)",
                "FMR1 autosomal homolog 2 (FXR2 aka FMR1L2P, FXR2)",
                "Indian hedgehog signaling molecule (IHH aka BDA1, HHG2)",
                "SUFU negative regulator of hedgehog signaling (SUFU aka BCNS2, JBTS32, PRO1280H, SUFUXL, SUFU)",
                "amyloid beta precursor like protein 2 (APLP2 aka APLP-2, APPH, APPL2, CDEBP)",
                "amyloid beta precursor protein (APP aka AAA, ABETA, ABPP, AD1I, CTFgamma, CVAP, PN-II, PN2, alpha-sAPP, preA4, APP)",
                "amyloid beta precursor protein binding protein 2 (APPBP2 aka APP-BP2, HS.84084, PAT1)",
                "apolipoprotein A1 (APOA1 aka AMYLD3, HPALP2, apo(a))",
                "apolipoprotein A2 (APOA2 aka Apo-AII, ApoA-II, apoAII)",
                "apolipoprotein A4 (APOA4)",
                "apolipoprotein E (APOE aka AD2, APO-E, ApoE4, LDLCQ5, LPG)",
                "apolipoprotein O (APOO aka FAM121B, MIC26, MICOS26, Mic23, My025)",
                "ataxin 1 (ATXN1 aka ATX1, D6S504E, SCA1)",
                "catechol-O-methyltransferase (COMT aka HEL-S-98n)",
                "catechol-O-methyltransferase domain containing 1 (COMTD1)",
                "chloride intracellular channel 6 (CLIC6 aka CLIC1L)",
                "collectrin, amino acid transport regulator (CLTRN aka NX-17, NX17, TMEM27)",
                "dopamine receptor D1 (DRD1 aka D1R, DADRA, DRD1)",
                "dopamine receptor D2 (DRD2 aka D2DR, D2R)",
                "dopamine receptor D4 (DRD4 aka D4DR)",
                "fibroblast growth factor receptor 1 (FGFR1 aka BFGFR, CD331, CEK, ECCL, FGFBR, FGFR-1, FLG, FLT-2, FLT2, HBGFR, HH2, HRTFDS, KAL2, N-SAM, OGD, bFGF-R-1)",
                "fibroblast growth factor receptor 3 (FGFR3 aka ACH, CD333, CEK2, HSFGFR3EX, JTK4)",
                "fibroblast growth factor receptor like 1 (FGFRL1 aka FGFR-5, FGFR5, FHFR)",
                "fragile X messenger ribonucleoprotein 1 (FMR1 aka FMRP, FRAXA, POF, POF1)",
                "hemoglobin subunit beta (HBB aka CD113t-C, ECYT6, beta-globin)",
                "hemoglobin subunit delta (HBD aka HBK)",
                "hemoglobin subunit mu (HBM aka HBAP2, HBK)",
                "homeostatic iron regulator (HFE aka HFE1, HH, HLA-H, MVCD7, TFQTL2)",
                "huntingtin (HTT aka HD, IT15, LOMARS)",
                "huntingtin associated protein 1 (HAP1 aka HAP2, HIP5, HLP, hHLP1)",
                "huntingtin interacting protein K (HYPK aka C15orf63, HSPC136)",
                "iron responsive element binding protein 2 (IREB2 aka ACO3, IRE-BP 2, IRE-BP2, IRP2, IRP2AD, NDCAMA)",
                "low density lipoprotein receptor (LDLR aka FH, FHC, FHCL1, LDLCQ2)",
                "low density lipoprotein receptor class A domain containing 1 (LDLRAD1)",
                "nitric oxide synthase 1 (NOS1 aka IHPS1, N-NOS, NC-NOS, NOS, bNOS, nNOS)",
                "nitric oxide synthase 2 (NOS2 aka HEP-NOS, INOS, NOSA, NOS2)",
                "nitric oxide synthase 3 (NOS3 aka ECNOS, eNOS)",
                "presenilin 1 (PSEN1 aka ACNINV3, AD3, CMD1U, FAD, PS-1, PS1, PSNL1, S182)",
                "presenilin 2 (PSEN2 aka AD3L, AD4, CMD1V, PS2, STM2)",
                "presenilin enhancer, gamma-secretase subunit (PSENEN aka ACNINV2, MDS033, MSTP064, PEN-2, PEN2)",
                "solute carrier family 1 member 6 (SLC1A6 aka EAAT4)",
                "solute carrier family 26 member 6 (SLC26A6)",
                "solute carrier family 6 member 4 (SLC6A4 aka 5-HTT, 5-HTTLPR, 5HTT, HTT, OCD1, SERT, SERT1, hSERT)",
                "sonic hedgehog signaling molecule (SHH aka HHG1, HLP3, HPE3, MCOPCB5, SMMCI, ShhNC, TPT, TPTPS)",
                "tetratricopeptide repeat domain 1 (TTC1 aka TPR1)",
                "thyrotropin releasing hormone receptor (TRHR aka CHNG7, TRH-R)",
                "transferrin receptor 2 (TFR2 aka HFE3, TFRC2)",
                "transmembrane O-methyltransferase (TOMT aka COMT2)",
                "transthyretin (TTR aka ATTR, CTS, CTS1, HEL111, HsT2651, PALB, TBPA, TTN)",
                "tumor protein p53 (TP53 aka BCC7, BMFS5, LFS1, P53, TRP53)",
                "tumor protein p53 binding protein 1 (TP53BP1 aka 53BP1, TDRD30, p202, p53BP1)",
                "tumor protein p53 regulated apoptosis inducing protein 1 (TP53AIP1 aka P53AIP1)",
                "very low density lipoprotein receptor (VLDLR aka CAMRQ1, CARMQ1, CHRMQ1, VLDL-RCH, VLDLR)"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "human protein coding gene",
        "domain": "biology",
        "response": [
            {
                "Referent": "BRCA1",
                "Canonical name": "Breast cancer 1, early onset"
            },
            {
                "Referent": "BRCA2",
                "Canonical name": "Breast cancer 2, early onset"
            },
            {
                "Referent": "CDH1",
                "Canonical name": "Cadherin-1, type 1, E-cadherin (epithelial)"
            },
            {
                "Referent": "CDKN2A",
                "Canonical name": "Cyclin-dependent kinase inhibitor 2A (p16, inhibits CDK4)"
            },
            {
                "Referent": "CDKN2B",
                "Canonical name": "Cyclin-dependent kinase inhibitor 2B (p15, inhibits CDK4)"
            },
            {
                "Referent": "CCND1",
                "Canonical name": "Cyclin D1"
            },
            {
                "Referent": "CCND2",
                "Canonical name": "Cyclin D2"
            },
            {
                "Referent": "CCND3",
                "Canonical name": "Cyclin D3"
            },
            {
                "Referent": "CCNE1",
                "Canonical name": "Cyclin E1"
            },
            {
                "Referent": "CCNE2",
                "Canonical name": "Cyclin E2"
            },
            {
                "Referent": "CCND3",
                "Canonical name": "Cyclin D3"
            },
            {
                "Referent": "CCNE1",
                "Canonical name": "Cyclin E1"
            },
            {
                "Referent": "CCNE2",
                "Canonical name": "Cyclin E2"
            },
            {
                "Referent": "CCND3",
                "Canonical name": "Cyclin D3"
            },
            {
                "Referent": "CCNE1",
                "Canonical name": "Cyclin E1"
            },
            {
                "Referent": "CCNE2",
                "Canonical name": "Cyclin E2"
            },
            {
                "Referent": "CCND3",
                "Canonical name": "Cyclin D3"
            },
            {
                "Referent": "CCNE1",
                "Canonical name": "Cyclin E1"
            },
            {
                "Referent": "CCNE2",
                "Canonical name": "Cyclin E2"
            },
            {
                "Referent": "CCND3",
                "Canonical name": "Cyclin D3"
            },
            {
                "Referent": "CCNE1",
                "Canonical name": "Cyclin E1"
            },
            {
                "Referent": "CCNE2",
                "Canonical name": "Cyclin E2"
            },
            {
                "Referent": "CCND3",
                "Canonical name": "Cyclin D3"
            },
            {
                "Referent": "CCNE1",
                "Canonical name": "Cyclin E1"
            },
            {
                "Referent": "CCNE2",
                "Canonical name": "Cyclin E2"
            },
            {
                "Referent": "CCND3",
                "Canonical name": "Cyclin D3"
            },
            {
                "Referent": "CCNE1",
                "Canonical name": "Cyclin E1"
            },
            {
                "Referent": "CCNE2",
                "Canonical name": "Cyclin E2"
            },
            {
                "Referent": "CCND3",
                "Canonical name": "Cyclin D3"
            },
            {
                "Referent": "CCNE1",
                "Canonical name": "Cyclin E1"
            },
            {
                "Referent": "CCNE2",
                "Canonical name": "Cyclin E2"
            },
            {
                "Referent": "CCND3",
                "Canonical name": "Cyclin D3"
            },
            {
                "Referent": "CCNE1",
                "Canonical name": "Cyclin E1"
            },
            {
                "Referent": "CCNE2",
                "Canonical name": "Cyclin E2"
            },
            {
                "Referent": "CCND3",
                "Canonical name": "Cyclin D3"
            },
            {
                "Referent": "CCNE1",
                "Canonical name": "Cyclin E1"
            },
            {
                "Referent": "CCNE2",
                "Canonical name": "Cyclin E2"
            },
            {
                "Referent": "CCND3",
                "Canonical name": "Cyclin D3"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "CDH1",
                "CDKN2A",
                "CDKN2B",
                "CCND1",
                "CCND2",
                "CCND3",
                "CCNE1",
                "CCNE2"
            ],
            "mismatches": [
                "BRCA1",
                "BRCA2"
            ],
            "true_referents": [
                "BRCA1 associated protein (BRAP aka BRAP2, IMP, RNF52)",
                "BRISC and BRCA1 A complex member 2 (BABAM2 aka BRCC4, BRCC45, BRE)",
                "cadherin 1 (CDH1 aka Arc-1, BCDS1, CD324, CDHE, ECAD, LCAM, UVO)",
                "cadherin 2 (CDH2 aka ACOGS, ADHD8, ARVD14, CD325, CDHN, CDw325, NCAD)",
                "cadherin related family member 5 (CDHR5 aka MLPCDH, MU-PCDH, MUCDHL, MUPCDH)",
                "cyclin C (CCNC aka CycC, SRB11, hSRB11)",
                "cyclin D1 (CCND1 aka BCL1, D11S287E, PRAD1, U21B31)",
                "cyclin D2 (CCND2 aka KIAK0002, MPPH3)",
                "cyclin D3 (CCND3)",
                "cyclin E1 (CCNE1 aka CCNE, pCCNE1)",
                "cyclin E2 (CCNE2 aka CYCE2)",
                "cyclin dependent kinase 1 (CDK1 aka CDC2, CDC28A, P34CDC2)",
                "cyclin dependent kinase 2 (CDK2 aka CDKN2, p33(CDK2))",
                "cyclin dependent kinase inhibitor 2A (CDKN2A aka ARF, CAI2, CDK4I, CDKN2, CMM2, INK4, INK4A, MLM, MTS-1, MTS1, P14, P14ARF, P16, P16-INK4A, P16INK4, P16INK4A, P19, P19ARF, TP16)",
                "cyclin dependent kinase inhibitor 2B (CDKN2B aka CDK4I, INK4B, MTS2, P15, TP15, p15INK4b)",
                "partner and localizer of BRCA2 (PALB2 aka BROVCA5, FANCN, PNCA3)"
            ],
            "TP": 8,
            "FP": 2,
            "FN": 0
        }
    }
]