[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "p53 (TP53)",
            "MYC",
            "RAS",
            "BRCA1",
            "BRCA2",
            "NF1",
            "NF2",
            "VHL",
            "PTEN",
            "APC",
            "RB1",
            "CDKN2A",
            "SMAD4",
            "TP53BP1",
            "ATM",
            "MLL",
            "SOX2",
            "MYB",
            "ETS1",
            "HIF1A",
            "ARID1A",
            "CREBBP",
            "EP300",
            "AR"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "MYC",
                "BRCA1",
                "VHL",
                "RB1",
                "SMAD4",
                "TP53BP1",
                "SOX2",
                "MYB",
                "ETS1",
                "HIF1A",
                "CREBBP",
                "EP300",
                "AR"
            ],
            "mismatches": [
                "RAS",
                "BRCA2",
                "NF1",
                "NF2",
                "PTEN",
                "APC",
                "CDKN2A",
                "ATM",
                "MLL",
                "ARID1A"
            ],
            "true_referents": [
                "AT-rich interactive domain-containing protein 1B (ARID1B aka BAF250B, DAN15, KIAA1235, OSA2)",
                "AT-rich interactive domain-containing protein 3A (ARID3A aka DRIL1, DRIL3, DRX, E2FBP1)",
                "AT-rich interactive domain-containing protein 3C (ARID3C)",
                "ATM interactor (ATMIN aka KIAA0431, ZNF822)",
                "Androgen receptor (AR aka DHTR, NR3C4)",
                "Arginine-fifty homeobox (ARGFX)",
                "Beta-arrestin-1 (ARRB1 aka ARR1)",
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "CREB-binding protein (CREBBP aka CBP)",
                "Calmodulin-binding transcription activator 2 (CAMTA2 aka KIAA0909)",
                "Catenin beta-1 (CTNNB1 aka CTNNB, OK/SW-cl.35, PRO2286)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Cyclic AMP-responsive element-binding protein 5 (CREB5 aka CREBPA)",
                "EP300-interacting inhibitor of differentiation 1 (EID1 aka C15orf3, CRI1, RBP21, PNAS-22, PTD014)",
                "EP300-interacting inhibitor of differentiation 2B (EID2B aka EID3)",
                "ETS homologous factor (EHF aka ESE3, ESE3B, ESEJ)",
                "Estrogen receptor (ESR1 aka ESR, NR3A1)",
                "Estrogen receptor beta (ESR2 aka ESTRB, NR3A2)",
                "Forkhead box protein E1 (FOXE1 aka FKHL15, FOXE2, TITF2, TTF2)",
                "General transcription factor II-I repeat domain-containing protein 2A (GTF2IRD2 aka GTF2IRD2A)",
                "Helix-loop-helix protein 1 (NHLH1 aka BHLHA35, HEN1)",
                "Helix-loop-helix protein 2 (NHLH2 aka BHLHA34, HEN2, KIAA0490)",
                "Histone acetyltransferase p300 (EP300 aka P300)",
                "Histone-lysine N-methyltransferase 2D (KMT2D aka ALR, MLL2, MLL4)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Hypoxia-inducible factor 1-alpha inhibitor (HIF1AN aka FIH1)",
                "Hypoxia-inducible factor 3-alpha (HIF3A aka BHLHE17, MOP7, PASD7)",
                "MLX-interacting protein (MLXIP aka BHLHE36, KIAA0867, MIR, MONDOA)",
                "Max-like protein X (MLX aka BHLHD13, TCFL4)",
                "Mothers against decapentaplegic homolog 4 (SMAD4 aka DPC4, MADH4)",
                "Mothers against decapentaplegic homolog 5 (SMAD5 aka MADH5)",
                "Mothers against decapentaplegic homolog 9 (SMAD9 aka MADH6, MADH9, SMAD8)",
                "Myb-related protein A (MYBL1 aka AMYB)",
                "Myb-related protein B (MYBL2 aka BMYB)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "Nuclear factor 1 A-type (NFIA aka KIAA1439)",
                "Nuclear factor 1 B-type (NFIB)",
                "Nuclear factor 1 C-type (NFIC aka NFI)",
                "Nuclear factor erythroid 2-related factor 2 (NFE2L2 aka NRF2)",
                "Nucleus accumbens-associated protein 1 (NACC1 aka BTBD14B, NAC1)",
                "Nucleus accumbens-associated protein 2 (NACC2 aka BTBD14A, NAC2, RBB)",
                "POU class 2 homeobox associating factor 3 (POU2AF3 aka C11orf93, CASC13, COLCA2)",
                "Protein C-ets-1 (ETS1 aka EWSR2)",
                "Protein C-ets-2 (ETS2)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "RB-associated KRAB zinc finger protein (RBAK aka ZNF769)",
                "Ras-related protein Rap-2c (RAP2C)",
                "Ras-responsive element-binding protein 1 (RREB1 aka FINB)",
                "Retinoblastoma-associated protein (RB1)",
                "Retinoic acid receptor alpha (RARA aka NR1B1)",
                "TP53-binding protein 1 (TP53BP1)",
                "Testis-specific chromodomain protein Y 2 (CDY2A aka CDY2B, CDY2)",
                "Transcription factor E2F1 (E2F1 aka RBBP3)",
                "Transcription factor E2F2 (E2F2)",
                "Transcription factor NF-E2 45 kDa subunit (NFE2)",
                "Transcription factor SOX-1 (SOX1)",
                "Transcription factor SOX-12 (SOX12 aka SOX22)",
                "Transcription factor SOX-2 (SOX2)",
                "Transcriptional activator Myb (MYB)",
                "Transforming acidic coiled-coil-containing protein 1 (TACC1 aka KIAA1103)",
                "Tyrosine-protein phosphatase non-receptor type 14 (PTPN14 aka PEZ, PTPD2)",
                "Zinc finger and BTB domain-containing protein 7C (ZBTB7C aka APM1, ZBTB36, ZNF857C)",
                "cAMP-responsive element-binding protein-like 2 (CREBL2)",
                "von Hippel-Lindau disease tumor suppressor (VHL)"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "TATA-binding protein (TBP)",
            "Steroidogenic factor 1 (SF-1)",
            "SOX2 transcription factor (SOX2)",
            "P53 tumor suppressor protein (TP53)",
            "Nuclear receptor co-repressor 1 (NCoR1)",
            "FOXA1 forkhead box A1 (FOXA1)",
            "MYC proto-oncogene protein (MYC)",
            "GATA binding protein 1 (GATA1)",
            "FOXA2 forkhead box A2 (FOXA2)",
            "Runt-related transcription factor 2 (RUNX2)",
            "PAX6 paired box 6 (PAX6)",
            "Nuclear factor kappa-light-chain-enhancer of activated B cells (NF-\u03baB)",
            "T-bet transcription factor (TBX21)",
            "E2F1 transcription factor (E2F1)",
            "E2F2 transcription factor (E2F2)",
            "E2F3 transcription factor (E2F3)",
            "Lef1 transcription factor (LEF1)",
            "HNF4A hepatocyte nuclear factor 4 alpha (HNF4A)",
            "REST repressor element 1-silencing transcription factor (REST)",
            "HIF1A hypoxia-inducible factor 1-alpha (HIF1A)",
            "C/EBP alpha (CEBPA)",
            "C/EBP beta (CEBPB)",
            "SP1 transcription factor (SP1)",
            "YY1 transcription factor (YY1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "MYC proto-oncogene protein (MYC)",
                "Runt-related transcription factor 2 (RUNX2)",
                "PAX6 paired box 6 (PAX6)",
                "E2F1 transcription factor (E2F1)",
                "E2F2 transcription factor (E2F2)",
                "E2F3 transcription factor (E2F3)",
                "Lef1 transcription factor (LEF1)",
                "HNF4A hepatocyte nuclear factor 4 alpha (HNF4A)",
                "REST repressor element 1-silencing transcription factor (REST)",
                "HIF1A hypoxia-inducible factor 1-alpha (HIF1A)",
                "C/EBP alpha (CEBPA)",
                "C/EBP beta (CEBPB)",
                "SP1 transcription factor (SP1)",
                "YY1 transcription factor (YY1)"
            ],
            "mismatches": [
                "TATA-binding protein (TBP)",
                "Steroidogenic factor 1 (SF-1)",
                "SOX2 transcription factor (SOX2)",
                "P53 tumor suppressor protein (TP53)",
                "Nuclear receptor co-repressor 1 (NCoR1)",
                "FOXA1 forkhead box A1 (FOXA1)",
                "GATA binding protein 1 (GATA1)",
                "FOXA2 forkhead box A2 (FOXA2)",
                "Nuclear factor kappa-light-chain-enhancer of activated B cells (NF-\u03baB)",
                "T-bet transcription factor (TBX21)"
            ],
            "true_referents": [
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "CCAAT/enhancer-binding protein alpha (CEBPA aka CEBP)",
                "CCAAT/enhancer-binding protein beta (CEBPB aka TCF5, PP9092)",
                "CCAAT/enhancer-binding protein delta (CEBPD)",
                "CCAAT/enhancer-binding protein epsilon (CEBPE)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Forkhead box protein B1 (FOXB1 aka FKH5)",
                "Forkhead box protein B2 (FOXB2)",
                "Forkhead box protein F2 (FOXF2 aka FKHL6, FREAC2)",
                "Forkhead box protein I2 (FOXI2)",
                "Forkhead box protein L1 (FOXL1 aka FKHL11, FREAC7)",
                "Forkhead box protein O1 (FOXO1 aka FKHR, FOXO1A)",
                "Hepatocyte nuclear factor 1-alpha (HNF1A aka TCF1)",
                "Hepatocyte nuclear factor 3-alpha (FOXA1 aka HNF3A, TCF3A)",
                "Hepatocyte nuclear factor 4-alpha (HNF4A aka HNF4, NR2A1, TCF14)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Hypoxia-inducible factor 1-alpha inhibitor (HIF1AN aka FIH1)",
                "Hypoxia-inducible factor 3-alpha (HIF3A aka BHLHE17, MOP7, PASD7)",
                "Lymphoid enhancer-binding factor 1 (LEF1)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "Nuclear receptor coactivator 1 (NCOA1 aka BHLHE74, SRC1)",
                "Nuclear receptor corepressor 1 (NCOR1 aka KIAA1047)",
                "Nuclear receptor corepressor 2 (NCOR2 aka CTG26)",
                "Paired box protein Pax-2 (PAX2)",
                "Paired box protein Pax-5 (PAX5)",
                "Paired box protein Pax-6 (PAX6 aka AN2)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "RE1-silencing transcription factor (REST aka NRSF, XBR)",
                "REST corepressor 1 (RCOR1 aka KIAA0071, RCOR)",
                "Runt-related transcription factor 1 (RUNX1 aka AML1, CBFA2)",
                "Runt-related transcription factor 2 (RUNX2 aka AML3, CBFA1, OSF2, PEBP2A)",
                "Runt-related transcription factor 3 (RUNX3 aka AML2, CBFA3, PEBP2A3)",
                "Splicing factor 1 (SF1 aka ZFM1, ZNF162)",
                "Steroidogenic factor 1 (NR5A1 aka AD4BP, FTZF1, SF1)",
                "Sterol regulatory element-binding protein 1 (SREBF1 aka BHLHD1, SREBP1)",
                "T-box transcription factor TBX1 (TBX1)",
                "T-box transcription factor TBX2 (TBX2)",
                "T-box transcription factor TBX21 (TBX21 aka TBET, TBLYM)",
                "TATA element modulatory factor (TMF1 aka ARA160)",
                "TATA-binding protein-associated factor 172 (BTAF1 aka TAF172)",
                "TATA-binding protein-associated factor 2N (TAF15 aka RBP56, TAF2N)",
                "TP53-binding protein 1 (TP53BP1)",
                "Transcription factor E2F1 (E2F1 aka RBBP3)",
                "Transcription factor E2F2 (E2F2)",
                "Transcription factor E2F3 (E2F3 aka KIAA0075)",
                "Transcription factor E2F4 (E2F4)",
                "Transcription factor E2F5 (E2F5)",
                "Transcription factor E2F6 (E2F6)",
                "Transcription factor GATA-4 (GATA4)",
                "Transcription factor GATA-5 (GATA5)",
                "Transcription factor GATA-6 (GATA6)",
                "Transcription factor LBX1 (LBX1 aka LBX1H)",
                "Transcription factor Maf (MAF)",
                "Transcription factor SOX-1 (SOX1)",
                "Transcription factor SOX-12 (SOX12 aka SOX22)",
                "Transcription factor SOX-2 (SOX2)",
                "Transcription factor Sp1 (SP1 aka TSFP1)",
                "Transcription factor Sp3 (SP3)",
                "Transcription factor Sp5 (SP5)",
                "Transcription factor YY2 (YY2 aka ZNF631)",
                "Transcription factor p65 (RELA aka NFKB3)",
                "Transcriptional repressor CTCF (CTCF)",
                "Transcriptional repressor protein YY1 (YY1 aka INO80S)",
                "YY1-associated factor 2 (YAF2)"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "p53 (TP53)",
            "Myc (MYC)",
            "NF-\u03baB (NFKB1)",
            "AP-1 (JUN)",
            "E2F1",
            "CREB (CREB1)",
            "STAT3",
            "FOXO1",
            "SP1",
            "HIF-1\u03b1 (HIF1A)",
            "Smad3",
            "NRF2 (NFE2L2)",
            "GATA1",
            "KLF4",
            "SOX2",
            "Pax6",
            "CREM",
            "ATF4",
            "RELA",
            "Egr1",
            "YAP1",
            "TGF-\u03b2",
            "USF1",
            "BRCA1"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "p53 (TP53)",
                "Myc (MYC)",
                "CREB (CREB1)",
                "STAT3",
                "FOXO1",
                "SP1",
                "HIF-1\u03b1 (HIF1A)",
                "NRF2 (NFE2L2)",
                "KLF4",
                "SOX2",
                "Pax6",
                "CREM",
                "RELA",
                "Egr1",
                "YAP1",
                "USF1",
                "BRCA1"
            ],
            "mismatches": [
                "NF-\u03baB (NFKB1)",
                "AP-1 (JUN)",
                "E2F1",
                "Smad3",
                "GATA1",
                "ATF4",
                "TGF-\u03b2"
            ],
            "true_referents": [
                "Basic helix-loop-helix domain-containing protein USF3 (USF3 aka KIAA2018)",
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Cyclic AMP-dependent transcription factor ATF-1 (ATF1)",
                "Cyclic AMP-dependent transcription factor ATF-5 (ATF5 aka ATFX)",
                "Cyclic AMP-dependent transcription factor ATF-7 (ATF7 aka ATFA)",
                "Cyclic AMP-responsive element-binding protein 1 (CREB1)",
                "Cyclic AMP-responsive element-binding protein 3-like protein 3 (CREB3L3 aka CREBH, HYST1481)",
                "Early growth response protein 1 (EGR1 aka KROX24, ZNF225)",
                "Early growth response protein 3 (EGR3 aka PILOT)",
                "Early growth response protein 4 (EGR4)",
                "Estrogen receptor (ESR1 aka ESR, NR3A1)",
                "Forkhead box protein O1 (FOXO1 aka FKHR, FOXO1A)",
                "Forkhead box protein O4 (FOXO4 aka AFX, AFX1, MLLT7)",
                "Forkhead box protein O6 (FOXO6)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Hypoxia-inducible factor 1-alpha inhibitor (HIF1AN aka FIH1)",
                "Hypoxia-inducible factor 3-alpha (HIF3A aka BHLHE17, MOP7, PASD7)",
                "Krueppel-like factor 1 (KLF1 aka EKLF)",
                "Krueppel-like factor 3 (KLF3 aka BKLF)",
                "Krueppel-like factor 4 (KLF4 aka EZF, GKLF)",
                "Mothers against decapentaplegic homolog 3 (SMAD3 aka MADH3)",
                "Mothers against decapentaplegic homolog 5 (SMAD5 aka MADH5)",
                "Mothers against decapentaplegic homolog 9 (SMAD9 aka MADH6, MADH9, SMAD8)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "Nuclear factor erythroid 2-related factor 2 (NFE2L2 aka NRF2)",
                "Nuclear factor erythroid 2-related factor 3 (NFE2L3 aka NRF3)",
                "Nuclear respiratory factor 1 (NRF1)",
                "Paired box protein Pax-2 (PAX2)",
                "Paired box protein Pax-5 (PAX5)",
                "Paired box protein Pax-6 (PAX6 aka AN2)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "Proto-oncogene c-Rel (REL)",
                "RelA-associated inhibitor (PPP1R13L aka IASPP, NKIP1, PPP1R13BL, RAI)",
                "Retinoic acid receptor alpha (RARA aka NR1B1)",
                "Signal transducer and activator of transcription 3 (STAT3 aka APRF)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 6 (STAT6)",
                "TP53-binding protein 1 (TP53BP1)",
                "Transcription factor AP-2-beta (TFAP2B)",
                "Transcription factor E2F2 (E2F2)",
                "Transcription factor E2F7 (E2F7)",
                "Transcription factor E2F8 (E2F8)",
                "Transcription factor GATA-4 (GATA4)",
                "Transcription factor GATA-5 (GATA5)",
                "Transcription factor GATA-6 (GATA6)",
                "Transcription factor Jun (JUN)",
                "Transcription factor JunB (JUNB)",
                "Transcription factor RelB (RELB)",
                "Transcription factor SOX-1 (SOX1)",
                "Transcription factor SOX-12 (SOX12 aka SOX22)",
                "Transcription factor SOX-2 (SOX2)",
                "Transcription factor Sp1 (SP1 aka TSFP1)",
                "Transcription factor Sp3 (SP3)",
                "Transcription factor Sp5 (SP5)",
                "Transcription factor p65 (RELA aka NFKB3)",
                "Transcriptional coactivator YAP1 (YAP1 aka YAP65)",
                "Transcriptional repressor protein YY1 (YY1 aka INO80S)",
                "Transforming growth factor beta-1-induced transcript 1 protein (TGFB1I1 aka ARA55)",
                "Upstream stimulatory factor 1 (USF1 aka BHLHB11, USF)",
                "Upstream stimulatory factor 2 (USF2 aka BHLHB12)",
                "YY1-associated factor 2 (YAF2)",
                "cAMP-responsive element modulator (CREM)",
                "cAMP-responsive element-binding protein-like 2 (CREBL2)"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "TP53 (p53)",
            "MYC (c-Myc)",
            "NFKB1 (NF-\u03baB1)",
            "STAT3 (STAT3)",
            "ESR1 (ER\u03b1)",
            "AR (Androgen Receptor)",
            "CREB1 (CREB)",
            "JUN (c-Jun)",
            "FOS (c-Fos)",
            "E2F1 (E2F1)",
            "HIF1A (HIF-1\u03b1)",
            "SMAD3 (SMAD3)",
            "RUNX1 (RUNX1)",
            "POU5F1 (Oct4)",
            "NANOG (Nanog)",
            "SOX2 (Sox2)",
            "GLI1 (Gli1)",
            "REST (NRSF)",
            "NR4A1 (NR4A1)",
            "ATF3 (ATF3)",
            "YY1 (YY1)",
            "SP1 (SP1)",
            "IRF3 (IRF3)",
            "ZNF263 (ZNF263)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53 (p53)",
                "MYC (c-Myc)",
                "NFKB1 (NF-\u03baB1)",
                "STAT3 (STAT3)",
                "ESR1 (ER\u03b1)",
                "AR (Androgen Receptor)",
                "CREB1 (CREB)",
                "JUN (c-Jun)",
                "FOS (c-Fos)",
                "HIF1A (HIF-1\u03b1)",
                "SMAD3 (SMAD3)",
                "POU5F1 (Oct4)",
                "NANOG (Nanog)",
                "SOX2 (Sox2)",
                "GLI1 (Gli1)",
                "REST (NRSF)",
                "NR4A1 (NR4A1)",
                "ATF3 (ATF3)",
                "YY1 (YY1)",
                "SP1 (SP1)",
                "IRF3 (IRF3)"
            ],
            "mismatches": [
                "E2F1 (E2F1)",
                "RUNX1 (RUNX1)",
                "ZNF263 (ZNF263)"
            ],
            "true_referents": [
                "Androgen receptor (AR aka DHTR, NR3C4)",
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Cyclic AMP-dependent transcription factor ATF-1 (ATF1)",
                "Cyclic AMP-dependent transcription factor ATF-3 (ATF3)",
                "Cyclic AMP-dependent transcription factor ATF-5 (ATF5 aka ATFX)",
                "Cyclic AMP-responsive element-binding protein 1 (CREB1)",
                "Cyclic AMP-responsive element-binding protein 3-like protein 3 (CREB3L3 aka CREBH, HYST1481)",
                "E3 ubiquitin-protein ligase DTX1 (DTX1)",
                "Estrogen receptor (ESR1 aka ESR, NR3A1)",
                "Fos-related antigen 1 (FOSL1 aka FRA1)",
                "Homeobox protein CDX-1 (CDX1)",
                "Homeobox protein NANOG (NANOG)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Hypoxia-inducible factor 1-alpha inhibitor (HIF1AN aka FIH1)",
                "Hypoxia-inducible factor 3-alpha (HIF3A aka BHLHE17, MOP7, PASD7)",
                "Interferon regulatory factor 1 (IRF1)",
                "Interferon regulatory factor 3 (IRF3)",
                "Interferon regulatory factor 5 (IRF5)",
                "Mothers against decapentaplegic homolog 3 (SMAD3 aka MADH3)",
                "Mothers against decapentaplegic homolog 5 (SMAD5 aka MADH5)",
                "Mothers against decapentaplegic homolog 9 (SMAD9 aka MADH6, MADH9, SMAD8)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "NANOG neighbor homeobox (NANOGNB)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "Nuclear receptor subfamily 4 group A member 2 (NR4A2 aka NOT, NURR1, TINUR)",
                "Nuclear receptor subfamily 4 group A member 3 (NR4A3 aka CHN, CSMF, MINOR, NOR1, TEC)",
                "Nuclear receptor subfamily 4immunitygroup A member 1 (NR4A1 aka GFRP1, HMR, NAK1)",
                "POU domain, class 2, transcription factor 1 (POU2F1 aka OCT1, OTF1)",
                "POU domain, class 5, transcription factor 1 (POU5F1 aka OCT3, OCT4, OTF3)",
                "Protein FosB (FOSB aka G0S3)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "Protein c-Fos (FOS aka G0S7)",
                "Putative POU domain, class 5, transcription factor 1B (POU5F1B aka OCT4PG1, OTF3C, OTF3P1, POU5F1P1, POU5FLC20, POU5FLC8)",
                "Putative homeobox protein NANOG2 (NANOGP1 aka NANOG2)",
                "RE1-silencing transcription factor (REST aka NRSF, XBR)",
                "REST corepressor 1 (RCOR1 aka KIAA0071, RCOR)",
                "REST corepressor 2 (RCOR2)",
                "RING1 and YY1-binding protein (RYBP aka DEDAF, YEAF1)",
                "Signal transducer and activator of transcription 3 (STAT3 aka APRF)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 6 (STAT6)",
                "Steroid hormone receptor ERR1 (ESRRA aka ERR1, ESRL1, NR3B1)",
                "Steroid hormone receptor ERR2 (ESRRB aka ERRB2, ESRL2, NR3B2)",
                "TP53-binding protein 1 (TP53BP1)",
                "Transcription factor E2F2 (E2F2)",
                "Transcription factor E2F7 (E2F7)",
                "Transcription factor E2F8 (E2F8)",
                "Transcription factor Jun (JUN)",
                "Transcription factor JunB (JUNB)",
                "Transcription factor JunD (JUND)",
                "Transcription factor LBX1 (LBX1 aka LBX1H)",
                "Transcription factor SOX-1 (SOX1)",
                "Transcription factor SOX-12 (SOX12 aka SOX22)",
                "Transcription factor SOX-2 (SOX2)",
                "Transcription factor Sp1 (SP1 aka TSFP1)",
                "Transcription factor Sp3 (SP3)",
                "Transcription factor Sp5 (SP5)",
                "Transcription factor YY2 (YY2 aka ZNF631)",
                "Transcription factor p65 (RELA aka NFKB3)",
                "Transcriptional activator GLI3 (GLI3)",
                "Transcriptional repressor protein YY1 (YY1 aka INO80S)",
                "Zinc finger protein 260 (ZNF260 aka ZFP260)",
                "Zinc finger protein 283 (ZNF283)",
                "Zinc finger protein 563 (ZNF563)",
                "Zinc finger protein GLI1 (GLI1 aka GLI)",
                "Zinc finger protein GLI2 (GLI2 aka THP)",
                "cAMP-responsive element-binding protein-like 2 (CREBL2)"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "Tumor Protein p53 (TP53)",
            "Myc Proto-Oncogene Protein (MYC)",
            "Forkhead Box P3 (FOXP3)",
            "Hypoxia-Inducible Factor 1-alpha (HIF1A)",
            "Nuclear Factor Kappa B Subunit 1 (NFKB1)",
            "Sex Determining Region Y (SRY)",
            "Estrogen Receptor 1 (ESR1)",
            "Androgen Receptor (AR)",
            "Glucocorticoid Receptor (NR3C1)",
            "Peroxisome Proliferator-Activated Receptor Gamma (PPARG)",
            "GATA Binding Protein 3 (GATA3)",
            "CCAAT/Enhancer Binding Protein Alpha (CEBPA)",
            "Signal Transducer and Activator of Transcription 3 (STAT3)",
            "Retinoic Acid Receptor Alpha (RARA)",
            "Nuclear Receptor Subfamily 1 Group I Member 2 (NR1I2)",
            "T-Box Transcription Factor TBX5 (TBX5)",
            "Paired Box 6 (PAX6)",
            "Zinc Finger Protein GLI1 (GLI1)",
            "E2F Transcription Factor 1 (E2F1)",
            "TATA-Box Binding Protein (TBP)",
            "Transcription Factor AP-2 Alpha (TFAP2A)",
            "Sox Transcription Factor 2 (SOX2)",
            "Kruppel-Like Factor 4 (KLF4)",
            "Nuclear Factor of Activated T-Cells 1 (NFATC1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Tumor Protein p53 (TP53)",
                "Myc Proto-Oncogene Protein (MYC)",
                "Forkhead Box P3 (FOXP3)",
                "Hypoxia-Inducible Factor 1-alpha (HIF1A)",
                "Nuclear Factor Kappa B Subunit 1 (NFKB1)",
                "Sex Determining Region Y (SRY)",
                "Estrogen Receptor 1 (ESR1)",
                "Androgen Receptor (AR)",
                "Glucocorticoid Receptor (NR3C1)",
                "Peroxisome Proliferator-Activated Receptor Gamma (PPARG)",
                "GATA Binding Protein 3 (GATA3)",
                "CCAAT/Enhancer Binding Protein Alpha (CEBPA)",
                "Retinoic Acid Receptor Alpha (RARA)",
                "Nuclear Receptor Subfamily 1 Group I Member 2 (NR1I2)",
                "T-Box Transcription Factor TBX5 (TBX5)",
                "Paired Box 6 (PAX6)",
                "Zinc Finger Protein GLI1 (GLI1)",
                "E2F Transcription Factor 1 (E2F1)",
                "Transcription Factor AP-2 Alpha (TFAP2A)",
                "Sox Transcription Factor 2 (SOX2)",
                "Kruppel-Like Factor 4 (KLF4)",
                "Nuclear Factor of Activated T-Cells 1 (NFATC1)"
            ],
            "mismatches": [
                "Signal Transducer and Activator of Transcription 3 (STAT3)",
                "TATA-Box Binding Protein (TBP)"
            ],
            "true_referents": [
                "Androgen receptor (AR aka DHTR, NR3C4)",
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "CCAAT/enhancer-binding protein alpha (CEBPA aka CEBP)",
                "CCAAT/enhancer-binding protein epsilon (CEBPE)",
                "CCAAT/enhancer-binding protein gamma (CEBPG)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Estrogen receptor (ESR1 aka ESR, NR3A1)",
                "Estrogen receptor beta (ESR2 aka ESTRB, NR3A2)",
                "Forkhead box protein I3 (FOXI3)",
                "Forkhead box protein L3 (FOXL3)",
                "Forkhead box protein P3 (FOXP3 aka IPEX, JM2)",
                "Glucocorticoid receptor (NR3C1 aka GRL)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Hypoxia-inducible factor 1-alpha inhibitor (HIF1AN aka FIH1)",
                "Hypoxia-inducible factor 3-alpha (HIF3A aka BHLHE17, MOP7, PASD7)",
                "Krueppel-like factor 1 (KLF1 aka EKLF)",
                "Krueppel-like factor 4 (KLF4 aka EZF, GKLF)",
                "Kruppel-like factor 18 (KLF18)",
                "Mineralocorticoid receptor (NR3C2 aka MCR, MLR)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "Nuclear factor of activated T-cells, cytoplasmic 1 (NFATC1 aka NFAT2, NFATC)",
                "Nuclear factor of activated T-cells, cytoplasmic 2 (NFATC2 aka NFAT1, NFATP)",
                "Nuclear factor of activated T-cells, cytoplasmic 4 (NFATC4 aka NFAT3)",
                "Nuclear receptor subfamily 1 group D member 2 (NR1D2)",
                "Nuclear receptor subfamily 1 group I member 2 (NR1I2 aka PXR)",
                "Nuclear receptor subfamily 4 group A member 2 (NR4A2 aka NOT, NURR1, TINUR)",
                "Paired box protein Pax-2 (PAX2)",
                "Paired box protein Pax-5 (PAX5)",
                "Paired box protein Pax-6 (PAX6 aka AN2)",
                "Peroxisome proliferator-activated receptor alpha (PPARA aka NR1C1, PPAR)",
                "Peroxisome proliferator-activated receptor gamma (PPARG aka NR1C3)",
                "Peroxisome proliferator-activated receptor gamma coactivator 1-beta (PPARGC1B aka PERC, PGC1, PGC1B, PPARGC1)",
                "Progesterone receptor (PGR aka NR3C3)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "Retinoic acid receptor RXR-alpha (RXRA aka NR2B1)",
                "Retinoic acid receptor alpha (RARA aka NR1B1)",
                "Retinoic acid receptor gamma (RARG aka NR1B3)",
                "Sex-determining region Y protein (SRY aka TDF)",
                "Signal transducer and activator of transcription 1-alpha/beta (STAT1)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 6 (STAT6)",
                "Steroid hormone receptor ERR1 (ESRRA aka ERR1, ESRL1, NR3B1)",
                "T-box transcription factor T (TBXT aka T)",
                "T-box transcription factor TBX1 (TBX1)",
                "T-box transcription factor TBX5 (TBX5)",
                "T-box transcription factor TBX6 (TBX6)",
                "TATA-binding protein-associated factor 172 (BTAF1 aka TAF172)",
                "TP53-binding protein 1 (TP53BP1)",
                "Testis-specific chromodomain protein Y 1 (CDY1 aka CDY1B, CDY1A)",
                "Testis-specific chromodomain protein Y 2 (CDY2A aka CDY2B, CDY2)",
                "Trans-acting T-cell-specific transcription factor GATA-3 (GATA3)",
                "Transcription factor AP-2 gamma (TFAP2C)",
                "Transcription factor AP-2-alpha (TFAP2A aka AP2TF, TFAP2)",
                "Transcription factor AP-2-beta (TFAP2B)",
                "Transcription factor E2F1 (E2F1 aka RBBP3)",
                "Transcription factor E2F5 (E2F5)",
                "Transcription factor E2F6 (E2F6)",
                "Transcription factor GATA-5 (GATA5)",
                "Transcription factor GATA-6 (GATA6)",
                "Transcription factor SOX-1 (SOX1)",
                "Transcription factor SOX-12 (SOX12 aka SOX22)",
                "Transcription factor SOX-2 (SOX2)",
                "Transcription factor p65 (RELA aka NFKB3)",
                "Zinc finger protein GLI1 (GLI1 aka GLI)",
                "Zinc finger protein GLI2 (GLI2 aka THP)",
                "Zinc finger protein GLI4 (GLI4 aka HKR4)"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "TP53 (TP53)",
            "MYC (MYC)",
            "NF-kB (NFKB1)",
            "FOXO3 (FOXO3)",
            "STAT3 (STAT3)",
            "CTCF (CTCF)",
            "AP-1 (JUN)",
            "E2F1 (E2F1)",
            "p53 (TP53)",
            "SMAD4 (SMAD4)",
            "GATA3 (GATA3)",
            "C/EBP\u03b1 (CEBPA)",
            "CREB1 (CREB1)",
            "NRF2 (NFE2L2)",
            "HIF1A (HIF1A)",
            "SREBF1 (SREBF1)",
            "RXRA (RXRA)",
            "LEF1 (LEF1)",
            "KLF4 (KLF4)",
            "Oct4 (POU5F1)",
            "c-Myb (MYB)",
            "p65 (RELA)",
            "RFX5 (RFX5)",
            "YY1 (YY1)",
            "TBX5 (TBX5)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "MYC",
                "FOXO3",
                "STAT3",
                "CTCF",
                "JUN",
                "E2F1",
                "SMAD4",
                "GATA3",
                "CEBPA",
                "CREB1",
                "NFE2L2",
                "HIF1A",
                "SREBF1",
                "RXRA",
                "LEF1",
                "KLF4",
                "POU5F1",
                "MYB",
                "RELA",
                "RFX5",
                "YY1"
            ],
            "mismatches": [
                "NF-kB",
                "TBX5"
            ],
            "true_referents": [
                "BEN domain-containing protein 6 (BEND6 aka C6orf65)",
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "C-terminal-binding protein 1 (CTBP1 aka CTBP)",
                "CCAAT/enhancer-binding protein alpha (CEBPA aka CEBP)",
                "CCAAT/enhancer-binding protein epsilon (CEBPE)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Cyclic AMP-responsive element-binding protein 1 (CREB1)",
                "Cyclic AMP-responsive element-binding protein 3-like protein 3 (CREB3L3 aka CREBH, HYST1481)",
                "DNA-binding protein RFX5 (RFX5)",
                "ELL-associated factor 1 (EAF1)",
                "Forkhead box protein O3 (FOXO3 aka FKHRL1, FOXO3A)",
                "Forkhead box protein O3B (FOXO3B)",
                "Forkhead box protein O6 (FOXO6)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Hypoxia-inducible factor 1-alpha inhibitor (HIF1AN aka FIH1)",
                "Hypoxia-inducible factor 3-alpha (HIF3A aka BHLHE17, MOP7, PASD7)",
                "Krueppel-like factor 1 (KLF1 aka EKLF)",
                "Krueppel-like factor 3 (KLF3 aka BKLF)",
                "Krueppel-like factor 4 (KLF4 aka EZF, GKLF)",
                "Lymphoid enhancer-binding factor 1 (LEF1)",
                "Mothers against decapentaplegic homolog 4 (SMAD4 aka DPC4, MADH4)",
                "Mothers against decapentaplegic homolog 5 (SMAD5 aka MADH5)",
                "Mothers against decapentaplegic homolog 9 (SMAD9 aka MADH6, MADH9, SMAD8)",
                "Myb-related protein A (MYBL1 aka AMYB)",
                "Myb-related protein B (MYBL2 aka BMYB)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "Nuclear factor erythroid 2-related factor 2 (NFE2L2 aka NRF2)",
                "Nuclear factor erythroid 2-related factor 3 (NFE2L3 aka NRF3)",
                "Nuclear respiratory factor 1 (NRF1)",
                "Oxysterols receptor LXR-alpha (NR1H3 aka LXRA)",
                "POU domain, class 2, transcription factor 1 (POU2F1 aka OCT1, OTF1)",
                "POU domain, class 5, transcription factor 1 (POU5F1 aka OCT3, OCT4, OTF3)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "Putative POU domain, class 5, transcription factor 1B (POU5F1B aka OCT4PG1, OTF3C, OTF3P1, POU5F1P1, POU5FLC20, POU5FLC8)",
                "RING1 and YY1-binding protein (RYBP aka DEDAF, YEAF1)",
                "RelA-associated inhibitor (PPP1R13L aka IASPP, NKIP1, PPP1R13BL, RAI)",
                "Retinoic acid receptor RXR-alpha (RXRA aka NR2B1)",
                "Retinoic acid receptor RXR-beta (RXRB aka NR2B2)",
                "Signal transducer and activator of transcription 3 (STAT3 aka APRF)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 6 (STAT6)",
                "Sterol regulatory element-binding protein 1 (SREBF1 aka BHLHD1, SREBP1)",
                "Sterol regulatory element-binding protein 2 (SREBF2 aka BHLHD2, SREBP2)",
                "TP53-binding protein 1 (TP53BP1)",
                "Trans-acting T-cell-specific transcription factor GATA-3 (GATA3)",
                "Transcription factor AP-2-beta (TFAP2B)",
                "Transcription factor E2F1 (E2F1 aka RBBP3)",
                "Transcription factor E2F2 (E2F2)",
                "Transcription factor E2F4 (E2F4)",
                "Transcription factor E2F7 (E2F7)",
                "Transcription factor E2F8 (E2F8)",
                "Transcription factor GATA-5 (GATA5)",
                "Transcription factor GATA-6 (GATA6)",
                "Transcription factor Jun (JUN)",
                "Transcription factor JunB (JUNB)",
                "Transcription factor RFX3 (RFX3)",
                "Transcription factor RFX4 (RFX4)",
                "Transcription factor YY2 (YY2 aka ZNF631)",
                "Transcription factor p65 (RELA aka NFKB3)",
                "Transcriptional activator Myb (MYB)",
                "Transcriptional repressor CTCF (CTCF)",
                "Transcriptional repressor CTCFL (CTCFL aka BORIS)",
                "Transcriptional repressor protein YY1 (YY1 aka INO80S)",
                "cAMP-responsive element-binding protein-like 2 (CREBL2)"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "BRCA1 (Breast Cancer 1)",
            "BRCA2 (Breast Cancer 2)",
            "TP53 (Tumor Protein p53)",
            "MYC (MYC Proto-Oncogene)",
            "RB1 (Retinoblastoma 1)",
            "APC (Adenomatous Polyposis Coli)",
            "STAT3 (Signal Transducer and Activator of Transcription 3)",
            "FOXP3 (Forkhead Box P3)",
            "CTNNB1 (Catenin Beta 1)",
            "CREB1 (cAMP Responsive Element Binding Protein 1)",
            "SMAD4 (SMAD Family Member 4)",
            "NOTCH1 (Notch Homolog 1)",
            "NFATC1 (Nuclear Factor of Activated T-cells 1)",
            "RELA (RELA Proto-Oncogene)",
            "FOXO1 (Forkhead Box O1)",
            "ATF2 (Activating Transcription Factor 2)",
            "ATF3 (Activating Transcription Factor 3)",
            "ATF4 (Activating Transcription Factor 4)",
            "ATF5 (Activating Transcription Factor 5)",
            "ATF6 (Activating Transcription Factor 6)",
            "ATF7 (Activating Transcription Factor 7)",
            "ATF1 (Activating Transcription Factor 1)",
            "JUN (Jun Proto-Oncogene)",
            "FOS (Fos Proto-Oncogene)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BRCA1 (Breast Cancer 1)",
                "TP53 (Tumor Protein p53)",
                "MYC (MYC Proto-Oncogene)",
                "RB1 (Retinoblastoma 1)",
                "FOXP3 (Forkhead Box P3)",
                "CTNNB1 (Catenin Beta 1)",
                "CREB1 (cAMP Responsive Element Binding Protein 1)",
                "SMAD4 (SMAD Family Member 4)",
                "NOTCH1 (Notch Homolog 1)",
                "NFATC1 (Nuclear Factor of Activated T-cells 1)",
                "FOXO1 (Forkhead Box O1)",
                "ATF2 (Activating Transcription Factor 2)",
                "ATF3 (Activating Transcription Factor 3)",
                "ATF4 (Activating Transcription Factor 4)",
                "ATF5 (Activating Transcription Factor 5)",
                "ATF6 (Activating Transcription Factor 6)",
                "ATF1 (Activating Transcription Factor 1)",
                "JUN (Jun Proto-Oncogene)",
                "FOS (Fos Proto-Oncogene)"
            ],
            "mismatches": [
                "BRCA2 (Breast Cancer 2)",
                "APC (Adenomatous Polyposis Coli)",
                "STAT3 (Signal Transducer and Activator of Transcription 3)",
                "RELA (RELA Proto-Oncogene)",
                "ATF7 (Activating Transcription Factor 7)"
            ],
            "true_referents": [
                "Activating transcription factor 7-interacting protein 1 (ATF7IP aka MCAF, MCAF1)",
                "Activating transcription factor 7-interacting protein 2 (ATF7IP2 aka MCAF2)",
                "Basic leucine zipper transcriptional factor ATF-like 2 (BATF2)",
                "Basic leucine zipper transcriptional factor ATF-like 3 (BATF3 aka SNFT)",
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "Catenin beta-1 (CTNNB1 aka CTNNB, OK/SW-cl.35, PRO2286)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Cyclic AMP-dependent transcription factor ATF-1 (ATF1)",
                "Cyclic AMP-dependent transcription factor ATF-2 (ATF2 aka CREB2, CREBP1)",
                "Cyclic AMP-dependent transcription factor ATF-3 (ATF3)",
                "Cyclic AMP-dependent transcription factor ATF-4 (ATF4 aka CREB2, TXREB)",
                "Cyclic AMP-dependent transcription factor ATF-5 (ATF5 aka ATFX)",
                "Cyclic AMP-dependent transcription factor ATF-6 alpha (ATF6)",
                "Cyclic AMP-dependent transcription factor ATF-7 (ATF7 aka ATFA)",
                "Cyclic AMP-responsive element-binding protein 1 (CREB1)",
                "Cyclic AMP-responsive element-binding protein 5 (CREB5 aka CREBPA)",
                "Estrogen receptor (ESR1 aka ESR, NR3A1)",
                "Estrogen receptor beta (ESR2 aka ESTRB, NR3A2)",
                "Forkhead box protein I3 (FOXI3)",
                "Forkhead box protein O1 (FOXO1 aka FKHR, FOXO1A)",
                "Forkhead box protein O4 (FOXO4 aka AFX, AFX1, MLLT7)",
                "Forkhead box protein O6 (FOXO6)",
                "Forkhead box protein P1 (FOXP1 aka HSPC215)",
                "Forkhead box protein P3 (FOXP3 aka IPEX, JM2)",
                "Fos-related antigen 1 (FOSL1 aka FRA1)",
                "Methyl-CpG-binding protein 2 (MECP2)",
                "Mothers against decapentaplegic homolog 4 (SMAD4 aka DPC4, MADH4)",
                "Mothers against decapentaplegic homolog 5 (SMAD5 aka MADH5)",
                "Mothers against decapentaplegic homolog 9 (SMAD9 aka MADH6, MADH9, SMAD8)",
                "Myb-binding protein 1A (MYBBP1A aka P160)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "Netrin-1 (NTN1 aka NTN1L)",
                "Netrin-3 (NTN3 aka NTN2L)",
                "Neural retina-specific leucine zipper protein (NRL aka D14S46E)",
                "Neurogenic locus notch homolog protein 1 (NOTCH1 aka TAN1)",
                "Neurogenic locus notch homolog protein 2 (NOTCH2)",
                "Neurogenic locus notch homolog protein 4 (NOTCH4 aka INT3)",
                "Nuclear factor of activated T-cells, cytoplasmic 1 (NFATC1 aka NFAT2, NFATC)",
                "Nuclear factor of activated T-cells, cytoplasmic 2 (NFATC2 aka NFAT1, NFATP)",
                "Nuclear factor of activated T-cells, cytoplasmic 4 (NFATC4 aka NFAT3)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "Protein c-Fos (FOS aka G0S7)",
                "Proto-oncogene c-Rel (REL)",
                "RelA-associated inhibitor (PPP1R13L aka IASPP, NKIP1, PPP1R13BL, RAI)",
                "Retinoblastoma-associated protein (RB1)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 5A (STAT5A aka STAT5)",
                "Signal transducer and activator of transcription 6 (STAT6)",
                "TP53-binding protein 1 (TP53BP1)",
                "Transcription factor E2F1 (E2F1 aka RBBP3)",
                "Transcription factor E2F2 (E2F2)",
                "Transcription factor E2F7 (E2F7)",
                "Transcription factor Jun (JUN)",
                "Transcription factor JunB (JUNB)",
                "Transcription factor JunD (JUND)",
                "Transcription factor RelB (RELB)",
                "cAMP-responsive element-binding protein-like 2 (CREBL2)"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "p53 gene",
            "BRCA1 gene",
            "STAT3 gene",
            "NF-kB gene",
            "HIF-1 gene",
            "MYC gene",
            "AP-1 gene",
            "CREB gene",
            "ERK gene",
            "JUN gene",
            "FOS gene",
            "NFKB1 gene",
            "NFKB2 gene",
            "REL gene",
            "STAT1 gene",
            "STAT2 gene",
            "STAT4 gene",
            "STAT5 gene",
            "STAT6 gene",
            "STAT7 gene",
            "TP53 gene",
            "ETS1 gene",
            "ETS2 gene",
            "BCL6 gene"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BRCA1 gene",
                "STAT3 gene",
                "MYC gene",
                "JUN gene",
                "FOS gene",
                "NFKB1 gene",
                "NFKB2 gene",
                "REL gene",
                "STAT1 gene",
                "STAT2 gene",
                "STAT4 gene",
                "STAT6 gene",
                "TP53 gene",
                "ETS1 gene",
                "ETS2 gene"
            ],
            "mismatches": [
                "p53 gene",
                "NF-kB gene",
                "HIF-1 gene",
                "AP-1 gene",
                "CREB gene",
                "ERK gene",
                "STAT5 gene",
                "STAT7 gene",
                "BCL6 gene"
            ],
            "true_referents": [
                "B-cell CLL/lymphoma 6 member B protein (BCL6B aka BAZF, ZNF62)",
                "B-cell lymphoma 6 protein (BCL6 aka BCL5, LAZ3, ZBTB27, ZNF51)",
                "BCL-6 corepressor (BCOR aka KIAA1575)",
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Cyclic AMP-responsive element-binding protein 1 (CREB1)",
                "Cyclic AMP-responsive element-binding protein 3-like protein 3 (CREB3L3 aka CREBH, HYST1481)",
                "ETS domain-containing transcription factor ERF (ERF)",
                "ETS domain-containing transcription factor ERF-like (ERFL)",
                "ETS homologous factor (EHF aka ESE3, ESE3B, ESEJ)",
                "ETS translocation variant 2 (ETV2 aka ER71, ETSRP71)",
                "Estrogen receptor (ESR1 aka ESR, NR3A1)",
                "Fos-related antigen 1 (FOSL1 aka FRA1)",
                "Fos-related antigen 2 (FOSL2 aka FRA2)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Hypoxia-inducible factor 1-alpha inhibitor (HIF1AN aka FIH1)",
                "Hypoxia-inducible factor 3-alpha (HIF3A aka BHLHE17, MOP7, PASD7)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "POU class 2 homeobox associating factor 3 (POU2AF3 aka C11orf93, CASC13, COLCA2)",
                "Protein C-ets-1 (ETS1 aka EWSR2)",
                "Protein C-ets-2 (ETS2)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "Protein c-Fos (FOS aka G0S7)",
                "Proto-oncogene c-Rel (REL)",
                "RE1-silencing transcription factor (REST aka NRSF, XBR)",
                "Signal transducer and activator of transcription 1-alpha/beta (STAT1)",
                "Signal transducer and activator of transcription 2 (STAT2)",
                "Signal transducer and activator of transcription 3 (STAT3 aka APRF)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 5A (STAT5A aka STAT5)",
                "Signal transducer and activator of transcription 5B (STAT5B)",
                "Signal transducer and activator of transcription 6 (STAT6)",
                "TP53-binding protein 1 (TP53BP1)",
                "Transcription factor AP-2-beta (TFAP2B)",
                "Transcription factor AP-2-epsilon (TFAP2E)",
                "Transcription factor AP-4 (TFAP4 aka BHLHC41)",
                "Transcription factor Jun (JUN)",
                "Transcription factor JunB (JUNB)",
                "Transcription factor JunD (JUND)",
                "Transcription factor RelB (RELB)",
                "Transcription factor p65 (RELA aka NFKB3)",
                "Transcriptional regulator ERG (ERG)",
                "cAMP-responsive element-binding protein-like 2 (CREBL2)"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "TP53 (p53)",
            "MYC (c-Myc)",
            "NF-\u03baB (RELA)",
            "GATA3",
            "CREB1",
            "E2F1",
            "STAT3",
            "SOX9",
            "FOXO1",
            "HIF1A",
            "AP-1 (FOS, JUN)",
            "PAX6",
            "SMAD4",
            "ELK1",
            "SP1",
            "RUNX1",
            "CEBPA",
            "NFKB1",
            "NFATC1",
            "IRF4",
            "ETS1",
            "KLF4",
            "NRF2 (NF-E2-related factor 2)",
            "CTNNB1 (\u03b2-Catenin)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53 (p53)",
                "MYC (c-Myc)",
                "RELA",
                "GATA3",
                "CREB1",
                "STAT3",
                "SOX9",
                "FOXO1",
                "HIF1A",
                "PAX6",
                "SMAD4",
                "ELK1",
                "SP1",
                "RUNX1",
                "CEBPA",
                "NFKB1",
                "NFATC1",
                "IRF4",
                "ETS1",
                "KLF4",
                "NRF2 (NF-E2-related factor 2)",
                "CTNNB1 (\u03b2-Catenin)"
            ],
            "mismatches": [
                "E2F1",
                "AP-1 (FOS, JUN)"
            ],
            "true_referents": [
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "CCAAT/enhancer-binding protein alpha (CEBPA aka CEBP)",
                "CCAAT/enhancer-binding protein epsilon (CEBPE)",
                "CCAAT/enhancer-binding protein gamma (CEBPG)",
                "Catenin beta-1 (CTNNB1 aka CTNNB, OK/SW-cl.35, PRO2286)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Cyclic AMP-responsive element-binding protein 1 (CREB1)",
                "Cyclic AMP-responsive element-binding protein 3-like protein 3 (CREB3L3 aka CREBH, HYST1481)",
                "Double homeobox protein 1 (DUX1)",
                "ETS domain-containing protein Elk-1 (ELK1)",
                "ETS domain-containing protein Elk-3 (ELK3 aka NET, SAP2)",
                "ETS domain-containing protein Elk-4 (ELK4 aka SAP1)",
                "ETS homologous factor (EHF aka ESE3, ESE3B, ESEJ)",
                "Forkhead box protein O1 (FOXO1 aka FKHR, FOXO1A)",
                "Forkhead box protein O4 (FOXO4 aka AFX, AFX1, MLLT7)",
                "Forkhead box protein O6 (FOXO6)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Hypoxia-inducible factor 1-alpha inhibitor (HIF1AN aka FIH1)",
                "Hypoxia-inducible factor 3-alpha (HIF3A aka BHLHE17, MOP7, PASD7)",
                "Interferon regulatory factor 1 (IRF1)",
                "Interferon regulatory factor 3 (IRF3)",
                "Interferon regulatory factor 4 (IRF4 aka MUM1)",
                "Krueppel-like factor 1 (KLF1 aka EKLF)",
                "Krueppel-like factor 3 (KLF3 aka BKLF)",
                "Krueppel-like factor 4 (KLF4 aka EZF, GKLF)",
                "Mothers against decapentaplegic homolog 4 (SMAD4 aka DPC4, MADH4)",
                "Mothers against decapentaplegic homolog 5 (SMAD5 aka MADH5)",
                "Mothers against decapentaplegic homolog 9 (SMAD9 aka MADH6, MADH9, SMAD8)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "Netrin-1 (NTN1 aka NTN1L)",
                "Netrin-3 (NTN3 aka NTN2L)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "Nuclear factor erythroid 2-related factor 2 (NFE2L2 aka NRF2)",
                "Nuclear factor erythroid 2-related factor 3 (NFE2L3 aka NRF3)",
                "Nuclear factor of activated T-cells, cytoplasmic 1 (NFATC1 aka NFAT2, NFATC)",
                "Nuclear factor of activated T-cells, cytoplasmic 2 (NFATC2 aka NFAT1, NFATP)",
                "Nuclear factor of activated T-cells, cytoplasmic 4 (NFATC4 aka NFAT3)",
                "Nuclear respiratory factor 1 (NRF1)",
                "Paired box protein Pax-2 (PAX2)",
                "Paired box protein Pax-5 (PAX5)",
                "Paired box protein Pax-6 (PAX6 aka AN2)",
                "Protein C-ets-1 (ETS1 aka EWSR2)",
                "Protein C-ets-2 (ETS2)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "Runt-related transcription factor 1 (RUNX1 aka AML1, CBFA2)",
                "Signal transducer and activator of transcription 3 (STAT3 aka APRF)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 6 (STAT6)",
                "TP53-binding protein 1 (TP53BP1)",
                "Trans-acting T-cell-specific transcription factor GATA-3 (GATA3)",
                "Transcription factor AP-2-beta (TFAP2B)",
                "Transcription factor E2F2 (E2F2)",
                "Transcription factor E2F7 (E2F7)",
                "Transcription factor E2F8 (E2F8)",
                "Transcription factor GATA-5 (GATA5)",
                "Transcription factor GATA-6 (GATA6)",
                "Transcription factor Jun (JUN)",
                "Transcription factor JunB (JUNB)",
                "Transcription factor LBX1 (LBX1 aka LBX1H)",
                "Transcription factor SOX-1 (SOX1)",
                "Transcription factor SOX-5 (SOX5)",
                "Transcription factor SOX-9 (SOX9)",
                "Transcription factor Sp1 (SP1 aka TSFP1)",
                "Transcription factor Sp3 (SP3)",
                "Transcription factor Sp5 (SP5)",
                "Transcription factor p65 (RELA aka NFKB3)",
                "cAMP-responsive element-binding protein-like 2 (CREBL2)"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "FOXP3 (Forkhead box P3)",
            "TP53 (Tumor protein p53)",
            "MYC (MYC proto-oncogene)",
            "BRCA1 (Breast cancer type 1 susceptibility protein)",
            "NF-\u03baB (Nuclear factor kappa B)",
            "HIF1A (Hypoxia-inducible factor 1-alpha)",
            "STAT3 (Signal transducer and activator of transcription 3)",
            "RUNX2 (Runt-related transcription factor 2)",
            "SOX2 (SRY-box transcription factor 2)",
            "OCT4 (Octamer-binding transcription factor 4)",
            "NANOG (Nanog homeobox)",
            "ESR1 (Estrogen receptor 1)",
            "AR (Androgen receptor)",
            "PPARG (Peroxisome proliferator-activated receptor gamma)",
            "NFKBIA (NFKB inhibitor alpha)",
            "GATA4 (GATA binding protein 4)",
            "PAX6 (Paired box 6)",
            "CREB1 (cAMP responsive element binding protein 1)",
            "E2F1 (E2F transcription factor 1)",
            "NOTCH1 (Notch receptor 1)",
            "SMAD4 (SMAD family member 4)",
            "RELA (RELA proto-oncogene, NF-kB subunit)",
            "NFATC1 (Nuclear factor of activated T cells 1)",
            "TFAP2A (Transcription factor AP-2 alpha)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "FOXP3 (Forkhead box P3)",
                "TP53 (Tumor protein p53)",
                "MYC (MYC proto-oncogene)",
                "BRCA1 (Breast cancer type 1 susceptibility protein)",
                "HIF1A (Hypoxia-inducible factor 1-alpha)",
                "RUNX2 (Runt-related transcription factor 2)",
                "SOX2 (SRY-box transcription factor 2)",
                "NANOG (Nanog homeobox)",
                "ESR1 (Estrogen receptor 1)",
                "AR (Androgen receptor)",
                "PPARG (Peroxisome proliferator-activated receptor gamma)",
                "GATA4 (GATA binding protein 4)",
                "PAX6 (Paired box 6)",
                "CREB1 (cAMP responsive element binding protein 1)",
                "E2F1 (E2F transcription factor 1)",
                "NOTCH1 (Notch receptor 1)",
                "SMAD4 (SMAD family member 4)",
                "RELA (RELA proto-oncogene, NF-kB subunit)",
                "NFATC1 (Nuclear factor of activated T cells 1)",
                "TFAP2A (Transcription factor AP-2 alpha)"
            ],
            "mismatches": [
                "NF-\u03baB (Nuclear factor kappa B)",
                "STAT3 (Signal transducer and activator of transcription 3)",
                "OCT4 (Octamer-binding transcription factor 4)",
                "NFKBIA (NFKB inhibitor alpha)"
            ],
            "true_referents": [
                "Androgen receptor (AR aka DHTR, NR3C4)",
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Cyclic AMP-responsive element-binding protein 1 (CREB1)",
                "Cyclic AMP-responsive element-binding protein 5 (CREB5 aka CREBPA)",
                "Estrogen receptor (ESR1 aka ESR, NR3A1)",
                "Estrogen receptor beta (ESR2 aka ESTRB, NR3A2)",
                "Forkhead box protein I3 (FOXI3)",
                "Forkhead box protein P1 (FOXP1 aka HSPC215)",
                "Forkhead box protein P3 (FOXP3 aka IPEX, JM2)",
                "Homeobox protein NANOG (NANOG)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Hypoxia-inducible factor 1-alpha inhibitor (HIF1AN aka FIH1)",
                "Hypoxia-inducible factor 3-alpha (HIF3A aka BHLHE17, MOP7, PASD7)",
                "Mothers against decapentaplegic homolog 4 (SMAD4 aka DPC4, MADH4)",
                "Mothers against decapentaplegic homolog 5 (SMAD5 aka MADH5)",
                "Mothers against decapentaplegic homolog 9 (SMAD9 aka MADH6, MADH9, SMAD8)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "NANOG neighbor homeobox (NANOGNB)",
                "NF-kappa-B inhibitor beta (NFKBIB aka IKBB, TRIP9)",
                "NF-kappa-B inhibitor zeta (NFKBIZ aka IKBZ, INAP, MAIL)",
                "Neurogenic locus notch homolog protein 1 (NOTCH1 aka TAN1)",
                "Neurogenic locus notch homolog protein 2 (NOTCH2)",
                "Neurogenic locus notch homolog protein 4 (NOTCH4 aka INT3)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "Nuclear factor of activated T-cells, cytoplasmic 1 (NFATC1 aka NFAT2, NFATC)",
                "Nuclear factor of activated T-cells, cytoplasmic 2 (NFATC2 aka NFAT1, NFATP)",
                "Nuclear factor of activated T-cells, cytoplasmic 4 (NFATC4 aka NFAT3)",
                "Paired box protein Pax-2 (PAX2)",
                "Paired box protein Pax-5 (PAX5)",
                "Paired box protein Pax-6 (PAX6 aka AN2)",
                "Peroxisome proliferator-activated receptor alpha (PPARA aka NR1C1, PPAR)",
                "Peroxisome proliferator-activated receptor gamma (PPARG aka NR1C3)",
                "Peroxisome proliferator-activated receptor gamma coactivator 1-beta (PPARGC1B aka PERC, PGC1, PGC1B, PPARGC1)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "Putative homeobox protein NANOG2 (NANOGP1 aka NANOG2)",
                "RelA-associated inhibitor (PPP1R13L aka IASPP, NKIP1, PPP1R13BL, RAI)",
                "Runt-related transcription factor 1 (RUNX1 aka AML1, CBFA2)",
                "Runt-related transcription factor 2 (RUNX2 aka AML3, CBFA1, OSF2, PEBP2A)",
                "Runt-related transcription factor 3 (RUNX3 aka AML2, CBFA3, PEBP2A3)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 5A (STAT5A aka STAT5)",
                "Signal transducer and activator of transcription 6 (STAT6)",
                "Steroid hormone receptor ERR1 (ESRRA aka ERR1, ESRL1, NR3B1)",
                "TP53-binding protein 1 (TP53BP1)",
                "Transcription factor AP-2 gamma (TFAP2C)",
                "Transcription factor AP-2-alpha (TFAP2A aka AP2TF, TFAP2)",
                "Transcription factor AP-2-beta (TFAP2B)",
                "Transcription factor E2F1 (E2F1 aka RBBP3)",
                "Transcription factor E2F4 (E2F4)",
                "Transcription factor E2F5 (E2F5)",
                "Transcription factor GATA-4 (GATA4)",
                "Transcription factor GATA-5 (GATA5)",
                "Transcription factor GATA-6 (GATA6)",
                "Transcription factor SOX-1 (SOX1)",
                "Transcription factor SOX-12 (SOX12 aka SOX22)",
                "Transcription factor SOX-2 (SOX2)",
                "Transcription factor SOX-4 (SOX4)",
                "Transcription factor p65 (RELA aka NFKB3)",
                "cAMP-responsive element-binding protein-like 2 (CREBL2)"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "TP53 (p53)",
            "MYC",
            "FOXP3",
            "HIF1A (HIF-1\u03b1)",
            "NFE2L2 (Nrf2)",
            "STAT3",
            "CEBPA (C/EBP\u03b1)",
            "PPARG (PPAR\u03b3)",
            "ESR1 (ER\u03b1)",
            "AR (Androgen Receptor)",
            "NR3C1 (Glucocorticoid Receptor)",
            "NFKB1 (NF-\u03baB1)",
            "RELA (NF-\u03baB p65)",
            "SP1",
            "EGR1",
            "FOS",
            "JUN",
            "CREB1",
            "ATF4",
            "DDIT3 (CHOP)",
            "TFAP2A (AP-2\u03b1)",
            "GATA1",
            "PAX6",
            "SOX2"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53",
                "MYC",
                "FOXP3",
                "HIF1A",
                "NFE2L2",
                "STAT3",
                "CEBPA",
                "PPARG",
                "ESR1",
                "AR",
                "NR3C1",
                "NFKB1",
                "RELA",
                "SP1",
                "EGR1",
                "FOS",
                "JUN",
                "CREB1",
                "DDIT3",
                "TFAP2A",
                "PAX6",
                "SOX2"
            ],
            "mismatches": [
                "ATF4",
                "GATA1"
            ],
            "true_referents": [
                "Androgen receptor (AR aka DHTR, NR3C4)",
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "CCAAT/enhancer-binding protein alpha (CEBPA aka CEBP)",
                "CCAAT/enhancer-binding protein epsilon (CEBPE)",
                "CCAAT/enhancer-binding protein gamma (CEBPG)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Cyclic AMP-dependent transcription factor ATF-1 (ATF1)",
                "Cyclic AMP-dependent transcription factor ATF-5 (ATF5 aka ATFX)",
                "Cyclic AMP-dependent transcription factor ATF-7 (ATF7 aka ATFA)",
                "Cyclic AMP-responsive element-binding protein 1 (CREB1)",
                "Cyclic AMP-responsive element-binding protein 3-like protein 3 (CREB3L3 aka CREBH, HYST1481)",
                "DNA damage-inducible transcript 3 protein (DDIT3 aka CHOP, CHOP10, GADD153)",
                "Early growth response protein 1 (EGR1 aka KROX24, ZNF225)",
                "Early growth response protein 3 (EGR3 aka PILOT)",
                "Early growth response protein 4 (EGR4)",
                "Endoplasmic reticulum membrane sensor NFE2L1 (NFE2L1 aka HBZ17, NRF1, TCF11)",
                "Estrogen receptor (ESR1 aka ESR, NR3A1)",
                "Forkhead box protein P1 (FOXP1 aka HSPC215)",
                "Forkhead box protein P3 (FOXP3 aka IPEX, JM2)",
                "Fos-related antigen 1 (FOSL1 aka FRA1)",
                "Glucocorticoid receptor (NR3C1 aka GRL)",
                "Histone deacetylase 1 (HDAC1 aka RPD3L1)",
                "Histone deacetylase 3 (HDAC3)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Hypoxia-inducible factor 1-alpha inhibitor (HIF1AN aka FIH1)",
                "Hypoxia-inducible factor 3-alpha (HIF3A aka BHLHE17, MOP7, PASD7)",
                "Interferon regulatory factor 3 (IRF3)",
                "Mineralocorticoid receptor (NR3C2 aka MCR, MLR)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "Nuclear factor erythroid 2-related factor 2 (NFE2L2 aka NRF2)",
                "Nuclear factor erythroid 2-related factor 3 (NFE2L3 aka NRF3)",
                "Nuclear receptor subfamily 1 group I member 3 (NR1I3 aka CAR)",
                "Paired box protein Pax-2 (PAX2)",
                "Paired box protein Pax-5 (PAX5)",
                "Paired box protein Pax-6 (PAX6 aka AN2)",
                "Peroxisome proliferator-activated receptor alpha (PPARA aka NR1C1, PPAR)",
                "Peroxisome proliferator-activated receptor gamma (PPARG aka NR1C3)",
                "Peroxisome proliferator-activated receptor gamma coactivator 1-beta (PPARGC1B aka PERC, PGC1, PGC1B, PPARGC1)",
                "Protein FosB (FOSB aka G0S3)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "Protein c-Fos (FOS aka G0S7)",
                "RelA-associated inhibitor (PPP1R13L aka IASPP, NKIP1, PPP1R13BL, RAI)",
                "Signal transducer and activator of transcription 3 (STAT3 aka APRF)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 6 (STAT6)",
                "Steroid hormone receptor ERR1 (ESRRA aka ERR1, ESRL1, NR3B1)",
                "Steroid hormone receptor ERR2 (ESRRB aka ERRB2, ESRL2, NR3B2)",
                "TP53-binding protein 1 (TP53BP1)",
                "Transcription factor AP-2-alpha (TFAP2A aka AP2TF, TFAP2)",
                "Transcription factor AP-2-beta (TFAP2B)",
                "Transcription factor AP-2-epsilon (TFAP2E)",
                "Transcription factor GATA-4 (GATA4)",
                "Transcription factor GATA-5 (GATA5)",
                "Transcription factor GATA-6 (GATA6)",
                "Transcription factor Jun (JUN)",
                "Transcription factor JunB (JUNB)",
                "Transcription factor JunD (JUND)",
                "Transcription factor SOX-1 (SOX1)",
                "Transcription factor SOX-12 (SOX12 aka SOX22)",
                "Transcription factor SOX-2 (SOX2)",
                "Transcription factor Sp1 (SP1 aka TSFP1)",
                "Transcription factor Sp3 (SP3)",
                "Transcription factor Sp5 (SP5)",
                "Transcription factor p65 (RELA aka NFKB3)",
                "cAMP-responsive element-binding protein-like 2 (CREBL2)"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "CREB1 (cAMP responsive element binding protein 1)",
            "NF-\u03baB (nuclear factor kappa-light-chain-enhancer of activated B cells)",
            "TP53 (tumor protein p53)",
            "MYC (MYC proto-oncogene, bHLH transcription factor)",
            "FOXO3 (forkhead box O3)",
            "HIF1A (hypoxia inducible factor 1 subunit alpha)",
            "PPARG (peroxisome proliferator activated receptor gamma)",
            "STAT3 (signal transducer and activator of transcription 3)",
            "NFKB1 (nuclear factor kappa B subunit 1)",
            "JUN (jun proto-oncogene, AP-1 transcription factor subunit)",
            "ESR1 (estrogen receptor 1)",
            "RELA (RELA proto-oncogene, NF-kB subunit)",
            "RUNX2 (runt related transcription factor 2)",
            "FOXP3 (forkhead box P3)",
            "SMAD3 (SMAD family member 3)",
            "GATA3 (GATA binding protein 3)",
            "NFATC1 (nuclear factor of activated T-cells 1)",
            "HNF4A (hepatocyte nuclear factor 4 alpha)",
            "SOX2 (SRY-box transcription factor 2)",
            "NANOG (Nanog homeobox)",
            "POU5F1 (POU class 5 homeobox 1)",
            "KLF4 (Kruppel like factor 4)",
            "MYB (MYB proto-oncogene, transcription factor)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "CREB1 (cAMP responsive element binding protein 1)",
                "TP53 (tumor protein p53)",
                "MYC (MYC proto-oncogene, bHLH transcription factor)",
                "FOXO3 (forkhead box O3)",
                "HIF1A (hypoxia inducible factor 1 subunit alpha)",
                "PPARG (peroxisome proliferator activated receptor gamma)",
                "NFKB1 (nuclear factor kappa B subunit 1)",
                "JUN (jun proto-oncogene, AP-1 transcription factor subunit)",
                "ESR1 (estrogen receptor 1)",
                "RELA (RELA proto-oncogene, NF-kB subunit)",
                "RUNX2 (runt related transcription factor 2)",
                "FOXP3 (forkhead box P3)",
                "SMAD3 (SMAD family member 3)",
                "GATA3 (GATA binding protein 3)",
                "NFATC1 (nuclear factor of activated T-cells 1)",
                "HNF4A (hepatocyte nuclear factor 4 alpha)",
                "SOX2 (SRY-box transcription factor 2)",
                "NANOG (Nanog homeobox)",
                "POU5F1 (POU class 5 homeobox 1)",
                "KLF4 (Kruppel like factor 4)",
                "MYB (MYB proto-oncogene, transcription factor)"
            ],
            "mismatches": [
                "NF-\u03baB (nuclear factor kappa-light-chain-enhancer of activated B cells)",
                "STAT3 (signal transducer and activator of transcription 3)"
            ],
            "true_referents": [
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Cyclic AMP-responsive element-binding protein 1 (CREB1)",
                "Cyclic AMP-responsive element-binding protein 5 (CREB5 aka CREBPA)",
                "Estrogen receptor (ESR1 aka ESR, NR3A1)",
                "Estrogen receptor beta (ESR2 aka ESTRB, NR3A2)",
                "Forkhead box protein I3 (FOXI3)",
                "Forkhead box protein O1 (FOXO1 aka FKHR, FOXO1A)",
                "Forkhead box protein O3 (FOXO3 aka FKHRL1, FOXO3A)",
                "Forkhead box protein O6 (FOXO6)",
                "Forkhead box protein P1 (FOXP1 aka HSPC215)",
                "Forkhead box protein P3 (FOXP3 aka IPEX, JM2)",
                "Hepatocyte nuclear factor 1-alpha (HNF1A aka TCF1)",
                "Hepatocyte nuclear factor 3-alpha (FOXA1 aka HNF3A, TCF3A)",
                "Hepatocyte nuclear factor 4-alpha (HNF4A aka HNF4, NR2A1, TCF14)",
                "Homeobox protein NANOG (NANOG)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Hypoxia-inducible factor 1-alpha inhibitor (HIF1AN aka FIH1)",
                "Hypoxia-inducible factor 3-alpha (HIF3A aka BHLHE17, MOP7, PASD7)",
                "Krueppel-like factor 1 (KLF1 aka EKLF)",
                "Krueppel-like factor 3 (KLF3 aka BKLF)",
                "Krueppel-like factor 4 (KLF4 aka EZF, GKLF)",
                "Mothers against decapentaplegic homolog 3 (SMAD3 aka MADH3)",
                "Mothers against decapentaplegic homolog 5 (SMAD5 aka MADH5)",
                "Mothers against decapentaplegic homolog 9 (SMAD9 aka MADH6, MADH9, SMAD8)",
                "Myb-binding protein 1A (MYBBP1A aka P160)",
                "Myb-related protein B (MYBL2 aka BMYB)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "NANOG neighbor homeobox (NANOGNB)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "Nuclear factor of activated T-cells, cytoplasmic 1 (NFATC1 aka NFAT2, NFATC)",
                "Nuclear factor of activated T-cells, cytoplasmic 2 (NFATC2 aka NFAT1, NFATP)",
                "Nuclear factor of activated T-cells, cytoplasmic 4 (NFATC4 aka NFAT3)",
                "POU domain, class 5, transcription factor 1 (POU5F1 aka OCT3, OCT4, OTF3)",
                "POU domain, class 6, transcription factor 1 (POU6F1 aka BRN5, MPOU, TCFB1)",
                "Peroxisome proliferator-activated receptor alpha (PPARA aka NR1C1, PPAR)",
                "Peroxisome proliferator-activated receptor gamma (PPARG aka NR1C3)",
                "Peroxisome proliferator-activated receptor gamma coactivator 1-beta (PPARGC1B aka PERC, PGC1, PGC1B, PPARGC1)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "Putative POU domain, class 5, transcription factor 1B (POU5F1B aka OCT4PG1, OTF3C, OTF3P1, POU5F1P1, POU5FLC20, POU5FLC8)",
                "Putative homeobox protein NANOG2 (NANOGP1 aka NANOG2)",
                "RelA-associated inhibitor (PPP1R13L aka IASPP, NKIP1, PPP1R13BL, RAI)",
                "Runt-related transcription factor 1 (RUNX1 aka AML1, CBFA2)",
                "Runt-related transcription factor 2 (RUNX2 aka AML3, CBFA1, OSF2, PEBP2A)",
                "Runt-related transcription factor 3 (RUNX3 aka AML2, CBFA3, PEBP2A3)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 5A (STAT5A aka STAT5)",
                "Signal transducer and activator of transcription 6 (STAT6)",
                "Steroid hormone receptor ERR1 (ESRRA aka ERR1, ESRL1, NR3B1)",
                "TP53-binding protein 1 (TP53BP1)",
                "Trans-acting T-cell-specific transcription factor GATA-3 (GATA3)",
                "Transcription factor GATA-5 (GATA5)",
                "Transcription factor GATA-6 (GATA6)",
                "Transcription factor Jun (JUN)",
                "Transcription factor JunB (JUNB)",
                "Transcription factor JunD (JUND)",
                "Transcription factor SOX-1 (SOX1)",
                "Transcription factor SOX-12 (SOX12 aka SOX22)",
                "Transcription factor SOX-2 (SOX2)",
                "Transcription factor p65 (RELA aka NFKB3)",
                "Transcriptional activator Myb (MYB)",
                "cAMP-responsive element-binding protein-like 2 (CREBL2)"
            ],
            "TP": 21,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "BRCA1 (BRCA1)",
            "TP53 (TP53)",
            "KRAS (KRAS)",
            "EGFR (EGFR)",
            "MYC (MYC)",
            "NF-\u03baB (NFKB1)",
            "HIF1A (HIF1A)",
            "STAT3 (STAT3)",
            "NOTCH1 (NOTCH1)",
            "RUNX1 (RUNX1)",
            "GATA1 (GATA1)",
            "POU5F1 (POU5F1)",
            "SOX2 (SOX2)",
            "NANOG (NANOG)",
            "KLF4 (KLF4)",
            "c-FOS (FOS)",
            "c-JUN (JUN)",
            "CEBPA (CEBPA)",
            "PPARG (PPARG)",
            "MYOD1 (MYOD1)",
            "MYOG (MYOG)",
            "GATA4 (GATA4)",
            "NKX2-5 (NKX2-5)",
            "MEF2C (MEF2C)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BRCA1 (BRCA1)",
                "TP53 (TP53)",
                "MYC (MYC)",
                "HIF1A (HIF1A)",
                "STAT3 (STAT3)",
                "NOTCH1 (NOTCH1)",
                "POU5F1 (POU5F1)",
                "SOX2 (SOX2)",
                "NANOG (NANOG)",
                "KLF4 (KLF4)",
                "c-FOS (FOS)",
                "c-JUN (JUN)",
                "CEBPA (CEBPA)",
                "PPARG (PPARG)",
                "MYOD1 (MYOD1)",
                "MYOG (MYOG)",
                "GATA4 (GATA4)",
                "NKX2-5 (NKX2-5)",
                "MEF2C (MEF2C)"
            ],
            "mismatches": [
                "KRAS (KRAS)",
                "EGFR (EGFR)",
                "NF-\u03baB (NFKB1)",
                "RUNX1 (RUNX1)",
                "GATA1 (GATA1)"
            ],
            "true_referents": [
                "Androgen receptor (AR aka DHTR, NR3C4)",
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "CCAAT/enhancer-binding protein alpha (CEBPA aka CEBP)",
                "CCAAT/enhancer-binding protein epsilon (CEBPE)",
                "CCAAT/enhancer-binding protein gamma (CEBPG)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "E3 ubiquitin-protein ligase DTX1 (DTX1)",
                "Endothelial differentiation-related factor 1 (EDF1)",
                "Estrogen receptor (ESR1 aka ESR, NR3A1)",
                "Fos-related antigen 1 (FOSL1 aka FRA1)",
                "Homeobox protein CDX-1 (CDX1)",
                "Homeobox protein NANOG (NANOG)",
                "Homeobox protein Nkx-2.2 (NKX2-2 aka NKX2.2, NKX2B)",
                "Homeobox protein Nkx-2.5 (NKX2-5 aka CSX, NKX2.5, NKX2E)",
                "Homeobox protein Nkx-2.6 (NKX2-6 aka NKX2F)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Hypoxia-inducible factor 1-alpha inhibitor (HIF1AN aka FIH1)",
                "Hypoxia-inducible factor 3-alpha (HIF3A aka BHLHE17, MOP7, PASD7)",
                "Krueppel-like factor 1 (KLF1 aka EKLF)",
                "Krueppel-like factor 3 (KLF3 aka BKLF)",
                "Krueppel-like factor 4 (KLF4 aka EZF, GKLF)",
                "MEF2-activating motif and SAP domain-containing transcriptional regulator (MAMSTR aka MASTR)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "Myoblast determination protein 1 (MYOD1 aka BHLHC1, MYF3, MYOD)",
                "Myocardin (MYOCD aka MYCD)",
                "Myocyte-specific enhancer factor 2A (MEF2A aka MEF2)",
                "Myocyte-specific enhancer factor 2C (MEF2C)",
                "Myogenin (MYOG aka BHLHC3, MYF4)",
                "Myoneurin (MYNN aka OSZF, ZBTB31, SBBIZ1)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "NANOG neighbor homeobox (NANOGNB)",
                "Neurogenic locus notch homolog protein 1 (NOTCH1 aka TAN1)",
                "Neurogenic locus notch homolog protein 2 (NOTCH2)",
                "Neurogenic locus notch homolog protein 4 (NOTCH4 aka INT3)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "POU domain, class 5, transcription factor 1 (POU5F1 aka OCT3, OCT4, OTF3)",
                "POU domain, class 6, transcription factor 1 (POU6F1 aka BRN5, MPOU, TCFB1)",
                "Peroxisome proliferator-activated receptor gamma (PPARG aka NR1C3)",
                "Peroxisome proliferator-activated receptor gamma coactivator 1-beta (PPARGC1B aka PERC, PGC1, PGC1B, PPARGC1)",
                "Peroxisome proliferator-activated receptor gamma coactivator-related protein 1 (PPRC1 aka KIAA0595)",
                "Pro-neuregulin-1, membrane-bound isoform (NRG1 aka GGF, HGL, HRGA, NDF, SMDF)",
                "Protein FosB (FOSB aka G0S3)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "Protein c-Fos (FOS aka G0S7)",
                "Putative POU domain, class 5, transcription factor 1B (POU5F1B aka OCT4PG1, OTF3C, OTF3P1, POU5F1P1, POU5FLC20, POU5FLC8)",
                "Putative homeobox protein NANOG2 (NANOGP1 aka NANOG2)",
                "Ras-related protein Rap-2c (RAP2C)",
                "Retinoic acid receptor RXR-alpha (RXRA aka NR2B1)",
                "Retinoic acid receptor alpha (RARA aka NR1B1)",
                "Signal transducer and activator of transcription 3 (STAT3 aka APRF)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 6 (STAT6)",
                "TP53-binding protein 1 (TP53BP1)",
                "Transcription factor GATA-4 (GATA4)",
                "Transcription factor GATA-5 (GATA5)",
                "Transcription factor GATA-6 (GATA6)",
                "Transcription factor Jun (JUN)",
                "Transcription factor JunB (JUNB)",
                "Transcription factor JunD (JUND)",
                "Transcription factor LBX1 (LBX1 aka LBX1H)",
                "Transcription factor SOX-1 (SOX1)",
                "Transcription factor SOX-12 (SOX12 aka SOX22)",
                "Transcription factor SOX-2 (SOX2)",
                "Transcription factor p65 (RELA aka NFKB3)"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "E2F1 (E2F transcription factor 1)",
            "E2F2 (E2F transcription factor 2)",
            "E2F3 (E2F transcription factor 3)",
            "E2F4 (E2F transcription factor 4)",
            "E2F5 (E2F transcription factor 5)",
            "E2F6 (E2F transcription factor 6)",
            "E2F7 (E2F transcription factor 7)",
            "E2F8 (E2F transcription factor 8)",
            "E2F9 (E2F transcription factor 9)",
            "E2F transcription factor 1",
            "E2F transcription factor 2",
            "E2F transcription factor 3",
            "E2F transcription factor 4",
            "E2F transcription factor 5",
            "E2F transcription factor 6",
            "E2F transcription factor 7",
            "E2F transcription factor 8",
            "E2F transcription factor 9",
            "YY1 (Yin Yang 1)",
            "Yin Yang 1",
            "CREB (cAMP response element-binding protein)",
            "cAMP response element-binding protein",
            "NF-\u03baB (nuclear factor kappa B)",
            "nuclear factor kappa B",
            "STAT1 (signal transducer and activator of transcription 1)",
            "signal transducer and activator of transcription 1",
            "STAT3 (signal transducer and activator of transcription 3)",
            "signal transducer and activator of transcription 3",
            "STAT5 (signal transducer and activator of transcription 5)",
            "signal transducer and activator of transcription 5",
            "STAT6 (signal transducer and activator of transcription 6)",
            "signal transducer and activator of transcription 6",
            "p53 (tumor protein p53)",
            "tumor protein p53",
            "p63 (tumor protein p63)",
            "tumor protein p63",
            "p73 (tumor protein p73)",
            "tumor protein p73"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "E2F1 (E2F transcription factor 1)",
                "E2F2 (E2F transcription factor 2)",
                "E2F3 (E2F transcription factor 3)",
                "E2F4 (E2F transcription factor 4)",
                "E2F5 (E2F transcription factor 5)",
                "E2F6 (E2F transcription factor 6)",
                "E2F7 (E2F transcription factor 7)",
                "E2F8 (E2F transcription factor 8)",
                "YY1 (Yin Yang 1)"
            ],
            "mismatches": [
                "E2F9 (E2F transcription factor 9)",
                "E2F transcription factor 1",
                "E2F transcription factor 2",
                "E2F transcription factor 3",
                "E2F transcription factor 4",
                "E2F transcription factor 5",
                "E2F transcription factor 6",
                "E2F transcription factor 7",
                "E2F transcription factor 8",
                "E2F transcription factor 9",
                "Yin Yang 1",
                "CREB (cAMP response element-binding protein)",
                "cAMP response element-binding protein",
                "NF-\u03baB (nuclear factor kappa B)",
                "nuclear factor kappa B",
                "STAT1 (signal transducer and activator of transcription 1)",
                "signal transducer and activator of transcription 1",
                "STAT3 (signal transducer and activator of transcription 3)",
                "signal transducer and activator of transcription 3",
                "STAT5 (signal transducer and activator of transcription 5)",
                "signal transducer and activator of transcription 5",
                "STAT6 (signal transducer and activator of transcription 6)",
                "signal transducer and activator of transcription 6",
                "p53 (tumor protein p53)",
                "tumor protein p53",
                "p63 (tumor protein p63)",
                "tumor protein p63",
                "p73 (tumor protein p73)",
                "tumor protein p73"
            ],
            "true_referents": [
                "Cyclic AMP-responsive element-binding protein 1 (CREB1)",
                "Cyclic AMP-responsive element-binding protein 5 (CREB5 aka CREBPA)",
                "Geminin (GMNN)",
                "Max dimerization protein 1 (MXD1 aka MAD)",
                "NF-kappa-B-repressing factor (NKRF aka ITBA4, NRF)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "RING1 and YY1-binding protein (RYBP aka DEDAF, YEAF1)",
                "Transcription factor 4 (TCF4 aka BHLHB19, ITF2, SEF2)",
                "Transcription factor 7 (TCF7 aka TCF1)",
                "Transcription factor E2F1 (E2F1 aka RBBP3)",
                "Transcription factor E2F2 (E2F2)",
                "Transcription factor E2F3 (E2F3 aka KIAA0075)",
                "Transcription factor E2F4 (E2F4)",
                "Transcription factor E2F5 (E2F5)",
                "Transcription factor E2F6 (E2F6)",
                "Transcription factor E2F7 (E2F7)",
                "Transcription factor E2F8 (E2F8)",
                "Transcription factor E4F1 (E4F1 aka E4F)",
                "Transcription factor YY2 (YY2 aka ZNF631)",
                "Transcription factor p65 (RELA aka NFKB3)",
                "Transcriptional repressor protein YY1 (YY1 aka INO80S)",
                "Visual system homeobox 1 (VSX1 aka RINX)",
                "cAMP-responsive element-binding protein-like 2 (CREBL2)"
            ],
            "TP": 9,
            "FP": 29,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            "TP53 (TP53)",
            "MYC (MYC)",
            "NF-\u03baB1 (NFKB1)",
            "NF-\u03baB2 (NFKB2)",
            "p53 (TP53)",
            "c-Myc (MYC)",
            "RelA (NFKB1)",
            "RelB (NFKB2)",
            "NFATC1 (NFATC1)",
            "NFATC2 (NFATC2)",
            "NFATC3 (NFATC3)",
            "NFATC4 (NFATC4)",
            "STAT1 (STAT1)",
            "STAT2 (STAT2)",
            "STAT3 (STAT3)",
            "STAT4 (STAT4)",
            "STAT5A (STAT5A)",
            "STAT5B (STAT5B)",
            "STAT6 (STAT6)",
            "CREB1 (CREB1)",
            "CREBBP (CREBBP)",
            "EP300 (EP300)",
            "PCAF (PCAF)",
            "p300 (EP300)",
            "CBP (CREBBP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "NF-kappa-B p105 subunit (NFKB1)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2)",
                "Cellular tumor antigen p53 (TP53)",
                "Myc proto-oncogene protein (MYC)",
                "Nuclear factor of activated T-cells, cytoplasmic 1 (NFATC1)",
                "Nuclear factor of activated T-cells, cytoplasmic 2 (NFATC2)",
                "Nuclear factor of activated T-cells, cytoplasmic 3 (NFATC3)",
                "Nuclear factor of activated T-cells, cytoplasmic 4 (NFATC4)",
                "Signal transducer and activator of transcription 1-alpha/beta (STAT1)",
                "Signal transducer and activator of transcription 2 (STAT2)",
                "Signal transducer and activator of transcription 3 (STAT3)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 5A (STAT5A)",
                "Signal transducer and activator of transcription 5B (STAT5B)",
                "Signal transducer and activator of transcription 6 (STAT6)",
                "Cyclic AMP-responsive element-binding protein 1 (CREB1)",
                "CREB-binding protein (CREBBP)",
                "Histone acetyltransferase p300 (EP300)",
                "Histone acetyltransferase KAT2B (KAT2B)"
            ],
            "mismatches": [
                "RelA (NFKB1)",
                "RelB (NFKB2)"
            ],
            "true_referents": [
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "CREB-binding protein (CREBBP aka CBP)",
                "Cbp/p300-interacting transactivator 1 (CITED1 aka MSG1)",
                "Cbp/p300-interacting transactivator 2 (CITED2 aka MRG1)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Cyclic AMP-responsive element-binding protein 1 (CREB1)",
                "Cyclic AMP-responsive element-binding protein 3-like protein 3 (CREB3L3 aka CREBH, HYST1481)",
                "Cyclic AMP-responsive element-binding protein 5 (CREB5 aka CREBPA)",
                "EP300-interacting inhibitor of differentiation 1 (EID1 aka C15orf3, CRI1, RBP21, PNAS-22, PTD014)",
                "EP300-interacting inhibitor of differentiation 2B (EID2B aka EID3)",
                "Histone acetyltransferase KAT2B (KAT2B aka PCAF)",
                "Histone acetyltransferase p300 (EP300 aka P300)",
                "Lipopolysaccharide-induced tumor necrosis factor-alpha factor (LITAF aka PIG7, SIMPLE)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "Nuclear factor of activated T-cells, cytoplasmic 1 (NFATC1 aka NFAT2, NFATC)",
                "Nuclear factor of activated T-cells, cytoplasmic 2 (NFATC2 aka NFAT1, NFATP)",
                "Nuclear factor of activated T-cells, cytoplasmic 3 (NFATC3 aka NFAT4)",
                "Nuclear factor of activated T-cells, cytoplasmic 4 (NFATC4 aka NFAT3)",
                "Protein L-Myc (MYCL aka BHLHE38, LMYC, MYCL1)",
                "Signal transducer and activator of transcription 1-alpha/beta (STAT1)",
                "Signal transducer and activator of transcription 2 (STAT2)",
                "Signal transducer and activator of transcription 3 (STAT3 aka APRF)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 5A (STAT5A aka STAT5)",
                "Signal transducer and activator of transcription 5B (STAT5B)",
                "Signal transducer and activator of transcription 6 (STAT6)",
                "TP53-binding protein 1 (TP53BP1)",
                "Transcription factor MafF (MAFF)",
                "Transcription factor RelB (RELB)",
                "Transcription factor p65 (RELA aka NFKB3)",
                "cAMP-responsive element-binding protein-like 2 (CREBL2)"
            ],
            "TP": 19,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "transcription regulation gene",
        "domain": "biology",
        "response": [
            {
                "Referent": "BRCA1",
                "Canonical Name": "Breast cancer 1, early onset"
            },
            {
                "Referent": "p53",
                "Canonical Name": "Tumor protein p53"
            },
            {
                "Referent": "MyoD",
                "Canonical Name": "Myogenic differentiation 1"
            },
            {
                "Referent": "MYC",
                "Canonical Name": "MYC proto-oncogene, bHLH transcription factor"
            },
            {
                "Referent": "NF-\u03baB",
                "Canonical Name": "Nuclear factor kappa B"
            },
            {
                "Referent": "STAT3",
                "Canonical Name": "Signal transducer and activator of transcription 3"
            },
            {
                "Referent": "HIF1\u03b1",
                "Canonical Name": "Hypoxia-inducible factor 1, alpha subunit"
            },
            {
                "Referent": "FOXO1",
                "Canonical Name": "Forkhead box O1"
            },
            {
                "Referent": "FOXO3",
                "Canonical Name": "Forkhead box O3"
            },
            {
                "Referent": "FOXO4",
                "Canonical Name": "Forkhead box O4"
            },
            {
                "Referent": "FOXO6",
                "Canonical Name": "Forkhead box O6"
            },
            {
                "Referent": "FOXO7",
                "Canonical Name": "Forkhead box O7"
            },
            {
                "Referent": "KLF4",
                "Canonical Name": "Kruppel-like factor 4"
            },
            {
                "Referent": "KLF5",
                "Canonical Name": "Kruppel-like factor 5"
            },
            {
                "Referent": "KLF6",
                "Canonical Name": "Kruppel-like factor 6"
            },
            {
                "Referent": "KLF9",
                "Canonical Name": "Kruppel-like factor 9"
            },
            {
                "Referent": "KLF10",
                "Canonical Name": "Kruppel-like factor 10"
            },
            {
                "Referent": "KLF11",
                "Canonical Name": "Kruppel-like factor 11"
            },
            {
                "Referent": "KLF12",
                "Canonical Name": "Kruppel-like factor 12"
            },
            {
                "Referent": "KLF13",
                "Canonical Name": "Kruppel-like factor 13"
            },
            {
                "Referent": "KLF14",
                "Canonical Name": "Kruppel-like factor 14"
            },
            {
                "Referent": "KLF15",
                "Canonical Name": "Kruppel-like factor 15"
            },
            {
                "Referent": "KLF16",
                "Canonical Name": "Kruppel-like factor 16"
            },
            {
                "Referent": "KLF17",
                "Canonical Name": "Kruppel-like factor 17"
            },
            {
                "Referent": "KLF18",
                "Canonical Name": "Kruppel-like factor 18"
            },
            {
                "Referent": "KLF20",
                "Canonical Name": "Kruppel-like factor 20"
            },
            {
                "Referent": "KLF21",
                "Canonical Name": "Kruppel-like factor 21"
            },
            {
                "Referent": "KLF22",
                "Canonical Name": "Kruppel-like factor 22"
            },
            {
                "Referent": "KLF23",
                "Canonical Name": "Kruppel-like factor 23"
            },
            {
                "Referent": "KLF24",
                "Canonical Name": "Kruppel-like factor 24"
            },
            {
                "Referent": "KLF25",
                "Canonical Name": "Kruppel-like factor 25"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Forkhead box protein O1 (FOXO1 aka FKHR, FOXO1A)",
                "Forkhead box protein O6 (FOXO6)",
                "Krueppel-like factor 4 (KLF4 aka EZF, GKLF)",
                "Krueppel-like factor 5 (KLF5 aka BTEB2, CKLF, IKLF)",
                "Krueppel-like factor 6 (KLF6 aka BCD1, COPEB, CPBP, ST12)",
                "Krueppel-like factor 10 (KLF10 aka TIEG, TIEG1)",
                "Krueppel-like factor 11 (KLF11 aka FKLF, TIEG2)",
                "Krueppel-like factor 13 (KLF13 aka BTEB3, NSLP1)",
                "Krueppel-like factor 14 (KLF14 aka BTEB5)",
                "Krueppel-like factor 15 (KLF15 aka KKLF)",
                "Krueppel-like factor 16 (KLF16 aka BTEB4, NSLP2)",
                "Krueppel-like factor 17 (KLF17 aka ZNF393)"
            ],
            "mismatches": [
                "Myoblast determination protein 1 (MYOD1 aka BHLHC1, MYF3, MYOD)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Signal transducer and activator of transcription 3 (STAT3)",
                "Forkhead box protein O3 (FOXO3)",
                "Forkhead box protein O4 (FOXO4)",
                "Forkhead box protein O7 (FOXO7)",
                "Krueppel-like factor 9 (KLF9)",
                "Krueppel-like factor 12 (KLF12)",
                "Krueppel-like factor 18 (KLF18)",
                "Krueppel-like factor 20 (KLF20)",
                "Krueppel-like factor 21 (KLF21)",
                "Krueppel-like factor 22 (KLF22)",
                "Krueppel-like factor 23 (KLF23)",
                "Krueppel-like factor 24 (KLF24)",
                "Krueppel-like factor 25 (KLF25)"
            ],
            "true_referents": [
                "Breast cancer type 1 susceptibility protein (BRCA1 aka RNF53)",
                "Cellular tumor antigen p53 (TP53 aka P53)",
                "Estrogen receptor (ESR1 aka ESR, NR3A1)",
                "Estrogen receptor beta (ESR2 aka ESTRB, NR3A2)",
                "Forkhead box protein D4 (FOXD4 aka FKHL9, FOXD4A, FREAC5)",
                "Forkhead box protein D4-like 3 (FOXD4L3)",
                "Forkhead box protein D4-like 5 (FOXD4L5)",
                "Forkhead box protein D4-like 6 (FOXD4L6)",
                "Forkhead box protein I1 (FOXI1 aka FKHL10, FREAC6)",
                "Forkhead box protein I3 (FOXI3)",
                "Forkhead box protein O1 (FOXO1 aka FKHR, FOXO1A)",
                "Forkhead box protein O6 (FOXO6)",
                "Hypoxia-inducible factor 1-alpha (HIF1A aka BHLHE78, MOP1, PASD8)",
                "Hypoxia-inducible factor 1-alpha inhibitor (HIF1AN aka FIH1)",
                "Hypoxia-inducible factor 3-alpha (HIF3A aka BHLHE17, MOP7, PASD7)",
                "Krueppel-like factor 1 (KLF1 aka EKLF)",
                "Krueppel-like factor 10 (KLF10 aka TIEG, TIEG1)",
                "Krueppel-like factor 11 (KLF11 aka FKLF, TIEG2)",
                "Krueppel-like factor 13 (KLF13 aka BTEB3, NSLP1)",
                "Krueppel-like factor 14 (KLF14 aka BTEB5)",
                "Krueppel-like factor 15 (KLF15 aka KKLF)",
                "Krueppel-like factor 16 (KLF16 aka BTEB4, NSLP2)",
                "Krueppel-like factor 17 (KLF17 aka ZNF393)",
                "Krueppel-like factor 4 (KLF4 aka EZF, GKLF)",
                "Krueppel-like factor 5 (KLF5 aka BTEB2, CKLF, IKLF)",
                "Krueppel-like factor 6 (KLF6 aka BCD1, COPEB, CPBP, ST12)",
                "Krueppel-like factor 7 (KLF7 aka UKLF)",
                "Krueppel-like factor 8 (KLF8 aka BKLF3, ZNF741)",
                "Myc proto-oncogene protein (MYC aka BHLHE39)",
                "Myc-associated zinc finger protein (MAZ aka ZNF801)",
                "Myoblast determination protein 1 (MYOD1 aka BHLHC1, MYF3, MYOD)",
                "Myocyte-specific enhancer factor 2A (MEF2A aka MEF2)",
                "Myogenin (MYOG aka BHLHC3, MYF4)",
                "N-myc proto-oncogene protein (MYCN aka BHLHE37, NMYC)",
                "Nuclear factor NF-kappa-B p100 subunit (NFKB2 aka LYT10)",
                "Nuclear factor NF-kappa-B p105 subunit (NFKB1)",
                "Signal transducer and activator of transcription 1-alpha/beta (STAT1)",
                "Signal transducer and activator of transcription 4 (STAT4)",
                "Signal transducer and activator of transcription 5A (STAT5A aka STAT5)",
                "TP53-binding protein 1 (TP53BP1)",
                "Transcription factor p65 (RELA aka NFKB3)"
            ],
            "TP": 16,
            "FP": 15,
            "FN": 0
        }
    }
]