[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERT (hTERT)",
            "TERC (hTERC)",
            "DKC1",
            "TINF2",
            "WRAP53",
            "NOP10",
            "NHP2",
            "RTEL1",
            "ATR",
            "ATM",
            "TRF1",
            "TRF2",
            "POT1",
            "TPP1",
            "PINX1",
            "PARN",
            "TERF1",
            "TERF2",
            "SMG6",
            "CTC1",
            "SASP3",
            "SASP1",
            "SASP2",
            "NBS1"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERT (hTERT)",
                "TERC (hTERC)",
                "DKC1",
                "TINF2",
                "WRAP53",
                "NOP10",
                "NHP2",
                "RTEL1",
                "ATR",
                "ATM",
                "TRF1",
                "TRF2",
                "POT1",
                "TPP1",
                "PINX1",
                "PARN",
                "TERF1",
                "TERF2",
                "SMG6",
                "CTC1",
                "SASP3",
                "SASP1",
                "SASP2",
                "NBS1"
            ],
            "mismatches": [],
            "true_referents": [
                "ATM",
                "ATR",
                "CTC1",
                "DKC1",
                "NBS1",
                "NHP2",
                "NOP10",
                "PARN",
                "PINX1",
                "POT1",
                "RTEL1",
                "SASP1",
                "SASP2",
                "SASP3",
                "SMG6",
                "TERC (hTERC)",
                "TERF1",
                "TERF2",
                "TERT (hTERT)",
                "TINF2",
                "TPP1",
                "TRF1",
                "TRF2",
                "WRAP53"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERT (telomerase reverse transcriptase)",
            "TERC (telomerase RNA component)",
            "DKC1 (dyskerin)",
            "NOP10 (nucleolar protein 10)",
            "NHP2 (nucleolar protein 2)",
            "TCAB1 (telomerase Cajal body protein 1)",
            "TINF2 (TERC-interacting nuclear factor 2)",
            "WRAP53 (WD repeat-containing protein 53)",
            "POT1 (protection of telomeres 1)",
            "TPP1 (TIN2-interacting protein 1)",
            "TIN2 (TRF1-interacting nuclear factor 2)",
            "TRF1 (telomeric repeat-binding factor 1)",
            "TRF2 (telomeric repeat-binding factor 2)",
            "RTEL1 (regulator of telomere elongation helicase 1)",
            "ATRX (alpha thalassemia/mental retardation syndrome X-linked)",
            "DAXX (death-domain associated protein)",
            "PARN (poly(A) specific ribonuclease)",
            "FEN1 (flap endonuclease 1)",
            "BLM (Bloom syndrome protein)",
            "WRN (Werner syndrome protein)",
            "SIRT6 (Sirtuin 6)",
            "HMGA2 (high mobility group AT-hook 2)",
            "OBFC1 (OBF-1-like protein 1)",
            "ACD (adducin)",
            "CTC1 (CTC1 regulator of telomere elongation helicase 1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERT (telomerase reverse transcriptase)",
                "TERC (telomerase RNA component)",
                "DKC1 (dyskerin)",
                "NOP10 (nucleolar protein 10)",
                "NHP2 (nucleolar protein 2)",
                "TCAB1 (telomerase Cajal body protein 1)",
                "TINF2 (TERC-interacting nuclear factor 2)",
                "WRAP53 (WD repeat-containing protein 53)",
                "POT1 (protection of telomeres 1)",
                "TPP1 (TIN2-interacting protein 1)",
                "TIN2 (TRF1-interacting nuclear factor 2)",
                "TRF1 (telomeric repeat-binding factor 1)",
                "TRF2 (telomeric repeat-binding factor 2)",
                "RTEL1 (regulator of telomere elongation helicase 1)",
                "ATRX (alpha thalassemia/mental retardation syndrome X-linked)",
                "DAXX (death-domain associated protein)",
                "PARN (poly(A) specific ribonuclease)",
                "FEN1 (flap endonuclease 1)",
                "BLM (Bloom syndrome protein)",
                "WRN (Werner syndrome protein)",
                "SIRT6 (Sirtuin 6)",
                "HMGA2 (high mobility group AT-hook 2)",
                "OBFC1 (OBF-1-like protein 1)",
                "ACD (adducin)"
            ],
            "mismatches": [
                "CTC1 (CTC1 regulator of telomere elongation helicase 1)"
            ],
            "true_referents": [
                "ACD (adducin)",
                "ATRX (alpha thalassemia/mental retardation syndrome X-linked)",
                "BLM (Bloom syndrome protein)",
                "DAXX (death-domain associated protein)",
                "DKC1 (dyskerin)",
                "FEN1 (flap endonuclease 1)",
                "HMGA2 (high mobility group AT-hook 2)",
                "NHP2 (nucleolar protein 2)",
                "NOP10 (nucleolar protein 10)",
                "OBFC1 (OBF-1-like protein 1)",
                "PARN (poly(A) specific ribonuclease)",
                "POT1 (protection of telomeres 1)",
                "RTEL1 (regulator of telomere elongation helicase 1)",
                "SIRT6 (Sirtuin 6)",
                "TCAB1 (telomerase Cajal body protein 1)",
                "TERC (telomerase RNA component)",
                "TERT (telomerase reverse transcriptase)",
                "TIN2 (TRF1-interacting nuclear factor 2)",
                "TINF2 (TERC-interacting nuclear factor 2)",
                "TPP1 (TIN2-interacting protein 1)",
                "TRF1 (telomeric repeat-binding factor 1)",
                "TRF2 (telomeric repeat-binding factor 2)",
                "WRAP53 (WD repeat-containing protein 53)",
                "WRN (Werner syndrome protein)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "Telomerase Reverse Transcriptase (TERT)",
            "Telomerase RNA Component (TERC)",
            "Telomere Repeat Binding Factor 1 (TRF1)",
            "Telomere Repeat Binding Factor 2 (TRF2)",
            "Protection of Telomeres 1 (POT1)",
            "Telomere Repeat-Containing RNA (TERRA)",
            "Telomeric Repeat-Containing RNA Interacting Protein 1 (TERF2IP)",
            "Telomerase-Associated Protein 1 (TEP1)",
            "Telomere Dyskeratosis 1 (DKC1)",
            "Telomere Maintenance 1 (TEN1)",
            "Telomere Maintenance 2 (TEN2)",
            "Telomere Maintenance 3 (TEN3)",
            "Telomere Maintenance 4 (TEN4)",
            "Telomere Maintenance 5 (TEN5)",
            "Telomere Maintenance 6 (TEN6)",
            "Telomere Maintenance 7 (TEN7)",
            "Telomere Maintenance 8 (TEN8)",
            "Telomere Maintenance 9 (TEN9)",
            "Telomere Maintenance 10 (TEN10)",
            "Telomere Maintenance 11 (TEN11)",
            "Telomere Maintenance 12 (TEN12)",
            "Telomere Maintenance 13 (TEN13)",
            "Telomere Maintenance 14 (TEN14)",
            "Telomere Maintenance 15 (TEN15)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Telomerase Reverse Transcriptase (TERT)",
                "Telomerase RNA Component (TERC)",
                "Telomere Repeat Binding Factor 1 (TRF1)",
                "Telomere Repeat Binding Factor 2 (TRF2)",
                "Protection of Telomeres 1 (POT1)",
                "Telomere Repeat-Containing RNA (TERRA)",
                "Telomeric Repeat-Containing RNA Interacting Protein 1 (TERF2IP)",
                "Telomerase-Associated Protein 1 (TEP1)",
                "Telomere Dyskeratosis 1 (DKC1)",
                "Telomere Maintenance 1 (TEN1)",
                "Telomere Maintenance 2 (TEN2)",
                "Telomere Maintenance 3 (TEN3)",
                "Telomere Maintenance 4 (TEN4)",
                "Telomere Maintenance 5 (TEN5)",
                "Telomere Maintenance 6 (TEN6)",
                "Telomere Maintenance 7 (TEN7)",
                "Telomere Maintenance 8 (TEN8)",
                "Telomere Maintenance 9 (TEN9)",
                "Telomere Maintenance 10 (TEN10)",
                "Telomere Maintenance 11 (TEN11)",
                "Telomere Maintenance 12 (TEN12)",
                "Telomere Maintenance 13 (TEN13)",
                "Telomere Maintenance 14 (TEN14)",
                "Telomere Maintenance 15 (TEN15)"
            ],
            "mismatches": [],
            "true_referents": [
                "Protection of Telomeres 1 (POT1)",
                "Telomerase RNA Component (TERC)",
                "Telomerase Reverse Transcriptase (TERT)",
                "Telomerase-Associated Protein 1 (TEP1)",
                "Telomere Dyskeratosis 1 (DKC1)",
                "Telomere Maintenance 1 (TEN1)",
                "Telomere Maintenance 10 (TEN10)",
                "Telomere Maintenance 11 (TEN11)",
                "Telomere Maintenance 12 (TEN12)",
                "Telomere Maintenance 13 (TEN13)",
                "Telomere Maintenance 14 (TEN14)",
                "Telomere Maintenance 15 (TEN15)",
                "Telomere Maintenance 2 (TEN2)",
                "Telomere Maintenance 3 (TEN3)",
                "Telomere Maintenance 4 (TEN4)",
                "Telomere Maintenance 5 (TEN5)",
                "Telomere Maintenance 6 (TEN6)",
                "Telomere Maintenance 7 (TEN7)",
                "Telomere Maintenance 8 (TEN8)",
                "Telomere Maintenance 9 (TEN9)",
                "Telomere Repeat Binding Factor 1 (TRF1)",
                "Telomere Repeat Binding Factor 2 (TRF2)",
                "Telomere Repeat-Containing RNA (TERRA)",
                "Telomeric Repeat-Containing RNA Interacting Protein 1 (TERF2IP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "Telomerase Reverse Transcriptase (TERT)",
            "Telomerase RNA Component (TERC)",
            "Dyskerin (DKC1)",
            "Telomerase-Associated Protein 1 (TEP1)",
            "Pontin (Pontin/REPT)",
            "Reptin (Pontin/REPT)",
            "TCAB1 (Telomerase Cajal Body Protein 1)",
            "PINX1 (PIM/Telomerase-Associated Protein 1)",
            "Shelterin Complex Subunit POT1 (POT1)",
            "Shelterin Complex Subunit TPP1 (TPP1)",
            "Shelterin Complex Subunit RAP1 (RAP1)",
            "Shelterin Complex Subunit TIN2 (TIN2)",
            "Shelterin Complex Subunit TRF1 (TRF1)",
            "Shelterin Complex Subunit TRF2 (TRF2)",
            "ATM (Ataxia Telangiectasia Mutated)",
            "ATR (Ataxia Telangiectasia and Rad3-related)",
            "Rad51 (Recombination Repair Gene RAD51)",
            "BRCA1 (Breast Cancer 1, Early Onset)",
            "BRCA2 (Breast Cancer 2, Early Onset)",
            "PARP1 (Poly (ADP-ribose) Polymerase 1)",
            "WRN (Werner Syndrome Protein)",
            "BLM (Bloom Syndrome Protein)",
            "RPA1 (Replication Protein A1)",
            "EST1 (Essential Telomere Maintenance 1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Telomerase Reverse Transcriptase (TERT)",
                "Telomerase RNA Component (TERC)",
                "Dyskerin (DKC1)",
                "Telomerase-Associated Protein 1 (TEP1)",
                "Pontin (Pontin/REPT)",
                "Reptin (Pontin/REPT)",
                "TCAB1 (Telomerase Cajal Body Protein 1)",
                "PINX1 (PIM/Telomerase-Associated Protein 1)",
                "Shelterin Complex Subunit POT1 (POT1)",
                "Shelterin Complex Subunit TPP1 (TPP1)",
                "Shelterin Complex Subunit RAP1 (RAP1)",
                "Shelterin Complex Subunit TIN2 (TIN2)",
                "Shelterin Complex Subunit TRF1 (TRF1)",
                "Shelterin Complex Subunit TRF2 (TRF2)",
                "ATM (Ataxia Telangiectasia Mutated)",
                "ATR (Ataxia Telangiectasia and Rad3-related)",
                "Rad51 (Recombination Repair Gene RAD51)",
                "BRCA1 (Breast Cancer 1, Early Onset)",
                "BRCA2 (Breast Cancer 2, Early Onset)",
                "PARP1 (Poly (ADP-ribose) Polymerase 1)",
                "WRN (Werner Syndrome Protein)",
                "BLM (Bloom Syndrome Protein)",
                "RPA1 (Replication Protein A1)",
                "EST1 (Essential Telomere Maintenance 1)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATM (Ataxia Telangiectasia Mutated)",
                "ATR (Ataxia Telangiectasia and Rad3-related)",
                "BLM (Bloom Syndrome Protein)",
                "BRCA1 (Breast Cancer 1, Early Onset)",
                "BRCA2 (Breast Cancer 2, Early Onset)",
                "Dyskerin (DKC1)",
                "EST1 (Essential Telomere Maintenance 1)",
                "PARP1 (Poly (ADP-ribose) Polymerase 1)",
                "PINX1 (PIM/Telomerase-Associated Protein 1)",
                "Pontin (Pontin/REPT)",
                "RPA1 (Replication Protein A1)",
                "Rad51 (Recombination Repair Gene RAD51)",
                "Reptin (Pontin/REPT)",
                "Shelterin Complex Subunit POT1 (POT1)",
                "Shelterin Complex Subunit RAP1 (RAP1)",
                "Shelterin Complex Subunit TIN2 (TIN2)",
                "Shelterin Complex Subunit TPP1 (TPP1)",
                "Shelterin Complex Subunit TRF1 (TRF1)",
                "Shelterin Complex Subunit TRF2 (TRF2)",
                "TCAB1 (Telomerase Cajal Body Protein 1)",
                "Telomerase RNA Component (TERC)",
                "Telomerase Reverse Transcriptase (TERT)",
                "Telomerase-Associated Protein 1 (TEP1)",
                "WRN (Werner Syndrome Protein)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "Telomerase Reverse Transcriptase (TERT)",
            "Telomerase RNA Component (TERC)",
            "Protection of Telomeres 1 (POT1)",
            "Telomeric Repeat Binding Factor 1 (TERF1)",
            "Telomeric Repeat Binding Factor 2 (TERF2)",
            "Repressor/Activator Protein 1 (RAP1)",
            "TIN2 Interacting Protein (TPP1)",
            "TRF1-Interacting Nuclear Factor 2 (TINF2)",
            "Nuclear Assembly Factor 1 (NAF1)",
            "Dyskerin (DKC1)",
            "NOP10 Ribonucleoprotein (NOP10)",
            "NHP2 Ribonucleoprotein (NHP2)",
            "GAR1 Ribonucleoprotein (GAR1)",
            "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
            "Tankyrase 1 (TNKS1)",
            "Tankyrase 2 (TNKS2)",
            "Apollo (APOLLO)",
            "RecQ Like Helicase 4 (RECQL4)",
            "Werner Syndrome RecQ Like Helicase (WRN)",
            "Bloom Syndrome RecQ Like Helicase (BLM)",
            "SMG1 Nonsense Mediated mRNA Decay Associated PI3K Related Kinase (SMG1)",
            "Polymerase (DNA Directed), Alpha 1 (POLA1)",
            "Polymerase (DNA Directed), Delta 1 (POLD1)",
            "Polymerase (DNA Directed), Epsilon 1 (POLE1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Telomerase Reverse Transcriptase (TERT)",
                "Telomerase RNA Component (TERC)",
                "Protection of Telomeres 1 (POT1)",
                "Telomeric Repeat Binding Factor 1 (TERF1)",
                "Telomeric Repeat Binding Factor 2 (TERF2)",
                "Repressor/Activator Protein 1 (RAP1)",
                "TIN2 Interacting Protein (TPP1)",
                "TRF1-Interacting Nuclear Factor 2 (TINF2)",
                "Nuclear Assembly Factor 1 (NAF1)",
                "Dyskerin (DKC1)",
                "NOP10 Ribonucleoprotein (NOP10)",
                "NHP2 Ribonucleoprotein (NHP2)",
                "GAR1 Ribonucleoprotein (GAR1)",
                "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
                "Tankyrase 1 (TNKS1)",
                "Tankyrase 2 (TNKS2)",
                "Apollo (APOLLO)",
                "RecQ Like Helicase 4 (RECQL4)",
                "Werner Syndrome RecQ Like Helicase (WRN)",
                "Bloom Syndrome RecQ Like Helicase (BLM)",
                "SMG1 Nonsense Mediated mRNA Decay Associated PI3K Related Kinase (SMG1)",
                "Polymerase (DNA Directed), Alpha 1 (POLA1)",
                "Polymerase (DNA Directed), Delta 1 (POLD1)",
                "Polymerase (DNA Directed), Epsilon 1 (POLE1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Apollo (APOLLO)",
                "Bloom Syndrome RecQ Like Helicase (BLM)",
                "Dyskerin (DKC1)",
                "GAR1 Ribonucleoprotein (GAR1)",
                "NHP2 Ribonucleoprotein (NHP2)",
                "NOP10 Ribonucleoprotein (NOP10)",
                "Nuclear Assembly Factor 1 (NAF1)",
                "Polymerase (DNA Directed), Alpha 1 (POLA1)",
                "Polymerase (DNA Directed), Delta 1 (POLD1)",
                "Polymerase (DNA Directed), Epsilon 1 (POLE1)",
                "Protection of Telomeres 1 (POT1)",
                "RecQ Like Helicase 4 (RECQL4)",
                "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
                "Repressor/Activator Protein 1 (RAP1)",
                "SMG1 Nonsense Mediated mRNA Decay Associated PI3K Related Kinase (SMG1)",
                "TIN2 Interacting Protein (TPP1)",
                "TRF1-Interacting Nuclear Factor 2 (TINF2)",
                "Tankyrase 1 (TNKS1)",
                "Tankyrase 2 (TNKS2)",
                "Telomerase RNA Component (TERC)",
                "Telomerase Reverse Transcriptase (TERT)",
                "Telomeric Repeat Binding Factor 1 (TERF1)",
                "Telomeric Repeat Binding Factor 2 (TERF2)",
                "Werner Syndrome RecQ Like Helicase (WRN)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERT (telomerase reverse transcriptase)",
            "TERC (telomerase RNA component)",
            "TP53 (tumor protein p53)",
            "ATM (ataxia telangiectasia mutated)",
            "ATR (ataxia telangiectasia and Rad3 related)",
            "WRN (Werner syndrome ATP-dependent helicase)",
            "BLM (Bloom syndrome protein)",
            "POT1 (protection of telomeres 1)",
            "TRF1 (telomeric repeat binding factor 1)",
            "TRF2 (telomeric repeat binding factor 2)",
            "TIN2 (TRF1-interacting nuclear protein 2)",
            "TINF2 (telomerase-interacting factor 2)",
            "RTEL1 (regulator of telomere elongation helicase 1)",
            "NBN (Nibrin)",
            "FANCJ (Fanconi anemia complementation group J)",
            "SIRT6 (sirtuin 6)",
            "SETX (senataxin)",
            "RPA1 (replication protein A1)",
            "MRE11 (meiotic recombination 11 homolog)",
            "H2AX (H2A histone family member X)",
            "LIG4 (DNA ligase 4)",
            "CST (CTC1-STN1-TEN1 complex)",
            "XPA (Xeroderma pigmentosum group A)",
            "XPD (Xeroderma pigmentosum group D)",
            "XPF (Xeroderma pigmentosum group F)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERT (telomerase reverse transcriptase)",
                "TERC (telomerase RNA component)",
                "TP53 (tumor protein p53)",
                "ATM (ataxia telangiectasia mutated)",
                "ATR (ataxia telangiectasia and Rad3 related)",
                "WRN (Werner syndrome ATP-dependent helicase)",
                "BLM (Bloom syndrome protein)",
                "POT1 (protection of telomeres 1)",
                "TRF1 (telomeric repeat binding factor 1)",
                "TRF2 (telomeric repeat binding factor 2)",
                "TIN2 (TRF1-interacting nuclear protein 2)",
                "TINF2 (telomerase-interacting factor 2)",
                "RTEL1 (regulator of telomere elongation helicase 1)",
                "NBN (Nibrin)",
                "FANCJ (Fanconi anemia complementation group J)",
                "SIRT6 (sirtuin 6)",
                "SETX (senataxin)",
                "RPA1 (replication protein A1)",
                "MRE11 (meiotic recombination 11 homolog)",
                "H2AX (H2A histone family member X)",
                "LIG4 (DNA ligase 4)",
                "CST (CTC1-STN1-TEN1 complex)",
                "XPA (Xeroderma pigmentosum group A)",
                "XPD (Xeroderma pigmentosum group D)"
            ],
            "mismatches": [
                "XPF (Xeroderma pigmentosum group F)"
            ],
            "true_referents": [
                "ATM (ataxia telangiectasia mutated)",
                "ATR (ataxia telangiectasia and Rad3 related)",
                "BLM (Bloom syndrome protein)",
                "CST (CTC1-STN1-TEN1 complex)",
                "FANCJ (Fanconi anemia complementation group J)",
                "H2AX (H2A histone family member X)",
                "LIG4 (DNA ligase 4)",
                "MRE11 (meiotic recombination 11 homolog)",
                "NBN (Nibrin)",
                "POT1 (protection of telomeres 1)",
                "RPA1 (replication protein A1)",
                "RTEL1 (regulator of telomere elongation helicase 1)",
                "SETX (senataxin)",
                "SIRT6 (sirtuin 6)",
                "TERC (telomerase RNA component)",
                "TERT (telomerase reverse transcriptase)",
                "TIN2 (TRF1-interacting nuclear protein 2)",
                "TINF2 (telomerase-interacting factor 2)",
                "TP53 (tumor protein p53)",
                "TRF1 (telomeric repeat binding factor 1)",
                "TRF2 (telomeric repeat binding factor 2)",
                "WRN (Werner syndrome ATP-dependent helicase)",
                "XPA (Xeroderma pigmentosum group A)",
                "XPD (Xeroderma pigmentosum group D)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "Telomerase reverse transcriptase (TERT)",
            "Telomerase RNA component (TERC)",
            "Adrenocortical dysplasia homolog (ACD)",
            "Protection of telomeres 1 (POT1)",
            "Telomeric repeat binding factor 1 (TERF1)",
            "Telomeric repeat binding factor 2 (TERF2)",
            "Telomeric repeat binding factor 2-interacting protein 1 (TERF2IP)",
            "Regulator of telomere elongation helicase 1 (RTEL1)",
            "Telomerase Cajal body protein 1 (TCAB1)",
            "Dyskerin pseudouridine synthase 1 (DKC1)",
            "Nola1 (NOLA1)",
            "Nola2 (NOLA2)",
            "Nola3 (NOLA3)",
            "Nucleostemin (GNL3)",
            "Tankyrase 1 (TNKS1)",
            "Tankyrase 2 (TNKS2)",
            "Tin2 (TINF2)",
            "TPP1 (TPP1)",
            "CTC1 (CTC1)",
            "STN1 (STN1)",
            "TEN1 (TEN1)",
            "Zinc finger protein 676 (ZNF676)",
            "Zinc finger protein 687 (ZNF687)",
            "Zinc finger protein 827 (ZNF827)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Telomerase reverse transcriptase (TERT)",
                "Telomerase RNA component (TERC)",
                "Adrenocortical dysplasia homolog (ACD)",
                "Protection of telomeres 1 (POT1)",
                "Telomeric repeat binding factor 1 (TERF1)",
                "Telomeric repeat binding factor 2 (TERF2)",
                "Telomeric repeat binding factor 2-interacting protein 1 (TERF2IP)",
                "Regulator of telomere elongation helicase 1 (RTEL1)",
                "Telomerase Cajal body protein 1 (TCAB1)",
                "Dyskerin pseudouridine synthase 1 (DKC1)",
                "Nola1 (NOLA1)",
                "Nola2 (NOLA2)",
                "Nola3 (NOLA3)",
                "Nucleostemin (GNL3)",
                "Tankyrase 1 (TNKS1)",
                "Tankyrase 2 (TNKS2)",
                "Tin2 (TINF2)",
                "TPP1 (TPP1)",
                "CTC1 (CTC1)",
                "STN1 (STN1)",
                "TEN1 (TEN1)",
                "Zinc finger protein 676 (ZNF676)",
                "Zinc finger protein 687 (ZNF687)",
                "Zinc finger protein 827 (ZNF827)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenocortical dysplasia homolog (ACD)",
                "CTC1 (CTC1)",
                "Dyskerin pseudouridine synthase 1 (DKC1)",
                "Nola1 (NOLA1)",
                "Nola2 (NOLA2)",
                "Nola3 (NOLA3)",
                "Nucleostemin (GNL3)",
                "Protection of telomeres 1 (POT1)",
                "Regulator of telomere elongation helicase 1 (RTEL1)",
                "STN1 (STN1)",
                "TEN1 (TEN1)",
                "TPP1 (TPP1)",
                "Tankyrase 1 (TNKS1)",
                "Tankyrase 2 (TNKS2)",
                "Telomerase Cajal body protein 1 (TCAB1)",
                "Telomerase RNA component (TERC)",
                "Telomerase reverse transcriptase (TERT)",
                "Telomeric repeat binding factor 1 (TERF1)",
                "Telomeric repeat binding factor 2 (TERF2)",
                "Telomeric repeat binding factor 2-interacting protein 1 (TERF2IP)",
                "Tin2 (TINF2)",
                "Zinc finger protein 676 (ZNF676)",
                "Zinc finger protein 687 (ZNF687)",
                "Zinc finger protein 827 (ZNF827)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERT (Telomerase Reverse Transcriptase)",
            "TERC (Telomerase RNA Component)",
            "TPP1 (Tripeptidyl Peptidase 1)",
            "POT1 (Protection of Telomeres 1)",
            "RTEL1 (Regulator of Telomere Elongation)",
            "TERF1 (Telomeric Repeat Binding Factor 1)",
            "TERF2 (Telomeric Repeat Binding Factor 2)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
            "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERT (Telomerase Reverse Transcriptase)",
                "TERC (Telomerase RNA Component)",
                "TPP1 (Tripeptidyl Peptidase 1)",
                "POT1 (Protection of Telomeres 1)",
                "RTEL1 (Regulator of Telomere Elongation)",
                "TERF1 (Telomeric Repeat Binding Factor 1)",
                "TERF2 (Telomeric Repeat Binding Factor 2)",
                "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)"
            ],
            "mismatches": [],
            "true_referents": [
                "POT1 (Protection of Telomeres 1)",
                "RTEL1 (Regulator of Telomere Elongation)",
                "TERC (Telomerase RNA Component)",
                "TERF1 (Telomeric Repeat Binding Factor 1)",
                "TERF2 (Telomeric Repeat Binding Factor 2)",
                "TERF2IP (Telomeric Repeat Factor 2 Interacting Protein)",
                "TERT (Telomerase Reverse Transcriptase)",
                "TPP1 (Tripeptidyl Peptidase 1)"
            ],
            "TP": 8,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "telomerase reverse transcriptase (TERT)",
            "telomerase RNA component (TERC)",
            "protection of telomeres 1 (POT1)",
            "telomeric repeat-binding factor 1 (TRF1)",
            "telomeric repeat-binding factor 2 (TRF2)",
            "TIN2 shelterin component (TINF2)",
            "adrenocorticotropic hormone binding protein (ACD)",
            "regulator of telomere elongation helicase 1 (RTEL1)",
            "Werner syndrome helicase (WRN)",
            "Bloom syndrome helicase (BLM)",
            "dyskerin pseudouridine synthase 1 (DKC1)",
            "NOP10 ribonucleoprotein component (NOP10)",
            "NHP2 ribonucleoprotein component (NHP2)",
            "CTC1 CST complex component (CTC1)",
            "STN1 CST complex component (STN1)",
            "TEN1 CST complex component (TEN1)",
            "poly(A)-specific ribonuclease (PARN)",
            "shelterin complex component 3 (TERF3)",
            "mammalian telomerase associated protein (MAST)",
            "telomere maintenance 1 (TM1)",
            "telomere maintenance 2 (TM2)",
            "shelterin component RAP1 (RAP1)",
            "shelterin component TRF2-interacting factor (TRF2IF)",
            "shelterin component POT1-interacting protein (PIP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "telomerase reverse transcriptase (TERT)",
                "telomerase RNA component (TERC)",
                "protection of telomeres 1 (POT1)",
                "telomeric repeat-binding factor 1 (TRF1)",
                "telomeric repeat-binding factor 2 (TRF2)",
                "TIN2 shelterin component (TINF2)",
                "adrenocorticotropic hormone binding protein (ACD)",
                "regulator of telomere elongation helicase 1 (RTEL1)",
                "Werner syndrome helicase (WRN)",
                "Bloom syndrome helicase (BLM)",
                "dyskerin pseudouridine synthase 1 (DKC1)",
                "NOP10 ribonucleoprotein component (NOP10)",
                "NHP2 ribonucleoprotein component (NHP2)",
                "CTC1 CST complex component (CTC1)",
                "STN1 CST complex component (STN1)",
                "TEN1 CST complex component (TEN1)",
                "poly(A)-specific ribonuclease (PARN)",
                "shelterin complex component 3 (TERF3)",
                "mammalian telomerase associated protein (MAST)",
                "telomere maintenance 1 (TM1)",
                "telomere maintenance 2 (TM2)",
                "shelterin component RAP1 (RAP1)",
                "shelterin component TRF2-interacting factor (TRF2IF)",
                "shelterin component POT1-interacting protein (PIP)"
            ],
            "mismatches": [],
            "true_referents": [
                "Bloom syndrome helicase (BLM)",
                "CTC1 CST complex component (CTC1)",
                "NHP2 ribonucleoprotein component (NHP2)",
                "NOP10 ribonucleoprotein component (NOP10)",
                "STN1 CST complex component (STN1)",
                "TEN1 CST complex component (TEN1)",
                "TIN2 shelterin component (TINF2)",
                "Werner syndrome helicase (WRN)",
                "adrenocorticotropic hormone binding protein (ACD)",
                "dyskerin pseudouridine synthase 1 (DKC1)",
                "mammalian telomerase associated protein (MAST)",
                "poly(A)-specific ribonuclease (PARN)",
                "protection of telomeres 1 (POT1)",
                "regulator of telomere elongation helicase 1 (RTEL1)",
                "shelterin complex component 3 (TERF3)",
                "shelterin component POT1-interacting protein (PIP)",
                "shelterin component RAP1 (RAP1)",
                "shelterin component TRF2-interacting factor (TRF2IF)",
                "telomerase RNA component (TERC)",
                "telomerase reverse transcriptase (TERT)",
                "telomere maintenance 1 (TM1)",
                "telomere maintenance 2 (TM2)",
                "telomeric repeat-binding factor 1 (TRF1)",
                "telomeric repeat-binding factor 2 (TRF2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "Telomerase reverse transcriptase (TERT)",
            "Telomerase RNA component (TERC)",
            "Protection of telomeres 1 (POT1)",
            "Telomeric repeat-binding factor 1 (TRF1)",
            "Telomeric repeat-binding factor 2 (TRF2)",
            "TRF1-interacting nuclear factor 2 (TINF2)",
            "Adrenocortical dysplasia protein homolog (ACD)",
            "TERF1-interacting nuclear factor 1 (PINX1)",
            "Regulator of telomere elongation helicase 1 (RTEL1)",
            "Telomere-associated protein RIF1 (RIF1)",
            "Telomere length regulation protein TEL2 homolog (TELO2)",
            "DNA repair protein RAD50 (RAD50)",
            "ATM serine/threonine kinase (ATM)",
            "Werner syndrome RecQ like helicase (WRN)",
            "Bloom syndrome RecQ like helicase (BLM)",
            "Poly(ADP-ribose) polymerase 1 (PARP1)",
            "Telomere capping protein 1 (TEP1)",
            "Tankyrase 1 (TNKS)",
            "Tankyrase 2 (TNKS2)",
            "Dyskeratosis congenita 1 (DKC1)",
            "Nuclear assembly factor 1 ribonucleoprotein (NAF1)",
            "NHP2 ribonucleoprotein (NHP2)",
            "NOP10 ribonucleoprotein (NOP10)",
            "Telomere maintenance 2 (TELO2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Telomerase reverse transcriptase (TERT)",
                "Telomerase RNA component (TERC)",
                "Protection of telomeres 1 (POT1)",
                "Telomeric repeat-binding factor 1 (TRF1)",
                "Telomeric repeat-binding factor 2 (TRF2)",
                "TRF1-interacting nuclear factor 2 (TINF2)",
                "Adrenocortical dysplasia protein homolog (ACD)",
                "TERF1-interacting nuclear factor 1 (PINX1)",
                "Regulator of telomere elongation helicase 1 (RTEL1)",
                "Telomere-associated protein RIF1 (RIF1)",
                "Telomere length regulation protein TEL2 homolog (TELO2)",
                "DNA repair protein RAD50 (RAD50)",
                "ATM serine/threonine kinase (ATM)",
                "Werner syndrome RecQ like helicase (WRN)",
                "Bloom syndrome RecQ like helicase (BLM)",
                "Poly(ADP-ribose) polymerase 1 (PARP1)",
                "Telomere capping protein 1 (TEP1)",
                "Tankyrase 1 (TNKS)",
                "Tankyrase 2 (TNKS2)",
                "Dyskeratosis congenita 1 (DKC1)",
                "Nuclear assembly factor 1 ribonucleoprotein (NAF1)",
                "NHP2 ribonucleoprotein (NHP2)",
                "NOP10 ribonucleoprotein (NOP10)",
                "Telomere maintenance 2 (TELO2)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATM serine/threonine kinase (ATM)",
                "Adrenocortical dysplasia protein homolog (ACD)",
                "Bloom syndrome RecQ like helicase (BLM)",
                "DNA repair protein RAD50 (RAD50)",
                "Dyskeratosis congenita 1 (DKC1)",
                "NHP2 ribonucleoprotein (NHP2)",
                "NOP10 ribonucleoprotein (NOP10)",
                "Nuclear assembly factor 1 ribonucleoprotein (NAF1)",
                "Poly(ADP-ribose) polymerase 1 (PARP1)",
                "Protection of telomeres 1 (POT1)",
                "Regulator of telomere elongation helicase 1 (RTEL1)",
                "TERF1-interacting nuclear factor 1 (PINX1)",
                "TRF1-interacting nuclear factor 2 (TINF2)",
                "Tankyrase 1 (TNKS)",
                "Tankyrase 2 (TNKS2)",
                "Telomerase RNA component (TERC)",
                "Telomerase reverse transcriptase (TERT)",
                "Telomere capping protein 1 (TEP1)",
                "Telomere length regulation protein TEL2 homolog (TELO2)",
                "Telomere maintenance 2 (TELO2)",
                "Telomere-associated protein RIF1 (RIF1)",
                "Telomeric repeat-binding factor 1 (TRF1)",
                "Telomeric repeat-binding factor 2 (TRF2)",
                "Werner syndrome RecQ like helicase (WRN)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "Telomerase Reverse Transcriptase (TERT)",
            "Telomerase RNA Component (TERC)",
            "Dyskerin Pseudouridine Synthase 1 (DKC1)",
            "NHP2 Ribonucleoprotein (NHP2)",
            "NOP10 Ribonucleoprotein (NOP10)",
            "Telomerase Cajal Body Protein 1 (TCAB1)",
            "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
            "CST Complex Subunit Alpha (CTC1)",
            "CST Complex Subunit Beta (STN1)",
            "CST Complex Subunit Gamma (TEN1)",
            "Telomeric Repeat Binding Factor 1 (TERF1)",
            "Telomeric Repeat Binding Factor 2 (TERF2)",
            "TERF1 Interacting Nuclear Factor 2 (TINF2)",
            "Protection of Telomeres 1 (POT1)",
            "TPP1 (ACD)",
            "Repressor/Activator Protein 1 (RAP1)",
            "Telomere Length Regulation Protein TEL2 (TELO2)",
            "KU Autoantigen 70kDa (XRCC6)",
            "KU Autoantigen 80kDa (XRCC5)",
            "DNA-dependent Protein Kinase Catalytic Subunit (PRKDC)",
            "Poly(ADP-ribose) Polymerase 1 (PARP1)",
            "Flap Endonuclease 1 (FEN1)",
            "DNA Replication Helicase/Nuclease 2 (DNA2)",
            "Werner Syndrome RecQ Like Helicase (WRN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Telomerase Reverse Transcriptase (TERT)",
                "Telomerase RNA Component (TERC)",
                "Dyskerin Pseudouridine Synthase 1 (DKC1)",
                "NHP2 Ribonucleoprotein (NHP2)",
                "NOP10 Ribonucleoprotein (NOP10)",
                "Telomerase Cajal Body Protein 1 (TCAB1)",
                "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
                "CST Complex Subunit Alpha (CTC1)",
                "CST Complex Subunit Beta (STN1)",
                "CST Complex Subunit Gamma (TEN1)",
                "Telomeric Repeat Binding Factor 1 (TERF1)",
                "Telomeric Repeat Binding Factor 2 (TERF2)",
                "TERF1 Interacting Nuclear Factor 2 (TINF2)",
                "Protection of Telomeres 1 (POT1)",
                "TPP1 (ACD)",
                "Repressor/Activator Protein 1 (RAP1)",
                "Telomere Length Regulation Protein TEL2 (TELO2)",
                "KU Autoantigen 70kDa (XRCC6)",
                "KU Autoantigen 80kDa (XRCC5)",
                "DNA-dependent Protein Kinase Catalytic Subunit (PRKDC)",
                "Poly(ADP-ribose) Polymerase 1 (PARP1)",
                "Flap Endonuclease 1 (FEN1)",
                "DNA Replication Helicase/Nuclease 2 (DNA2)",
                "Werner Syndrome RecQ Like Helicase (WRN)"
            ],
            "mismatches": [],
            "true_referents": [
                "CST Complex Subunit Alpha (CTC1)",
                "CST Complex Subunit Beta (STN1)",
                "CST Complex Subunit Gamma (TEN1)",
                "DNA Replication Helicase/Nuclease 2 (DNA2)",
                "DNA-dependent Protein Kinase Catalytic Subunit (PRKDC)",
                "Dyskerin Pseudouridine Synthase 1 (DKC1)",
                "Flap Endonuclease 1 (FEN1)",
                "KU Autoantigen 70kDa (XRCC6)",
                "KU Autoantigen 80kDa (XRCC5)",
                "NHP2 Ribonucleoprotein (NHP2)",
                "NOP10 Ribonucleoprotein (NOP10)",
                "Poly(ADP-ribose) Polymerase 1 (PARP1)",
                "Protection of Telomeres 1 (POT1)",
                "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
                "Repressor/Activator Protein 1 (RAP1)",
                "TERF1 Interacting Nuclear Factor 2 (TINF2)",
                "TPP1 (ACD)",
                "Telomerase Cajal Body Protein 1 (TCAB1)",
                "Telomerase RNA Component (TERC)",
                "Telomerase Reverse Transcriptase (TERT)",
                "Telomere Length Regulation Protein TEL2 (TELO2)",
                "Telomeric Repeat Binding Factor 1 (TERF1)",
                "Telomeric Repeat Binding Factor 2 (TERF2)",
                "Werner Syndrome RecQ Like Helicase (WRN)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "Telomerase reverse transcriptase (TERT)",
            "Telomerase RNA component (TERC)",
            "Protection of telomeres 1 (POT1)",
            "Repressor activator protein 1 (RAP1)",
            "TRF1-interacting nuclear protein 2 (TIN2)",
            "TRF1-interacting nuclear factor 2 (TINF2)",
            "Adrenocortical dysplasia protein homolog (ACD)",
            "Regulator of telomere elongation helicase 1 (RTEL1)",
            "CST telomere replication complex component 1 (CTC1)",
            "Telomeric repeat binding factor 1 (TERF1)",
            "Telomeric repeat binding factor 2 (TERF2)",
            "Telomeric repeat binding factor 2 interacting protein 1 (TERF2IP)",
            "WD repeat containing antisense to TP53 (WRAP53)",
            "Shelterin complex subunit POT1 (POT1)",
            "Shelterin complex subunit TRF1 (TERF1)",
            "Shelterin complex subunit TRF2 (TERF2)",
            "Shelterin complex subunit RAP1 (TERF2IP)",
            "Shelterin complex subunit TIN2 (TINF2)",
            "Shelterin complex subunit TPP1 (ACD)",
            "Poly(A)-specific ribonuclease (PARN)",
            "Nucleolar protein 10 (NOL10)",
            "NAF1 nucleosome assembly protein (NAF1)",
            "Dyskerin pseudouridine synthase 1 (DKC1)",
            "Non-structural maintenance of chromosomes element 1 homolog (NBSL1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Telomerase reverse transcriptase (TERT)",
                "Telomerase RNA component (TERC)",
                "Protection of telomeres 1 (POT1)",
                "Repressor activator protein 1 (RAP1)",
                "TRF1-interacting nuclear protein 2 (TIN2)",
                "TRF1-interacting nuclear factor 2 (TINF2)",
                "Adrenocortical dysplasia protein homolog (ACD)",
                "Regulator of telomere elongation helicase 1 (RTEL1)",
                "CST telomere replication complex component 1 (CTC1)",
                "Telomeric repeat binding factor 1 (TERF1)",
                "Telomeric repeat binding factor 2 (TERF2)",
                "Telomeric repeat binding factor 2 interacting protein 1 (TERF2IP)",
                "WD repeat containing antisense to TP53 (WRAP53)",
                "Shelterin complex subunit POT1 (POT1)",
                "Shelterin complex subunit TRF1 (TERF1)",
                "Shelterin complex subunit TRF2 (TERF2)",
                "Shelterin complex subunit RAP1 (TERF2IP)",
                "Shelterin complex subunit TIN2 (TINF2)",
                "Shelterin complex subunit TPP1 (ACD)",
                "Poly(A)-specific ribonuclease (PARN)",
                "Nucleolar protein 10 (NOL10)",
                "NAF1 nucleosome assembly protein (NAF1)",
                "Dyskerin pseudouridine synthase 1 (DKC1)",
                "Non-structural maintenance of chromosomes element 1 homolog (NBSL1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenocortical dysplasia protein homolog (ACD)",
                "CST telomere replication complex component 1 (CTC1)",
                "Dyskerin pseudouridine synthase 1 (DKC1)",
                "NAF1 nucleosome assembly protein (NAF1)",
                "Non-structural maintenance of chromosomes element 1 homolog (NBSL1)",
                "Nucleolar protein 10 (NOL10)",
                "Poly(A)-specific ribonuclease (PARN)",
                "Protection of telomeres 1 (POT1)",
                "Regulator of telomere elongation helicase 1 (RTEL1)",
                "Repressor activator protein 1 (RAP1)",
                "Shelterin complex subunit POT1 (POT1)",
                "Shelterin complex subunit RAP1 (TERF2IP)",
                "Shelterin complex subunit TIN2 (TINF2)",
                "Shelterin complex subunit TPP1 (ACD)",
                "Shelterin complex subunit TRF1 (TERF1)",
                "Shelterin complex subunit TRF2 (TERF2)",
                "TRF1-interacting nuclear factor 2 (TINF2)",
                "TRF1-interacting nuclear protein 2 (TIN2)",
                "Telomerase RNA component (TERC)",
                "Telomerase reverse transcriptase (TERT)",
                "Telomeric repeat binding factor 1 (TERF1)",
                "Telomeric repeat binding factor 2 (TERF2)",
                "Telomeric repeat binding factor 2 interacting protein 1 (TERF2IP)",
                "WD repeat containing antisense to TP53 (WRAP53)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "Telomerase Reverse Transcriptase (TERT)",
            "Telomerase RNA Component (TERC)",
            "Telomeric Repeat Binding Factor 1 (TRF1)",
            "Telomeric Repeat Binding Factor 2 (TRF2)",
            "Protection of Telomeres 1 (POT1)",
            "Tripeptidyl Peptidase 1 (TPP1)",
            "Adrenocortical Dysplasia Homolog (ACDP1)",
            "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
            "Tankyrase 1 (TNKS1)",
            "Tankyrase 2 (TNKS2)",
            "Shelterin Complex Subunit TIN2 (TINF2)",
            "Shelterin Complex Subunit RAP1 (TERF2IP)",
            "Shelterin Complex Subunit TPP1 (ACD)",
            "Shelterin Complex Subunit TRF1 Interacting Nuclear Factor 2 (TINF2)",
            "Chromatin Remodeling Factor ATRX (ATRX)",
            "Chromatin Remodeling Factor DAXX (DAXX)",
            "Poly(ADP-Ribose) Polymerase 1 (PARP1)",
            "Poly(ADP-Ribose) Polymerase 2 (PARP2)",
            "Ku70 (XRCC6)",
            "Ku80 (XRCC5)",
            "DNA-Dependent Protein Kinase Catalytic Subunit (PRKDC)",
            "MRE11 Homolog, Double-Strand Break Repair Nuclease (MRE11)",
            "Nijmegen Breakage Syndrome 1 (NBN)",
            "RAD50 Double-Strand Break Repair Protein (RAD50)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Telomerase Reverse Transcriptase (TERT)",
                "Telomerase RNA Component (TERC)",
                "Telomeric Repeat Binding Factor 1 (TRF1)",
                "Telomeric Repeat Binding Factor 2 (TRF2)",
                "Protection of Telomeres 1 (POT1)",
                "Tripeptidyl Peptidase 1 (TPP1)",
                "Adrenocortical Dysplasia Homolog (ACDP1)",
                "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
                "Tankyrase 1 (TNKS1)",
                "Tankyrase 2 (TNKS2)",
                "Shelterin Complex Subunit TIN2 (TINF2)",
                "Shelterin Complex Subunit RAP1 (TERF2IP)",
                "Shelterin Complex Subunit TPP1 (ACD)",
                "Shelterin Complex Subunit TRF1 Interacting Nuclear Factor 2 (TINF2)",
                "Chromatin Remodeling Factor ATRX (ATRX)",
                "Chromatin Remodeling Factor DAXX (DAXX)",
                "Poly(ADP-Ribose) Polymerase 1 (PARP1)",
                "Poly(ADP-Ribose) Polymerase 2 (PARP2)",
                "Ku70 (XRCC6)",
                "Ku80 (XRCC5)",
                "DNA-Dependent Protein Kinase Catalytic Subunit (PRKDC)",
                "MRE11 Homolog, Double-Strand Break Repair Nuclease (MRE11)",
                "Nijmegen Breakage Syndrome 1 (NBN)",
                "RAD50 Double-Strand Break Repair Protein (RAD50)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenocortical Dysplasia Homolog (ACDP1)",
                "Chromatin Remodeling Factor ATRX (ATRX)",
                "Chromatin Remodeling Factor DAXX (DAXX)",
                "DNA-Dependent Protein Kinase Catalytic Subunit (PRKDC)",
                "Ku70 (XRCC6)",
                "Ku80 (XRCC5)",
                "MRE11 Homolog, Double-Strand Break Repair Nuclease (MRE11)",
                "Nijmegen Breakage Syndrome 1 (NBN)",
                "Poly(ADP-Ribose) Polymerase 1 (PARP1)",
                "Poly(ADP-Ribose) Polymerase 2 (PARP2)",
                "Protection of Telomeres 1 (POT1)",
                "RAD50 Double-Strand Break Repair Protein (RAD50)",
                "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
                "Shelterin Complex Subunit RAP1 (TERF2IP)",
                "Shelterin Complex Subunit TIN2 (TINF2)",
                "Shelterin Complex Subunit TPP1 (ACD)",
                "Shelterin Complex Subunit TRF1 Interacting Nuclear Factor 2 (TINF2)",
                "Tankyrase 1 (TNKS1)",
                "Tankyrase 2 (TNKS2)",
                "Telomerase RNA Component (TERC)",
                "Telomerase Reverse Transcriptase (TERT)",
                "Telomeric Repeat Binding Factor 1 (TRF1)",
                "Telomeric Repeat Binding Factor 2 (TRF2)",
                "Tripeptidyl Peptidase 1 (TPP1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERT (Telomerase Reverse Transcriptase) (TERT)",
            "TLC1 (Telomerase RNA Component) (TLC1)",
            "EST2 (EST2, telomerase catalytic subunit) (EST2)",
            "Dicer (Dicer, ribonuclease III) (Dicer)",
            "TRF1 (Telomeric Repeat Factor 1) (TRF1)",
            "TRF2 (Telomeric Repeat Factor 2) (TRF2)",
            "Rap1 (Rap1, telomere-binding protein) (Rap1)",
            "Pot1 (Protection of Telomeres 1) (Pot1)",
            "TPP1 (Telomerase-associated protein 1) (TPP1)",
            "OBFC1 (OB fold-containing protein 1) (OBFC1)",
            "EST1 (EST1, telomerase-associated protein) (EST1)",
            "Cdc13 (Cdc13, telomere-binding protein) (Cdc13)",
            "Stn1 (Stn1, telomere-binding protein) (Stn1)",
            "Ten1 (Ten1, telomere-binding protein) (Ten1)",
            "Taz1 (Taz1, telomere-binding protein) (Taz1)",
            "Mre11 (Mre11, double-strand break repair protein) (Mre11)",
            "Nbs1 (Nijmegen breakage syndrome 1) (Nbs1)",
            "Rad50 (Rad50, double-strand break repair protein) (Rad50)",
            "ATM (Ataxia-telangiectasia mutated) (ATM)",
            "BRCA1 (Breast cancer 1, early onset) (BRCA1)",
            "BRCA2 (Breast cancer 2, early onset) (BRCA2)",
            "FANCD2 (Fanconi anemia, complementation group D2) (FANCD2)",
            "FANCI (Fanconi anemia, complementation group I) (FANCI)",
            "BLM (Bloom syndrome protein) (BLM)",
            "WRN (Werner syndrome protein) (WRN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERT (Telomerase Reverse Transcriptase) (TERT)",
                "TLC1 (Telomerase RNA Component) (TLC1)",
                "EST2 (EST2, telomerase catalytic subunit) (EST2)",
                "Dicer (Dicer, ribonuclease III) (Dicer)",
                "TRF1 (Telomeric Repeat Factor 1) (TRF1)",
                "TRF2 (Telomeric Repeat Factor 2) (TRF2)",
                "Rap1 (Rap1, telomere-binding protein) (Rap1)",
                "Pot1 (Protection of Telomeres 1) (Pot1)",
                "TPP1 (Telomerase-associated protein 1) (TPP1)",
                "OBFC1 (OB fold-containing protein 1) (OBFC1)",
                "EST1 (EST1, telomerase-associated protein) (EST1)",
                "Cdc13 (Cdc13, telomere-binding protein) (Cdc13)",
                "Stn1 (Stn1, telomere-binding protein) (Stn1)",
                "Ten1 (Ten1, telomere-binding protein) (Ten1)",
                "Taz1 (Taz1, telomere-binding protein) (Taz1)",
                "Mre11 (Mre11, double-strand break repair protein) (Mre11)",
                "Nbs1 (Nijmegen breakage syndrome 1) (Nbs1)",
                "Rad50 (Rad50, double-strand break repair protein) (Rad50)",
                "ATM (Ataxia-telangiectasia mutated) (ATM)",
                "BRCA1 (Breast cancer 1, early onset) (BRCA1)",
                "BRCA2 (Breast cancer 2, early onset) (BRCA2)",
                "FANCD2 (Fanconi anemia, complementation group D2) (FANCD2)",
                "FANCI (Fanconi anemia, complementation group I) (FANCI)",
                "BLM (Bloom syndrome protein) (BLM)"
            ],
            "mismatches": [
                "WRN (Werner syndrome protein) (WRN)"
            ],
            "true_referents": [
                "ATM (Ataxia-telangiectasia mutated) (ATM)",
                "BLM (Bloom syndrome protein) (BLM)",
                "BRCA1 (Breast cancer 1, early onset) (BRCA1)",
                "BRCA2 (Breast cancer 2, early onset) (BRCA2)",
                "Cdc13 (Cdc13, telomere-binding protein) (Cdc13)",
                "Dicer (Dicer, ribonuclease III) (Dicer)",
                "EST1 (EST1, telomerase-associated protein) (EST1)",
                "EST2 (EST2, telomerase catalytic subunit) (EST2)",
                "FANCD2 (Fanconi anemia, complementation group D2) (FANCD2)",
                "FANCI (Fanconi anemia, complementation group I) (FANCI)",
                "Mre11 (Mre11, double-strand break repair protein) (Mre11)",
                "Nbs1 (Nijmegen breakage syndrome 1) (Nbs1)",
                "OBFC1 (OB fold-containing protein 1) (OBFC1)",
                "Pot1 (Protection of Telomeres 1) (Pot1)",
                "Rad50 (Rad50, double-strand break repair protein) (Rad50)",
                "Rap1 (Rap1, telomere-binding protein) (Rap1)",
                "Stn1 (Stn1, telomere-binding protein) (Stn1)",
                "TERT (Telomerase Reverse Transcriptase) (TERT)",
                "TLC1 (Telomerase RNA Component) (TLC1)",
                "TPP1 (Telomerase-associated protein 1) (TPP1)",
                "TRF1 (Telomeric Repeat Factor 1) (TRF1)",
                "TRF2 (Telomeric Repeat Factor 2) (TRF2)",
                "Taz1 (Taz1, telomere-binding protein) (Taz1)",
                "Ten1 (Ten1, telomere-binding protein) (Ten1)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "Telomerase Reverse Transcriptase (TERT)",
            "Telomerase RNA Component (TERC)",
            "Protection of Telomeres 1 (POT1)",
            "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
            "Telomere Repeat Binding Factor 1 (TERF1)",
            "Telomere Repeat Binding Factor 2 (TERF2)",
            "ATR-X syndrome, alpha-thalassemia/mental retardation syndrome X-linked (ATRX)",
            "DNase I Hypersensitive Sites 6-8 (DHX36)",
            "Polymerase Alpha (POLA1)",
            "Replication Factor C Subunit 1 (RFC1)",
            "Replication Factor C Subunit 2 (RFC2)",
            "Replication Factor C Subunit 3 (RFC3)",
            "Replication Factor C Subunit 4 (RFC4)",
            "Replication Factor C Subunit 5 (RFC5)",
            "DNA Polymerase Delta Subunit 1 (POLD1)",
            "DNA Polymerase Delta Subunit 2 (POLD2)",
            "DNA Polymerase Delta Subunit 3 (POLD3)",
            "DNA Polymerase Delta Subunit 4 (POLD4)",
            "DNA Polymerase Epsilon Subunit 1 (POLE1)",
            "DNA Polymerase Epsilon Subunit 2 (POLE2)",
            "DNA Polymerase Epsilon Subunit 3 (POLE3)",
            "DNA Polymerase Epsilon Subunit 4 (POLE4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Telomerase Reverse Transcriptase (TERT)",
                "Telomerase RNA Component (TERC)",
                "Protection of Telomeres 1 (POT1)",
                "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
                "Telomere Repeat Binding Factor 1 (TERF1)",
                "Telomere Repeat Binding Factor 2 (TERF2)",
                "ATR-X syndrome, alpha-thalassemia/mental retardation syndrome X-linked (ATRX)",
                "DNase I Hypersensitive Sites 6-8 (DHX36)",
                "Polymerase Alpha (POLA1)",
                "Replication Factor C Subunit 1 (RFC1)",
                "Replication Factor C Subunit 2 (RFC2)",
                "Replication Factor C Subunit 3 (RFC3)",
                "Replication Factor C Subunit 4 (RFC4)",
                "Replication Factor C Subunit 5 (RFC5)",
                "DNA Polymerase Delta Subunit 1 (POLD1)",
                "DNA Polymerase Delta Subunit 2 (POLD2)",
                "DNA Polymerase Delta Subunit 3 (POLD3)",
                "DNA Polymerase Delta Subunit 4 (POLD4)",
                "DNA Polymerase Epsilon Subunit 1 (POLE1)",
                "DNA Polymerase Epsilon Subunit 2 (POLE2)",
                "DNA Polymerase Epsilon Subunit 3 (POLE3)",
                "DNA Polymerase Epsilon Subunit 4 (POLE4)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATR-X syndrome, alpha-thalassemia/mental retardation syndrome X-linked (ATRX)",
                "DNA Polymerase Delta Subunit 1 (POLD1)",
                "DNA Polymerase Delta Subunit 2 (POLD2)",
                "DNA Polymerase Delta Subunit 3 (POLD3)",
                "DNA Polymerase Delta Subunit 4 (POLD4)",
                "DNA Polymerase Epsilon Subunit 1 (POLE1)",
                "DNA Polymerase Epsilon Subunit 2 (POLE2)",
                "DNA Polymerase Epsilon Subunit 3 (POLE3)",
                "DNA Polymerase Epsilon Subunit 4 (POLE4)",
                "DNase I Hypersensitive Sites 6-8 (DHX36)",
                "Polymerase Alpha (POLA1)",
                "Protection of Telomeres 1 (POT1)",
                "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
                "Replication Factor C Subunit 1 (RFC1)",
                "Replication Factor C Subunit 2 (RFC2)",
                "Replication Factor C Subunit 3 (RFC3)",
                "Replication Factor C Subunit 4 (RFC4)",
                "Replication Factor C Subunit 5 (RFC5)",
                "Telomerase RNA Component (TERC)",
                "Telomerase Reverse Transcriptase (TERT)",
                "Telomere Repeat Binding Factor 1 (TERF1)",
                "Telomere Repeat Binding Factor 2 (TERF2)"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            {
                "Term": "BLM",
                "Abbreviation": "BLM"
            },
            {
                "Term": "Cdc13",
                "Abbreviation": "CDC13"
            },
            {
                "Term": "Est1",
                "Abbreviation": "EST1"
            },
            {
                "Term": "Est2",
                "Abbreviation": "EST2"
            },
            {
                "Term": "Est3",
                "Abbreviation": "EST3"
            },
            {
                "Term": "Est4",
                "Abbreviation": "EST4"
            },
            {
                "Term": "Est5",
                "Abbreviation": "EST5"
            },
            {
                "Term": "Est6",
                "Abbreviation": "EST6"
            },
            {
                "Term": "Est7",
                "Abbreviation": "EST7"
            },
            {
                "Term": "Est8",
                "Abbreviation": "EST8"
            },
            {
                "Term": "Est9",
                "Abbreviation": "EST9"
            },
            {
                "Term": "Est10",
                "Abbreviation": "EST10"
            },
            {
                "Term": "Est11",
                "Abbreviation": "EST11"
            },
            {
                "Term": "Est12",
                "Abbreviation": "EST12"
            },
            {
                "Term": "Est13",
                "Abbreviation": "EST13"
            },
            {
                "Term": "Est14",
                "Abbreviation": "EST14"
            },
            {
                "Term": "Est15",
                "Abbreviation": "EST15"
            },
            {
                "Term": "Est16",
                "Abbreviation": "EST16"
            },
            {
                "Term": "Est17",
                "Abbreviation": "EST17"
            },
            {
                "Term": "Est18",
                "Abbreviation": "EST18"
            },
            {
                "Term": "Est19",
                "Abbreviation": "EST19"
            },
            {
                "Term": "Est20",
                "Abbreviation": "EST20"
            },
            {
                "Term": "Est21",
                "Abbreviation": "EST21"
            },
            {
                "Term": "Est22",
                "Abbreviation": "EST22"
            },
            {
                "Term": "Est23",
                "Abbreviation": "EST23"
            },
            {
                "Term": "Est24",
                "Abbreviation": "EST24"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BLM",
                "Cdc13",
                "Est1",
                "Est2",
                "Est3",
                "Est4",
                "Est5",
                "Est6",
                "Est7",
                "Est8",
                "Est9",
                "Est10",
                "Est11",
                "Est12",
                "Est13",
                "Est14",
                "Est15",
                "Est16",
                "Est17",
                "Est18",
                "Est19",
                "Est20",
                "Est21",
                "Est22"
            ],
            "mismatches": [
                "Est23",
                "Est24"
            ],
            "true_referents": [
                "{\"Term\": \"BLM\", \"Abbreviation\": \"BLM\"}",
                "{\"Term\": \"Cdc13\", \"Abbreviation\": \"CDC13\"}",
                "{\"Term\": \"Est1\", \"Abbreviation\": \"EST1\"}",
                "{\"Term\": \"Est10\", \"Abbreviation\": \"EST10\"}",
                "{\"Term\": \"Est11\", \"Abbreviation\": \"EST11\"}",
                "{\"Term\": \"Est12\", \"Abbreviation\": \"EST12\"}",
                "{\"Term\": \"Est13\", \"Abbreviation\": \"EST13\"}",
                "{\"Term\": \"Est14\", \"Abbreviation\": \"EST14\"}",
                "{\"Term\": \"Est15\", \"Abbreviation\": \"EST15\"}",
                "{\"Term\": \"Est16\", \"Abbreviation\": \"EST16\"}",
                "{\"Term\": \"Est17\", \"Abbreviation\": \"EST17\"}",
                "{\"Term\": \"Est18\", \"Abbreviation\": \"EST18\"}",
                "{\"Term\": \"Est19\", \"Abbreviation\": \"EST19\"}",
                "{\"Term\": \"Est2\", \"Abbreviation\": \"EST2\"}",
                "{\"Term\": \"Est20\", \"Abbreviation\": \"EST20\"}",
                "{\"Term\": \"Est21\", \"Abbreviation\": \"EST21\"}",
                "{\"Term\": \"Est22\", \"Abbreviation\": \"EST22\"}",
                "{\"Term\": \"Est3\", \"Abbreviation\": \"EST3\"}",
                "{\"Term\": \"Est4\", \"Abbreviation\": \"EST4\"}",
                "{\"Term\": \"Est5\", \"Abbreviation\": \"EST5\"}",
                "{\"Term\": \"Est6\", \"Abbreviation\": \"EST6\"}",
                "{\"Term\": \"Est7\", \"Abbreviation\": \"EST7\"}",
                "{\"Term\": \"Est8\", \"Abbreviation\": \"EST8\"}",
                "{\"Term\": \"Est9\", \"Abbreviation\": \"EST9\"}"
            ],
            "TP": 24,
            "FP": 2,
            "FN": 0
        }
    }
]