[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERT (TER)",
            "TERC (TR)",
            "DKC1",
            "NHP2",
            "NOP10",
            "TCAB1",
            "TINF2",
            "POT1",
            "RTEL1",
            "PARN",
            "WRAP53",
            "STN1",
            "TERT (hTERT)",
            "NOPP140",
            "POTIP1",
            "TINF2 (TERF2IP)",
            "POTIP2",
            "NHP2L1",
            "TCAB1 (TCAB1)",
            "TINF2 (TERF2)",
            "WRAP53 (TCAB1)",
            "RMI1",
            "RMI2",
            "TERRA"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERT (TER)",
                "TERC (TR)",
                "DKC1",
                "NHP2",
                "NOP10",
                "TCAB1",
                "TINF2",
                "POT1",
                "RTEL1",
                "PARN",
                "WRAP53",
                "STN1",
                "TERT (hTERT)",
                "NOPP140",
                "POTIP1",
                "TINF2 (TERF2IP)",
                "POTIP2",
                "NHP2L1",
                "TCAB1 (TCAB1)",
                "TINF2 (TERF2)",
                "WRAP53 (TCAB1)",
                "RMI1",
                "RMI2",
                "TERRA"
            ],
            "mismatches": [],
            "true_referents": [
                "DKC1",
                "NHP2",
                "NHP2L1",
                "NOP10",
                "NOPP140",
                "PARN",
                "POT1",
                "POTIP1",
                "POTIP2",
                "RMI1",
                "RMI2",
                "RTEL1",
                "STN1",
                "TCAB1",
                "TCAB1 (TCAB1)",
                "TERC (TR)",
                "TERRA",
                "TERT (TER)",
                "TERT (hTERT)",
                "TINF2",
                "TINF2 (TERF2)",
                "TINF2 (TERF2IP)",
                "WRAP53",
                "WRAP53 (TCAB1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERT (telomerase reverse transcriptase)",
            "TERC (telomerase RNA component)",
            "DKC1 (dyskerin)",
            "NOP10 (nucleolar protein 10)",
            "NHP2 (nucleolar protein 2)",
            "TCAB1 (telomerase Cajal body protein 1)",
            "TINF2 (TRF1-interacting nuclear factor 2)",
            "TPP1 (TIN2-interacting protein 1)",
            "POT1 (protection of telomeres 1)",
            "TRF1 (telomeric repeat-binding factor 1)",
            "TRF2 (telomeric repeat-binding factor 2)",
            "RTEL1 (regulator of telomere elongation helicase 1)",
            "ACD (ATRX-DAXX chromatin remodeling complex)",
            "ATRX (alpha thalassemia/mental retardation syndrome X-linked)",
            "DAXX (death-domain associated protein)",
            "WRAP53 (WRAP53 beta)",
            "Rap1 (repressor/activator protein 1)",
            "STN1 (single-stranded DNA-binding protein 1)",
            "TERF2IP (TERF2 interacting protein)",
            "NOP56 (nucleolar protein 56)",
            "NOP58 (nucleolar protein 58)",
            "TIN2 (TRF1-interacting nuclear protein 2)",
            "POT1B (protection of telomeres 1B)",
            "POT1C (protection of telomeres 1C)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERT (telomerase reverse transcriptase)",
                "TERC (telomerase RNA component)",
                "DKC1 (dyskerin)",
                "NOP10 (nucleolar protein 10)",
                "NHP2 (nucleolar protein 2)",
                "TCAB1 (telomerase Cajal body protein 1)",
                "TINF2 (TRF1-interacting nuclear factor 2)",
                "TPP1 (TIN2-interacting protein 1)",
                "POT1 (protection of telomeres 1)",
                "TRF1 (telomeric repeat-binding factor 1)",
                "TRF2 (telomeric repeat-binding factor 2)",
                "RTEL1 (regulator of telomere elongation helicase 1)",
                "ACD (ATRX-DAXX chromatin remodeling complex)",
                "ATRX (alpha thalassemia/mental retardation syndrome X-linked)",
                "DAXX (death-domain associated protein)",
                "WRAP53 (WRAP53 beta)",
                "Rap1 (repressor/activator protein 1)",
                "STN1 (single-stranded DNA-binding protein 1)",
                "TERF2IP (TERF2 interacting protein)",
                "NOP56 (nucleolar protein 56)",
                "NOP58 (nucleolar protein 58)",
                "TIN2 (TRF1-interacting nuclear protein 2)",
                "POT1B (protection of telomeres 1B)",
                "POT1C (protection of telomeres 1C)"
            ],
            "mismatches": [],
            "true_referents": [
                "ACD (ATRX-DAXX chromatin remodeling complex)",
                "ATRX (alpha thalassemia/mental retardation syndrome X-linked)",
                "DAXX (death-domain associated protein)",
                "DKC1 (dyskerin)",
                "NHP2 (nucleolar protein 2)",
                "NOP10 (nucleolar protein 10)",
                "NOP56 (nucleolar protein 56)",
                "NOP58 (nucleolar protein 58)",
                "POT1 (protection of telomeres 1)",
                "POT1B (protection of telomeres 1B)",
                "POT1C (protection of telomeres 1C)",
                "RTEL1 (regulator of telomere elongation helicase 1)",
                "Rap1 (repressor/activator protein 1)",
                "STN1 (single-stranded DNA-binding protein 1)",
                "TCAB1 (telomerase Cajal body protein 1)",
                "TERC (telomerase RNA component)",
                "TERF2IP (TERF2 interacting protein)",
                "TERT (telomerase reverse transcriptase)",
                "TIN2 (TRF1-interacting nuclear protein 2)",
                "TINF2 (TRF1-interacting nuclear factor 2)",
                "TPP1 (TIN2-interacting protein 1)",
                "TRF1 (telomeric repeat-binding factor 1)",
                "TRF2 (telomeric repeat-binding factor 2)",
                "WRAP53 (WRAP53 beta)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERT (Telomerase Reverse Transcriptase)",
            "TERC (Telomerase RNA Component)",
            "DCK1 (Dyskerin)",
            "TIN2 (TRF1-Interacting Nuclear Factor 2)",
            "POT1 (Protection of Telomeres 1)",
            "TPP1 (Tripeptidyl Peptidase 1)",
            "RAP1 (Repressor Activator Protein 1)",
            "TRF1 (Telomeric Repeat-Binding Factor 1)",
            "TRF2 (Telomeric Repeat-Binding Factor 2)",
            "TNKS1 (Tankyrase 1)",
            "TNKS2 (Tankyrase 2)",
            "MRN Complex (MRE11, RAD50, NBS1)",
            "RTEL1 (Regulator of Telomere Length 1)",
            "RTL1 (Regulator of Telomere Length 1)",
            "WRN (Werner Syndrome RecQ Like Helicase)",
            "BLM (Bloom Syndrome RecQ Like Helicase)",
            "XRCC3 (X-ray Repair Cross Complementing 3)",
            "RAD51 (RAD51 Recombinase)",
            "RAD52 (RAD52 Homolog)",
            "RAD54 (RAD54 Like)",
            "XRCC1 (X-ray Repair Cross Complementing 1)",
            "XRCC2 (X-ray Repair Cross Complementing 2)",
            "XRCC4 (X-ray Repair Cross Complementing 4)",
            "XRCC5 (X-ray Repair Cross Complementing 5)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERT (Telomerase Reverse Transcriptase)",
                "TERC (Telomerase RNA Component)",
                "DCK1 (Dyskerin)",
                "TIN2 (TRF1-Interacting Nuclear Factor 2)",
                "POT1 (Protection of Telomeres 1)",
                "TPP1 (Tripeptidyl Peptidase 1)",
                "RAP1 (Repressor Activator Protein 1)",
                "TRF1 (Telomeric Repeat-Binding Factor 1)",
                "TRF2 (Telomeric Repeat-Binding Factor 2)",
                "TNKS1 (Tankyrase 1)",
                "TNKS2 (Tankyrase 2)",
                "MRN Complex (MRE11, RAD50, NBS1)",
                "RTEL1 (Regulator of Telomere Length 1)",
                "RTL1 (Regulator of Telomere Length 1)",
                "WRN (Werner Syndrome RecQ Like Helicase)",
                "BLM (Bloom Syndrome RecQ Like Helicase)",
                "XRCC3 (X-ray Repair Cross Complementing 3)",
                "RAD51 (RAD51 Recombinase)",
                "RAD52 (RAD52 Homolog)",
                "RAD54 (RAD54 Like)",
                "XRCC1 (X-ray Repair Cross Complementing 1)",
                "XRCC2 (X-ray Repair Cross Complementing 2)",
                "XRCC4 (X-ray Repair Cross Complementing 4)",
                "XRCC5 (X-ray Repair Cross Complementing 5)"
            ],
            "mismatches": [],
            "true_referents": [
                "BLM (Bloom Syndrome RecQ Like Helicase)",
                "DCK1 (Dyskerin)",
                "MRN Complex (MRE11, RAD50, NBS1)",
                "POT1 (Protection of Telomeres 1)",
                "RAD51 (RAD51 Recombinase)",
                "RAD52 (RAD52 Homolog)",
                "RAD54 (RAD54 Like)",
                "RAP1 (Repressor Activator Protein 1)",
                "RTEL1 (Regulator of Telomere Length 1)",
                "RTL1 (Regulator of Telomere Length 1)",
                "TERC (Telomerase RNA Component)",
                "TERT (Telomerase Reverse Transcriptase)",
                "TIN2 (TRF1-Interacting Nuclear Factor 2)",
                "TNKS1 (Tankyrase 1)",
                "TNKS2 (Tankyrase 2)",
                "TPP1 (Tripeptidyl Peptidase 1)",
                "TRF1 (Telomeric Repeat-Binding Factor 1)",
                "TRF2 (Telomeric Repeat-Binding Factor 2)",
                "WRN (Werner Syndrome RecQ Like Helicase)",
                "XRCC1 (X-ray Repair Cross Complementing 1)",
                "XRCC2 (X-ray Repair Cross Complementing 2)",
                "XRCC3 (X-ray Repair Cross Complementing 3)",
                "XRCC4 (X-ray Repair Cross Complementing 4)",
                "XRCC5 (X-ray Repair Cross Complementing 5)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERT (hTERT)",
            "TERC (hTR)",
            "POT1",
            "TPP1",
            "RAP1",
            "TIN2",
            "TRF1",
            "TRF2",
            "Shelterin complex",
            "Dyskerin (DKC1)",
            "TCAB1",
            "NOP10",
            "NHP2",
            "EST1",
            "SMG9",
            "PINX1",
            "MAD2",
            "BubR1",
            "ATM",
            "ATR",
            "WRN",
            "BLM",
            "Ku70/Ku80 heterodimer",
            "PARP1"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERT (hTERT)",
                "TERC (hTR)",
                "POT1",
                "TPP1",
                "RAP1",
                "TIN2",
                "TRF1",
                "TRF2",
                "Shelterin complex",
                "Dyskerin (DKC1)",
                "TCAB1",
                "NOP10",
                "NHP2",
                "EST1",
                "SMG9",
                "PINX1",
                "MAD2",
                "BubR1",
                "ATM",
                "ATR",
                "WRN",
                "BLM",
                "Ku70/Ku80 heterodimer",
                "PARP1"
            ],
            "mismatches": [],
            "true_referents": [
                "ATM",
                "ATR",
                "BLM",
                "BubR1",
                "Dyskerin (DKC1)",
                "EST1",
                "Ku70/Ku80 heterodimer",
                "MAD2",
                "NHP2",
                "NOP10",
                "PARP1",
                "PINX1",
                "POT1",
                "RAP1",
                "SMG9",
                "Shelterin complex",
                "TCAB1",
                "TERC (hTR)",
                "TERT (hTERT)",
                "TIN2",
                "TPP1",
                "TRF1",
                "TRF2",
                "WRN"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "Telomerase reverse transcriptase (TERT)",
            "Telomerase RNA component (TERC)",
            "Protection of telomeres protein 1 (POT1)",
            "Telomere repeat-binding factor 1 (TERF1/TRF1)",
            "Telomere repeat-binding factor 2 (TERF2/TRF2)",
            "Repressor/activator protein 1 (RAP1)",
            "Telomeric repeat-binding factor 2-interacting protein 1 (TERF2IP/RAP1)",
            "TIN2 interacting protein (TPP1/ACD)",
            "TRF1-interacting nuclear factor 2 (TINF2/TIN2)",
            "Tankyrase 1 (TNKS1)",
            "Tankyrase 2 (TNKS2)",
            "Pin2/TRF1-interacting telomerase inhibitor 1 (PINX1)",
            "Nuclear assembly factor 1 (NAF1)",
            "Nucleolar protein 7 (NOP7)",
            "NOP10 ribonucleoprotein (NOP10)",
            "GAR1 ribonucleoprotein homolog (GAR1)",
            "Dyskerin pseudouridine synthase 1 (DKC1)",
            "NHP2 ribonucleoprotein (NHP2)",
            "Telomeric zinc finger-associated protein (TZAP)",
            "Apollo (APOLLO/WRNIP1)",
            "CST complex subunit STN1 (STN1)",
            "CST complex subunit CTC1 (CTC1)",
            "CST complex subunit TEN1 (TEN1)",
            "Regulator of telomere elongation helicase 1 (RTEL1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Telomerase reverse transcriptase (TERT)",
                "Telomerase RNA component (TERC)",
                "Protection of telomeres protein 1 (POT1)",
                "Telomere repeat-binding factor 1 (TERF1/TRF1)",
                "Telomere repeat-binding factor 2 (TERF2/TRF2)",
                "Repressor/activator protein 1 (RAP1)",
                "Telomeric repeat-binding factor 2-interacting protein 1 (TERF2IP/RAP1)",
                "TIN2 interacting protein (TPP1/ACD)",
                "TRF1-interacting nuclear factor 2 (TINF2/TIN2)",
                "Tankyrase 1 (TNKS1)",
                "Tankyrase 2 (TNKS2)",
                "Pin2/TRF1-interacting telomerase inhibitor 1 (PINX1)",
                "Nuclear assembly factor 1 (NAF1)",
                "Nucleolar protein 7 (NOP7)",
                "NOP10 ribonucleoprotein (NOP10)",
                "GAR1 ribonucleoprotein homolog (GAR1)",
                "Dyskerin pseudouridine synthase 1 (DKC1)",
                "NHP2 ribonucleoprotein (NHP2)",
                "Telomeric zinc finger-associated protein (TZAP)",
                "Apollo (APOLLO/WRNIP1)",
                "CST complex subunit STN1 (STN1)",
                "CST complex subunit CTC1 (CTC1)",
                "CST complex subunit TEN1 (TEN1)",
                "Regulator of telomere elongation helicase 1 (RTEL1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Apollo (APOLLO/WRNIP1)",
                "CST complex subunit CTC1 (CTC1)",
                "CST complex subunit STN1 (STN1)",
                "CST complex subunit TEN1 (TEN1)",
                "Dyskerin pseudouridine synthase 1 (DKC1)",
                "GAR1 ribonucleoprotein homolog (GAR1)",
                "NHP2 ribonucleoprotein (NHP2)",
                "NOP10 ribonucleoprotein (NOP10)",
                "Nuclear assembly factor 1 (NAF1)",
                "Nucleolar protein 7 (NOP7)",
                "Pin2/TRF1-interacting telomerase inhibitor 1 (PINX1)",
                "Protection of telomeres protein 1 (POT1)",
                "Regulator of telomere elongation helicase 1 (RTEL1)",
                "Repressor/activator protein 1 (RAP1)",
                "TIN2 interacting protein (TPP1/ACD)",
                "TRF1-interacting nuclear factor 2 (TINF2/TIN2)",
                "Tankyrase 1 (TNKS1)",
                "Tankyrase 2 (TNKS2)",
                "Telomerase RNA component (TERC)",
                "Telomerase reverse transcriptase (TERT)",
                "Telomere repeat-binding factor 1 (TERF1/TRF1)",
                "Telomere repeat-binding factor 2 (TERF2/TRF2)",
                "Telomeric repeat-binding factor 2-interacting protein 1 (TERF2IP/RAP1)",
                "Telomeric zinc finger-associated protein (TZAP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERT (telomerase reverse transcriptase)",
            "TERC (telomerase RNA component)",
            "POT1 (protection of telomeres 1)",
            "TRF1 (telomeric repeat binding factor 1)",
            "TRF2 (telomeric repeat binding factor 2)",
            "TIN2 (TRF1-interacting nuclear protein 2)",
            "TPP1 (TIN2-interacting protein 1)",
            "WRAP53 (WD repeat and phosphoinositide-interacting protein 53)",
            "RTEL1 (regulator of telomere elongation helicase 1)",
            "BLM (Bloom syndrome protein)",
            "DAXX (death-domain associated protein)",
            "FANCJ (Fanconi anemia complementation group J)",
            "NHP2 (nuclear RNA helicase 2)",
            "NOP10 (nucleolar protein 10)",
            "MRE11 (meiotic recombination 11 homolog)",
            "ATM (ataxia telangiectasia mutated)",
            "ATR (ataxia telangiectasia and Rad3 related)",
            "TP53 (tumor protein p53)",
            "RAD51 (radiation sensitive 51)",
            "SMC6 (structural maintenance of chromosomes 6)",
            "CST complex (composed of CTC1, STN1, and TEN1)",
            "TINF2 (telomeric repeat-binding factor 2-interacting factor 2)",
            "POT1B (protection of telomeres 1B)",
            "TERRA (telomeric repeat-containing RNA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERT (telomerase reverse transcriptase)",
                "TERC (telomerase RNA component)",
                "POT1 (protection of telomeres 1)",
                "TRF1 (telomeric repeat binding factor 1)",
                "TRF2 (telomeric repeat binding factor 2)",
                "TIN2 (TRF1-interacting nuclear protein 2)",
                "TPP1 (TIN2-interacting protein 1)",
                "WRAP53 (WD repeat and phosphoinositide-interacting protein 53)",
                "RTEL1 (regulator of telomere elongation helicase 1)",
                "BLM (Bloom syndrome protein)",
                "DAXX (death-domain associated protein)",
                "FANCJ (Fanconi anemia complementation group J)",
                "NHP2 (nuclear RNA helicase 2)",
                "NOP10 (nucleolar protein 10)",
                "MRE11 (meiotic recombination 11 homolog)",
                "ATM (ataxia telangiectasia mutated)",
                "ATR (ataxia telangiectasia and Rad3 related)",
                "TP53 (tumor protein p53)",
                "RAD51 (radiation sensitive 51)",
                "SMC6 (structural maintenance of chromosomes 6)",
                "CST complex (composed of CTC1, STN1, and TEN1)",
                "TINF2 (telomeric repeat-binding factor 2-interacting factor 2)",
                "POT1B (protection of telomeres 1B)",
                "TERRA (telomeric repeat-containing RNA)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATM (ataxia telangiectasia mutated)",
                "ATR (ataxia telangiectasia and Rad3 related)",
                "BLM (Bloom syndrome protein)",
                "CST complex (composed of CTC1, STN1, and TEN1)",
                "DAXX (death-domain associated protein)",
                "FANCJ (Fanconi anemia complementation group J)",
                "MRE11 (meiotic recombination 11 homolog)",
                "NHP2 (nuclear RNA helicase 2)",
                "NOP10 (nucleolar protein 10)",
                "POT1 (protection of telomeres 1)",
                "POT1B (protection of telomeres 1B)",
                "RAD51 (radiation sensitive 51)",
                "RTEL1 (regulator of telomere elongation helicase 1)",
                "SMC6 (structural maintenance of chromosomes 6)",
                "TERC (telomerase RNA component)",
                "TERRA (telomeric repeat-containing RNA)",
                "TERT (telomerase reverse transcriptase)",
                "TIN2 (TRF1-interacting nuclear protein 2)",
                "TINF2 (telomeric repeat-binding factor 2-interacting factor 2)",
                "TP53 (tumor protein p53)",
                "TPP1 (TIN2-interacting protein 1)",
                "TRF1 (telomeric repeat binding factor 1)",
                "TRF2 (telomeric repeat binding factor 2)",
                "WRAP53 (WD repeat and phosphoinositide-interacting protein 53)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "Telomerase reverse transcriptase (TERT)",
            "Protection of telomeres 1 (POT1)",
            "Telomeric repeat-binding factor 1 (TRF1)",
            "Telomeric repeat-binding factor 2 (TRF2)",
            "Telomerase RNA Component (TERC)",
            "Adrenocortical dysplasia protein homolog (ACD)",
            "Protection of telomeres 1B (POT1B)",
            "Rap1-interacting factor 1 homolog (RIF1)",
            "Telomere length regulation protein (TEN1)",
            "Stn1, CST complex subunit (STN1)",
            "Ctc1, CST complex subunit (CTC1)",
            "Telomerase Cajal body protein 1 (TCAB1)",
            "Dyskerin pseudouridine synthase 1 (DKC1)",
            "NHP2 ribonucleoprotein (NHP2)",
            "Nucleolar protein 10 (NOP10)",
            "Gar1 ribonucleoprotein (GAR1)",
            "Telomerase-associated protein 1 (TEP1)",
            "Telomere-associated protein RIF1 (RIF1)",
            "Telomere maintenance 2 (WRAP53)",
            "Regulator of telomere elongation helicase 1 (RTEL1)",
            "Telomeric repeat-binding factor 2-interacting protein 1 (TERF2IP)",
            "PinX1 (PINX1)",
            "Telomeric overhang-binding protein (TEBP)",
            "Telomere-specific endonuclease 1 (TEN1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Telomerase reverse transcriptase (TERT)",
                "Protection of telomeres 1 (POT1)",
                "Telomeric repeat-binding factor 1 (TRF1)",
                "Telomeric repeat-binding factor 2 (TRF2)",
                "Telomerase RNA Component (TERC)",
                "Adrenocortical dysplasia protein homolog (ACD)",
                "Protection of telomeres 1B (POT1B)",
                "Rap1-interacting factor 1 homolog (RIF1)",
                "Telomere length regulation protein (TEN1)",
                "Stn1, CST complex subunit (STN1)",
                "Ctc1, CST complex subunit (CTC1)",
                "Telomerase Cajal body protein 1 (TCAB1)",
                "Dyskerin pseudouridine synthase 1 (DKC1)",
                "NHP2 ribonucleoprotein (NHP2)",
                "Nucleolar protein 10 (NOP10)",
                "Gar1 ribonucleoprotein (GAR1)",
                "Telomerase-associated protein 1 (TEP1)",
                "Telomere-associated protein RIF1 (RIF1)",
                "Telomere maintenance 2 (WRAP53)",
                "Regulator of telomere elongation helicase 1 (RTEL1)",
                "Telomeric repeat-binding factor 2-interacting protein 1 (TERF2IP)",
                "PinX1 (PINX1)",
                "Telomeric overhang-binding protein (TEBP)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenocortical dysplasia protein homolog (ACD)",
                "Ctc1, CST complex subunit (CTC1)",
                "Dyskerin pseudouridine synthase 1 (DKC1)",
                "Gar1 ribonucleoprotein (GAR1)",
                "NHP2 ribonucleoprotein (NHP2)",
                "Nucleolar protein 10 (NOP10)",
                "PinX1 (PINX1)",
                "Protection of telomeres 1 (POT1)",
                "Protection of telomeres 1B (POT1B)",
                "Rap1-interacting factor 1 homolog (RIF1)",
                "Regulator of telomere elongation helicase 1 (RTEL1)",
                "Stn1, CST complex subunit (STN1)",
                "Telomerase Cajal body protein 1 (TCAB1)",
                "Telomerase RNA Component (TERC)",
                "Telomerase reverse transcriptase (TERT)",
                "Telomerase-associated protein 1 (TEP1)",
                "Telomere length regulation protein (TEN1)",
                "Telomere maintenance 2 (WRAP53)",
                "Telomere-associated protein RIF1 (RIF1)",
                "Telomere-specific endonuclease 1 (TEN1)",
                "Telomeric overhang-binding protein (TEBP)",
                "Telomeric repeat-binding factor 1 (TRF1)",
                "Telomeric repeat-binding factor 2 (TRF2)",
                "Telomeric repeat-binding factor 2-interacting protein 1 (TERF2IP)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TP53 (p53)",
            "TERT (telomerase reverse transcriptase)",
            "TERC (telomerase RNA component)",
            "TERF1 (telomeric repeat binding factor 1)",
            "TERF2 (telomeric repeat binding factor 2)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
            "TERF2IP (telomeric repeat binding factor 2 interacting protein)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TP53 (p53)",
                "TERT (telomerase reverse transcriptase)",
                "TERC (telomerase RNA component)",
                "TERF1 (telomeric repeat binding factor 1)",
                "TERF2 (telomeric repeat binding factor 2)",
                "TERF2IP (telomeric repeat binding factor 2 interacting protein)"
            ],
            "mismatches": [],
            "true_referents": [
                "TERC (telomerase RNA component)",
                "TERF1 (telomeric repeat binding factor 1)",
                "TERF2 (telomeric repeat binding factor 2)",
                "TERF2IP (telomeric repeat binding factor 2 interacting protein)",
                "TERT (telomerase reverse transcriptase)",
                "TP53 (p53)"
            ],
            "TP": 6,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERT (Telomerase Reverse Transcriptase)",
            "TERC (Telomerase RNA Component)",
            "DKC1 (Dyskerin)",
            "NOP10",
            "NHP2",
            "GAR1",
            "TINF2 (TERF1-Interacting Nuclear Factor 2)",
            "POT1 (Protection of Telomeres 1)",
            "ACD (TPP1)",
            "TERF1 (Telomeric Repeat-Binding Factor 1)",
            "TERF2 (Telomeric Repeat-Binding Factor 2)",
            "TERF2IP (TERF2-Interacting Protein, RAP1)",
            "CTC1",
            "STN1",
            "TEN1",
            "RTEL1 (Regulator of Telomere Elongation Helicase 1)",
            "WRN (Werner Syndrome Helicase)",
            "BLM (Bloom Syndrome Helicase)",
            "ATM (Ataxia Telangiectasia Mutated)",
            "ATR (ATM and Rad3-Related)",
            "SLX4",
            "RPA1 (Replication Protein A1)",
            "RPA2 (Replication Protein A2)",
            "RPA3 (Replication Protein A3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERT (Telomerase Reverse Transcriptase)",
                "TERC (Telomerase RNA Component)",
                "DKC1 (Dyskerin)",
                "NOP10",
                "NHP2",
                "GAR1",
                "TINF2 (TERF1-Interacting Nuclear Factor 2)",
                "POT1 (Protection of Telomeres 1)",
                "ACD (TPP1)",
                "TERF1 (Telomeric Repeat-Binding Factor 1)",
                "TERF2 (Telomeric Repeat-Binding Factor 2)",
                "TERF2IP (TERF2-Interacting Protein, RAP1)",
                "CTC1",
                "STN1",
                "TEN1",
                "RTEL1 (Regulator of Telomere Elongation Helicase 1)",
                "WRN (Werner Syndrome Helicase)",
                "BLM (Bloom Syndrome Helicase)",
                "ATM (Ataxia Telangiectasia Mutated)",
                "ATR (ATM and Rad3-Related)",
                "SLX4",
                "RPA1 (Replication Protein A1)",
                "RPA2 (Replication Protein A2)",
                "RPA3 (Replication Protein A3)"
            ],
            "mismatches": [],
            "true_referents": [
                "ACD (TPP1)",
                "ATM (Ataxia Telangiectasia Mutated)",
                "ATR (ATM and Rad3-Related)",
                "BLM (Bloom Syndrome Helicase)",
                "CTC1",
                "DKC1 (Dyskerin)",
                "GAR1",
                "NHP2",
                "NOP10",
                "POT1 (Protection of Telomeres 1)",
                "RPA1 (Replication Protein A1)",
                "RPA2 (Replication Protein A2)",
                "RPA3 (Replication Protein A3)",
                "RTEL1 (Regulator of Telomere Elongation Helicase 1)",
                "SLX4",
                "STN1",
                "TEN1",
                "TERC (Telomerase RNA Component)",
                "TERF1 (Telomeric Repeat-Binding Factor 1)",
                "TERF2 (Telomeric Repeat-Binding Factor 2)",
                "TERF2IP (TERF2-Interacting Protein, RAP1)",
                "TERT (Telomerase Reverse Transcriptase)",
                "TINF2 (TERF1-Interacting Nuclear Factor 2)",
                "WRN (Werner Syndrome Helicase)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "Telomerase Reverse Transcriptase (TERT)",
            "Protection of Telomeres 1 (POT1)",
            "Telomeric Repeat Binding Factor 1 (TERF1)",
            "Telomeric Repeat Binding Factor 2 (TERF2)",
            "TERF1 Interacting Nuclear Factor 2 (TINF2)",
            "ACD Shelterin Complex Subunit And Telomerase Recruitment Factor (ACD)",
            "Telomeric Repeat Binding Factor 2 Interacting Protein (TERF2IP)",
            "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
            "CST Telomere Replication Complex Component 1 (CTC1)",
            "STN1 Subunit Of CST Complex (STN1)",
            "TEN1 Subunit Of CST Complex (TEN1)",
            "Telomere Maintenance 2 (TELO2)",
            "Telomere Length Regulation Protein TEL2 Homolog (TTI1)",
            "Telomere Length Regulation Protein TEL2 Homolog (TTI2)",
            "Dyskeratosis Congenita 1 (DKC1)",
            "NHP2 Ribonucleoprotein (NHP2)",
            "NOP10 Ribonucleoprotein (NOP10)",
            "GAR1 Ribonucleoprotein (GAR1)",
            "Telomerase RNA Component (TERC)",
            "TNKS Tankyrase 1 (TNKS)",
            "TNKS2 Tankyrase 2 (TNKS2)",
            "Werner Syndrome RecQ Like Helicase (WRN)",
            "Bloom Syndrome RecQ Like Helicase (BLM)",
            "ATM Serine/Threonine Kinase (ATM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Telomerase Reverse Transcriptase (TERT)",
                "Protection of Telomeres 1 (POT1)",
                "Telomeric Repeat Binding Factor 1 (TERF1)",
                "Telomeric Repeat Binding Factor 2 (TERF2)",
                "TERF1 Interacting Nuclear Factor 2 (TINF2)",
                "ACD Shelterin Complex Subunit And Telomerase Recruitment Factor (ACD)",
                "Telomeric Repeat Binding Factor 2 Interacting Protein (TERF2IP)",
                "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
                "CST Telomere Replication Complex Component 1 (CTC1)",
                "STN1 Subunit Of CST Complex (STN1)",
                "TEN1 Subunit Of CST Complex (TEN1)",
                "Telomere Maintenance 2 (TELO2)",
                "Telomere Length Regulation Protein TEL2 Homolog (TTI1)",
                "Telomere Length Regulation Protein TEL2 Homolog (TTI2)",
                "Dyskeratosis Congenita 1 (DKC1)",
                "NHP2 Ribonucleoprotein (NHP2)",
                "NOP10 Ribonucleoprotein (NOP10)",
                "GAR1 Ribonucleoprotein (GAR1)",
                "Telomerase RNA Component (TERC)",
                "TNKS Tankyrase 1 (TNKS)",
                "TNKS2 Tankyrase 2 (TNKS2)",
                "Werner Syndrome RecQ Like Helicase (WRN)",
                "Bloom Syndrome RecQ Like Helicase (BLM)",
                "ATM Serine/Threonine Kinase (ATM)"
            ],
            "mismatches": [],
            "true_referents": [
                "ACD Shelterin Complex Subunit And Telomerase Recruitment Factor (ACD)",
                "ATM Serine/Threonine Kinase (ATM)",
                "Bloom Syndrome RecQ Like Helicase (BLM)",
                "CST Telomere Replication Complex Component 1 (CTC1)",
                "Dyskeratosis Congenita 1 (DKC1)",
                "GAR1 Ribonucleoprotein (GAR1)",
                "NHP2 Ribonucleoprotein (NHP2)",
                "NOP10 Ribonucleoprotein (NOP10)",
                "Protection of Telomeres 1 (POT1)",
                "Regulator of Telomere Elongation Helicase 1 (RTEL1)",
                "STN1 Subunit Of CST Complex (STN1)",
                "TEN1 Subunit Of CST Complex (TEN1)",
                "TERF1 Interacting Nuclear Factor 2 (TINF2)",
                "TNKS Tankyrase 1 (TNKS)",
                "TNKS2 Tankyrase 2 (TNKS2)",
                "Telomerase RNA Component (TERC)",
                "Telomerase Reverse Transcriptase (TERT)",
                "Telomere Length Regulation Protein TEL2 Homolog (TTI1)",
                "Telomere Length Regulation Protein TEL2 Homolog (TTI2)",
                "Telomere Maintenance 2 (TELO2)",
                "Telomeric Repeat Binding Factor 1 (TERF1)",
                "Telomeric Repeat Binding Factor 2 (TERF2)",
                "Telomeric Repeat Binding Factor 2 Interacting Protein (TERF2IP)",
                "Werner Syndrome RecQ Like Helicase (WRN)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERC (Telomerase RNA Component)",
            "TERT (Telomerase Reverse Transcriptase)",
            "TERF1 (Telomeric Repeat Binding Factor 1)",
            "TERF2 (Telomeric Repeat Binding Factor 2)",
            "TINF2 (TERF1 Interacting Nuclear Factor 2)",
            "ACD (Adrenocortical Dysplasia Homolog)",
            "POT1 (Protection of Telomeres 1)",
            "TPP1 (Tripeptidyl Peptidase 1)",
            "TERF2IP (TERF2 Interacting Protein)",
            "RTEL1 (Regulator of Telomere Elongation Helicase 1)",
            "PARN (Poly(A)-Specific Ribonuclease)",
            "NOP10 (NOP10 Ribonucleoprotein)",
            "NHP2 (NHP2 Ribonucleoprotein)",
            "DKC1 (Dyskerin Pseudouridine Synthase 1)",
            "WRAP53 (WD Repeat Containing Antisense to TP53)",
            "HNRNPA1 (Heterogeneous Nuclear Ribonucleoprotein A1)",
            "HNRNPA2B1 (Heterogeneous Nuclear Ribonucleoprotein A2/B1)",
            "TCAB1 (Telomerase Cajal Body Protein 1)",
            "NAF1 (Nuclear Assembly Factor 1 Ribonucleoprotein)",
            "PINX1 (PIN2/TERF1 Interacting Telomerase Inhibitor 1)",
            "MCRS1 (Microspherule Protein 1)",
            "RPA1 (Replication Protein A1)",
            "STN1 (STN1 Subunit of CST Complex)",
            "CTC1 (CTS Telomere Maintenance Complex Component 1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERC (Telomerase RNA Component)",
                "TERT (Telomerase Reverse Transcriptase)",
                "TERF1 (Telomeric Repeat Binding Factor 1)",
                "TERF2 (Telomeric Repeat Binding Factor 2)",
                "TINF2 (TERF1 Interacting Nuclear Factor 2)",
                "ACD (Adrenocortical Dysplasia Homolog)",
                "POT1 (Protection of Telomeres 1)",
                "TPP1 (Tripeptidyl Peptidase 1)",
                "TERF2IP (TERF2 Interacting Protein)",
                "RTEL1 (Regulator of Telomere Elongation Helicase 1)",
                "PARN (Poly(A)-Specific Ribonuclease)",
                "NOP10 (NOP10 Ribonucleoprotein)",
                "NHP2 (NHP2 Ribonucleoprotein)",
                "DKC1 (Dyskerin Pseudouridine Synthase 1)",
                "WRAP53 (WD Repeat Containing Antisense to TP53)",
                "HNRNPA1 (Heterogeneous Nuclear Ribonucleoprotein A1)",
                "HNRNPA2B1 (Heterogeneous Nuclear Ribonucleoprotein A2/B1)",
                "TCAB1 (Telomerase Cajal Body Protein 1)",
                "NAF1 (Nuclear Assembly Factor 1 Ribonucleoprotein)",
                "PINX1 (PIN2/TERF1 Interacting Telomerase Inhibitor 1)",
                "MCRS1 (Microspherule Protein 1)",
                "RPA1 (Replication Protein A1)",
                "STN1 (STN1 Subunit of CST Complex)",
                "CTC1 (CTS Telomere Maintenance Complex Component 1)"
            ],
            "mismatches": [],
            "true_referents": [
                "ACD (Adrenocortical Dysplasia Homolog)",
                "CTC1 (CTS Telomere Maintenance Complex Component 1)",
                "DKC1 (Dyskerin Pseudouridine Synthase 1)",
                "HNRNPA1 (Heterogeneous Nuclear Ribonucleoprotein A1)",
                "HNRNPA2B1 (Heterogeneous Nuclear Ribonucleoprotein A2/B1)",
                "MCRS1 (Microspherule Protein 1)",
                "NAF1 (Nuclear Assembly Factor 1 Ribonucleoprotein)",
                "NHP2 (NHP2 Ribonucleoprotein)",
                "NOP10 (NOP10 Ribonucleoprotein)",
                "PARN (Poly(A)-Specific Ribonuclease)",
                "PINX1 (PIN2/TERF1 Interacting Telomerase Inhibitor 1)",
                "POT1 (Protection of Telomeres 1)",
                "RPA1 (Replication Protein A1)",
                "RTEL1 (Regulator of Telomere Elongation Helicase 1)",
                "STN1 (STN1 Subunit of CST Complex)",
                "TCAB1 (Telomerase Cajal Body Protein 1)",
                "TERC (Telomerase RNA Component)",
                "TERF1 (Telomeric Repeat Binding Factor 1)",
                "TERF2 (Telomeric Repeat Binding Factor 2)",
                "TERF2IP (TERF2 Interacting Protein)",
                "TERT (Telomerase Reverse Transcriptase)",
                "TINF2 (TERF1 Interacting Nuclear Factor 2)",
                "TPP1 (Tripeptidyl Peptidase 1)",
                "WRAP53 (WD Repeat Containing Antisense to TP53)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "Telomerase reverse transcriptase (TERT)",
            "Telomerase-associated protein 1 (TEP1)",
            "Protection of telomeres 1 (POT1)",
            "Repressor activator protein 1 (RAP1)",
            "TRF1-interacting nuclear protein 2 (TIN2)",
            "TRF1-interacting protein 2 (TINF2)",
            "TRF1-interacting protein 1 (TINF1)",
            "Telomeric repeat binding factor 1 (TERF1)",
            "Telomeric repeat binding factor 2 (TERF2)",
            "Telomeric repeat binding factor 2 interacting protein 1 (TERF2IP)",
            "Regulator of telomere elongation helicase 1 (RTEL1)",
            "Shelterin complex subunit POT1 (POT1)",
            "Shelterin complex subunit TRF1 (TERF1)",
            "Shelterin complex subunit TRF2 (TERF2)",
            "Shelterin complex subunit RAP1 (TERF2IP)",
            "Shelterin complex subunit TIN2 (TINF2)",
            "Shelterin complex subunit TPP1 (ACD)",
            "Shelterin complex subunit TNKS1BP1 (TNKS1BP1)",
            "Shelterin complex subunit TNKS2 (TNKS2)",
            "CST telomere replication complex subunit CTC1 (CTC1)",
            "CST telomere replication complex subunit STN1 (OBFC1)",
            "CST telomere replication complex subunit TEN1 (TINF2)",
            "Telomere elongation helicase (RTEL1)",
            "Telomere length regulation protein TEL2 (TELO2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Telomerase reverse transcriptase (TERT)",
                "Telomerase-associated protein 1 (TEP1)",
                "Protection of telomeres 1 (POT1)",
                "Repressor activator protein 1 (RAP1)",
                "TRF1-interacting nuclear protein 2 (TIN2)",
                "TRF1-interacting protein 2 (TINF2)",
                "TRF1-interacting protein 1 (TINF1)",
                "Telomeric repeat binding factor 1 (TERF1)",
                "Telomeric repeat binding factor 2 (TERF2)",
                "Telomeric repeat binding factor 2 interacting protein 1 (TERF2IP)",
                "Regulator of telomere elongation helicase 1 (RTEL1)",
                "Shelterin complex subunit POT1 (POT1)",
                "Shelterin complex subunit TRF1 (TERF1)",
                "Shelterin complex subunit TRF2 (TERF2)",
                "Shelterin complex subunit RAP1 (TERF2IP)",
                "Shelterin complex subunit TIN2 (TINF2)",
                "Shelterin complex subunit TPP1 (ACD)",
                "Shelterin complex subunit TNKS1BP1 (TNKS1BP1)",
                "Shelterin complex subunit TNKS2 (TNKS2)",
                "CST telomere replication complex subunit CTC1 (CTC1)",
                "CST telomere replication complex subunit STN1 (OBFC1)",
                "CST telomere replication complex subunit TEN1 (TINF2)",
                "Telomere elongation helicase (RTEL1)",
                "Telomere length regulation protein TEL2 (TELO2)"
            ],
            "mismatches": [],
            "true_referents": [
                "CST telomere replication complex subunit CTC1 (CTC1)",
                "CST telomere replication complex subunit STN1 (OBFC1)",
                "CST telomere replication complex subunit TEN1 (TINF2)",
                "Protection of telomeres 1 (POT1)",
                "Regulator of telomere elongation helicase 1 (RTEL1)",
                "Repressor activator protein 1 (RAP1)",
                "Shelterin complex subunit POT1 (POT1)",
                "Shelterin complex subunit RAP1 (TERF2IP)",
                "Shelterin complex subunit TIN2 (TINF2)",
                "Shelterin complex subunit TNKS1BP1 (TNKS1BP1)",
                "Shelterin complex subunit TNKS2 (TNKS2)",
                "Shelterin complex subunit TPP1 (ACD)",
                "Shelterin complex subunit TRF1 (TERF1)",
                "Shelterin complex subunit TRF2 (TERF2)",
                "TRF1-interacting nuclear protein 2 (TIN2)",
                "TRF1-interacting protein 1 (TINF1)",
                "TRF1-interacting protein 2 (TINF2)",
                "Telomerase reverse transcriptase (TERT)",
                "Telomerase-associated protein 1 (TEP1)",
                "Telomere elongation helicase (RTEL1)",
                "Telomere length regulation protein TEL2 (TELO2)",
                "Telomeric repeat binding factor 1 (TERF1)",
                "Telomeric repeat binding factor 2 (TERF2)",
                "Telomeric repeat binding factor 2 interacting protein 1 (TERF2IP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERT (Telomerase Reverse Transcriptase)",
            "TERC (Telomerase RNA Component)",
            "POT1 (Protection of Telomeres 1)",
            "TIN2 (TRF1-Interacting Nuclear Factor 2)",
            "TPP1 (Tripeptidyl Peptidase 1)",
            "RAP1 (Repressor/Activator Protein 1)",
            "TRF1 (Telomeric Repeat-Binding Factor 1)",
            "TRF2 (Telomeric Repeat-Binding Factor 2)",
            "RTEL1 (Regulator of Telomere Elongation Helicase 1)",
            "TNKS (Tankyrase)",
            "TNKS2 (Tankyrase 2)",
            "NOP10 (Nucleolar Protein 10)",
            "NHP2 (Non-Histone Chromosome Protein 2)",
            "GAR1 (Glycine-Arginine-Rich Protein 1)",
            "DKC1 (Dyskeratosis Congenita 1, Dyskerin)",
            "WRAP53 (WD Repeat-Containing Antisense to TP53)",
            "PINX1 (PIN2/TERF1-Interacting, Telomerase Inhibitor 1)",
            "PTOP (POT1 and TIN2 Organizing Protein)",
            "AKTIP (AKT-Interacting Protein)",
            "TCAB1 (Telomerase Cajal Body Protein 1)",
            "PARN (Poly(A)-Specific Ribonuclease)",
            "RTEL1-LIKE (Regulator of Telomere Elongation Helicase 1-Like)",
            "OBFC1 (Oligonucleotide/Oligosaccharide-Binding Fold Containing 1)",
            "TINF2 (TERF1-Interacting Nuclear Factor 2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERT (Telomerase Reverse Transcriptase)",
                "TERC (Telomerase RNA Component)",
                "POT1 (Protection of Telomeres 1)",
                "TIN2 (TRF1-Interacting Nuclear Factor 2)",
                "TPP1 (Tripeptidyl Peptidase 1)",
                "RAP1 (Repressor/Activator Protein 1)",
                "TRF1 (Telomeric Repeat-Binding Factor 1)",
                "TRF2 (Telomeric Repeat-Binding Factor 2)",
                "RTEL1 (Regulator of Telomere Elongation Helicase 1)",
                "TNKS (Tankyrase)",
                "TNKS2 (Tankyrase 2)",
                "NOP10 (Nucleolar Protein 10)",
                "NHP2 (Non-Histone Chromosome Protein 2)",
                "GAR1 (Glycine-Arginine-Rich Protein 1)",
                "DKC1 (Dyskeratosis Congenita 1, Dyskerin)",
                "WRAP53 (WD Repeat-Containing Antisense to TP53)",
                "PINX1 (PIN2/TERF1-Interacting, Telomerase Inhibitor 1)",
                "PTOP (POT1 and TIN2 Organizing Protein)",
                "AKTIP (AKT-Interacting Protein)",
                "TCAB1 (Telomerase Cajal Body Protein 1)",
                "PARN (Poly(A)-Specific Ribonuclease)",
                "RTEL1-LIKE (Regulator of Telomere Elongation Helicase 1-Like)",
                "OBFC1 (Oligonucleotide/Oligosaccharide-Binding Fold Containing 1)",
                "TINF2 (TERF1-Interacting Nuclear Factor 2)"
            ],
            "mismatches": [],
            "true_referents": [
                "AKTIP (AKT-Interacting Protein)",
                "DKC1 (Dyskeratosis Congenita 1, Dyskerin)",
                "GAR1 (Glycine-Arginine-Rich Protein 1)",
                "NHP2 (Non-Histone Chromosome Protein 2)",
                "NOP10 (Nucleolar Protein 10)",
                "OBFC1 (Oligonucleotide/Oligosaccharide-Binding Fold Containing 1)",
                "PARN (Poly(A)-Specific Ribonuclease)",
                "PINX1 (PIN2/TERF1-Interacting, Telomerase Inhibitor 1)",
                "POT1 (Protection of Telomeres 1)",
                "PTOP (POT1 and TIN2 Organizing Protein)",
                "RAP1 (Repressor/Activator Protein 1)",
                "RTEL1 (Regulator of Telomere Elongation Helicase 1)",
                "RTEL1-LIKE (Regulator of Telomere Elongation Helicase 1-Like)",
                "TCAB1 (Telomerase Cajal Body Protein 1)",
                "TERC (Telomerase RNA Component)",
                "TERT (Telomerase Reverse Transcriptase)",
                "TIN2 (TRF1-Interacting Nuclear Factor 2)",
                "TINF2 (TERF1-Interacting Nuclear Factor 2)",
                "TNKS (Tankyrase)",
                "TNKS2 (Tankyrase 2)",
                "TPP1 (Tripeptidyl Peptidase 1)",
                "TRF1 (Telomeric Repeat-Binding Factor 1)",
                "TRF2 (Telomeric Repeat-Binding Factor 2)",
                "WRAP53 (WD Repeat-Containing Antisense to TP53)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERT (Telomerase Reverse Transcriptase) gene (TERT)",
            "TERC (Telomerase RNA Component) gene (TERC)",
            "TRF1 (Telomere Repeat Factor 1) gene",
            "TRF2 (Telomere Repeat Factor 2) gene",
            "Rap1 (Rapidly Accelerated Fibrosarcoma 1) gene",
            "Pot1 (Protection of Telomeres 1) gene",
            "Pot1b (Protection of Telomeres 1B) gene",
            "TPP1 (Telomerase-associated Protein 1) gene",
            "EST1 (Est1) gene",
            "EST2 (Est2) gene",
            "MRE11 (Meiotic Recombination 11) gene",
            "NBS1 (Nijmegen Breakage Syndrome 1) gene",
            "ATM (Ataxia-Telangiectasia Mutated) gene",
            "ATR (Ataxia-Telangiectasia and Rad3-related) gene",
            "RPA1 (Replication Protein A 1) gene",
            "RPA2 (Replication Protein A 2) gene",
            "RPA3 (Replication Protein A 3) gene",
            "BRCA1 (Breast Cancer 1) gene",
            "BRCA2 (Breast Cancer 2) gene",
            "BLM (Bloom Syndrome) gene",
            "WRN (Werner Syndrome) gene",
            "Ku70 (Ku Autoantigen 70) gene",
            "Ku80 (Ku Autoantigen 80) gene",
            "DNA-PKcs (DNA-dependent Protein Kinase catalytic subunit) gene"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERT (Telomerase Reverse Transcriptase) gene (TERT)",
                "TERC (Telomerase RNA Component) gene (TERC)",
                "TRF1 (Telomere Repeat Factor 1) gene",
                "TRF2 (Telomere Repeat Factor 2) gene",
                "Rap1 (Rapidly Accelerated Fibrosarcoma 1) gene",
                "Pot1 (Protection of Telomeres 1) gene",
                "Pot1b (Protection of Telomeres 1B) gene",
                "TPP1 (Telomerase-associated Protein 1) gene",
                "EST1 (Est1) gene",
                "EST2 (Est2) gene",
                "MRE11 (Meiotic Recombination 11) gene",
                "NBS1 (Nijmegen Breakage Syndrome 1) gene",
                "ATM (Ataxia-Telangiectasia Mutated) gene",
                "ATR (Ataxia-Telangiectasia and Rad3-related) gene",
                "RPA1 (Replication Protein A 1) gene",
                "RPA2 (Replication Protein A 2) gene",
                "RPA3 (Replication Protein A 3) gene",
                "BRCA1 (Breast Cancer 1) gene",
                "BRCA2 (Breast Cancer 2) gene",
                "BLM (Bloom Syndrome) gene",
                "WRN (Werner Syndrome) gene",
                "Ku70 (Ku Autoantigen 70) gene",
                "Ku80 (Ku Autoantigen 80) gene",
                "DNA-PKcs (DNA-dependent Protein Kinase catalytic subunit) gene"
            ],
            "mismatches": [],
            "true_referents": [
                "ATM (Ataxia-Telangiectasia Mutated) gene",
                "ATR (Ataxia-Telangiectasia and Rad3-related) gene",
                "BLM (Bloom Syndrome) gene",
                "BRCA1 (Breast Cancer 1) gene",
                "BRCA2 (Breast Cancer 2) gene",
                "DNA-PKcs (DNA-dependent Protein Kinase catalytic subunit) gene",
                "EST1 (Est1) gene",
                "EST2 (Est2) gene",
                "Ku70 (Ku Autoantigen 70) gene",
                "Ku80 (Ku Autoantigen 80) gene",
                "MRE11 (Meiotic Recombination 11) gene",
                "NBS1 (Nijmegen Breakage Syndrome 1) gene",
                "Pot1 (Protection of Telomeres 1) gene",
                "Pot1b (Protection of Telomeres 1B) gene",
                "RPA1 (Replication Protein A 1) gene",
                "RPA2 (Replication Protein A 2) gene",
                "RPA3 (Replication Protein A 3) gene",
                "Rap1 (Rapidly Accelerated Fibrosarcoma 1) gene",
                "TERC (Telomerase RNA Component) gene (TERC)",
                "TERT (Telomerase Reverse Transcriptase) gene (TERT)",
                "TPP1 (Telomerase-associated Protein 1) gene",
                "TRF1 (Telomere Repeat Factor 1) gene",
                "TRF2 (Telomere Repeat Factor 2) gene",
                "WRN (Werner Syndrome) gene"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            "TERF1 (TERF1)",
            "TERF2 (TERF2)",
            "POT1 (POT1)",
            "TNKS (TNKS)",
            "RTEL1 (RTEL1)",
            "CTC1 (CTC1)",
            "STN1 (STN1)",
            "ZNF827 (ZNF827)",
            "Apollo (DUT-NUP98)",
            "RTEL1-TNKS (RTEL1-TNKS)",
            "TRF1 (TRF1)",
            "TRF2 (TRF2)",
            "TPP1 (TPP1)",
            "POT1-TPP1 (POT1-TPP1)",
            "DNase-like protein (DNase-like)",
            "Apollo-DUT (Apollo-DUT)",
            "TNKS- RTEL1 (TNKS- RTEL1)",
            "Ctc1-Stn1-Ten1 (CST)",
            "Ten1 (Ten1)",
            "Stn1 (Stn1)",
            "Ctc1 (Ctc1)",
            "Rap1 (Rap1)",
            "Pif1 (Pif1)",
            "TINF2 (TINF2)",
            "DCLRE1C (DCLRE1C)",
            "ATM (ATM)",
            "ATR (ATR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "TERF1 (TERF1)",
                "TERF2 (TERF2)",
                "POT1 (POT1)",
                "TNKS (TNKS)",
                "RTEL1 (RTEL1)",
                "CTC1 (CTC1)",
                "STN1 (STN1)",
                "ZNF827 (ZNF827)",
                "Apollo (DUT-NUP98)",
                "RTEL1-TNKS (RTEL1-TNKS)",
                "TRF1 (TRF1)",
                "TRF2 (TRF2)",
                "TPP1 (TPP1)",
                "POT1-TPP1 (POT1-TPP1)",
                "DNase-like protein (DNase-like)",
                "Apollo-DUT (Apollo-DUT)",
                "TNKS- RTEL1 (TNKS- RTEL1)",
                "Ctc1-Stn1-Ten1 (CST)",
                "Ten1 (Ten1)",
                "Stn1 (Stn1)",
                "Ctc1 (Ctc1)",
                "Rap1 (Rap1)",
                "Pif1 (Pif1)",
                "TINF2 (TINF2)"
            ],
            "mismatches": [
                "DCLRE1C (DCLRE1C)",
                "ATM (ATM)",
                "ATR (ATR)"
            ],
            "true_referents": [
                "Apollo (DUT-NUP98)",
                "Apollo-DUT (Apollo-DUT)",
                "CTC1 (CTC1)",
                "Ctc1 (Ctc1)",
                "Ctc1-Stn1-Ten1 (CST)",
                "DNase-like protein (DNase-like)",
                "POT1 (POT1)",
                "POT1-TPP1 (POT1-TPP1)",
                "Pif1 (Pif1)",
                "RTEL1 (RTEL1)",
                "RTEL1-TNKS (RTEL1-TNKS)",
                "Rap1 (Rap1)",
                "STN1 (STN1)",
                "Stn1 (Stn1)",
                "TERF1 (TERF1)",
                "TERF2 (TERF2)",
                "TINF2 (TINF2)",
                "TNKS (TNKS)",
                "TNKS- RTEL1 (TNKS- RTEL1)",
                "TPP1 (TPP1)",
                "TRF1 (TRF1)",
                "TRF2 (TRF2)",
                "Ten1 (Ten1)",
                "ZNF827 (ZNF827)"
            ],
            "TP": 24,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "telomere maintenance gene",
        "domain": "biology",
        "response": [
            {
                "Referent": "BRCA1",
                "Canonical name": "breast cancer type 1 susceptibility protein"
            },
            {
                "Referent": "ATM",
                "Canonical name": "ataxia-telangiectasia mutated"
            },
            {
                "Referent": "RAD50",
                "Canonical name": "RAD50 protein"
            },
            {
                "Referent": "NBS1",
                "Canonical name": "Nijmegen breakage syndrome 1 protein"
            },
            {
                "Referent": "RAD52",
                "Canonical name": "RAD52 protein"
            },
            {
                "Referent": "MRE11A",
                "Canonical name": "meiotic recombination 11 homolog A protein"
            },
            {
                "Referent": "RAD51",
                "Canonical name": "RAD51 recombinase"
            },
            {
                "Referent": "TP53",
                "Canonical name": "tumor protein p53"
            },
            {
                "Referent": "BLM",
                "Canonical name": "bloom syndrome protein"
            },
            {
                "Referent": "WRN",
                "Canonical name": "Werner syndrome-like protein"
            },
            {
                "Referent": "POT1",
                "Canonical name": "protection of telomeres 1 protein"
            },
            {
                "Referent": "TPP1",
                "Canonical name": "TPP1 protein"
            },
            {
                "Referent": "PARP1",
                "Canonical name": "poly (ADP-ribose) polymerase family member 1"
            },
            {
                "Referent": "RAP1",
                "Canonical name": "repressor activator protein 1"
            },
            {
                "Referent": "FANCJ",
                "Canonical name": "Fanconi anemia complementation group J protein"
            },
            {
                "Referent": "RAD54L",
                "Canonical name": "RAD54L protein"
            },
            {
                "Referent": "XRCC6",
                "Canonical name": "X-ray repair cross-complementing protein 6"
            },
            {
                "Referent": "MRE11B",
                "Canonical name": "meiotic recombination 11 homolog B protein"
            },
            {
                "Referent": "XRCC5",
                "Canonical name": "X-ray repair cross-complementing protein 5"
            },
            {
                "Referent": "XRCC7",
                "Canonical name": "X-ray repair cross-complementing protein 7"
            },
            {
                "Referent": "RAD54B",
                "Canonical name": "RAD54B protein"
            },
            {
                "Referent": "RAD51C",
                "Canonical name": "RAD51C recombinase"
            },
            {
                "Referent": "RAD51D",
                "Canonical name": "RAD51D recombinase"
            },
            {
                "Referent": "RAD52B",
                "Canonical name": "RAD52B protein"
            },
            {
                "Referent": "RAD52L1",
                "Canonical name": "RAD52 homolog 1"
            },
            {
                "Referent": "RAD52L2",
                "Canonical name": "RAD52 homolog 2"
            },
            {
                "Referent": "RAD54L2",
                "Canonical name": "RAD54L2 protein"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BRCA1",
                "ATM",
                "RAD50",
                "NBS1",
                "RAD52",
                "MRE11A",
                "RAD51",
                "TP53",
                "BLM",
                "WRN",
                "POT1",
                "TPP1",
                "PARP1",
                "RAP1",
                "FANCJ",
                "RAD54L",
                "XRCC6",
                "MRE11B",
                "XRCC5",
                "XRCC7",
                "RAD54B",
                "RAD51C",
                "RAD51D",
                "RAD52B"
            ],
            "mismatches": [
                "RAD52L1",
                "RAD52L2",
                "RAD54L2"
            ],
            "true_referents": [
                "{\"Referent\": \"ATM\", \"Canonical name\": \"ataxia-telangiectasia mutated\"}",
                "{\"Referent\": \"BLM\", \"Canonical name\": \"bloom syndrome protein\"}",
                "{\"Referent\": \"BRCA1\", \"Canonical name\": \"breast cancer type 1 susceptibility protein\"}",
                "{\"Referent\": \"FANCJ\", \"Canonical name\": \"Fanconi anemia complementation group J protein\"}",
                "{\"Referent\": \"MRE11A\", \"Canonical name\": \"meiotic recombination 11 homolog A protein\"}",
                "{\"Referent\": \"MRE11B\", \"Canonical name\": \"meiotic recombination 11 homolog B protein\"}",
                "{\"Referent\": \"NBS1\", \"Canonical name\": \"Nijmegen breakage syndrome 1 protein\"}",
                "{\"Referent\": \"PARP1\", \"Canonical name\": \"poly (ADP-ribose) polymerase family member 1\"}",
                "{\"Referent\": \"POT1\", \"Canonical name\": \"protection of telomeres 1 protein\"}",
                "{\"Referent\": \"RAD50\", \"Canonical name\": \"RAD50 protein\"}",
                "{\"Referent\": \"RAD51\", \"Canonical name\": \"RAD51 recombinase\"}",
                "{\"Referent\": \"RAD51C\", \"Canonical name\": \"RAD51C recombinase\"}",
                "{\"Referent\": \"RAD51D\", \"Canonical name\": \"RAD51D recombinase\"}",
                "{\"Referent\": \"RAD52\", \"Canonical name\": \"RAD52 protein\"}",
                "{\"Referent\": \"RAD52B\", \"Canonical name\": \"RAD52B protein\"}",
                "{\"Referent\": \"RAD54B\", \"Canonical name\": \"RAD54B protein\"}",
                "{\"Referent\": \"RAD54L\", \"Canonical name\": \"RAD54L protein\"}",
                "{\"Referent\": \"RAP1\", \"Canonical name\": \"repressor activator protein 1\"}",
                "{\"Referent\": \"TP53\", \"Canonical name\": \"tumor protein p53\"}",
                "{\"Referent\": \"TPP1\", \"Canonical name\": \"TPP1 protein\"}",
                "{\"Referent\": \"WRN\", \"Canonical name\": \"Werner syndrome-like protein\"}",
                "{\"Referent\": \"XRCC5\", \"Canonical name\": \"X-ray repair cross-complementing protein 5\"}",
                "{\"Referent\": \"XRCC6\", \"Canonical name\": \"X-ray repair cross-complementing protein 6\"}",
                "{\"Referent\": \"XRCC7\", \"Canonical name\": \"X-ray repair cross-complementing protein 7\"}"
            ],
            "TP": 24,
            "FP": 3,
            "FN": 0
        }
    }
]