[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "eIF4E (eIF4E)",
            "eIF4G (eIF4G)",
            "eIF4A (eIF4A)",
            "eIF2B (eIF2B)",
            "eIF5 (eIF5)",
            "PABP (PABP)",
            "eIF3 (eIF3)",
            "eIF1 (eIF1)",
            "eIF6 (eIF6)",
            "eIF4B (eIF4B)",
            "eIF1A (eIF1A)",
            "p97 (p97)",
            "eIF2C (eIF2C)",
            "p38 (p38)",
            "eIF2 (eIF2)",
            "p28 (p28)",
            "p72 (p72)",
            "p220 (p220)",
            "p48 (p48)",
            "p62 (p62)",
            "p110 (p110)",
            "p40 (p40)",
            "p13 (p13)",
            "p22 (p22)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "eIF4E (eIF4E)",
                "eIF4G (eIF4G)",
                "eIF4A (eIF4A)",
                "eIF2B (eIF2B)",
                "eIF5 (eIF5)",
                "PABP (PABP)",
                "eIF3 (eIF3)",
                "eIF1 (eIF1)",
                "eIF6 (eIF6)",
                "eIF4B (eIF4B)",
                "eIF1A (eIF1A)",
                "p97 (p97)",
                "eIF2C (eIF2C)",
                "p38 (p38)",
                "eIF2 (eIF2)",
                "p28 (p28)",
                "p72 (p72)",
                "p220 (p220)",
                "p48 (p48)",
                "p62 (p62)",
                "p110 (p110)",
                "p40 (p40)",
                "p13 (p13)",
                "p22 (p22)"
            ],
            "mismatches": [],
            "true_referents": [
                "PABP (PABP)",
                "eIF1 (eIF1)",
                "eIF1A (eIF1A)",
                "eIF2 (eIF2)",
                "eIF2B (eIF2B)",
                "eIF2C (eIF2C)",
                "eIF3 (eIF3)",
                "eIF4A (eIF4A)",
                "eIF4B (eIF4B)",
                "eIF4E (eIF4E)",
                "eIF4G (eIF4G)",
                "eIF5 (eIF5)",
                "eIF6 (eIF6)",
                "p110 (p110)",
                "p13 (p13)",
                "p22 (p22)",
                "p220 (p220)",
                "p28 (p28)",
                "p38 (p38)",
                "p40 (p40)",
                "p48 (p48)",
                "p62 (p62)",
                "p72 (p72)",
                "p97 (p97)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "Eukaryotic Initiation Factor 2 (eIF2)",
            "Eukaryotic Initiation Factor 4E (eIF4E)",
            "Eukaryotic Initiation Factor 4G (eIF4G)",
            "Eukaryotic Initiation Factor 4A (eIF4A)",
            "Eukaryotic Initiation Factor 3 (eIF3)",
            "Poly(A)-Binding Protein (PABP)",
            "Eukaryotic Initiation Factor 5A (eIF5A)",
            "Eukaryotic Initiation Factor 1A (eIF1A)",
            "Eukaryotic Initiation Factor 2B (eIF2B)",
            "Eukaryotic Initiation Factor 5 (eIF5)",
            "Eukaryotic Initiation Factor 6 (eIF6)",
            "Eukaryotic Initiation Factor 1 (eIF1)",
            "Eukaryotic Initiation Factor 2A (eIF2A)",
            "Eukaryotic Initiation Factor 3 Subunit 3 (eIF3S3)",
            "Eukaryotic Initiation Factor 3 Subunit 5 (eIF3S5)",
            "Eukaryotic Initiation Factor 3 Subunit 7 (eIF3S7)",
            "Eukaryotic Initiation Factor 3 Subunit 9 (eIF3S9)",
            "Eukaryotic Initiation Factor 3 Subunit 11 (eIF3S11)",
            "Eukaryotic Initiation Factor 4E-Binding Protein 1 (4E-BP1)",
            "Eukaryotic Initiation Factor 4E-Binding Protein 2 (4E-BP2)",
            "Eukaryotic Initiation Factor 4E-Binding Protein 3 (4E-BP3)",
            "S6 Kinase (S6K)",
            "Ribosomal Protein S6 (RPS6)",
            "Eukaryotic Initiation Factor 4B (eIF4B)",
            "Eukaryotic Initiation Factor 4H (eIF4H)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Eukaryotic Initiation Factor 2 (eIF2)",
                "Eukaryotic Initiation Factor 4E (eIF4E)",
                "Eukaryotic Initiation Factor 4G (eIF4G)",
                "Eukaryotic Initiation Factor 4A (eIF4A)",
                "Eukaryotic Initiation Factor 3 (eIF3)",
                "Poly(A)-Binding Protein (PABP)",
                "Eukaryotic Initiation Factor 5A (eIF5A)",
                "Eukaryotic Initiation Factor 1A (eIF1A)",
                "Eukaryotic Initiation Factor 2B (eIF2B)",
                "Eukaryotic Initiation Factor 5 (eIF5)",
                "Eukaryotic Initiation Factor 6 (eIF6)",
                "Eukaryotic Initiation Factor 1 (eIF1)",
                "Eukaryotic Initiation Factor 2A (eIF2A)",
                "Eukaryotic Initiation Factor 3 Subunit 3 (eIF3S3)",
                "Eukaryotic Initiation Factor 3 Subunit 5 (eIF3S5)",
                "Eukaryotic Initiation Factor 3 Subunit 7 (eIF3S7)",
                "Eukaryotic Initiation Factor 3 Subunit 9 (eIF3S9)",
                "Eukaryotic Initiation Factor 3 Subunit 11 (eIF3S11)",
                "Eukaryotic Initiation Factor 4E-Binding Protein 1 (4E-BP1)",
                "Eukaryotic Initiation Factor 4E-Binding Protein 2 (4E-BP2)",
                "Eukaryotic Initiation Factor 4E-Binding Protein 3 (4E-BP3)",
                "S6 Kinase (S6K)",
                "Ribosomal Protein S6 (RPS6)",
                "Eukaryotic Initiation Factor 4B (eIF4B)"
            ],
            "mismatches": [
                "Eukaryotic Initiation Factor 4H (eIF4H)"
            ],
            "true_referents": [
                "Eukaryotic Initiation Factor 1 (eIF1)",
                "Eukaryotic Initiation Factor 1A (eIF1A)",
                "Eukaryotic Initiation Factor 2 (eIF2)",
                "Eukaryotic Initiation Factor 2A (eIF2A)",
                "Eukaryotic Initiation Factor 2B (eIF2B)",
                "Eukaryotic Initiation Factor 3 (eIF3)",
                "Eukaryotic Initiation Factor 3 Subunit 11 (eIF3S11)",
                "Eukaryotic Initiation Factor 3 Subunit 3 (eIF3S3)",
                "Eukaryotic Initiation Factor 3 Subunit 5 (eIF3S5)",
                "Eukaryotic Initiation Factor 3 Subunit 7 (eIF3S7)",
                "Eukaryotic Initiation Factor 3 Subunit 9 (eIF3S9)",
                "Eukaryotic Initiation Factor 4A (eIF4A)",
                "Eukaryotic Initiation Factor 4B (eIF4B)",
                "Eukaryotic Initiation Factor 4E (eIF4E)",
                "Eukaryotic Initiation Factor 4E-Binding Protein 1 (4E-BP1)",
                "Eukaryotic Initiation Factor 4E-Binding Protein 2 (4E-BP2)",
                "Eukaryotic Initiation Factor 4E-Binding Protein 3 (4E-BP3)",
                "Eukaryotic Initiation Factor 4G (eIF4G)",
                "Eukaryotic Initiation Factor 5 (eIF5)",
                "Eukaryotic Initiation Factor 5A (eIF5A)",
                "Eukaryotic Initiation Factor 6 (eIF6)",
                "Poly(A)-Binding Protein (PABP)",
                "Ribosomal Protein S6 (RPS6)",
                "S6 Kinase (S6K)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "Eukaryotic initiation factor 2 (eIF2)",
            "Eukaryotic initiation factor 2B (eIF2B)",
            "Eukaryotic initiation factor 4E (eIF4E)",
            "Eukaryotic initiation factor 4G (eIF4G)",
            "Eukaryotic initiation factor 4B (eIF4B)",
            "Eukaryotic initiation factor 3 (eIF3)",
            "Eukaryotic initiation factor 5 (eIF5)",
            "Eukaryotic initiation factor 5B (eIF5B)",
            "Eukaryotic initiation factor 1 (eIF1)",
            "Eukaryotic initiation factor 1A (eIF1A)",
            "Eukaryotic initiation factor 6 (eIF6)",
            "Elongation factor 1 alpha (EF1A)",
            "Elongation factor 2 (EF2)",
            "Elongation factor 4 (EF4)",
            "Elongation factor 5 (EF5)",
            "Elongation factor 3 (EF3)",
            "Ribosomal protein S6 kinase (S6K)",
            "Eukaryotic release factor 1 (eRF1)",
            "Eukaryotic release factor 3 (eRF3)",
            "Programmed cell death protein 4 (PDCD4)",
            "4E-BP1 (EIF4EBP1)",
            "4E-BP2 (EIF4EBP2)",
            "4E-BP3 (EIF4EBP3)",
            "PABP (Poly(A)-binding protein)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Eukaryotic initiation factor 2 (eIF2)",
                "Eukaryotic initiation factor 2B (eIF2B)",
                "Eukaryotic initiation factor 4E (eIF4E)",
                "Eukaryotic initiation factor 4G (eIF4G)",
                "Eukaryotic initiation factor 4B (eIF4B)",
                "Eukaryotic initiation factor 3 (eIF3)",
                "Eukaryotic initiation factor 5 (eIF5)",
                "Eukaryotic initiation factor 5B (eIF5B)",
                "Eukaryotic initiation factor 1 (eIF1)",
                "Eukaryotic initiation factor 1A (eIF1A)",
                "Eukaryotic initiation factor 6 (eIF6)",
                "Elongation factor 1 alpha (EF1A)",
                "Elongation factor 2 (EF2)",
                "Elongation factor 4 (EF4)",
                "Elongation factor 5 (EF5)",
                "Elongation factor 3 (EF3)",
                "Ribosomal protein S6 kinase (S6K)",
                "Eukaryotic release factor 1 (eRF1)",
                "Eukaryotic release factor 3 (eRF3)",
                "Programmed cell death protein 4 (PDCD4)",
                "4E-BP1 (EIF4EBP1)",
                "4E-BP2 (EIF4EBP2)",
                "4E-BP3 (EIF4EBP3)",
                "PABP (Poly(A)-binding protein)"
            ],
            "mismatches": [],
            "true_referents": [
                "4E-BP1 (EIF4EBP1)",
                "4E-BP2 (EIF4EBP2)",
                "4E-BP3 (EIF4EBP3)",
                "Elongation factor 1 alpha (EF1A)",
                "Elongation factor 2 (EF2)",
                "Elongation factor 3 (EF3)",
                "Elongation factor 4 (EF4)",
                "Elongation factor 5 (EF5)",
                "Eukaryotic initiation factor 1 (eIF1)",
                "Eukaryotic initiation factor 1A (eIF1A)",
                "Eukaryotic initiation factor 2 (eIF2)",
                "Eukaryotic initiation factor 2B (eIF2B)",
                "Eukaryotic initiation factor 3 (eIF3)",
                "Eukaryotic initiation factor 4B (eIF4B)",
                "Eukaryotic initiation factor 4E (eIF4E)",
                "Eukaryotic initiation factor 4G (eIF4G)",
                "Eukaryotic initiation factor 5 (eIF5)",
                "Eukaryotic initiation factor 5B (eIF5B)",
                "Eukaryotic initiation factor 6 (eIF6)",
                "Eukaryotic release factor 1 (eRF1)",
                "Eukaryotic release factor 3 (eRF3)",
                "PABP (Poly(A)-binding protein)",
                "Programmed cell death protein 4 (PDCD4)",
                "Ribosomal protein S6 kinase (S6K)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "eIF4E (eIF4E)",
            "eIF4G (eIF4G)",
            "eIF3 (eIF3)",
            "eIF2 (eIF2)",
            "eIF2\u03b1 kinase 1 (PKR)",
            "Hemin-regulated inhibitor kinase (HRI)",
            "GCN2 (GCN2)",
            "PERK (PERK)",
            "4E-BP1 (4E-BP1)",
            "MNK1/2 (MNK1/2)",
            "S6K1 (S6K1)",
            "PTEN-induced kinase 1 (PINK1)",
            "Ribosomal protein S6 kinase beta-1 (S6K\u03b21)",
            "eIF5B (eIF5B)",
            "Decapping protein DCP1 (DCP1)",
            "Lazarus (LAZ3L)",
            "TIA-1 (TIA-1)",
            "TTP (TTP)",
            "AUF1 (AUF1)",
            "HuR (HuR)",
            "eIF6 (eIF6)",
            "eIF1 (eIF1)",
            "eIF1A (eIF1A)",
            "eEF1A (eEF1A)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "eIF4E (eIF4E)",
                "eIF4G (eIF4G)",
                "eIF3 (eIF3)",
                "eIF2 (eIF2)",
                "eIF2\u03b1 kinase 1 (PKR)",
                "Hemin-regulated inhibitor kinase (HRI)",
                "GCN2 (GCN2)",
                "PERK (PERK)",
                "4E-BP1 (4E-BP1)",
                "MNK1/2 (MNK1/2)",
                "S6K1 (S6K1)",
                "PTEN-induced kinase 1 (PINK1)",
                "Ribosomal protein S6 kinase beta-1 (S6K\u03b21)",
                "eIF5B (eIF5B)",
                "Decapping protein DCP1 (DCP1)",
                "Lazarus (LAZ3L)",
                "TIA-1 (TIA-1)",
                "TTP (TTP)",
                "AUF1 (AUF1)",
                "HuR (HuR)",
                "eIF6 (eIF6)",
                "eIF1 (eIF1)",
                "eIF1A (eIF1A)",
                "eEF1A (eEF1A)"
            ],
            "mismatches": [],
            "true_referents": [
                "4E-BP1 (4E-BP1)",
                "AUF1 (AUF1)",
                "Decapping protein DCP1 (DCP1)",
                "GCN2 (GCN2)",
                "Hemin-regulated inhibitor kinase (HRI)",
                "HuR (HuR)",
                "Lazarus (LAZ3L)",
                "MNK1/2 (MNK1/2)",
                "PERK (PERK)",
                "PTEN-induced kinase 1 (PINK1)",
                "Ribosomal protein S6 kinase beta-1 (S6K\u03b21)",
                "S6K1 (S6K1)",
                "TIA-1 (TIA-1)",
                "TTP (TTP)",
                "eEF1A (eEF1A)",
                "eIF1 (eIF1)",
                "eIF1A (eIF1A)",
                "eIF2 (eIF2)",
                "eIF2\u03b1 kinase 1 (PKR)",
                "eIF3 (eIF3)",
                "eIF4E (eIF4E)",
                "eIF4G (eIF4G)",
                "eIF5B (eIF5B)",
                "eIF6 (eIF6)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "Eukaryotic Initiation Factor 4E (eIF4E)",
            "Eukaryotic Initiation Factor 2 (eIF2)",
            "Eukaryotic Initiation Factor 3 (eIF3)",
            "Eukaryotic Initiation Factor 4G (eIF4G)",
            "Eukaryotic Initiation Factor 5 (eIF5)",
            "Eukaryotic Initiation Factor 1 (eIF1)",
            "Eukaryotic Initiation Factor 1A (eIF1A)",
            "Eukaryotic Initiation Factor 4A (eIF4A)",
            "Eukaryotic Initiation Factor 5B (eIF5B)",
            "Eukaryotic Initiation Factor 4B (eIF4B)",
            "Eukaryotic Elongation Factor 1A (eEF1A)",
            "Eukaryotic Elongation Factor 2 (eEF2)",
            "Eukaryotic Release Factor 1 (eRF1)",
            "Eukaryotic Release Factor 3 (eRF3)",
            "Ribosomal Protein S6 Kinase (S6K)",
            "Protein Kinase R (PKR)",
            "Mammalian Target of Rapamycin (mTOR)",
            "Ribosomal Protein S6 (rpS6)",
            "Ribosomal Protein L13a (RPL13A)",
            "Ribosomal Protein L26 (RPL26)",
            "Ribosomal Protein S3 (RPS3)",
            "Ribosomal Protein S5 (RPS5)",
            "Ribosomal Protein S10 (RPS10)",
            "Ribosomal Protein L7 (RPL7)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Eukaryotic Initiation Factor 4E (eIF4E)",
                "Eukaryotic Initiation Factor 2 (eIF2)",
                "Eukaryotic Initiation Factor 3 (eIF3)",
                "Eukaryotic Initiation Factor 4G (eIF4G)",
                "Eukaryotic Initiation Factor 5 (eIF5)",
                "Eukaryotic Initiation Factor 1 (eIF1)",
                "Eukaryotic Initiation Factor 1A (eIF1A)",
                "Eukaryotic Initiation Factor 4A (eIF4A)",
                "Eukaryotic Initiation Factor 5B (eIF5B)",
                "Eukaryotic Initiation Factor 4B (eIF4B)",
                "Eukaryotic Elongation Factor 1A (eEF1A)",
                "Eukaryotic Elongation Factor 2 (eEF2)",
                "Eukaryotic Release Factor 1 (eRF1)",
                "Eukaryotic Release Factor 3 (eRF3)",
                "Ribosomal Protein S6 Kinase (S6K)",
                "Protein Kinase R (PKR)",
                "Mammalian Target of Rapamycin (mTOR)",
                "Ribosomal Protein S6 (rpS6)",
                "Ribosomal Protein L13a (RPL13A)",
                "Ribosomal Protein L26 (RPL26)",
                "Ribosomal Protein S3 (RPS3)",
                "Ribosomal Protein S5 (RPS5)",
                "Ribosomal Protein S10 (RPS10)",
                "Ribosomal Protein L7 (RPL7)"
            ],
            "mismatches": [],
            "true_referents": [
                "Eukaryotic Elongation Factor 1A (eEF1A)",
                "Eukaryotic Elongation Factor 2 (eEF2)",
                "Eukaryotic Initiation Factor 1 (eIF1)",
                "Eukaryotic Initiation Factor 1A (eIF1A)",
                "Eukaryotic Initiation Factor 2 (eIF2)",
                "Eukaryotic Initiation Factor 3 (eIF3)",
                "Eukaryotic Initiation Factor 4A (eIF4A)",
                "Eukaryotic Initiation Factor 4B (eIF4B)",
                "Eukaryotic Initiation Factor 4E (eIF4E)",
                "Eukaryotic Initiation Factor 4G (eIF4G)",
                "Eukaryotic Initiation Factor 5 (eIF5)",
                "Eukaryotic Initiation Factor 5B (eIF5B)",
                "Eukaryotic Release Factor 1 (eRF1)",
                "Eukaryotic Release Factor 3 (eRF3)",
                "Mammalian Target of Rapamycin (mTOR)",
                "Protein Kinase R (PKR)",
                "Ribosomal Protein L13a (RPL13A)",
                "Ribosomal Protein L26 (RPL26)",
                "Ribosomal Protein L7 (RPL7)",
                "Ribosomal Protein S10 (RPS10)",
                "Ribosomal Protein S3 (RPS3)",
                "Ribosomal Protein S5 (RPS5)",
                "Ribosomal Protein S6 (rpS6)",
                "Ribosomal Protein S6 Kinase (S6K)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "eIF4E (eukaryotic translation initiation factor 4E)",
            "eIF4G (eukaryotic translation initiation factor 4G)",
            "eIF3 (eukaryotic translation initiation factor 3)",
            "eIF2 (eukaryotic translation initiation factor 2)",
            "eIF5 (eukaryotic translation initiation factor 5)",
            "eIF5A (eukaryotic translation initiation factor 5A)",
            "eIF1 (eukaryotic translation initiation factor 1)",
            "eIF1A (eukaryotic translation initiation factor 1A)",
            "eIF2B (eukaryotic translation initiation factor 2B)",
            "eIF4A (eukaryotic translation initiation factor 4A)",
            "eIF4B (eukaryotic translation initiation factor 4B)",
            "eIF4H (eukaryotic translation initiation factor 4H)",
            "eIF2D (eukaryotic translation initiation factor 2D)",
            "MTOR (mechanistic target of rapamycin)",
            "S6K1 (ribosomal protein S6 kinase beta-1)",
            "4E-BP1 (eukaryotic translation initiation factor 4E-binding protein 1)",
            "CPEB (cytoplasmic polyadenylation element-binding protein)",
            "GCN2 (general control nonderepressible 2 kinase)",
            "PKR (protein kinase R)",
            "eEF1A (eukaryotic elongation factor 1 alpha)",
            "eEF2 (eukaryotic elongation factor 2)",
            "Raptor (regulatory-associated protein of mTOR)",
            "Rictor (rapamycin-insensitive companion of mTOR)",
            "CUGBP1 (CUG-binding protein 1)",
            "FMRP (Fragile X mental retardation protein)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "eIF4E (eukaryotic translation initiation factor 4E)",
                "eIF4G (eukaryotic translation initiation factor 4G)",
                "eIF3 (eukaryotic translation initiation factor 3)",
                "eIF2 (eukaryotic translation initiation factor 2)",
                "eIF5 (eukaryotic translation initiation factor 5)",
                "eIF5A (eukaryotic translation initiation factor 5A)",
                "eIF1 (eukaryotic translation initiation factor 1)",
                "eIF1A (eukaryotic translation initiation factor 1A)",
                "eIF2B (eukaryotic translation initiation factor 2B)",
                "eIF4A (eukaryotic translation initiation factor 4A)",
                "eIF4B (eukaryotic translation initiation factor 4B)",
                "eIF4H (eukaryotic translation initiation factor 4H)",
                "eIF2D (eukaryotic translation initiation factor 2D)",
                "MTOR (mechanistic target of rapamycin)",
                "S6K1 (ribosomal protein S6 kinase beta-1)",
                "4E-BP1 (eukaryotic translation initiation factor 4E-binding protein 1)",
                "CPEB (cytoplasmic polyadenylation element-binding protein)",
                "GCN2 (general control nonderepressible 2 kinase)",
                "PKR (protein kinase R)",
                "eEF1A (eukaryotic elongation factor 1 alpha)",
                "eEF2 (eukaryotic elongation factor 2)",
                "Raptor (regulatory-associated protein of mTOR)",
                "Rictor (rapamycin-insensitive companion of mTOR)",
                "CUGBP1 (CUG-binding protein 1)"
            ],
            "mismatches": [
                "FMRP (Fragile X mental retardation protein)"
            ],
            "true_referents": [
                "4E-BP1 (eukaryotic translation initiation factor 4E-binding protein 1)",
                "CPEB (cytoplasmic polyadenylation element-binding protein)",
                "CUGBP1 (CUG-binding protein 1)",
                "GCN2 (general control nonderepressible 2 kinase)",
                "MTOR (mechanistic target of rapamycin)",
                "PKR (protein kinase R)",
                "Raptor (regulatory-associated protein of mTOR)",
                "Rictor (rapamycin-insensitive companion of mTOR)",
                "S6K1 (ribosomal protein S6 kinase beta-1)",
                "eEF1A (eukaryotic elongation factor 1 alpha)",
                "eEF2 (eukaryotic elongation factor 2)",
                "eIF1 (eukaryotic translation initiation factor 1)",
                "eIF1A (eukaryotic translation initiation factor 1A)",
                "eIF2 (eukaryotic translation initiation factor 2)",
                "eIF2B (eukaryotic translation initiation factor 2B)",
                "eIF2D (eukaryotic translation initiation factor 2D)",
                "eIF3 (eukaryotic translation initiation factor 3)",
                "eIF4A (eukaryotic translation initiation factor 4A)",
                "eIF4B (eukaryotic translation initiation factor 4B)",
                "eIF4E (eukaryotic translation initiation factor 4E)",
                "eIF4G (eukaryotic translation initiation factor 4G)",
                "eIF4H (eukaryotic translation initiation factor 4H)",
                "eIF5 (eukaryotic translation initiation factor 5)",
                "eIF5A (eukaryotic translation initiation factor 5A)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "eukaryotic initiation factor 4E (eIF4E)",
            "eukaryotic initiation factor 4G (eIF4G)",
            "eukaryotic initiation factor 2 (eIF2)",
            "eukaryotic initiation factor 5 (eIF5)",
            "eukaryotic initiation factor 3 (eIF3)",
            "eukaryotic elongation factor 1 (eEF1)",
            "eukaryotic elongation factor 2 (eEF2)",
            "eukaryotic peptide chain release factor 1 (eRF1)",
            "eukaryotic peptide chain release factor 3 (eRF3)",
            "poly(A)-binding protein (PABP)",
            "eukaryotic translation initiation factor 4A (eIF4A)",
            "eukaryotic translation initiation factor 4B (eIF4B)",
            "eukaryotic translation initiation factor 4H (eIF4H)",
            "eukaryotic translation initiation factor 5A (eIF5A)",
            "eukaryotic translation initiation factor 5B (eIF5B)",
            "eukaryotic translation initiation factor 6 (eIF6)",
            "eukaryotic translation initiation factor 1 (eIF1)",
            "eukaryotic translation initiation factor 1A (eIF1A)",
            "eukaryotic translation initiation factor 2B (eIF2B)",
            "eukaryotic translation initiation factor 2C (eIF2C)",
            "eukaryotic translation initiation factor 2D (eIF2D)",
            "eukaryotic translation initiation factor 3A (eIF3A)",
            "eukaryotic translation initiation factor 3B (eIF3B)",
            "eukaryotic translation initiation factor 3C (eIF3C)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "eukaryotic initiation factor 4E (eIF4E)",
                "eukaryotic initiation factor 4G (eIF4G)",
                "eukaryotic initiation factor 2 (eIF2)",
                "eukaryotic initiation factor 5 (eIF5)",
                "eukaryotic initiation factor 3 (eIF3)",
                "eukaryotic elongation factor 1 (eEF1)",
                "eukaryotic elongation factor 2 (eEF2)",
                "eukaryotic peptide chain release factor 1 (eRF1)",
                "eukaryotic peptide chain release factor 3 (eRF3)",
                "poly(A)-binding protein (PABP)",
                "eukaryotic translation initiation factor 4A (eIF4A)",
                "eukaryotic translation initiation factor 4B (eIF4B)",
                "eukaryotic translation initiation factor 4H (eIF4H)",
                "eukaryotic translation initiation factor 5A (eIF5A)",
                "eukaryotic translation initiation factor 5B (eIF5B)",
                "eukaryotic translation initiation factor 6 (eIF6)",
                "eukaryotic translation initiation factor 1 (eIF1)",
                "eukaryotic translation initiation factor 1A (eIF1A)",
                "eukaryotic translation initiation factor 2B (eIF2B)",
                "eukaryotic translation initiation factor 2C (eIF2C)",
                "eukaryotic translation initiation factor 2D (eIF2D)",
                "eukaryotic translation initiation factor 3A (eIF3A)",
                "eukaryotic translation initiation factor 3B (eIF3B)",
                "eukaryotic translation initiation factor 3C (eIF3C)"
            ],
            "mismatches": [],
            "true_referents": [
                "eukaryotic elongation factor 1 (eEF1)",
                "eukaryotic elongation factor 2 (eEF2)",
                "eukaryotic initiation factor 2 (eIF2)",
                "eukaryotic initiation factor 3 (eIF3)",
                "eukaryotic initiation factor 4E (eIF4E)",
                "eukaryotic initiation factor 4G (eIF4G)",
                "eukaryotic initiation factor 5 (eIF5)",
                "eukaryotic peptide chain release factor 1 (eRF1)",
                "eukaryotic peptide chain release factor 3 (eRF3)",
                "eukaryotic translation initiation factor 1 (eIF1)",
                "eukaryotic translation initiation factor 1A (eIF1A)",
                "eukaryotic translation initiation factor 2B (eIF2B)",
                "eukaryotic translation initiation factor 2C (eIF2C)",
                "eukaryotic translation initiation factor 2D (eIF2D)",
                "eukaryotic translation initiation factor 3A (eIF3A)",
                "eukaryotic translation initiation factor 3B (eIF3B)",
                "eukaryotic translation initiation factor 3C (eIF3C)",
                "eukaryotic translation initiation factor 4A (eIF4A)",
                "eukaryotic translation initiation factor 4B (eIF4B)",
                "eukaryotic translation initiation factor 4H (eIF4H)",
                "eukaryotic translation initiation factor 5A (eIF5A)",
                "eukaryotic translation initiation factor 5B (eIF5B)",
                "eukaryotic translation initiation factor 6 (eIF6)",
                "poly(A)-binding protein (PABP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "Protein A (PA)",
            "Protein B (PB)",
            "Protein C (PC)",
            "Protein D (PD)",
            "Protein E (PE)",
            "Protein F (PF)",
            "Protein G (PG)",
            "Protein H (PH)",
            "Protein I (PI)",
            "Protein J (PJ)",
            "Protein K (PK)",
            "Protein L (PL)",
            "Protein M (PM)",
            "Protein N (PN)",
            "Protein O (PO)",
            "Protein P (PP)",
            "Protein Q (PQ)",
            "Protein R (PR)",
            "Protein S (PS)",
            "Protein T (PT)",
            "Protein U (PU)",
            "Protein V (PV)",
            "Protein W (PW)",
            "Protein X (PX)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Protein A (PA)",
                "Protein B (PB)",
                "Protein C (PC)",
                "Protein D (PD)",
                "Protein E (PE)",
                "Protein F (PF)",
                "Protein G (PG)",
                "Protein H (PH)",
                "Protein I (PI)",
                "Protein J (PJ)",
                "Protein K (PK)",
                "Protein L (PL)",
                "Protein M (PM)",
                "Protein N (PN)",
                "Protein O (PO)",
                "Protein P (PP)",
                "Protein Q (PQ)",
                "Protein R (PR)",
                "Protein S (PS)",
                "Protein T (PT)",
                "Protein U (PU)",
                "Protein V (PV)",
                "Protein W (PW)",
                "Protein X (PX)"
            ],
            "mismatches": [],
            "true_referents": [
                "Protein A (PA)",
                "Protein B (PB)",
                "Protein C (PC)",
                "Protein D (PD)",
                "Protein E (PE)",
                "Protein F (PF)",
                "Protein G (PG)",
                "Protein H (PH)",
                "Protein I (PI)",
                "Protein J (PJ)",
                "Protein K (PK)",
                "Protein L (PL)",
                "Protein M (PM)",
                "Protein N (PN)",
                "Protein O (PO)",
                "Protein P (PP)",
                "Protein Q (PQ)",
                "Protein R (PR)",
                "Protein S (PS)",
                "Protein T (PT)",
                "Protein U (PU)",
                "Protein V (PV)",
                "Protein W (PW)",
                "Protein X (PX)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "Eukaryotic initiation factor 4E (eIF4E)",
            "Eukaryotic initiation factor 4A (eIF4A)",
            "Eukaryotic initiation factor 4G (eIF4G)",
            "Eukaryotic initiation factor 2 alpha (eIF2\u03b1)",
            "Eukaryotic initiation factor 3 (eIF3)",
            "Eukaryotic elongation factor 1 alpha (eEF1A)",
            "Eukaryotic elongation factor 2 (eEF2)",
            "4E-Binding protein 1 (4E-BP1)",
            "Mechanistic target of rapamycin (mTOR)",
            "Ribosomal protein S6 kinase beta-1 (S6K1)",
            "Eukaryotic initiation factor 5 (eIF5)",
            "Eukaryotic initiation factor 6 (eIF6)",
            "Receptor for activated C kinase 1 (RACK1)",
            "Fragile X mental retardation protein (FMRP)",
            "Transcription initiation factor TIF1A",
            "Programmed cell death protein 4 (PDCD4)",
            "DEAD-box helicase 6 (DDX6)",
            "La-related protein 1 (LARP1)",
            "GRB10 interacting GYF protein 2 (GIGYF2)",
            "Eukaryotic initiation factor 1 (eIF1)",
            "Eukaryotic initiation factor 2B (eIF2B)",
            "Eukaryotic initiation factor 3 subunit F (eIF3F)",
            "Eukaryotic initiation factor 3 subunit H (eIF3H)",
            "Eukaryotic initiation factor 4B (eIF4B)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Eukaryotic initiation factor 4E (eIF4E)",
                "Eukaryotic initiation factor 4A (eIF4A)",
                "Eukaryotic initiation factor 4G (eIF4G)",
                "Eukaryotic initiation factor 2 alpha (eIF2\u03b1)",
                "Eukaryotic initiation factor 3 (eIF3)",
                "Eukaryotic elongation factor 1 alpha (eEF1A)",
                "Eukaryotic elongation factor 2 (eEF2)",
                "4E-Binding protein 1 (4E-BP1)",
                "Mechanistic target of rapamycin (mTOR)",
                "Ribosomal protein S6 kinase beta-1 (S6K1)",
                "Eukaryotic initiation factor 5 (eIF5)",
                "Eukaryotic initiation factor 6 (eIF6)",
                "Receptor for activated C kinase 1 (RACK1)",
                "Fragile X mental retardation protein (FMRP)",
                "Transcription initiation factor TIF1A",
                "Programmed cell death protein 4 (PDCD4)",
                "DEAD-box helicase 6 (DDX6)",
                "La-related protein 1 (LARP1)",
                "GRB10 interacting GYF protein 2 (GIGYF2)",
                "Eukaryotic initiation factor 1 (eIF1)",
                "Eukaryotic initiation factor 2B (eIF2B)",
                "Eukaryotic initiation factor 3 subunit F (eIF3F)",
                "Eukaryotic initiation factor 3 subunit H (eIF3H)",
                "Eukaryotic initiation factor 4B (eIF4B)"
            ],
            "mismatches": [],
            "true_referents": [
                "4E-Binding protein 1 (4E-BP1)",
                "DEAD-box helicase 6 (DDX6)",
                "Eukaryotic elongation factor 1 alpha (eEF1A)",
                "Eukaryotic elongation factor 2 (eEF2)",
                "Eukaryotic initiation factor 1 (eIF1)",
                "Eukaryotic initiation factor 2 alpha (eIF2\u03b1)",
                "Eukaryotic initiation factor 2B (eIF2B)",
                "Eukaryotic initiation factor 3 (eIF3)",
                "Eukaryotic initiation factor 3 subunit F (eIF3F)",
                "Eukaryotic initiation factor 3 subunit H (eIF3H)",
                "Eukaryotic initiation factor 4A (eIF4A)",
                "Eukaryotic initiation factor 4B (eIF4B)",
                "Eukaryotic initiation factor 4E (eIF4E)",
                "Eukaryotic initiation factor 4G (eIF4G)",
                "Eukaryotic initiation factor 5 (eIF5)",
                "Eukaryotic initiation factor 6 (eIF6)",
                "Fragile X mental retardation protein (FMRP)",
                "GRB10 interacting GYF protein 2 (GIGYF2)",
                "La-related protein 1 (LARP1)",
                "Mechanistic target of rapamycin (mTOR)",
                "Programmed cell death protein 4 (PDCD4)",
                "Receptor for activated C kinase 1 (RACK1)",
                "Ribosomal protein S6 kinase beta-1 (S6K1)",
                "Transcription initiation factor TIF1A"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "Eukaryotic initiation factor 2 (eIF2)",
            "Eukaryotic initiation factor 4E (eIF4E)",
            "Eukaryotic elongation factor 1A (eEF1A)",
            "Eukaryotic elongation factor 2 (eEF2)",
            "Eukaryotic release factor 1 (eRF1)",
            "Poly(A)-binding protein (PABP)",
            "GCN2 protein kinase",
            "PERK protein kinase",
            "4E-BP1 (eIF4E-binding protein 1)",
            "mTOR (mammalian target of rapamycin)",
            "S6 kinase",
            "Fragile X mental retardation protein (FMRP)",
            "Cytoplasmic polyadenylation element-binding protein (CPEB)",
            "Pumilio",
            "Staufen",
            "Argonaute proteins",
            "RISC (RNA-induced silencing complex)",
            "Smaug",
            "Bicoid",
            "Nanos",
            "Bruno",
            "IRP1 (Iron regulatory protein 1)",
            "IRP2 (Iron regulatory protein 2)",
            "FMRP-associated mRNP complex"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Eukaryotic initiation factor 2 (eIF2)",
                "Eukaryotic initiation factor 4E (eIF4E)",
                "Eukaryotic elongation factor 1A (eEF1A)",
                "Eukaryotic elongation factor 2 (eEF2)",
                "Eukaryotic release factor 1 (eRF1)",
                "Poly(A)-binding protein (PABP)",
                "GCN2 protein kinase",
                "PERK protein kinase",
                "4E-BP1 (eIF4E-binding protein 1)",
                "mTOR (mammalian target of rapamycin)",
                "S6 kinase",
                "Fragile X mental retardation protein (FMRP)",
                "Cytoplasmic polyadenylation element-binding protein (CPEB)",
                "Pumilio",
                "Staufen",
                "Argonaute proteins",
                "RISC (RNA-induced silencing complex)",
                "Smaug",
                "Bicoid",
                "Nanos",
                "Bruno",
                "IRP1 (Iron regulatory protein 1)",
                "IRP2 (Iron regulatory protein 2)",
                "FMRP-associated mRNP complex"
            ],
            "mismatches": [],
            "true_referents": [
                "4E-BP1 (eIF4E-binding protein 1)",
                "Argonaute proteins",
                "Bicoid",
                "Bruno",
                "Cytoplasmic polyadenylation element-binding protein (CPEB)",
                "Eukaryotic elongation factor 1A (eEF1A)",
                "Eukaryotic elongation factor 2 (eEF2)",
                "Eukaryotic initiation factor 2 (eIF2)",
                "Eukaryotic initiation factor 4E (eIF4E)",
                "Eukaryotic release factor 1 (eRF1)",
                "FMRP-associated mRNP complex",
                "Fragile X mental retardation protein (FMRP)",
                "GCN2 protein kinase",
                "IRP1 (Iron regulatory protein 1)",
                "IRP2 (Iron regulatory protein 2)",
                "Nanos",
                "PERK protein kinase",
                "Poly(A)-binding protein (PABP)",
                "Pumilio",
                "RISC (RNA-induced silencing complex)",
                "S6 kinase",
                "Smaug",
                "Staufen",
                "mTOR (mammalian target of rapamycin)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "Eukaryotic initiation factor 2 (eIF2)",
            "Eukaryotic initiation factor 4E (eIF4E)",
            "Eukaryotic initiation factor 4G (eIF4G)",
            "Eukaryotic initiation factor 4A (eIF4A)",
            "Eukaryotic initiation factor 4B (eIF4B)",
            "Eukaryotic initiation factor 4H (eIF4H)",
            "Eukaryotic elongation factor 1A (eEF1A)",
            "Eukaryotic elongation factor 1B (eEF1B)",
            "Eukaryotic elongation factor 2 (eEF2)",
            "Eukaryotic release factor 1 (eRF1)",
            "Eukaryotic release factor 3 (eRF3)",
            "Poly(A)-binding protein (PABP)",
            "Ribosomal protein S6 kinase (S6K)",
            "Eukaryotic translation initiation factor 2-alpha kinase 1 (EIF2AK1)",
            "Eukaryotic translation initiation factor 2-alpha kinase 2 (EIF2AK2)",
            "Eukaryotic translation initiation factor 2-alpha kinase 3 (EIF2AK3)",
            "Eukaryotic translation initiation factor 2-alpha kinase 4 (EIF2AK4)",
            "Eukaryotic translation initiation factor 4E-binding protein 1 (4E-BP1)",
            "Eukaryotic translation initiation factor 4E-binding protein 2 (4E-BP2)",
            "Eukaryotic translation initiation factor 4E-binding protein 3 (4E-BP3)",
            "Eukaryotic translation initiation factor 4E transporter (4E-T)",
            "Eukaryotic translation initiation factor 5 (eIF5)",
            "Eukaryotic translation initiation factor 5A (eIF5A)",
            "Eukaryotic translation initiation factor 5B (eIF5B)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Eukaryotic initiation factor 2 (eIF2)",
                "Eukaryotic initiation factor 4E (eIF4E)",
                "Eukaryotic initiation factor 4G (eIF4G)",
                "Eukaryotic initiation factor 4A (eIF4A)",
                "Eukaryotic initiation factor 4B (eIF4B)",
                "Eukaryotic initiation factor 4H (eIF4H)",
                "Eukaryotic elongation factor 1A (eEF1A)",
                "Eukaryotic elongation factor 1B (eEF1B)",
                "Eukaryotic elongation factor 2 (eEF2)",
                "Eukaryotic release factor 1 (eRF1)",
                "Eukaryotic release factor 3 (eRF3)",
                "Poly(A)-binding protein (PABP)",
                "Ribosomal protein S6 kinase (S6K)",
                "Eukaryotic translation initiation factor 2-alpha kinase 1 (EIF2AK1)",
                "Eukaryotic translation initiation factor 2-alpha kinase 2 (EIF2AK2)",
                "Eukaryotic translation initiation factor 2-alpha kinase 3 (EIF2AK3)",
                "Eukaryotic translation initiation factor 2-alpha kinase 4 (EIF2AK4)",
                "Eukaryotic translation initiation factor 4E-binding protein 1 (4E-BP1)",
                "Eukaryotic translation initiation factor 4E-binding protein 2 (4E-BP2)",
                "Eukaryotic translation initiation factor 4E-binding protein 3 (4E-BP3)",
                "Eukaryotic translation initiation factor 4E transporter (4E-T)",
                "Eukaryotic translation initiation factor 5 (eIF5)",
                "Eukaryotic translation initiation factor 5A (eIF5A)",
                "Eukaryotic translation initiation factor 5B (eIF5B)"
            ],
            "mismatches": [],
            "true_referents": [
                "Eukaryotic elongation factor 1A (eEF1A)",
                "Eukaryotic elongation factor 1B (eEF1B)",
                "Eukaryotic elongation factor 2 (eEF2)",
                "Eukaryotic initiation factor 2 (eIF2)",
                "Eukaryotic initiation factor 4A (eIF4A)",
                "Eukaryotic initiation factor 4B (eIF4B)",
                "Eukaryotic initiation factor 4E (eIF4E)",
                "Eukaryotic initiation factor 4G (eIF4G)",
                "Eukaryotic initiation factor 4H (eIF4H)",
                "Eukaryotic release factor 1 (eRF1)",
                "Eukaryotic release factor 3 (eRF3)",
                "Eukaryotic translation initiation factor 2-alpha kinase 1 (EIF2AK1)",
                "Eukaryotic translation initiation factor 2-alpha kinase 2 (EIF2AK2)",
                "Eukaryotic translation initiation factor 2-alpha kinase 3 (EIF2AK3)",
                "Eukaryotic translation initiation factor 2-alpha kinase 4 (EIF2AK4)",
                "Eukaryotic translation initiation factor 4E transporter (4E-T)",
                "Eukaryotic translation initiation factor 4E-binding protein 1 (4E-BP1)",
                "Eukaryotic translation initiation factor 4E-binding protein 2 (4E-BP2)",
                "Eukaryotic translation initiation factor 4E-binding protein 3 (4E-BP3)",
                "Eukaryotic translation initiation factor 5 (eIF5)",
                "Eukaryotic translation initiation factor 5A (eIF5A)",
                "Eukaryotic translation initiation factor 5B (eIF5B)",
                "Poly(A)-binding protein (PABP)",
                "Ribosomal protein S6 kinase (S6K)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "Eukaryotic translation initiation factor 4E (eIF4E)",
            "Eukaryotic translation initiation factor 4G (eIF4G)",
            "Eukaryotic translation initiation factor 4A (eIF4A)",
            "Eukaryotic translation initiation factor 4B (eIF4B)",
            "Poly(A)-binding protein (PABP)",
            "Eukaryotic translation initiation factor 2 (eIF2)",
            "Eukaryotic translation initiation factor 3 (eIF3)",
            "Eukaryotic translation initiation factor 5 (eIF5)",
            "Eukaryotic translation initiation factor 5B (eIF5B)",
            "Eukaryotic translation initiation factor 1 (eIF1)",
            "Eukaryotic translation initiation factor 1A (eIF1A)",
            "Eukaryotic translation initiation factor 6 (eIF6)",
            "Mammalian target of rapamycin (mTOR)",
            "S6 kinase 1 (S6K1)",
            "4E-binding protein 1 (4E-BP1)",
            "Programmed cell death 4 (PDCD4)",
            "Tristetraprolin (TTP)",
            "HuR protein",
            "Fragile X mental retardation protein (FMRP)",
            "Cytoplasmic polyadenylation element binding protein (CPEB)",
            "Upstream of N-Ras (Unr)",
            "Musashi RNA-binding protein",
            "Pumilio homology domain family member 1 (PUM1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Eukaryotic translation initiation factor 4E (eIF4E)",
                "Eukaryotic translation initiation factor 4G (eIF4G)",
                "Eukaryotic translation initiation factor 4A (eIF4A)",
                "Eukaryotic translation initiation factor 4B (eIF4B)",
                "Poly(A)-binding protein (PABP)",
                "Eukaryotic translation initiation factor 2 (eIF2)",
                "Eukaryotic translation initiation factor 3 (eIF3)",
                "Eukaryotic translation initiation factor 5 (eIF5)",
                "Eukaryotic translation initiation factor 5B (eIF5B)",
                "Eukaryotic translation initiation factor 1 (eIF1)",
                "Eukaryotic translation initiation factor 1A (eIF1A)",
                "Eukaryotic translation initiation factor 6 (eIF6)",
                "Mammalian target of rapamycin (mTOR)",
                "S6 kinase 1 (S6K1)",
                "4E-binding protein 1 (4E-BP1)",
                "Programmed cell death 4 (PDCD4)",
                "Tristetraprolin (TTP)",
                "HuR protein",
                "Fragile X mental retardation protein (FMRP)",
                "Cytoplasmic polyadenylation element binding protein (CPEB)",
                "Upstream of N-Ras (Unr)",
                "Musashi RNA-binding protein",
                "Pumilio homology domain family member 1 (PUM1)"
            ],
            "mismatches": [],
            "true_referents": [
                "4E-binding protein 1 (4E-BP1)",
                "Cytoplasmic polyadenylation element binding protein (CPEB)",
                "Eukaryotic translation initiation factor 1 (eIF1)",
                "Eukaryotic translation initiation factor 1A (eIF1A)",
                "Eukaryotic translation initiation factor 2 (eIF2)",
                "Eukaryotic translation initiation factor 3 (eIF3)",
                "Eukaryotic translation initiation factor 4A (eIF4A)",
                "Eukaryotic translation initiation factor 4B (eIF4B)",
                "Eukaryotic translation initiation factor 4E (eIF4E)",
                "Eukaryotic translation initiation factor 4G (eIF4G)",
                "Eukaryotic translation initiation factor 5 (eIF5)",
                "Eukaryotic translation initiation factor 5B (eIF5B)",
                "Eukaryotic translation initiation factor 6 (eIF6)",
                "Fragile X mental retardation protein (FMRP)",
                "HuR protein",
                "Mammalian target of rapamycin (mTOR)",
                "Musashi RNA-binding protein",
                "Poly(A)-binding protein (PABP)",
                "Programmed cell death 4 (PDCD4)",
                "Pumilio homology domain family member 1 (PUM1)",
                "S6 kinase 1 (S6K1)",
                "Tristetraprolin (TTP)",
                "Upstream of N-Ras (Unr)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "Eukaryotic Translation Initiation Factor 4E (eIF4E)",
            "Eukaryotic Translation Initiation Factor 4B (eIF4B)",
            "Eukaryotic Translation Initiation Factor 4G (eIF4G)",
            "Poly(A) Binding Protein (PABP)",
            "Eukaryotic Translation Initiation Factor 2 (eIF2)",
            "Eukaryotic Translation Initiation Factor 2B (eIF2B)",
            "Eukaryotic Translation Initiation Factor 3 (eIF3)",
            "Eukaryotic Translation Elongation Factor 1A (eEF1A)",
            "Eukaryotic Translation Elongation Factor 2 (eEF2)",
            "Ribosomal Protein S6 Kinase (S6K)",
            "Eukaryotic Translation Initiation Factor 4E Binding Protein (4E-BP)",
            "Mammalian Target of Rapamycin (mTOR)",
            "Glycogen Synthase Kinase 3 (GSK3)",
            "Protein Kinase C (PKC)",
            "Protein Kinase B (Akt)",
            "Mitogen-Activated Protein Kinase (MAPK)",
            "Extracellular Signal-Regulated Kinase (ERK)",
            "c-Jun N-Terminal Kinase (JNK)",
            "p38 Mitogen-Activated Protein Kinase (p38 MAPK)",
            "Tuberous Sclerosis Complex 1 (TSC1)",
            "Tuberous Sclerosis Complex 2 (TSC2)",
            "Ras Homolog Enriched in Brain (Rheb)",
            "Eukaryotic Translation Initiation Factor 5B (eIF5B)",
            "Eukaryotic Translation Initiation Factor 1 (eIF1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Eukaryotic Translation Initiation Factor 4E (eIF4E)",
                "Eukaryotic Translation Initiation Factor 4B (eIF4B)",
                "Eukaryotic Translation Initiation Factor 4G (eIF4G)",
                "Poly(A) Binding Protein (PABP)",
                "Eukaryotic Translation Initiation Factor 2 (eIF2)",
                "Eukaryotic Translation Initiation Factor 2B (eIF2B)",
                "Eukaryotic Translation Initiation Factor 3 (eIF3)",
                "Eukaryotic Translation Elongation Factor 1A (eEF1A)",
                "Eukaryotic Translation Elongation Factor 2 (eEF2)",
                "Ribosomal Protein S6 Kinase (S6K)",
                "Eukaryotic Translation Initiation Factor 4E Binding Protein (4E-BP)",
                "Mammalian Target of Rapamycin (mTOR)",
                "Glycogen Synthase Kinase 3 (GSK3)",
                "Protein Kinase C (PKC)",
                "Protein Kinase B (Akt)",
                "Mitogen-Activated Protein Kinase (MAPK)",
                "Extracellular Signal-Regulated Kinase (ERK)",
                "c-Jun N-Terminal Kinase (JNK)",
                "p38 Mitogen-Activated Protein Kinase (p38 MAPK)",
                "Tuberous Sclerosis Complex 1 (TSC1)",
                "Tuberous Sclerosis Complex 2 (TSC2)",
                "Ras Homolog Enriched in Brain (Rheb)",
                "Eukaryotic Translation Initiation Factor 5B (eIF5B)",
                "Eukaryotic Translation Initiation Factor 1 (eIF1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Eukaryotic Translation Elongation Factor 1A (eEF1A)",
                "Eukaryotic Translation Elongation Factor 2 (eEF2)",
                "Eukaryotic Translation Initiation Factor 1 (eIF1)",
                "Eukaryotic Translation Initiation Factor 2 (eIF2)",
                "Eukaryotic Translation Initiation Factor 2B (eIF2B)",
                "Eukaryotic Translation Initiation Factor 3 (eIF3)",
                "Eukaryotic Translation Initiation Factor 4B (eIF4B)",
                "Eukaryotic Translation Initiation Factor 4E (eIF4E)",
                "Eukaryotic Translation Initiation Factor 4E Binding Protein (4E-BP)",
                "Eukaryotic Translation Initiation Factor 4G (eIF4G)",
                "Eukaryotic Translation Initiation Factor 5B (eIF5B)",
                "Extracellular Signal-Regulated Kinase (ERK)",
                "Glycogen Synthase Kinase 3 (GSK3)",
                "Mammalian Target of Rapamycin (mTOR)",
                "Mitogen-Activated Protein Kinase (MAPK)",
                "Poly(A) Binding Protein (PABP)",
                "Protein Kinase B (Akt)",
                "Protein Kinase C (PKC)",
                "Ras Homolog Enriched in Brain (Rheb)",
                "Ribosomal Protein S6 Kinase (S6K)",
                "Tuberous Sclerosis Complex 1 (TSC1)",
                "Tuberous Sclerosis Complex 2 (TSC2)",
                "c-Jun N-Terminal Kinase (JNK)",
                "p38 Mitogen-Activated Protein Kinase (p38 MAPK)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "Eukaryotic Initiation Factor 2 (eIF2)",
            "Regulatory Protein S6 Kinase",
            "eIF2 Kinase",
            "Phosphorylated eIF2",
            "eIF2B",
            "eIF4E-binding Protein 1 (4E-BP1)",
            "Phosphorylated 4E-BP1",
            "mTOR",
            "Phosphorylated mTOR",
            "Raptor",
            "DEPDC5",
            "eIF4E",
            "Phosphorylated eIF4E",
            "4E-BP2",
            "Phosphorylated 4E-BP2",
            "eIF4G",
            "Phosphorylated eIF4G",
            "eIF4A",
            "Phosphorylated eIF4A",
            "eIF3",
            "Phosphorylated eIF3",
            "eIF5",
            "Phosphorylated eIF5",
            "eIF6",
            "Phosphorylated eIF6"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Eukaryotic Initiation Factor 2 (eIF2)",
                "Regulatory Protein S6 Kinase",
                "eIF2 Kinase",
                "Phosphorylated eIF2",
                "eIF2B",
                "eIF4E-binding Protein 1 (4E-BP1)",
                "Phosphorylated 4E-BP1",
                "mTOR",
                "Phosphorylated mTOR",
                "Raptor",
                "DEPDC5",
                "eIF4E",
                "Phosphorylated eIF4E",
                "4E-BP2",
                "Phosphorylated 4E-BP2",
                "eIF4G",
                "Phosphorylated eIF4G",
                "eIF4A",
                "Phosphorylated eIF4A",
                "eIF3",
                "Phosphorylated eIF3",
                "eIF5",
                "Phosphorylated eIF5",
                "eIF6"
            ],
            "mismatches": [
                "Phosphorylated eIF6"
            ],
            "true_referents": [
                "4E-BP2",
                "DEPDC5",
                "Eukaryotic Initiation Factor 2 (eIF2)",
                "Phosphorylated 4E-BP1",
                "Phosphorylated 4E-BP2",
                "Phosphorylated eIF2",
                "Phosphorylated eIF3",
                "Phosphorylated eIF4A",
                "Phosphorylated eIF4E",
                "Phosphorylated eIF4G",
                "Phosphorylated eIF5",
                "Phosphorylated mTOR",
                "Raptor",
                "Regulatory Protein S6 Kinase",
                "eIF2 Kinase",
                "eIF2B",
                "eIF3",
                "eIF4A",
                "eIF4E",
                "eIF4E-binding Protein 1 (4E-BP1)",
                "eIF4G",
                "eIF5",
                "eIF6",
                "mTOR"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            "eIF1A (eukaryotic initiation factor 1A)",
            "eIF2A (eukaryotic initiation factor 2A)",
            "eIF2B (eukaryotic initiation factor 2B)",
            "eIF3A (eukaryotic initiation factor 3A)",
            "eIF3B (eukaryotic initiation factor 3B)",
            "eIF3C (eukaryotic initiation factor 3C)",
            "eIF3D (eukaryotic initiation factor 3D)",
            "eIF3E (eukaryotic initiation factor 3E)",
            "eIF3F (eukaryotic initiation factor 3F)",
            "eIF3G (eukaryotic initiation factor 3G)",
            "eIF3H (eukaryotic initiation factor 3H)",
            "eIF3I (eukaryotic initiation factor 3I)",
            "eIF3J (eukaryotic initiation factor 3J)",
            "eIF4A (eukaryotic initiation factor 4A)",
            "eIF4B (eukaryotic initiation factor 4B)",
            "eIF4E (eukaryotic initiation factor 4E)",
            "eIF4G (eukaryotic initiation factor 4G)",
            "eIF5 (eukaryotic initiation factor 5)",
            "eRF1 (eukaryotic release factor 1)",
            "eRF3 (eukaryotic release factor 3)",
            "PABP (poly(A) binding protein)",
            "GCN2 (general control non-repressible 2)",
            "PKR (protein kinase RNA-activated)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "eIF1A (eukaryotic initiation factor 1A)",
                "eIF2A (eukaryotic initiation factor 2A)",
                "eIF2B (eukaryotic initiation factor 2B)",
                "eIF3A (eukaryotic initiation factor 3A)",
                "eIF3B (eukaryotic initiation factor 3B)",
                "eIF3C (eukaryotic initiation factor 3C)",
                "eIF3D (eukaryotic initiation factor 3D)",
                "eIF3E (eukaryotic initiation factor 3E)",
                "eIF3F (eukaryotic initiation factor 3F)",
                "eIF3G (eukaryotic initiation factor 3G)",
                "eIF3H (eukaryotic initiation factor 3H)",
                "eIF3I (eukaryotic initiation factor 3I)",
                "eIF3J (eukaryotic initiation factor 3J)",
                "eIF4A (eukaryotic initiation factor 4A)",
                "eIF4B (eukaryotic initiation factor 4B)",
                "eIF4E (eukaryotic initiation factor 4E)",
                "eIF4G (eukaryotic initiation factor 4G)",
                "eIF5 (eukaryotic initiation factor 5)",
                "eRF1 (eukaryotic release factor 1)",
                "eRF3 (eukaryotic release factor 3)",
                "PABP (poly(A) binding protein)",
                "GCN2 (general control non-repressible 2)",
                "PKR (protein kinase RNA-activated)"
            ],
            "mismatches": [],
            "true_referents": [
                "GCN2 (general control non-repressible 2)",
                "PABP (poly(A) binding protein)",
                "PKR (protein kinase RNA-activated)",
                "eIF1A (eukaryotic initiation factor 1A)",
                "eIF2A (eukaryotic initiation factor 2A)",
                "eIF2B (eukaryotic initiation factor 2B)",
                "eIF3A (eukaryotic initiation factor 3A)",
                "eIF3B (eukaryotic initiation factor 3B)",
                "eIF3C (eukaryotic initiation factor 3C)",
                "eIF3D (eukaryotic initiation factor 3D)",
                "eIF3E (eukaryotic initiation factor 3E)",
                "eIF3F (eukaryotic initiation factor 3F)",
                "eIF3G (eukaryotic initiation factor 3G)",
                "eIF3H (eukaryotic initiation factor 3H)",
                "eIF3I (eukaryotic initiation factor 3I)",
                "eIF3J (eukaryotic initiation factor 3J)",
                "eIF4A (eukaryotic initiation factor 4A)",
                "eIF4B (eukaryotic initiation factor 4B)",
                "eIF4E (eukaryotic initiation factor 4E)",
                "eIF4G (eukaryotic initiation factor 4G)",
                "eIF5 (eukaryotic initiation factor 5)",
                "eRF1 (eukaryotic release factor 1)",
                "eRF3 (eukaryotic release factor 3)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "translation regulation protein",
        "domain": "biology",
        "response": [
            [
                "Referent",
                "Cyclin-dependent kinase"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase activator"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2B"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 1A"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 1B"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2A"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2C"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2D"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2E"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2F"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2G"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2H"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2I"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2J"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2K"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2L"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2M"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2N"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2O"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2P"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2Q"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2R"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2S"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2T"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2U"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2V"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2W"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2X"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2Y"
            ],
            [
                "Referent",
                "Cyclin-dependent kinase inhibitor 2Z"
            ]
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cyclin-dependent kinase",
                "Cyclin-dependent kinase inhibitor",
                "Cyclin-dependent kinase activator",
                "Cyclin-dependent kinase inhibitor 2B",
                "Cyclin-dependent kinase inhibitor 1A",
                "Cyclin-dependent kinase inhibitor 1B",
                "Cyclin-dependent kinase inhibitor 2A",
                "Cyclin-dependent kinase inhibitor 2C",
                "Cyclin-dependent kinase inhibitor 2D",
                "Cyclin-dependent kinase inhibitor 2E",
                "Cyclin-dependent kinase inhibitor 2F",
                "Cyclin-dependent kinase inhibitor 2G",
                "Cyclin-dependent kinase inhibitor 2H",
                "Cyclin-dependent kinase inhibitor 2I",
                "Cyclin-dependent kinase inhibitor 2J",
                "Cyclin-dependent kinase inhibitor 2K",
                "Cyclin-dependent kinase inhibitor 2L",
                "Cyclin-dependent kinase inhibitor 2M",
                "Cyclin-dependent kinase inhibitor 2N",
                "Cyclin-dependent kinase inhibitor 2O",
                "Cyclin-dependent kinase inhibitor 2P",
                "Cyclin-dependent kinase inhibitor 2Q",
                "Cyclin-dependent kinase inhibitor 2R",
                "Cyclin-dependent kinase inhibitor 2S"
            ],
            "mismatches": [
                "Cyclin-dependent kinase inhibitor 2T",
                "Cyclin-dependent kinase inhibitor 2U",
                "Cyclin-dependent kinase inhibitor 2V",
                "Cyclin-dependent kinase inhibitor 2W",
                "Cyclin-dependent kinase inhibitor 2X",
                "Cyclin-dependent kinase inhibitor 2Y",
                "Cyclin-dependent kinase inhibitor 2Z"
            ],
            "true_referents": [
                "[\"Referent\", \"Cyclin-dependent kinase activator\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 1A\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 1B\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2A\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2B\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2C\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2D\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2E\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2F\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2G\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2H\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2I\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2J\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2K\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2L\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2M\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2N\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2O\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2P\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2Q\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2R\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor 2S\"]",
                "[\"Referent\", \"Cyclin-dependent kinase inhibitor\"]",
                "[\"Referent\", \"Cyclin-dependent kinase\"]"
            ],
            "TP": 24,
            "FP": 7,
            "FN": 0
        }
    }
]