[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "System A (SLC1A4)",
            "System B0 (SLC6A19)",
            "System B0AT1 (SLC6A19)",
            "System B0AT3 (SLC6A20)",
            "System B0AT6 (SLC6A14)",
            "System B (SLC6A18)",
            "System ASC (SLC36A1)",
            "System Amino acid-preferring Na+ coupled (SLC38A1)",
            "System Amino acid-preferring Na+ coupled 2 (SLC38A2)",
            "System Amino acid-preferring Na+ coupled 3 (SLC38A3)",
            "System Amino acid-preferring Na+ coupled 4 (SLC38A4)",
            "System Amino acid-preferring Na+ coupled 5 (SLC38A5)",
            "System Amino acid-preferring Na+ coupled 6 (SLC38A6)",
            "System Amino acid-preferring Na+ coupled 7 (SLC38A7)",
            "System Amino acid-preferring Na+ coupled 8 (SLC38A8)",
            "System Amino acid-preferring Na+ coupled 9 (SLC38A9)",
            "System L (SLC7A5/SLC3A2)",
            "System L (SLC7A7/SLC3A2)",
            "System L (SLC7A9/SLC3A2)",
            "System L (SLC7A13/SLC3A2)",
            "System L (SLC7A14/SLC3A2)",
            "System L (SLC7A16/SLC3A2)",
            "System T (SLC7A8/SLC3A2)",
            "System y+ (SLC16A10)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "System A (SLC1A4)",
                "System B0 (SLC6A19)",
                "System B0AT1 (SLC6A19)",
                "System B0AT3 (SLC6A20)",
                "System B0AT6 (SLC6A14)",
                "System B (SLC6A18)",
                "System ASC (SLC36A1)",
                "System Amino acid-preferring Na+ coupled (SLC38A1)",
                "System Amino acid-preferring Na+ coupled 2 (SLC38A2)",
                "System Amino acid-preferring Na+ coupled 3 (SLC38A3)",
                "System Amino acid-preferring Na+ coupled 4 (SLC38A4)",
                "System Amino acid-preferring Na+ coupled 5 (SLC38A5)",
                "System Amino acid-preferring Na+ coupled 6 (SLC38A6)",
                "System Amino acid-preferring Na+ coupled 7 (SLC38A7)",
                "System Amino acid-preferring Na+ coupled 8 (SLC38A8)",
                "System Amino acid-preferring Na+ coupled 9 (SLC38A9)",
                "System L (SLC7A5/SLC3A2)",
                "System L (SLC7A7/SLC3A2)",
                "System L (SLC7A9/SLC3A2)",
                "System L (SLC7A13/SLC3A2)",
                "System L (SLC7A14/SLC3A2)",
                "System L (SLC7A16/SLC3A2)",
                "System T (SLC7A8/SLC3A2)",
                "System y+ (SLC16A10)"
            ],
            "mismatches": [],
            "true_referents": [
                "System A (SLC1A4)",
                "System ASC (SLC36A1)",
                "System Amino acid-preferring Na+ coupled (SLC38A1)",
                "System Amino acid-preferring Na+ coupled 2 (SLC38A2)",
                "System Amino acid-preferring Na+ coupled 3 (SLC38A3)",
                "System Amino acid-preferring Na+ coupled 4 (SLC38A4)",
                "System Amino acid-preferring Na+ coupled 5 (SLC38A5)",
                "System Amino acid-preferring Na+ coupled 6 (SLC38A6)",
                "System Amino acid-preferring Na+ coupled 7 (SLC38A7)",
                "System Amino acid-preferring Na+ coupled 8 (SLC38A8)",
                "System Amino acid-preferring Na+ coupled 9 (SLC38A9)",
                "System B (SLC6A18)",
                "System B0 (SLC6A19)",
                "System B0AT1 (SLC6A19)",
                "System B0AT3 (SLC6A20)",
                "System B0AT6 (SLC6A14)",
                "System L (SLC7A13/SLC3A2)",
                "System L (SLC7A14/SLC3A2)",
                "System L (SLC7A16/SLC3A2)",
                "System L (SLC7A5/SLC3A2)",
                "System L (SLC7A7/SLC3A2)",
                "System L (SLC7A9/SLC3A2)",
                "System T (SLC7A8/SLC3A2)",
                "System y+ (SLC16A10)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "System A Amino Acid Transporter (SLC38A1)",
            "System ASC Amino Acid Transporter (SLC7A5)",
            "System B(0+) Amino Acid Transporter (SLC3A2)",
            "System B(0+) Amino Acid Transporter (SLC7A9)",
            "System B(+) Amino Acid Transporter (SLC7A7)",
            "System L Amino Acid Transporter (SLC7A5)",
            "System L Amino Acid Transporter (SLC7A8)",
            "System N Amino Acid Transporter (SLC38A1)",
            "System N Amino Acid Transporter (SLC38A2)",
            "System N Amino Acid Transporter (SLC38A5)",
            "System Xc- Amino Acid Transporter (SLC7A11)",
            "Alanine, Serine, Cysteine-Preferring Transporter 2 (ASCT2, SLC1A5)",
            "Alanine, Serine, Cysteine-Preferring Transporter 3 (ASCT3, SLC1A6)",
            "Cystine/glutamate antiporter (xCT, SLC7A11)",
            "Excitatory Amino Acid Transporter 1 (EAAT1, SLC1A3)",
            "Excitatory Amino Acid Transporter 2 (EAAT2, SLC1A2)",
            "Excitatory Amino Acid Transporter 3 (EAAT3, SLC1A1)",
            "Excitatory Amino Acid Transporter 4 (EAAT4, SLC1A6)",
            "Excitatory Amino Acid Transporter 5 (EAAT5, SLC1A7)",
            "Glutamate Aspartate Transporter (GLAST, SLC1A3)",
            "Glutamate Transporter 1 (GLT-1, SLC1A2)",
            "Neutral Amino Acid Transporter B(0) (B(0)AT, SLC7A9)",
            "Proton-Coupled Amino Acid Transporter 1 (PAT1, SLC36A1)",
            "Proton-Coupled Aromatic Amino Acid Transporter 1 (PAT2, SLC36A2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "System A Amino Acid Transporter (SLC38A1)",
                "System ASC Amino Acid Transporter (SLC7A5)",
                "System B(0+) Amino Acid Transporter (SLC3A2)",
                "System B(0+) Amino Acid Transporter (SLC7A9)",
                "System B(+) Amino Acid Transporter (SLC7A7)",
                "System L Amino Acid Transporter (SLC7A5)",
                "System L Amino Acid Transporter (SLC7A8)",
                "System N Amino Acid Transporter (SLC38A1)",
                "System N Amino Acid Transporter (SLC38A2)",
                "System N Amino Acid Transporter (SLC38A5)",
                "System Xc- Amino Acid Transporter (SLC7A11)",
                "Alanine, Serine, Cysteine-Preferring Transporter 2 (ASCT2, SLC1A5)",
                "Alanine, Serine, Cysteine-Preferring Transporter 3 (ASCT3, SLC1A6)",
                "Cystine/glutamate antiporter (xCT, SLC7A11)",
                "Excitatory Amino Acid Transporter 1 (EAAT1, SLC1A3)",
                "Excitatory Amino Acid Transporter 2 (EAAT2, SLC1A2)",
                "Excitatory Amino Acid Transporter 3 (EAAT3, SLC1A1)",
                "Excitatory Amino Acid Transporter 4 (EAAT4, SLC1A6)",
                "Excitatory Amino Acid Transporter 5 (EAAT5, SLC1A7)",
                "Glutamate Aspartate Transporter (GLAST, SLC1A3)",
                "Glutamate Transporter 1 (GLT-1, SLC1A2)",
                "Neutral Amino Acid Transporter B(0) (B(0)AT, SLC7A9)",
                "Proton-Coupled Amino Acid Transporter 1 (PAT1, SLC36A1)",
                "Proton-Coupled Aromatic Amino Acid Transporter 1 (PAT2, SLC36A2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alanine, Serine, Cysteine-Preferring Transporter 2 (ASCT2, SLC1A5)",
                "Alanine, Serine, Cysteine-Preferring Transporter 3 (ASCT3, SLC1A6)",
                "Cystine/glutamate antiporter (xCT, SLC7A11)",
                "Excitatory Amino Acid Transporter 1 (EAAT1, SLC1A3)",
                "Excitatory Amino Acid Transporter 2 (EAAT2, SLC1A2)",
                "Excitatory Amino Acid Transporter 3 (EAAT3, SLC1A1)",
                "Excitatory Amino Acid Transporter 4 (EAAT4, SLC1A6)",
                "Excitatory Amino Acid Transporter 5 (EAAT5, SLC1A7)",
                "Glutamate Aspartate Transporter (GLAST, SLC1A3)",
                "Glutamate Transporter 1 (GLT-1, SLC1A2)",
                "Neutral Amino Acid Transporter B(0) (B(0)AT, SLC7A9)",
                "Proton-Coupled Amino Acid Transporter 1 (PAT1, SLC36A1)",
                "Proton-Coupled Aromatic Amino Acid Transporter 1 (PAT2, SLC36A2)",
                "System A Amino Acid Transporter (SLC38A1)",
                "System ASC Amino Acid Transporter (SLC7A5)",
                "System B(+) Amino Acid Transporter (SLC7A7)",
                "System B(0+) Amino Acid Transporter (SLC3A2)",
                "System B(0+) Amino Acid Transporter (SLC7A9)",
                "System L Amino Acid Transporter (SLC7A5)",
                "System L Amino Acid Transporter (SLC7A8)",
                "System N Amino Acid Transporter (SLC38A1)",
                "System N Amino Acid Transporter (SLC38A2)",
                "System N Amino Acid Transporter (SLC38A5)",
                "System Xc- Amino Acid Transporter (SLC7A11)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "SLC1A1 (EAAC1)",
            "SLC1A2 (GLT-1)",
            "SLC1A3 (GLAST)",
            "SLC1A4 (ASCT1)",
            "SLC1A5 (ASCT2)",
            "SLC3A2 (4F2hc)",
            "SLC3A1 (rBAT)",
            "SLC6A6 (TauT)",
            "SLC6A8 (Creatine Transporter)",
            "SLC6A9 (GlyT1)",
            "SLC6A12 (BETA)",
            "SLC6A13 (GAT2)",
            "SLC6A14 (GAT4)",
            "SLC6A15 (B^0AT3)",
            "SLC6A17 (B^0AT2)",
            "SLC6A19 (B^0AT1)",
            "SLC7A1 (CAT1)",
            "SLC7A2 (CAT2)",
            "SLC7A5 (LAT1)",
            "SLC7A6 (LAT2)",
            "SLC7A7 (y+LAT1)",
            "SLC7A8 (LAT3)",
            "SLC7A11 (xCT)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "SLC1A1 (EAAC1)",
                "SLC1A2 (GLT-1)",
                "SLC1A3 (GLAST)",
                "SLC1A4 (ASCT1)",
                "SLC1A5 (ASCT2)",
                "SLC3A2 (4F2hc)",
                "SLC3A1 (rBAT)",
                "SLC6A6 (TauT)",
                "SLC6A8 (Creatine Transporter)",
                "SLC6A9 (GlyT1)",
                "SLC6A12 (BETA)",
                "SLC6A13 (GAT2)",
                "SLC6A14 (GAT4)",
                "SLC6A15 (B^0AT3)",
                "SLC6A17 (B^0AT2)",
                "SLC6A19 (B^0AT1)",
                "SLC7A1 (CAT1)",
                "SLC7A2 (CAT2)",
                "SLC7A5 (LAT1)",
                "SLC7A6 (LAT2)",
                "SLC7A7 (y+LAT1)",
                "SLC7A8 (LAT3)",
                "SLC7A11 (xCT)"
            ],
            "mismatches": [],
            "true_referents": [
                "SLC1A1 (EAAC1)",
                "SLC1A2 (GLT-1)",
                "SLC1A3 (GLAST)",
                "SLC1A4 (ASCT1)",
                "SLC1A5 (ASCT2)",
                "SLC3A1 (rBAT)",
                "SLC3A2 (4F2hc)",
                "SLC6A12 (BETA)",
                "SLC6A13 (GAT2)",
                "SLC6A14 (GAT4)",
                "SLC6A15 (B^0AT3)",
                "SLC6A17 (B^0AT2)",
                "SLC6A19 (B^0AT1)",
                "SLC6A6 (TauT)",
                "SLC6A8 (Creatine Transporter)",
                "SLC6A9 (GlyT1)",
                "SLC7A1 (CAT1)",
                "SLC7A11 (xCT)",
                "SLC7A2 (CAT2)",
                "SLC7A5 (LAT1)",
                "SLC7A6 (LAT2)",
                "SLC7A7 (y+LAT1)",
                "SLC7A8 (LAT3)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "SLC1A1/EAAT2 (GLAST)",
            "SLC1A2/EAAT1 (GLAST)",
            "SLC1A3/EAAT3 (GLAST)",
            "SLC6A6/PAIP1 (GlyT1)",
            "SLC6A9/GlyT2",
            "SLC7A1/y+LAT1",
            "SLC7A2/y+LAT2",
            "SLC7A5/LAT1",
            "SLC7A8/LAT3",
            "SLC3A2/b0,+AT",
            "SLC3A1/b0,+AT",
            "SLC6A14/ASCT2",
            "SLC6A15/ASCT1",
            "SLC6A19/SNAT2",
            "SLC6A20/SNAT1",
            "SLC16A8/OATV1",
            "SLC16A9/OATV2",
            "SLC36A1/EAAC1",
            "SLC36A2/EAAC2",
            "SLC36A3/EAAC3",
            "SLC43A1/EAAT5",
            "SLC43A2/EAAT6",
            "SLC45A1/DIDS1",
            "SLC45A2/DIDS2"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "SLC1A1/EAAT2 (GLAST)",
                "SLC1A2/EAAT1 (GLAST)",
                "SLC1A3/EAAT3 (GLAST)",
                "SLC6A6/PAIP1 (GlyT1)",
                "SLC6A9/GlyT2",
                "SLC7A1/y+LAT1",
                "SLC7A2/y+LAT2",
                "SLC7A5/LAT1",
                "SLC7A8/LAT3",
                "SLC3A2/b0,+AT",
                "SLC3A1/b0,+AT",
                "SLC6A14/ASCT2",
                "SLC6A15/ASCT1",
                "SLC6A19/SNAT2",
                "SLC6A20/SNAT1",
                "SLC16A8/OATV1",
                "SLC16A9/OATV2",
                "SLC36A1/EAAC1",
                "SLC36A2/EAAC2",
                "SLC36A3/EAAC3",
                "SLC43A1/EAAT5",
                "SLC43A2/EAAT6",
                "SLC45A1/DIDS1",
                "SLC45A2/DIDS2"
            ],
            "mismatches": [],
            "true_referents": [
                "SLC16A8/OATV1",
                "SLC16A9/OATV2",
                "SLC1A1/EAAT2 (GLAST)",
                "SLC1A2/EAAT1 (GLAST)",
                "SLC1A3/EAAT3 (GLAST)",
                "SLC36A1/EAAC1",
                "SLC36A2/EAAC2",
                "SLC36A3/EAAC3",
                "SLC3A1/b0,+AT",
                "SLC3A2/b0,+AT",
                "SLC43A1/EAAT5",
                "SLC43A2/EAAT6",
                "SLC45A1/DIDS1",
                "SLC45A2/DIDS2",
                "SLC6A14/ASCT2",
                "SLC6A15/ASCT1",
                "SLC6A19/SNAT2",
                "SLC6A20/SNAT1",
                "SLC6A6/PAIP1 (GlyT1)",
                "SLC6A9/GlyT2",
                "SLC7A1/y+LAT1",
                "SLC7A2/y+LAT2",
                "SLC7A5/LAT1",
                "SLC7A8/LAT3"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "System L1 (SLC7A5)",
            "System L2 (SLC7A8)",
            "System ASC1 (SLC1A5)",
            "System A (SLC38A2)",
            "System N (SLC38A3)",
            "System Xc- (SLC7A11)",
            "System X- (SLC7A6)",
            "System Y+ (SLC7A1)",
            "System B0+ (SLC6A14)",
            "System B0 (SLC6A19)",
            "System IMINO (SLC6A20)",
            "System T (SLC16A10)",
            "System X- (SLC7A9)",
            "System L3 (SLC7A10)",
            "System ASC2 (SLC7A12)",
            "System Y+L (SLC7A7)",
            "System X- (SLC7A2)",
            "System X- (SLC7A3)",
            "System X- (SLC7A4)",
            "System A (SLC38A1)",
            "System N (SLC38A5)",
            "System X- (SLC7A13)",
            "System X- (SLC7A14)",
            "System X- (SLC7A15)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "System L1 (SLC7A5)",
                "System L2 (SLC7A8)",
                "System ASC1 (SLC1A5)",
                "System A (SLC38A2)",
                "System N (SLC38A3)",
                "System Xc- (SLC7A11)",
                "System X- (SLC7A6)",
                "System Y+ (SLC7A1)",
                "System B0+ (SLC6A14)",
                "System B0 (SLC6A19)",
                "System IMINO (SLC6A20)",
                "System T (SLC16A10)",
                "System X- (SLC7A9)",
                "System L3 (SLC7A10)",
                "System ASC2 (SLC7A12)",
                "System Y+L (SLC7A7)",
                "System X- (SLC7A2)",
                "System X- (SLC7A3)",
                "System X- (SLC7A4)",
                "System A (SLC38A1)",
                "System N (SLC38A5)",
                "System X- (SLC7A13)",
                "System X- (SLC7A14)",
                "System X- (SLC7A15)"
            ],
            "mismatches": [],
            "true_referents": [
                "System A (SLC38A1)",
                "System A (SLC38A2)",
                "System ASC1 (SLC1A5)",
                "System ASC2 (SLC7A12)",
                "System B0 (SLC6A19)",
                "System B0+ (SLC6A14)",
                "System IMINO (SLC6A20)",
                "System L1 (SLC7A5)",
                "System L2 (SLC7A8)",
                "System L3 (SLC7A10)",
                "System N (SLC38A3)",
                "System N (SLC38A5)",
                "System T (SLC16A10)",
                "System X- (SLC7A13)",
                "System X- (SLC7A14)",
                "System X- (SLC7A15)",
                "System X- (SLC7A2)",
                "System X- (SLC7A3)",
                "System X- (SLC7A4)",
                "System X- (SLC7A6)",
                "System X- (SLC7A9)",
                "System Xc- (SLC7A11)",
                "System Y+ (SLC7A1)",
                "System Y+L (SLC7A7)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "SLC1A1 (Sodium-dependent neutral amino acid transporter 1)",
            "SLC1A2 (Sodium-dependent glutamate/aspartate transporter)",
            "SLC1A3 (Glial high-affinity glutamate transporter)",
            "SLC6A19 (B0AT1, Neutral amino acid transporter)",
            "SLC7A1 (Cationic amino acid transporter 1)",
            "SLC7A2 (Cationic amino acid transporter 2)",
            "SLC7A5 (LAT1, Large neutral amino acid transporter 1)",
            "SLC7A6 (System L amino acid transporter)",
            "SLC7A7 (CAT2, Cationic amino acid transporter)",
            "SLC7A9 (System ASC amino acid transporter)",
            "SLC16A1 (Monocarboxylate transporter 1)",
            "SLC16A2 (Monocarboxylate transporter 2)",
            "SLC25A22 (Mitochondrial glutamate carrier)",
            "SLC36A1 (Proton-coupled amino acid transporter 1)",
            "SLC38A1 (System A amino acid transporter)",
            "SLC38A2 (System A amino acid transporter)",
            "SLC39A1 (Zinc transporter 1)",
            "SLC43A1 (L-type amino acid transporter 3)",
            "SLC44A1 (Choline transporter)",
            "SLC6A20 (Proline transporter)",
            "SLC7A4 (System X- amino acid transporter)",
            "SLC7A5 (System L amino acid transporter)",
            "SLC7A8 (System X- amino acid transporter)",
            "SLC1A5 (ASCT2, Alanine-serine-cysteine transporter 2)",
            "SLC6A12 (Sodium-dependent neutral amino acid transporter)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "SLC1A1 (Sodium-dependent neutral amino acid transporter 1)",
                "SLC1A2 (Sodium-dependent glutamate/aspartate transporter)",
                "SLC1A3 (Glial high-affinity glutamate transporter)",
                "SLC6A19 (B0AT1, Neutral amino acid transporter)",
                "SLC7A1 (Cationic amino acid transporter 1)",
                "SLC7A2 (Cationic amino acid transporter 2)",
                "SLC7A5 (LAT1, Large neutral amino acid transporter 1)",
                "SLC7A6 (System L amino acid transporter)",
                "SLC7A7 (CAT2, Cationic amino acid transporter)",
                "SLC7A9 (System ASC amino acid transporter)",
                "SLC16A1 (Monocarboxylate transporter 1)",
                "SLC16A2 (Monocarboxylate transporter 2)",
                "SLC25A22 (Mitochondrial glutamate carrier)",
                "SLC36A1 (Proton-coupled amino acid transporter 1)",
                "SLC38A1 (System A amino acid transporter)",
                "SLC38A2 (System A amino acid transporter)",
                "SLC39A1 (Zinc transporter 1)",
                "SLC43A1 (L-type amino acid transporter 3)",
                "SLC44A1 (Choline transporter)",
                "SLC6A20 (Proline transporter)",
                "SLC7A4 (System X- amino acid transporter)",
                "SLC7A8 (System X- amino acid transporter)",
                "SLC1A5 (ASCT2, Alanine-serine-cysteine transporter 2)"
            ],
            "mismatches": [
                "SLC6A12 (Sodium-dependent neutral amino acid transporter)"
            ],
            "true_referents": [
                "SLC16A1 (Monocarboxylate transporter 1)",
                "SLC16A2 (Monocarboxylate transporter 2)",
                "SLC1A1 (Sodium-dependent neutral amino acid transporter 1)",
                "SLC1A2 (Sodium-dependent glutamate/aspartate transporter)",
                "SLC1A3 (Glial high-affinity glutamate transporter)",
                "SLC1A5 (ASCT2, Alanine-serine-cysteine transporter 2)",
                "SLC25A22 (Mitochondrial glutamate carrier)",
                "SLC36A1 (Proton-coupled amino acid transporter 1)",
                "SLC38A1 (System A amino acid transporter)",
                "SLC38A2 (System A amino acid transporter)",
                "SLC39A1 (Zinc transporter 1)",
                "SLC43A1 (L-type amino acid transporter 3)",
                "SLC44A1 (Choline transporter)",
                "SLC6A19 (B0AT1, Neutral amino acid transporter)",
                "SLC6A20 (Proline transporter)",
                "SLC7A1 (Cationic amino acid transporter 1)",
                "SLC7A2 (Cationic amino acid transporter 2)",
                "SLC7A4 (System X- amino acid transporter)",
                "SLC7A5 (LAT1, Large neutral amino acid transporter 1)",
                "SLC7A5 (System L amino acid transporter)",
                "SLC7A6 (System L amino acid transporter)",
                "SLC7A7 (CAT2, Cationic amino acid transporter)",
                "SLC7A8 (System X- amino acid transporter)",
                "SLC7A9 (System ASC amino acid transporter)"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "Sodium-coupled neutral amino acid transporter 1 (SNAT1)",
            "Sodium-coupled neutral amino acid transporter 2 (SNAT2)",
            "Sodium-coupled neutral amino acid transporter 3 (SNAT3)",
            "Sodium-coupled neutral amino acid transporter 4 (SNAT4)",
            "Sodium-coupled neutral amino acid transporter 5 (SNAT5)",
            "Sodium-coupled neutral amino acid transporter 6 (SNAT6)",
            "Sodium-coupled neutral amino acid transporter 7 (SNAT7)",
            "Sodium-coupled neutral amino acid transporter 8 (SNAT8)",
            "Sodium-coupled neutral amino acid transporter 9 (SNAT9)",
            "Sodium-coupled neutral amino acid transporter 10 (SNAT10)",
            "Sodium-coupled neutral amino acid transporter 11 (SNAT11)",
            "Sodium-coupled neutral amino acid transporter 12 (SNAT12)",
            "Sodium-coupled neutral amino acid transporter 13 (SNAT13)",
            "Sodium-coupled neutral amino acid transporter 14 (SNAT14)",
            "Sodium-coupled neutral amino acid transporter 15 (SNAT15)",
            "Sodium-coupled neutral amino acid transporter 16 (SNAT16)",
            "Sodium-coupled neutral amino acid transporter 17 (SNAT17)",
            "Sodium-coupled neutral amino acid transporter 18 (SNAT18)",
            "Sodium-coupled neutral amino acid transporter 19 (SNAT19)",
            "Sodium-coupled neutral amino acid transporter 20 (SNAT20)",
            "Sodium-coupled neutral amino acid transporter 21 (SNAT21)",
            "Sodium-coupled neutral amino acid transporter 22 (SNAT22)",
            "Sodium-coupled neutral amino acid transporter 23 (SNAT23)",
            "Sodium-coupled neutral amino acid transporter 24 (SNAT24)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sodium-coupled neutral amino acid transporter 1 (SNAT1)",
                "Sodium-coupled neutral amino acid transporter 2 (SNAT2)",
                "Sodium-coupled neutral amino acid transporter 3 (SNAT3)",
                "Sodium-coupled neutral amino acid transporter 4 (SNAT4)",
                "Sodium-coupled neutral amino acid transporter 5 (SNAT5)",
                "Sodium-coupled neutral amino acid transporter 6 (SNAT6)",
                "Sodium-coupled neutral amino acid transporter 7 (SNAT7)",
                "Sodium-coupled neutral amino acid transporter 8 (SNAT8)",
                "Sodium-coupled neutral amino acid transporter 9 (SNAT9)",
                "Sodium-coupled neutral amino acid transporter 10 (SNAT10)",
                "Sodium-coupled neutral amino acid transporter 11 (SNAT11)",
                "Sodium-coupled neutral amino acid transporter 12 (SNAT12)",
                "Sodium-coupled neutral amino acid transporter 13 (SNAT13)",
                "Sodium-coupled neutral amino acid transporter 14 (SNAT14)",
                "Sodium-coupled neutral amino acid transporter 15 (SNAT15)",
                "Sodium-coupled neutral amino acid transporter 16 (SNAT16)",
                "Sodium-coupled neutral amino acid transporter 17 (SNAT17)",
                "Sodium-coupled neutral amino acid transporter 18 (SNAT18)",
                "Sodium-coupled neutral amino acid transporter 19 (SNAT19)",
                "Sodium-coupled neutral amino acid transporter 20 (SNAT20)",
                "Sodium-coupled neutral amino acid transporter 21 (SNAT21)",
                "Sodium-coupled neutral amino acid transporter 22 (SNAT22)",
                "Sodium-coupled neutral amino acid transporter 23 (SNAT23)",
                "Sodium-coupled neutral amino acid transporter 24 (SNAT24)"
            ],
            "mismatches": [],
            "true_referents": [
                "Sodium-coupled neutral amino acid transporter 1 (SNAT1)",
                "Sodium-coupled neutral amino acid transporter 10 (SNAT10)",
                "Sodium-coupled neutral amino acid transporter 11 (SNAT11)",
                "Sodium-coupled neutral amino acid transporter 12 (SNAT12)",
                "Sodium-coupled neutral amino acid transporter 13 (SNAT13)",
                "Sodium-coupled neutral amino acid transporter 14 (SNAT14)",
                "Sodium-coupled neutral amino acid transporter 15 (SNAT15)",
                "Sodium-coupled neutral amino acid transporter 16 (SNAT16)",
                "Sodium-coupled neutral amino acid transporter 17 (SNAT17)",
                "Sodium-coupled neutral amino acid transporter 18 (SNAT18)",
                "Sodium-coupled neutral amino acid transporter 19 (SNAT19)",
                "Sodium-coupled neutral amino acid transporter 2 (SNAT2)",
                "Sodium-coupled neutral amino acid transporter 20 (SNAT20)",
                "Sodium-coupled neutral amino acid transporter 21 (SNAT21)",
                "Sodium-coupled neutral amino acid transporter 22 (SNAT22)",
                "Sodium-coupled neutral amino acid transporter 23 (SNAT23)",
                "Sodium-coupled neutral amino acid transporter 24 (SNAT24)",
                "Sodium-coupled neutral amino acid transporter 3 (SNAT3)",
                "Sodium-coupled neutral amino acid transporter 4 (SNAT4)",
                "Sodium-coupled neutral amino acid transporter 5 (SNAT5)",
                "Sodium-coupled neutral amino acid transporter 6 (SNAT6)",
                "Sodium-coupled neutral amino acid transporter 7 (SNAT7)",
                "Sodium-coupled neutral amino acid transporter 8 (SNAT8)",
                "Sodium-coupled neutral amino acid transporter 9 (SNAT9)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "Solute carrier family 7 member 5 (SLC7A5)",
            "Solute carrier family 7 member 8 (SLC7A8)",
            "Solute carrier family 1 member 5 (SLC1A5)",
            "Solute carrier family 6 member 19 (SLC6A19)",
            "Solute carrier family 6 member 20 (SLC6A20)",
            "Solute carrier family 7 member 7 (SLC7A7)",
            "Solute carrier family 1 member 3 (SLC1A3)",
            "Solute carrier family 1 member 2 (SLC1A2)",
            "Solute carrier family 1 member 1 (SLC1A1)",
            "Solute carrier family 7 member 1 (SLC7A1)",
            "Solute carrier family 7 member 11 (SLC7A11)",
            "Solute carrier family 7 member 2 (SLC7A2)",
            "Solute carrier family 7 member 3 (SLC7A3)",
            "Solute carrier family 7 member 4 (SLC7A4)",
            "Solute carrier family 7 member 6 (SLC7A6)",
            "Solute carrier family 7 member 9 (SLC7A9)",
            "Solute carrier family 7 member 10 (SLC7A10)",
            "Solute carrier family 7 member 12 (SLC7A12)",
            "Solute carrier family 7 member 13 (SLC7A13)",
            "Solute carrier family 7 member 14 (SLC7A14)",
            "Solute carrier family 7 member 15 (SLC7A15)",
            "Solute carrier family 7 member 16 (SLC7A16)",
            "Solute carrier family 7 member 17 (SLC7A17)",
            "Solute carrier family 7 member 18 (SLC7A18)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Solute carrier family 7 member 5 (SLC7A5)",
                "Solute carrier family 7 member 8 (SLC7A8)",
                "Solute carrier family 1 member 5 (SLC1A5)",
                "Solute carrier family 6 member 19 (SLC6A19)",
                "Solute carrier family 6 member 20 (SLC6A20)",
                "Solute carrier family 7 member 7 (SLC7A7)",
                "Solute carrier family 1 member 3 (SLC1A3)",
                "Solute carrier family 1 member 2 (SLC1A2)",
                "Solute carrier family 1 member 1 (SLC1A1)",
                "Solute carrier family 7 member 1 (SLC7A1)",
                "Solute carrier family 7 member 11 (SLC7A11)",
                "Solute carrier family 7 member 2 (SLC7A2)",
                "Solute carrier family 7 member 3 (SLC7A3)",
                "Solute carrier family 7 member 4 (SLC7A4)",
                "Solute carrier family 7 member 6 (SLC7A6)",
                "Solute carrier family 7 member 9 (SLC7A9)",
                "Solute carrier family 7 member 10 (SLC7A10)",
                "Solute carrier family 7 member 12 (SLC7A12)",
                "Solute carrier family 7 member 13 (SLC7A13)",
                "Solute carrier family 7 member 14 (SLC7A14)",
                "Solute carrier family 7 member 15 (SLC7A15)",
                "Solute carrier family 7 member 16 (SLC7A16)",
                "Solute carrier family 7 member 17 (SLC7A17)",
                "Solute carrier family 7 member 18 (SLC7A18)"
            ],
            "mismatches": [],
            "true_referents": [
                "Solute carrier family 1 member 1 (SLC1A1)",
                "Solute carrier family 1 member 2 (SLC1A2)",
                "Solute carrier family 1 member 3 (SLC1A3)",
                "Solute carrier family 1 member 5 (SLC1A5)",
                "Solute carrier family 6 member 19 (SLC6A19)",
                "Solute carrier family 6 member 20 (SLC6A20)",
                "Solute carrier family 7 member 1 (SLC7A1)",
                "Solute carrier family 7 member 10 (SLC7A10)",
                "Solute carrier family 7 member 11 (SLC7A11)",
                "Solute carrier family 7 member 12 (SLC7A12)",
                "Solute carrier family 7 member 13 (SLC7A13)",
                "Solute carrier family 7 member 14 (SLC7A14)",
                "Solute carrier family 7 member 15 (SLC7A15)",
                "Solute carrier family 7 member 16 (SLC7A16)",
                "Solute carrier family 7 member 17 (SLC7A17)",
                "Solute carrier family 7 member 18 (SLC7A18)",
                "Solute carrier family 7 member 2 (SLC7A2)",
                "Solute carrier family 7 member 3 (SLC7A3)",
                "Solute carrier family 7 member 4 (SLC7A4)",
                "Solute carrier family 7 member 5 (SLC7A5)",
                "Solute carrier family 7 member 6 (SLC7A6)",
                "Solute carrier family 7 member 7 (SLC7A7)",
                "Solute carrier family 7 member 8 (SLC7A8)",
                "Solute carrier family 7 member 9 (SLC7A9)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "SLC1A4 (ASCT1)",
            "SLC1A5 (ASCT2)",
            "SLC3A2 (CD98)",
            "SLC6A14 (ATB0,+)",
            "SLC6A19 (B0AT1)",
            "SLC7A1 (CAT1)",
            "SLC7A2 (CAT2)",
            "SLC7A3 (CAT3)",
            "SLC7A5 (LAT1)",
            "SLC7A6 (y+LAT2)",
            "SLC7A7 (y+LAT1)",
            "SLC7A8 (LAT2)",
            "SLC7A11 (xCT)",
            "SLC16A10 (TAT1)",
            "SLC16A6 (TAT2)",
            "SLC36A1 (PAT1)",
            "SLC36A2 (PAT2)",
            "SLC38A1 (SNAT1)",
            "SLC38A2 (SNAT2)",
            "SLC38A3 (SNAT3)",
            "SLC38A4 (SNAT4)",
            "SLC43A1 (LAT3)",
            "SLC43A2 (LAT4)",
            "SLC6A20 (PROT)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "SLC1A4 (ASCT1)",
                "SLC1A5 (ASCT2)",
                "SLC3A2 (CD98)",
                "SLC6A14 (ATB0,+)",
                "SLC6A19 (B0AT1)",
                "SLC7A1 (CAT1)",
                "SLC7A2 (CAT2)",
                "SLC7A3 (CAT3)",
                "SLC7A5 (LAT1)",
                "SLC7A6 (y+LAT2)",
                "SLC7A7 (y+LAT1)",
                "SLC7A8 (LAT2)",
                "SLC7A11 (xCT)",
                "SLC16A10 (TAT1)",
                "SLC16A6 (TAT2)",
                "SLC36A1 (PAT1)",
                "SLC36A2 (PAT2)",
                "SLC38A1 (SNAT1)",
                "SLC38A2 (SNAT2)",
                "SLC38A3 (SNAT3)",
                "SLC38A4 (SNAT4)",
                "SLC43A1 (LAT3)",
                "SLC43A2 (LAT4)",
                "SLC6A20 (PROT)"
            ],
            "mismatches": [],
            "true_referents": [
                "SLC16A10 (TAT1)",
                "SLC16A6 (TAT2)",
                "SLC1A4 (ASCT1)",
                "SLC1A5 (ASCT2)",
                "SLC36A1 (PAT1)",
                "SLC36A2 (PAT2)",
                "SLC38A1 (SNAT1)",
                "SLC38A2 (SNAT2)",
                "SLC38A3 (SNAT3)",
                "SLC38A4 (SNAT4)",
                "SLC3A2 (CD98)",
                "SLC43A1 (LAT3)",
                "SLC43A2 (LAT4)",
                "SLC6A14 (ATB0,+)",
                "SLC6A19 (B0AT1)",
                "SLC6A20 (PROT)",
                "SLC7A1 (CAT1)",
                "SLC7A11 (xCT)",
                "SLC7A2 (CAT2)",
                "SLC7A3 (CAT3)",
                "SLC7A5 (LAT1)",
                "SLC7A6 (y+LAT2)",
                "SLC7A7 (y+LAT1)",
                "SLC7A8 (LAT2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "Alanine serine cysteine transporter 2 (ASCT2)",
            "Large neutral amino acids transporter small subunit 1 (LAT1)",
            "Sodium-coupled neutral amino acid transporter 1 (SNAT1)",
            "Cationic amino acid transporter 1 (CAT1)",
            "Excitatory amino acid transporter 1 (EAAT1)",
            "Glycine transporter 1 (GlyT1)",
            "Proton-coupled amino acid transporter 1 (PAT1)",
            "Sodium-dependent neutral amino acid transporter 1 (SNAT2)",
            "System N amino acid transporter 1 (SNAT3)",
            "Vesicular inhibitory amino acid transporter (VIAAT)",
            "Broad neutral amino acid transporter (BOAT)",
            "Sodium-coupled neutral amino acid transporter 2 (SNAT5)",
            "L-type amino acid transporter 2 (LAT2)",
            "Sodium-dependent neutral amino acid transporter B(0)AT1",
            "Proton-assisted amino acid transporter 4 (PAT4)",
            "Sodium-dependent neutral amino acid transporter SLC6A19",
            "Cationic amino acid transporter 2 (CAT2)",
            "Sodium-dependent neutral amino acid transporter SLC6A15",
            "Excitatory amino acid transporter 2 (EAAT2)",
            "Sodium-dependent neutral amino acid transporter SLC6A18",
            "Glycine transporter 2 (GlyT2)",
            "Proton-coupled amino acid transporter 2 (PAT2)",
            "System A amino acid transporter 3 (SNAT4)",
            "Vesicular glutamate transporter 1 (VGLUT1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine serine cysteine transporter 2 (ASCT2)",
                "Large neutral amino acids transporter small subunit 1 (LAT1)",
                "Sodium-coupled neutral amino acid transporter 1 (SNAT1)",
                "Cationic amino acid transporter 1 (CAT1)",
                "Excitatory amino acid transporter 1 (EAAT1)",
                "Glycine transporter 1 (GlyT1)",
                "Proton-coupled amino acid transporter 1 (PAT1)",
                "Sodium-dependent neutral amino acid transporter 1 (SNAT2)",
                "System N amino acid transporter 1 (SNAT3)",
                "Vesicular inhibitory amino acid transporter (VIAAT)",
                "Broad neutral amino acid transporter (BOAT)",
                "Sodium-coupled neutral amino acid transporter 2 (SNAT5)",
                "L-type amino acid transporter 2 (LAT2)",
                "Sodium-dependent neutral amino acid transporter B(0)AT1",
                "Proton-assisted amino acid transporter 4 (PAT4)",
                "Sodium-dependent neutral amino acid transporter SLC6A19",
                "Cationic amino acid transporter 2 (CAT2)",
                "Sodium-dependent neutral amino acid transporter SLC6A15",
                "Excitatory amino acid transporter 2 (EAAT2)",
                "Sodium-dependent neutral amino acid transporter SLC6A18",
                "Glycine transporter 2 (GlyT2)",
                "Proton-coupled amino acid transporter 2 (PAT2)",
                "System A amino acid transporter 3 (SNAT4)",
                "Vesicular glutamate transporter 1 (VGLUT1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alanine serine cysteine transporter 2 (ASCT2)",
                "Broad neutral amino acid transporter (BOAT)",
                "Cationic amino acid transporter 1 (CAT1)",
                "Cationic amino acid transporter 2 (CAT2)",
                "Excitatory amino acid transporter 1 (EAAT1)",
                "Excitatory amino acid transporter 2 (EAAT2)",
                "Glycine transporter 1 (GlyT1)",
                "Glycine transporter 2 (GlyT2)",
                "L-type amino acid transporter 2 (LAT2)",
                "Large neutral amino acids transporter small subunit 1 (LAT1)",
                "Proton-assisted amino acid transporter 4 (PAT4)",
                "Proton-coupled amino acid transporter 1 (PAT1)",
                "Proton-coupled amino acid transporter 2 (PAT2)",
                "Sodium-coupled neutral amino acid transporter 1 (SNAT1)",
                "Sodium-coupled neutral amino acid transporter 2 (SNAT5)",
                "Sodium-dependent neutral amino acid transporter 1 (SNAT2)",
                "Sodium-dependent neutral amino acid transporter B(0)AT1",
                "Sodium-dependent neutral amino acid transporter SLC6A15",
                "Sodium-dependent neutral amino acid transporter SLC6A18",
                "Sodium-dependent neutral amino acid transporter SLC6A19",
                "System A amino acid transporter 3 (SNAT4)",
                "System N amino acid transporter 1 (SNAT3)",
                "Vesicular glutamate transporter 1 (VGLUT1)",
                "Vesicular inhibitory amino acid transporter (VIAAT)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "Large neutral amino acid transporter 1 (LAT1)",
            "Large neutral amino acid transporter 2 (LAT2)",
            "Cationic amino acid transporter 1 (CAT1)",
            "Cationic amino acid transporter 2 (CAT2)",
            "Cationic amino acid transporter 3 (CAT3)",
            "Cationic amino acid transporter 4 (CAT4)",
            "Excitatory amino acid transporter 1 (EAAT1)",
            "Excitatory amino acid transporter 2 (EAAT2)",
            "Excitatory amino acid transporter 3 (EAAT3)",
            "Excitatory amino acid transporter 4 (EAAT4)",
            "Excitatory amino acid transporter 5 (EAAT5)",
            "Alanine-serine-cysteine transporter 1 (ASCT1)",
            "Alanine-serine-cysteine transporter 2 (ASCT2)",
            "Sodium-coupled neutral amino acid transporter 1 (SNAT1)",
            "Sodium-coupled neutral amino acid transporter 2 (SNAT2)",
            "Sodium-coupled neutral amino acid transporter 3 (SNAT3)",
            "Sodium-coupled neutral amino acid transporter 4 (SNAT4)",
            "Sodium-coupled neutral amino acid transporter 5 (SNAT5)",
            "Proton-coupled amino acid transporter 1 (PAT1)",
            "Proton-coupled amino acid transporter 2 (PAT2)",
            "Proton-coupled amino acid transporter 4 (PAT4)",
            "B0 amino acid transporter 1 (B0AT1)",
            "B0 amino acid transporter 2 (B0AT2)",
            "y+L amino acid transporter 1 (y+LAT1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Large neutral amino acid transporter 1 (LAT1)",
                "Large neutral amino acid transporter 2 (LAT2)",
                "Cationic amino acid transporter 1 (CAT1)",
                "Cationic amino acid transporter 2 (CAT2)",
                "Cationic amino acid transporter 3 (CAT3)",
                "Cationic amino acid transporter 4 (CAT4)",
                "Excitatory amino acid transporter 1 (EAAT1)",
                "Excitatory amino acid transporter 2 (EAAT2)",
                "Excitatory amino acid transporter 3 (EAAT3)",
                "Excitatory amino acid transporter 4 (EAAT4)",
                "Excitatory amino acid transporter 5 (EAAT5)",
                "Alanine-serine-cysteine transporter 1 (ASCT1)",
                "Alanine-serine-cysteine transporter 2 (ASCT2)",
                "Sodium-coupled neutral amino acid transporter 1 (SNAT1)",
                "Sodium-coupled neutral amino acid transporter 2 (SNAT2)",
                "Sodium-coupled neutral amino acid transporter 3 (SNAT3)",
                "Sodium-coupled neutral amino acid transporter 4 (SNAT4)",
                "Sodium-coupled neutral amino acid transporter 5 (SNAT5)",
                "Proton-coupled amino acid transporter 1 (PAT1)",
                "Proton-coupled amino acid transporter 2 (PAT2)",
                "Proton-coupled amino acid transporter 4 (PAT4)",
                "B0 amino acid transporter 1 (B0AT1)",
                "B0 amino acid transporter 2 (B0AT2)",
                "y+L amino acid transporter 1 (y+LAT1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alanine-serine-cysteine transporter 1 (ASCT1)",
                "Alanine-serine-cysteine transporter 2 (ASCT2)",
                "B0 amino acid transporter 1 (B0AT1)",
                "B0 amino acid transporter 2 (B0AT2)",
                "Cationic amino acid transporter 1 (CAT1)",
                "Cationic amino acid transporter 2 (CAT2)",
                "Cationic amino acid transporter 3 (CAT3)",
                "Cationic amino acid transporter 4 (CAT4)",
                "Excitatory amino acid transporter 1 (EAAT1)",
                "Excitatory amino acid transporter 2 (EAAT2)",
                "Excitatory amino acid transporter 3 (EAAT3)",
                "Excitatory amino acid transporter 4 (EAAT4)",
                "Excitatory amino acid transporter 5 (EAAT5)",
                "Large neutral amino acid transporter 1 (LAT1)",
                "Large neutral amino acid transporter 2 (LAT2)",
                "Proton-coupled amino acid transporter 1 (PAT1)",
                "Proton-coupled amino acid transporter 2 (PAT2)",
                "Proton-coupled amino acid transporter 4 (PAT4)",
                "Sodium-coupled neutral amino acid transporter 1 (SNAT1)",
                "Sodium-coupled neutral amino acid transporter 2 (SNAT2)",
                "Sodium-coupled neutral amino acid transporter 3 (SNAT3)",
                "Sodium-coupled neutral amino acid transporter 4 (SNAT4)",
                "Sodium-coupled neutral amino acid transporter 5 (SNAT5)",
                "y+L amino acid transporter 1 (y+LAT1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "System ASC amino acid transporter (ASC)",
            "Cationic amino acid transporter 1 (CAT1)",
            "L-type amino acid transporter 1 (LAT1)",
            "y+L amino acid transporter 1 (y+LAT1)",
            "Alanine-serine-cysteine transporter 1 (ASCT1)",
            "Glycoprotein-associated amino acid transporter (gpaAT)",
            "Proton-assisted amino acid transporter 1 (PAT1)",
            "Sodium-coupled neutral amino acid transporter 2 (SNAT2)",
            "Cystine/glutamate antiporter (xCT)",
            "Heteromeric amino acid transporter (HAT)",
            "Amino acid transporter B0AT1 (B0AT1)",
            "Amino acid transporter B0AT3 (B0AT3)",
            "Sodium-coupled neutral amino acid transporter 4 (SNAT4)",
            "Sodium-coupled neutral amino acid transporter 5 (SNAT5)",
            "Sodium-coupled neutral amino acid transporter 7 (SNAT7)",
            "Proton-assisted amino acid transporter 2 (PAT2)",
            "Proton-assisted amino acid transporter 3 (PAT3)",
            "Proton-assisted amino acid transporter 4 (PAT4)",
            "Sodium-coupled neutral amino acid transporter 1 (SNAT1)",
            "Sodium-coupled neutral amino acid transporter 3 (SNAT3)",
            "Sodium-coupled neutral amino acid transporter 6 (SNAT6)",
            "Amino acid transporter ATB0,+",
            "Amino acid transporter AGT1",
            "Amino acid transporter TA1"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "System ASC amino acid transporter (ASC)",
                "Cationic amino acid transporter 1 (CAT1)",
                "L-type amino acid transporter 1 (LAT1)",
                "y+L amino acid transporter 1 (y+LAT1)",
                "Alanine-serine-cysteine transporter 1 (ASCT1)",
                "Glycoprotein-associated amino acid transporter (gpaAT)",
                "Proton-assisted amino acid transporter 1 (PAT1)",
                "Sodium-coupled neutral amino acid transporter 2 (SNAT2)",
                "Cystine/glutamate antiporter (xCT)",
                "Heteromeric amino acid transporter (HAT)",
                "Amino acid transporter B0AT1 (B0AT1)",
                "Amino acid transporter B0AT3 (B0AT3)",
                "Sodium-coupled neutral amino acid transporter 4 (SNAT4)",
                "Sodium-coupled neutral amino acid transporter 5 (SNAT5)",
                "Sodium-coupled neutral amino acid transporter 7 (SNAT7)",
                "Proton-assisted amino acid transporter 2 (PAT2)",
                "Proton-assisted amino acid transporter 3 (PAT3)",
                "Proton-assisted amino acid transporter 4 (PAT4)",
                "Sodium-coupled neutral amino acid transporter 1 (SNAT1)",
                "Sodium-coupled neutral amino acid transporter 3 (SNAT3)",
                "Sodium-coupled neutral amino acid transporter 6 (SNAT6)",
                "Amino acid transporter ATB0,+",
                "Amino acid transporter AGT1",
                "Amino acid transporter TA1"
            ],
            "mismatches": [],
            "true_referents": [
                "Alanine-serine-cysteine transporter 1 (ASCT1)",
                "Amino acid transporter AGT1",
                "Amino acid transporter ATB0,+",
                "Amino acid transporter B0AT1 (B0AT1)",
                "Amino acid transporter B0AT3 (B0AT3)",
                "Amino acid transporter TA1",
                "Cationic amino acid transporter 1 (CAT1)",
                "Cystine/glutamate antiporter (xCT)",
                "Glycoprotein-associated amino acid transporter (gpaAT)",
                "Heteromeric amino acid transporter (HAT)",
                "L-type amino acid transporter 1 (LAT1)",
                "Proton-assisted amino acid transporter 1 (PAT1)",
                "Proton-assisted amino acid transporter 2 (PAT2)",
                "Proton-assisted amino acid transporter 3 (PAT3)",
                "Proton-assisted amino acid transporter 4 (PAT4)",
                "Sodium-coupled neutral amino acid transporter 1 (SNAT1)",
                "Sodium-coupled neutral amino acid transporter 2 (SNAT2)",
                "Sodium-coupled neutral amino acid transporter 3 (SNAT3)",
                "Sodium-coupled neutral amino acid transporter 4 (SNAT4)",
                "Sodium-coupled neutral amino acid transporter 5 (SNAT5)",
                "Sodium-coupled neutral amino acid transporter 6 (SNAT6)",
                "Sodium-coupled neutral amino acid transporter 7 (SNAT7)",
                "System ASC amino acid transporter (ASC)",
                "y+L amino acid transporter 1 (y+LAT1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "Alanine Transporter (SNAT2)",
            "Arginine Transporter (CAT1)",
            "Asparagine Transporter (ASCT2)",
            "Aspartate Transporter (EAAT1)",
            "Cysteine Transporter (xCT)",
            "Glutamate Transporter (EAAT2)",
            "Glutamine Transporter (SNAT3)",
            "Glycine Transporter (GLYT1)",
            "Histidine Transporter (CAT2)",
            "Isoleucine Transporter (LAT1)",
            "Leucine Transporter (LAT1)",
            "Lysine Transporter (CAT1)",
            "Methionine Transporter (LAT1)",
            "Ornithine Transporter (CAT1)",
            "Phenylalanine Transporter (LAT1)",
            "Proline Transporter (SNAT2)",
            "Serine Transporter (ASCT2)",
            "Taurine Transporter (TauT)",
            "Threonine Transporter (SNAT2)",
            "Tryptophan Transporter (LAT1)",
            "Tyrosine Transporter (LAT1)",
            "Valine Transporter (LAT1)",
            "Cationic Amino Acid Transporter (CAT1)",
            "Neutral Amino Acid Transporter (ASCT2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine Transporter (SNAT2)",
                "Arginine Transporter (CAT1)",
                "Asparagine Transporter (ASCT2)",
                "Aspartate Transporter (EAAT1)",
                "Cysteine Transporter (xCT)",
                "Glutamate Transporter (EAAT2)",
                "Glutamine Transporter (SNAT3)",
                "Glycine Transporter (GLYT1)",
                "Histidine Transporter (CAT2)",
                "Isoleucine Transporter (LAT1)",
                "Leucine Transporter (LAT1)",
                "Lysine Transporter (CAT1)",
                "Methionine Transporter (LAT1)",
                "Ornithine Transporter (CAT1)",
                "Phenylalanine Transporter (LAT1)",
                "Proline Transporter (SNAT2)",
                "Serine Transporter (ASCT2)",
                "Taurine Transporter (TauT)",
                "Threonine Transporter (SNAT2)",
                "Tryptophan Transporter (LAT1)",
                "Tyrosine Transporter (LAT1)",
                "Valine Transporter (LAT1)",
                "Cationic Amino Acid Transporter (CAT1)",
                "Neutral Amino Acid Transporter (ASCT2)"
            ],
            "mismatches": [
                "Histidine Transporter (CAT2)"
            ],
            "true_referents": [
                "Alanine Transporter (SNAT2)",
                "Arginine Transporter (CAT1)",
                "Asparagine Transporter (ASCT2)",
                "Aspartate Transporter (EAAT1)",
                "Cationic Amino Acid Transporter (CAT1)",
                "Cysteine Transporter (xCT)",
                "Glutamate Transporter (EAAT2)",
                "Glutamine Transporter (SNAT3)",
                "Glycine Transporter (GLYT1)",
                "Histidine Transporter (CAT2)",
                "Isoleucine Transporter (LAT1)",
                "Leucine Transporter (LAT1)",
                "Lysine Transporter (CAT1)",
                "Methionine Transporter (LAT1)",
                "Neutral Amino Acid Transporter (ASCT2)",
                "Ornithine Transporter (CAT1)",
                "Phenylalanine Transporter (LAT1)",
                "Proline Transporter (SNAT2)",
                "Serine Transporter (ASCT2)",
                "Taurine Transporter (TauT)",
                "Threonine Transporter (SNAT2)",
                "Tryptophan Transporter (LAT1)",
                "Tyrosine Transporter (LAT1)",
                "Valine Transporter (LAT1)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "SLC1A5 (ATM1) in human placenta (1)",
            "SLC6A19 in human liver (2)",
            "SLC7A5 in human kidney (3)",
            "SLC7A8 in human brain (4)",
            "SLC22A2 in human liver (5)",
            "SLC22A6 in human kidney (6)",
            "SLC25A12 in human liver (7)",
            "SLC25A15 in human placenta (8)",
            "SLC25A22 in human brain (9)",
            "SLC25A23 in human kidney (10)",
            "SLC25A24 in human liver (11)",
            "SLC25A25 in human placenta (12)",
            "SLC25A26 in human brain (13)",
            "SLC25A27 in human kidney (14)",
            "SLC25A28 in human liver (15)",
            "SLC25A29 in human placenta (16)",
            "SLC25A30 in human brain (17)",
            "SLC25A31 in human kidney (18)",
            "SLC25A32 in human liver (19)",
            "SLC25A33 in human placenta (20)",
            "SLC25A34 in human brain (21)",
            "SLC25A35 in human kidney (22)",
            "SLC25A36 in human liver (23)",
            "SLC25A37 in human placenta (24)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "SLC1A5 (ATM1) in human placenta (1)",
                "SLC6A19 in human liver (2)",
                "SLC7A5 in human kidney (3)",
                "SLC7A8 in human brain (4)",
                "SLC22A2 in human liver (5)",
                "SLC22A6 in human kidney (6)",
                "SLC25A12 in human liver (7)",
                "SLC25A15 in human placenta (8)",
                "SLC25A22 in human brain (9)",
                "SLC25A23 in human kidney (10)",
                "SLC25A24 in human liver (11)",
                "SLC25A25 in human placenta (12)",
                "SLC25A26 in human brain (13)",
                "SLC25A27 in human kidney (14)",
                "SLC25A28 in human liver (15)",
                "SLC25A29 in human placenta (16)",
                "SLC25A30 in human brain (17)",
                "SLC25A31 in human kidney (18)",
                "SLC25A32 in human liver (19)",
                "SLC25A33 in human placenta (20)",
                "SLC25A34 in human brain (21)",
                "SLC25A35 in human kidney (22)",
                "SLC25A36 in human liver (23)",
                "SLC25A37 in human placenta (24)"
            ],
            "mismatches": [],
            "true_referents": [
                "SLC1A5 (ATM1) in human placenta (1)",
                "SLC22A2 in human liver (5)",
                "SLC22A6 in human kidney (6)",
                "SLC25A12 in human liver (7)",
                "SLC25A15 in human placenta (8)",
                "SLC25A22 in human brain (9)",
                "SLC25A23 in human kidney (10)",
                "SLC25A24 in human liver (11)",
                "SLC25A25 in human placenta (12)",
                "SLC25A26 in human brain (13)",
                "SLC25A27 in human kidney (14)",
                "SLC25A28 in human liver (15)",
                "SLC25A29 in human placenta (16)",
                "SLC25A30 in human brain (17)",
                "SLC25A31 in human kidney (18)",
                "SLC25A32 in human liver (19)",
                "SLC25A33 in human placenta (20)",
                "SLC25A34 in human brain (21)",
                "SLC25A35 in human kidney (22)",
                "SLC25A36 in human liver (23)",
                "SLC25A37 in human placenta (24)",
                "SLC6A19 in human liver (2)",
                "SLC7A5 in human kidney (3)",
                "SLC7A8 in human brain (4)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            "4F2hc (SLC3A2)",
            "AGT1 (SLC7A7)",
            "ASCT1 (SLC1A4)",
            "ASCT2 (SLC1A5)",
            "ATA1 (SLC16A1)",
            "ATA2 (SLC16A2)",
            "B(0,+)-type amino acid transporter (SLC6A20)",
            "B(0)-type amino acid transporter (SLC6A18)",
            "Beta/GABA transporter (SLC6A12)",
            "CAT-1 (SLC7A1)",
            "CAT-2 (SLC7A2)",
            "CAT-3 (SLC7A3)",
            "CAT-4 (SLC7A4)",
            "CD98hc (SLC3A2)",
            "EAAT1 (SLC1A3)",
            "EAAT2 (SLC1A2)",
            "EAAT3 (SLC1A1)",
            "EAAT4 (SLC1A6)",
            "EAAT5 (SLC1A7)",
            "GAT-1 (SLC6A1)",
            "GAT-2 (SLC6A2)",
            "GAT-3 (SLC6A3)",
            "GAT-4 (SLC6A4)",
            "LAT1 (SLC7A5)",
            "LAT2 (SLC7A8)",
            "Proline transporter (SLC6A19)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "4F2hc (SLC3A2)",
                "AGT1 (SLC7A7)",
                "ASCT1 (SLC1A4)",
                "ASCT2 (SLC1A5)",
                "ATA1 (SLC16A1)",
                "ATA2 (SLC16A2)",
                "B(0,+)-type amino acid transporter (SLC6A20)",
                "B(0)-type amino acid transporter (SLC6A18)",
                "Beta/GABA transporter (SLC6A12)",
                "CAT-1 (SLC7A1)",
                "CAT-2 (SLC7A2)",
                "CAT-3 (SLC7A3)",
                "CAT-4 (SLC7A4)",
                "CD98hc (SLC3A2)",
                "EAAT1 (SLC1A3)",
                "EAAT2 (SLC1A2)",
                "EAAT3 (SLC1A1)",
                "EAAT4 (SLC1A6)",
                "EAAT5 (SLC1A7)",
                "GAT-1 (SLC6A1)",
                "GAT-2 (SLC6A2)",
                "GAT-3 (SLC6A3)",
                "GAT-4 (SLC6A4)",
                "LAT1 (SLC7A5)"
            ],
            "mismatches": [
                "LAT2 (SLC7A8)",
                "Proline transporter (SLC6A19)"
            ],
            "true_referents": [
                "4F2hc (SLC3A2)",
                "AGT1 (SLC7A7)",
                "ASCT1 (SLC1A4)",
                "ASCT2 (SLC1A5)",
                "ATA1 (SLC16A1)",
                "ATA2 (SLC16A2)",
                "B(0)-type amino acid transporter (SLC6A18)",
                "B(0,+)-type amino acid transporter (SLC6A20)",
                "Beta/GABA transporter (SLC6A12)",
                "CAT-1 (SLC7A1)",
                "CAT-2 (SLC7A2)",
                "CAT-3 (SLC7A3)",
                "CAT-4 (SLC7A4)",
                "CD98hc (SLC3A2)",
                "EAAT1 (SLC1A3)",
                "EAAT2 (SLC1A2)",
                "EAAT3 (SLC1A1)",
                "EAAT4 (SLC1A6)",
                "EAAT5 (SLC1A7)",
                "GAT-1 (SLC6A1)",
                "GAT-2 (SLC6A2)",
                "GAT-3 (SLC6A3)",
                "GAT-4 (SLC6A4)",
                "LAT1 (SLC7A5)"
            ],
            "TP": 24,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "plasma membrane amino acid transporter",
        "domain": "biology",
        "response": [
            {
                "Referent": "Apolipoprotein E receptor 2 (ApoER2)",
                "Identifier": "ApoER2"
            },
            {
                "Referent": "Breast cancer resistance protein (BCRP)",
                "Identifier": "BCRP"
            },
            {
                "Referent": "Cationic amino acid transporter 1 (CAT1)",
                "Identifier": "CAT1"
            },
            {
                "Referent": "Cationic amino acid transporter 2 (CAT2)",
                "Identifier": "CAT2"
            },
            {
                "Referent": "Cationic amino acid transporter 3 (CAT3)",
                "Identifier": "CAT3"
            },
            {
                "Referent": "Cationic amino acid transporter 4 (CAT4)",
                "Identifier": "CAT4"
            },
            {
                "Referent": "Cationic amino acid transporter 5 (CAT5)",
                "Identifier": "CAT5"
            },
            {
                "Referent": "Cationic amino acid transporter 6 (CAT6)",
                "Identifier": "CAT6"
            },
            {
                "Referent": "Cationic amino acid transporter 7 (CAT7)",
                "Identifier": "CAT7"
            },
            {
                "Referent": "Cationic amino acid transporter 8 (CAT8)",
                "Identifier": "CAT8"
            },
            {
                "Referent": "Cationic amino acid transporter 9 (CAT9)",
                "Identifier": "CAT9"
            },
            {
                "Referent": "Cationic amino acid transporter 10 (CAT10)",
                "Identifier": "CAT10"
            },
            {
                "Referent": "Cationic amino acid transporter 11 (CAT11)",
                "Identifier": "CAT11"
            },
            {
                "Referent": "Cationic amino acid transporter 12 (CAT12)",
                "Identifier": "CAT12"
            },
            {
                "Referent": "Cationic amino acid transporter 13 (CAT13)",
                "Identifier": "CAT13"
            },
            {
                "Referent": "Cationic amino acid transporter 14 (CAT14)",
                "Identifier": "CAT14"
            },
            {
                "Referent": "Cationic amino acid transporter 15 (CAT15)",
                "Identifier": "CAT15"
            },
            {
                "Referent": "Cationic amino acid transporter 16 (CAT16)",
                "Identifier": "CAT16"
            },
            {
                "Referent": "Cationic amino acid transporter 17 (CAT17)",
                "Identifier": "CAT17"
            },
            {
                "Referent": "Cationic amino acid transporter 18 (CAT18)",
                "Identifier": "CAT18"
            },
            {
                "Referent": "Cationic amino acid transporter 19 (CAT19)",
                "Identifier": "CAT19"
            },
            {
                "Referent": "Cationic amino acid transporter 20 (CAT20)",
                "Identifier": "CAT20"
            },
            {
                "Referent": "Cationic amino acid transporter 21 (CAT21)",
                "Identifier": "CAT21"
            },
            {
                "Referent": "Cationic amino acid transporter 22 (CAT22)",
                "Identifier": "CAT22"
            },
            {
                "Referent": "Cationic amino acid transporter 23 (CAT23)",
                "Identifier": "CAT23"
            },
            {
                "Referent": "Cationic amino acid transporter 24 (CAT24)",
                "Identifier": "CAT24"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Apolipoprotein E receptor 2 (ApoER2)",
                "Breast cancer resistance protein (BCRP)",
                "Cationic amino acid transporter 1 (CAT1)",
                "Cationic amino acid transporter 2 (CAT2)",
                "Cationic amino acid transporter 3 (CAT3)",
                "Cationic amino acid transporter 4 (CAT4)",
                "Cationic amino acid transporter 5 (CAT5)",
                "Cationic amino acid transporter 6 (CAT6)",
                "Cationic amino acid transporter 7 (CAT7)",
                "Cationic amino acid transporter 8 (CAT8)",
                "Cationic amino acid transporter 9 (CAT9)",
                "Cationic amino acid transporter 10 (CAT10)",
                "Cationic amino acid transporter 11 (CAT11)",
                "Cationic amino acid transporter 12 (CAT12)",
                "Cationic amino acid transporter 13 (CAT13)",
                "Cationic amino acid transporter 14 (CAT14)",
                "Cationic amino acid transporter 15 (CAT15)",
                "Cationic amino acid transporter 16 (CAT16)",
                "Cationic amino acid transporter 17 (CAT17)",
                "Cationic amino acid transporter 18 (CAT18)",
                "Cationic amino acid transporter 19 (CAT19)",
                "Cationic amino acid transporter 20 (CAT20)",
                "Cationic amino acid transporter 21 (CAT21)",
                "Cationic amino acid transporter 22 (CAT22)"
            ],
            "mismatches": [
                "Cationic amino acid transporter 23 (CAT23)",
                "Cationic amino acid transporter 24 (CAT24)"
            ],
            "true_referents": [
                "{\"Referent\": \"Apolipoprotein E receptor 2 (ApoER2)\", \"Identifier\": \"ApoER2\"}",
                "{\"Referent\": \"Breast cancer resistance protein (BCRP)\", \"Identifier\": \"BCRP\"}",
                "{\"Referent\": \"Cationic amino acid transporter 1 (CAT1)\", \"Identifier\": \"CAT1\"}",
                "{\"Referent\": \"Cationic amino acid transporter 10 (CAT10)\", \"Identifier\": \"CAT10\"}",
                "{\"Referent\": \"Cationic amino acid transporter 11 (CAT11)\", \"Identifier\": \"CAT11\"}",
                "{\"Referent\": \"Cationic amino acid transporter 12 (CAT12)\", \"Identifier\": \"CAT12\"}",
                "{\"Referent\": \"Cationic amino acid transporter 13 (CAT13)\", \"Identifier\": \"CAT13\"}",
                "{\"Referent\": \"Cationic amino acid transporter 14 (CAT14)\", \"Identifier\": \"CAT14\"}",
                "{\"Referent\": \"Cationic amino acid transporter 15 (CAT15)\", \"Identifier\": \"CAT15\"}",
                "{\"Referent\": \"Cationic amino acid transporter 16 (CAT16)\", \"Identifier\": \"CAT16\"}",
                "{\"Referent\": \"Cationic amino acid transporter 17 (CAT17)\", \"Identifier\": \"CAT17\"}",
                "{\"Referent\": \"Cationic amino acid transporter 18 (CAT18)\", \"Identifier\": \"CAT18\"}",
                "{\"Referent\": \"Cationic amino acid transporter 19 (CAT19)\", \"Identifier\": \"CAT19\"}",
                "{\"Referent\": \"Cationic amino acid transporter 2 (CAT2)\", \"Identifier\": \"CAT2\"}",
                "{\"Referent\": \"Cationic amino acid transporter 20 (CAT20)\", \"Identifier\": \"CAT20\"}",
                "{\"Referent\": \"Cationic amino acid transporter 21 (CAT21)\", \"Identifier\": \"CAT21\"}",
                "{\"Referent\": \"Cationic amino acid transporter 22 (CAT22)\", \"Identifier\": \"CAT22\"}",
                "{\"Referent\": \"Cationic amino acid transporter 3 (CAT3)\", \"Identifier\": \"CAT3\"}",
                "{\"Referent\": \"Cationic amino acid transporter 4 (CAT4)\", \"Identifier\": \"CAT4\"}",
                "{\"Referent\": \"Cationic amino acid transporter 5 (CAT5)\", \"Identifier\": \"CAT5\"}",
                "{\"Referent\": \"Cationic amino acid transporter 6 (CAT6)\", \"Identifier\": \"CAT6\"}",
                "{\"Referent\": \"Cationic amino acid transporter 7 (CAT7)\", \"Identifier\": \"CAT7\"}",
                "{\"Referent\": \"Cationic amino acid transporter 8 (CAT8)\", \"Identifier\": \"CAT8\"}",
                "{\"Referent\": \"Cationic amino acid transporter 9 (CAT9)\", \"Identifier\": \"CAT9\"}"
            ],
            "TP": 24,
            "FP": 2,
            "FN": 0
        }
    }
]