[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "MT-ATP6 (MT-ATP6)",
            "MT-ATP8 (MT-ATP8)",
            "MT-CO1 (MT-CO1)",
            "MT-CO2 (MT-CO2)",
            "MT-CO3 (MT-CO3)",
            "MT-ND1 (MT-ND1)",
            "MT-ND2 (MT-ND2)",
            "MT-ND3 (MT-ND3)",
            "MT-ND4 (MT-ND4)",
            "MT-ND4L (MT-ND4L)",
            "MT-ND5 (MT-ND5)",
            "MT-ND6 (MT-ND6)",
            "MT-CYB (MT-CYB)",
            "MT-ATP8 (MT-ATP8)",
            "MT-RNR1 (MT-RNR1)",
            "MT-RNR2 (MT-RNR2)",
            "MT-TP (MT-TP)",
            "MT-TQ (MT-TQ)",
            "MT-TK (MT-TK)",
            "MT-TV (MT-TV)",
            "MT-TF (MT-TF)",
            "MT-TS1 (MT-TS1)",
            "MT-TS2 (MT-TS2)",
            "MT-TL1 (MT-TL1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "MT-ATP6 (MT-ATP6)",
                "MT-ATP8 (MT-ATP8)",
                "MT-CO1 (MT-CO1)",
                "MT-CO2 (MT-CO2)",
                "MT-CO3 (MT-CO3)",
                "MT-ND1 (MT-ND1)",
                "MT-ND2 (MT-ND2)",
                "MT-ND3 (MT-ND3)",
                "MT-ND4 (MT-ND4)",
                "MT-ND4L (MT-ND4L)",
                "MT-ND5 (MT-ND5)",
                "MT-ND6 (MT-ND6)",
                "MT-CYB (MT-CYB)",
                "MT-RNR1 (MT-RNR1)",
                "MT-RNR2 (MT-RNR2)",
                "MT-TP (MT-TP)",
                "MT-TQ (MT-TQ)",
                "MT-TK (MT-TK)",
                "MT-TV (MT-TV)",
                "MT-TF (MT-TF)",
                "MT-TS1 (MT-TS1)",
                "MT-TS2 (MT-TS2)",
                "MT-TL1 (MT-TL1)"
            ],
            "mismatches": [],
            "true_referents": [
                "MT-ATP6 (MT-ATP6)",
                "MT-ATP8 (MT-ATP8)",
                "MT-CO1 (MT-CO1)",
                "MT-CO2 (MT-CO2)",
                "MT-CO3 (MT-CO3)",
                "MT-CYB (MT-CYB)",
                "MT-ND1 (MT-ND1)",
                "MT-ND2 (MT-ND2)",
                "MT-ND3 (MT-ND3)",
                "MT-ND4 (MT-ND4)",
                "MT-ND4L (MT-ND4L)",
                "MT-ND5 (MT-ND5)",
                "MT-ND6 (MT-ND6)",
                "MT-RNR1 (MT-RNR1)",
                "MT-RNR2 (MT-RNR2)",
                "MT-TF (MT-TF)",
                "MT-TK (MT-TK)",
                "MT-TL1 (MT-TL1)",
                "MT-TP (MT-TP)",
                "MT-TQ (MT-TQ)",
                "MT-TS1 (MT-TS1)",
                "MT-TS2 (MT-TS2)",
                "MT-TV (MT-TV)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "ATP6 (MT-ATP6)",
            "ATP8 (MT-ATP8)",
            "ND1 (MT-ND1)",
            "ND2 (MT-ND2)",
            "ND3 (MT-ND3)",
            "ND4 (MT-ND4)",
            "ND4L (MT-ND4L)",
            "ND5 (MT-ND5)",
            "ND6 (MT-ND6)",
            "CYTB (MT-CYB)",
            "COX1 (MT-CO1)",
            "COX2 (MT-CO2)",
            "COX3 (MT-CO3)",
            "TFAM (MT-TFAM)",
            "ND1 (MT-ND1)",
            "ND2 (MT-ND2)",
            "ND3 (MT-ND3)",
            "ND4 (MT-ND4)",
            "ND4L (MT-ND4L)",
            "ND5 (MT-ND5)",
            "ND6 (MT-ND6)",
            "CYTB (MT-CYB)",
            "COX1 (MT-CO1)",
            "COX2 (MT-CO2)",
            "COX3 (MT-CO3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATP6 (MT-ATP6)",
                "ATP8 (MT-ATP8)",
                "ND1 (MT-ND1)",
                "ND2 (MT-ND2)",
                "ND3 (MT-ND3)",
                "ND4 (MT-ND4)",
                "ND4L (MT-ND4L)",
                "ND5 (MT-ND5)",
                "ND6 (MT-ND6)",
                "CYTB (MT-CYB)",
                "COX1 (MT-CO1)",
                "COX2 (MT-CO2)",
                "COX3 (MT-CO3)",
                "TFAM (MT-TFAM)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP6 (MT-ATP6)",
                "ATP8 (MT-ATP8)",
                "COX1 (MT-CO1)",
                "COX2 (MT-CO2)",
                "COX3 (MT-CO3)",
                "CYTB (MT-CYB)",
                "ND1 (MT-ND1)",
                "ND2 (MT-ND2)",
                "ND3 (MT-ND3)",
                "ND4 (MT-ND4)",
                "ND4L (MT-ND4L)",
                "ND5 (MT-ND5)",
                "ND6 (MT-ND6)",
                "TFAM (MT-TFAM)"
            ],
            "TP": 14,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "MT-CO1 (COI)",
            "MT-CO2",
            "MT-CO3",
            "MT-CYB",
            "MT-ATP6",
            "MT-ATP8",
            "MT-ND1",
            "MT-ND2",
            "MT-ND3",
            "MT-ND4",
            "MT-ND4L",
            "MT-ND5",
            "MT-ND6",
            "MT-RNR1",
            "MT-RNR2",
            "MT-TP",
            "MT-TA",
            "MT-TC",
            "MT-TD",
            "MT-TE",
            "MT-TF",
            "MT-TG",
            "MT-TH",
            "MT-TI"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "MT-CO1 (COI)",
                "MT-CO2",
                "MT-CO3",
                "MT-CYB",
                "MT-ATP6",
                "MT-ATP8",
                "MT-ND1",
                "MT-ND2",
                "MT-ND3",
                "MT-ND4",
                "MT-ND4L",
                "MT-ND5",
                "MT-ND6",
                "MT-RNR1",
                "MT-RNR2",
                "MT-TP",
                "MT-TA",
                "MT-TC",
                "MT-TD",
                "MT-TE",
                "MT-TF",
                "MT-TG",
                "MT-TH",
                "MT-TI"
            ],
            "mismatches": [],
            "true_referents": [
                "MT-ATP6",
                "MT-ATP8",
                "MT-CO1 (COI)",
                "MT-CO2",
                "MT-CO3",
                "MT-CYB",
                "MT-ND1",
                "MT-ND2",
                "MT-ND3",
                "MT-ND4",
                "MT-ND4L",
                "MT-ND5",
                "MT-ND6",
                "MT-RNR1",
                "MT-RNR2",
                "MT-TA",
                "MT-TC",
                "MT-TD",
                "MT-TE",
                "MT-TF",
                "MT-TG",
                "MT-TH",
                "MT-TI",
                "MT-TP"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "MT-ATP6 (MT-ATP6)",
            "MT-ATP8 (MT-ATP8)",
            "MT-ATP9 (MT-ATP9)",
            "MT-CO1 (MT-CO1)",
            "MT-CO2 (MT-CO2)",
            "MT-CO3 (MT-CO3)",
            "MT-Cytb (MT-Cytb)",
            "MT-ND1 (MT-ND1)",
            "MT-ND2 (MT-ND2)",
            "MT-ND3 (MT-ND3)",
            "MT-ND4 (MT-ND4)",
            "MT-ND4L (MT-ND4L)",
            "MT-ND5 (MT-ND5)",
            "MT-ND6 (MT-ND6)",
            "MT-RNR1 (MT-RNR1)",
            "MT-RNR2 (MT-RNR2)",
            "MT-TF (MT-TF)",
            "MT-TH (MT-TH)",
            "MT-TL1 (MT-TL1)",
            "MT-TL2 (MT-TL2)",
            "MT-TV (MT-TV)",
            "MT-TW (MT-TW)",
            "MT-TY (MT-TY)",
            "MT-TZ (MT-TZ)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "MT-ATP6 (MT-ATP6)",
                "MT-ATP8 (MT-ATP8)",
                "MT-ATP9 (MT-ATP9)",
                "MT-CO1 (MT-CO1)",
                "MT-CO2 (MT-CO2)",
                "MT-CO3 (MT-CO3)",
                "MT-Cytb (MT-Cytb)",
                "MT-ND1 (MT-ND1)",
                "MT-ND2 (MT-ND2)",
                "MT-ND3 (MT-ND3)",
                "MT-ND4 (MT-ND4)",
                "MT-ND4L (MT-ND4L)",
                "MT-ND5 (MT-ND5)",
                "MT-ND6 (MT-ND6)",
                "MT-RNR1 (MT-RNR1)",
                "MT-RNR2 (MT-RNR2)",
                "MT-TF (MT-TF)",
                "MT-TH (MT-TH)",
                "MT-TL1 (MT-TL1)",
                "MT-TL2 (MT-TL2)",
                "MT-TV (MT-TV)",
                "MT-TW (MT-TW)",
                "MT-TY (MT-TY)",
                "MT-TZ (MT-TZ)"
            ],
            "mismatches": [],
            "true_referents": [
                "MT-ATP6 (MT-ATP6)",
                "MT-ATP8 (MT-ATP8)",
                "MT-ATP9 (MT-ATP9)",
                "MT-CO1 (MT-CO1)",
                "MT-CO2 (MT-CO2)",
                "MT-CO3 (MT-CO3)",
                "MT-Cytb (MT-Cytb)",
                "MT-ND1 (MT-ND1)",
                "MT-ND2 (MT-ND2)",
                "MT-ND3 (MT-ND3)",
                "MT-ND4 (MT-ND4)",
                "MT-ND4L (MT-ND4L)",
                "MT-ND5 (MT-ND5)",
                "MT-ND6 (MT-ND6)",
                "MT-RNR1 (MT-RNR1)",
                "MT-RNR2 (MT-RNR2)",
                "MT-TF (MT-TF)",
                "MT-TH (MT-TH)",
                "MT-TL1 (MT-TL1)",
                "MT-TL2 (MT-TL2)",
                "MT-TV (MT-TV)",
                "MT-TW (MT-TW)",
                "MT-TY (MT-TY)",
                "MT-TZ (MT-TZ)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "Cytochrome c oxidase subunit I (MT-CO1)",
            "Cytochrome c oxidase subunit II (MT-CO2)",
            "Cytochrome c oxidase subunit III (MT-CO3)",
            "ATP synthase subunit 6 (MT-ATP6)",
            "ATP synthase subunit 8 (MT-ATP8)",
            "Cytochrome b (MT-CYB)",
            "NADH dehydrogenase subunit 1 (MT-ND1)",
            "NADH dehydrogenase subunit 2 (MT-ND2)",
            "NADH dehydrogenase subunit 3 (MT-ND3)",
            "NADH dehydrogenase subunit 4 (MT-ND4)",
            "NADH dehydrogenase subunit 4L (MT-ND4L)",
            "NADH dehydrogenase subunit 5 (MT-ND5)",
            "NADH dehydrogenase subunit 6 (MT-ND6)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytochrome c oxidase subunit I (MT-CO1)",
                "Cytochrome c oxidase subunit II (MT-CO2)",
                "Cytochrome c oxidase subunit III (MT-CO3)",
                "ATP synthase subunit 6 (MT-ATP6)",
                "ATP synthase subunit 8 (MT-ATP8)",
                "Cytochrome b (MT-CYB)",
                "NADH dehydrogenase subunit 1 (MT-ND1)",
                "NADH dehydrogenase subunit 2 (MT-ND2)",
                "NADH dehydrogenase subunit 3 (MT-ND3)",
                "NADH dehydrogenase subunit 4 (MT-ND4)",
                "NADH dehydrogenase subunit 4L (MT-ND4L)",
                "NADH dehydrogenase subunit 5 (MT-ND5)",
                "NADH dehydrogenase subunit 6 (MT-ND6)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase subunit 6 (MT-ATP6)",
                "ATP synthase subunit 8 (MT-ATP8)",
                "Cytochrome b (MT-CYB)",
                "Cytochrome c oxidase subunit I (MT-CO1)",
                "Cytochrome c oxidase subunit II (MT-CO2)",
                "Cytochrome c oxidase subunit III (MT-CO3)",
                "NADH dehydrogenase subunit 1 (MT-ND1)",
                "NADH dehydrogenase subunit 2 (MT-ND2)",
                "NADH dehydrogenase subunit 3 (MT-ND3)",
                "NADH dehydrogenase subunit 4 (MT-ND4)",
                "NADH dehydrogenase subunit 4L (MT-ND4L)",
                "NADH dehydrogenase subunit 5 (MT-ND5)",
                "NADH dehydrogenase subunit 6 (MT-ND6)"
            ],
            "TP": 13,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "MT-ATP6 (MT-ATP6)",
            "MT-CO1 (MT-CO1)",
            "MT-CO2 (MT-CO2)",
            "MT-CYB (MT-CYB)",
            "MT-ND1 (MT-ND1)",
            "MT-ND2 (MT-ND2)",
            "MT-ND3 (MT-ND3)",
            "MT-ND4 (MT-ND4)",
            "MT-ND4L (MT-ND4L)",
            "MT-ND5 (MT-ND5)",
            "MT-ND6 (MT-ND6)",
            "MT-RNR1 (MT-RNR1)",
            "MT-RNR2 (MT-RNR2)",
            "MT-TF (MT-TF)",
            "MT-TH (MT-TH)",
            "MT-TY (MT-TY)",
            "MT-TS (MT-TS)",
            "MT-TL1 (MT-TL1)",
            "MT-TL2 (MT-TL2)",
            "MT-TG (MT-TG)",
            "MT-TP (MT-TP)",
            "MT-TQ (MT-TQ)",
            "MT-TW (MT-TW)",
            "MT-TX (MT-TX)",
            "MT-TZ (MT-TZ)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "MT-ATP6 (MT-ATP6)",
                "MT-CO1 (MT-CO1)",
                "MT-CO2 (MT-CO2)",
                "MT-CYB (MT-CYB)",
                "MT-ND1 (MT-ND1)",
                "MT-ND2 (MT-ND2)",
                "MT-ND3 (MT-ND3)",
                "MT-ND4 (MT-ND4)",
                "MT-ND4L (MT-ND4L)",
                "MT-ND5 (MT-ND5)",
                "MT-ND6 (MT-ND6)",
                "MT-RNR1 (MT-RNR1)",
                "MT-RNR2 (MT-RNR2)",
                "MT-TF (MT-TF)",
                "MT-TG (MT-TG)",
                "MT-TH (MT-TH)",
                "MT-TL1 (MT-TL1)",
                "MT-TL2 (MT-TL2)",
                "MT-TP (MT-TP)",
                "MT-TQ (MT-TQ)",
                "MT-TS (MT-TS)",
                "MT-TW (MT-TW)",
                "MT-TX (MT-TX)",
                "MT-TY (MT-TY)"
            ],
            "mismatches": [
                "MT-TZ (MT-TZ)"
            ],
            "true_referents": [
                "MT-ATP6 (MT-ATP6)",
                "MT-CO1 (MT-CO1)",
                "MT-CO2 (MT-CO2)",
                "MT-CYB (MT-CYB)",
                "MT-ND1 (MT-ND1)",
                "MT-ND2 (MT-ND2)",
                "MT-ND3 (MT-ND3)",
                "MT-ND4 (MT-ND4)",
                "MT-ND4L (MT-ND4L)",
                "MT-ND5 (MT-ND5)",
                "MT-ND6 (MT-ND6)",
                "MT-RNR1 (MT-RNR1)",
                "MT-RNR2 (MT-RNR2)",
                "MT-TF (MT-TF)",
                "MT-TG (MT-TG)",
                "MT-TH (MT-TH)",
                "MT-TL1 (MT-TL1)",
                "MT-TL2 (MT-TL2)",
                "MT-TP (MT-TP)",
                "MT-TQ (MT-TQ)",
                "MT-TS (MT-TS)",
                "MT-TW (MT-TW)",
                "MT-TX (MT-TX)",
                "MT-TY (MT-TY)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "ATP synthase F0 subunit 6 (ATP6)",
            "ATP synthase F0 subunit 8 (ATP8)",
            "Cytochrome c oxidase I (COX1)",
            "Cytochrome c oxidase II (COX2)",
            "Cytochrome c oxidase III (COX3)",
            "Cytochrome b (CYTB)",
            "NADH dehydrogenase 1 (ND1)",
            "NADH dehydrogenase 2 (ND2)",
            "NADH dehydrogenase 3 (ND3)",
            "NADH dehydrogenase 4 (ND4)",
            "NADH dehydrogenase 4L (ND4L)",
            "NADH dehydrogenase 5 (ND5)",
            "NADH dehydrogenase 6 (ND6)",
            "Mitochondrially Encoded 12S RNA (MT-RNR1)",
            "Mitochondrially Encoded 16S RNA (MT-RNR2)",
            "Mitochondrially Encoded tRNA Phenylalanine (MT-TF)",
            "Mitochondrially Encoded tRNA Leucine 1 (MT-TL1)",
            "Mitochondrially Encoded tRNA Leucine 2 (MT-TL2)",
            "Mitochondrially Encoded tRNA Isoleucine (MT-TI)",
            "Mitochondrially Encoded tRNA Methionine (MT-TM)",
            "Mitochondrially Encoded tRNA Valine (MT-TV)",
            "Mitochondrially Encoded tRNA Serine 1 (MT-TS1)",
            "Mitochondrially Encoded tRNA Serine 2 (MT-TS2)",
            "Mitochondrially Encoded tRNA Proline (MT-TP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATP synthase F0 subunit 6 (ATP6)",
                "ATP synthase F0 subunit 8 (ATP8)",
                "Cytochrome c oxidase I (COX1)",
                "Cytochrome c oxidase II (COX2)",
                "Cytochrome c oxidase III (COX3)",
                "Cytochrome b (CYTB)",
                "NADH dehydrogenase 1 (ND1)",
                "NADH dehydrogenase 2 (ND2)",
                "NADH dehydrogenase 3 (ND3)",
                "NADH dehydrogenase 4 (ND4)",
                "NADH dehydrogenase 4L (ND4L)",
                "NADH dehydrogenase 5 (ND5)",
                "NADH dehydrogenase 6 (ND6)",
                "Mitochondrially Encoded 12S RNA (MT-RNR1)",
                "Mitochondrially Encoded 16S RNA (MT-RNR2)",
                "Mitochondrially Encoded tRNA Phenylalanine (MT-TF)",
                "Mitochondrially Encoded tRNA Leucine 1 (MT-TL1)",
                "Mitochondrially Encoded tRNA Leucine 2 (MT-TL2)",
                "Mitochondrially Encoded tRNA Isoleucine (MT-TI)",
                "Mitochondrially Encoded tRNA Methionine (MT-TM)",
                "Mitochondrially Encoded tRNA Valine (MT-TV)",
                "Mitochondrially Encoded tRNA Serine 1 (MT-TS1)",
                "Mitochondrially Encoded tRNA Serine 2 (MT-TS2)",
                "Mitochondrially Encoded tRNA Proline (MT-TP)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase F0 subunit 6 (ATP6)",
                "ATP synthase F0 subunit 8 (ATP8)",
                "Cytochrome b (CYTB)",
                "Cytochrome c oxidase I (COX1)",
                "Cytochrome c oxidase II (COX2)",
                "Cytochrome c oxidase III (COX3)",
                "Mitochondrially Encoded 12S RNA (MT-RNR1)",
                "Mitochondrially Encoded 16S RNA (MT-RNR2)",
                "Mitochondrially Encoded tRNA Isoleucine (MT-TI)",
                "Mitochondrially Encoded tRNA Leucine 1 (MT-TL1)",
                "Mitochondrially Encoded tRNA Leucine 2 (MT-TL2)",
                "Mitochondrially Encoded tRNA Methionine (MT-TM)",
                "Mitochondrially Encoded tRNA Phenylalanine (MT-TF)",
                "Mitochondrially Encoded tRNA Proline (MT-TP)",
                "Mitochondrially Encoded tRNA Serine 1 (MT-TS1)",
                "Mitochondrially Encoded tRNA Serine 2 (MT-TS2)",
                "Mitochondrially Encoded tRNA Valine (MT-TV)",
                "NADH dehydrogenase 1 (ND1)",
                "NADH dehydrogenase 2 (ND2)",
                "NADH dehydrogenase 3 (ND3)",
                "NADH dehydrogenase 4 (ND4)",
                "NADH dehydrogenase 4L (ND4L)",
                "NADH dehydrogenase 5 (ND5)",
                "NADH dehydrogenase 6 (ND6)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "MT-CO1 (cytochrome c oxidase subunit 1)",
            "MT-CO2 (cytochrome c oxidase subunit 2)",
            "MT-CO3 (cytochrome c oxidase subunit 3)",
            "MT-CYB (cytochrome b)",
            "MT-ND1 (NADH dehydrogenase subunit 1)",
            "MT-ND2 (NADH dehydrogenase subunit 2)",
            "MT-ND3 (NADH dehydrogenase subunit 3)",
            "MT-ND4 (NADH dehydrogenase subunit 4)",
            "MT-ND4L (NADH dehydrogenase subunit 4L)",
            "MT-ND5 (NADH dehydrogenase subunit 5)",
            "MT-ND6 (NADH dehydrogenase subunit 6)",
            "MT-ATP6 (ATP synthase F0 subunit 6)",
            "MT-ATP8 (ATP synthase F0 subunit 8)",
            "MT-RNR1 (12S ribosomal RNA)",
            "MT-RNR2 (16S ribosomal RNA)",
            "MT-TC (tRNA-Cys)",
            "MT-TD (tRNA-Asp)",
            "MT-TE (tRNA-Glu)",
            "MT-TF (tRNA-Phe)",
            "MT-TG (tRNA-Gly)",
            "MT-TH (tRNA-His)",
            "MT-TI (tRNA-Ile)",
            "MT-TK (tRNA-Lys)",
            "MT-TL1 (tRNA-Leu(CUN))",
            "MT-TL2 (tRNA-Leu(UUR))"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "MT-CO1 (cytochrome c oxidase subunit 1)",
                "MT-CO2 (cytochrome c oxidase subunit 2)",
                "MT-CO3 (cytochrome c oxidase subunit 3)",
                "MT-CYB (cytochrome b)",
                "MT-ND1 (NADH dehydrogenase subunit 1)",
                "MT-ND2 (NADH dehydrogenase subunit 2)",
                "MT-ND3 (NADH dehydrogenase subunit 3)",
                "MT-ND4 (NADH dehydrogenase subunit 4)",
                "MT-ND4L (NADH dehydrogenase subunit 4L)",
                "MT-ND5 (NADH dehydrogenase subunit 5)",
                "MT-ND6 (NADH dehydrogenase subunit 6)",
                "MT-ATP6 (ATP synthase F0 subunit 6)",
                "MT-ATP8 (ATP synthase F0 subunit 8)",
                "MT-RNR1 (12S ribosomal RNA)",
                "MT-RNR2 (16S ribosomal RNA)",
                "MT-TC (tRNA-Cys)",
                "MT-TD (tRNA-Asp)",
                "MT-TE (tRNA-Glu)",
                "MT-TF (tRNA-Phe)",
                "MT-TG (tRNA-Gly)",
                "MT-TH (tRNA-His)",
                "MT-TI (tRNA-Ile)",
                "MT-TK (tRNA-Lys)",
                "MT-TL1 (tRNA-Leu(CUN))"
            ],
            "mismatches": [
                "MT-TL2 (tRNA-Leu(UUR))"
            ],
            "true_referents": [
                "MT-ATP6 (ATP synthase F0 subunit 6)",
                "MT-ATP8 (ATP synthase F0 subunit 8)",
                "MT-CO1 (cytochrome c oxidase subunit 1)",
                "MT-CO2 (cytochrome c oxidase subunit 2)",
                "MT-CO3 (cytochrome c oxidase subunit 3)",
                "MT-CYB (cytochrome b)",
                "MT-ND1 (NADH dehydrogenase subunit 1)",
                "MT-ND2 (NADH dehydrogenase subunit 2)",
                "MT-ND3 (NADH dehydrogenase subunit 3)",
                "MT-ND4 (NADH dehydrogenase subunit 4)",
                "MT-ND4L (NADH dehydrogenase subunit 4L)",
                "MT-ND5 (NADH dehydrogenase subunit 5)",
                "MT-ND6 (NADH dehydrogenase subunit 6)",
                "MT-RNR1 (12S ribosomal RNA)",
                "MT-RNR2 (16S ribosomal RNA)",
                "MT-TC (tRNA-Cys)",
                "MT-TD (tRNA-Asp)",
                "MT-TE (tRNA-Glu)",
                "MT-TF (tRNA-Phe)",
                "MT-TG (tRNA-Gly)",
                "MT-TH (tRNA-His)",
                "MT-TI (tRNA-Ile)",
                "MT-TK (tRNA-Lys)",
                "MT-TL1 (tRNA-Leu(CUN))"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "MT-ATP6 (ATP synthase F0 subunit 6)",
            "MT-ATP8 (ATP synthase F0 subunit 8)",
            "MT-CO1 (Cytochrome c oxidase subunit I)",
            "MT-CO2 (Cytochrome c oxidase subunit II)",
            "MT-CO3 (Cytochrome c oxidase subunit III)",
            "MT-CYB (Cytochrome b)",
            "MT-ND1 (NADH dehydrogenase 1)",
            "MT-ND2 (NADH dehydrogenase 2)",
            "MT-ND3 (NADH dehydrogenase 3)",
            "MT-ND4 (NADH dehydrogenase 4)",
            "MT-ND4L (NADH dehydrogenase 4L)",
            "MT-ND5 (NADH dehydrogenase 5)",
            "MT-ND6 (NADH dehydrogenase 6)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "MT-ATP6 (ATP synthase F0 subunit 6)",
                "MT-ATP8 (ATP synthase F0 subunit 8)",
                "MT-CO1 (Cytochrome c oxidase subunit I)",
                "MT-CO2 (Cytochrome c oxidase subunit II)",
                "MT-CO3 (Cytochrome c oxidase subunit III)",
                "MT-CYB (Cytochrome b)",
                "MT-ND1 (NADH dehydrogenase 1)",
                "MT-ND2 (NADH dehydrogenase 2)",
                "MT-ND3 (NADH dehydrogenase 3)",
                "MT-ND4 (NADH dehydrogenase 4)",
                "MT-ND4L (NADH dehydrogenase 4L)",
                "MT-ND5 (NADH dehydrogenase 5)",
                "MT-ND6 (NADH dehydrogenase 6)"
            ],
            "mismatches": [],
            "true_referents": [
                "MT-ATP6 (ATP synthase F0 subunit 6)",
                "MT-ATP8 (ATP synthase F0 subunit 8)",
                "MT-CO1 (Cytochrome c oxidase subunit I)",
                "MT-CO2 (Cytochrome c oxidase subunit II)",
                "MT-CO3 (Cytochrome c oxidase subunit III)",
                "MT-CYB (Cytochrome b)",
                "MT-ND1 (NADH dehydrogenase 1)",
                "MT-ND2 (NADH dehydrogenase 2)",
                "MT-ND3 (NADH dehydrogenase 3)",
                "MT-ND4 (NADH dehydrogenase 4)",
                "MT-ND4L (NADH dehydrogenase 4L)",
                "MT-ND5 (NADH dehydrogenase 5)",
                "MT-ND6 (NADH dehydrogenase 6)"
            ],
            "TP": 13,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "ATP6 (MT-ATP6)",
            "ATP8 (MT-ATP8)",
            "COX1 (MT-CO1)",
            "COX2 (MT-CO2)",
            "COX3 (MT-CO3)",
            "CYTB (MT-CYB)",
            "ND1 (MT-ND1)",
            "ND2 (MT-ND2)",
            "ND3 (MT-ND3)",
            "ND4 (MT-ND4)",
            "ND4L (MT-ND4L)",
            "ND5 (MT-ND5)",
            "ND6 (MT-ND6)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATP6 (MT-ATP6)",
                "ATP8 (MT-ATP8)",
                "COX1 (MT-CO1)",
                "COX2 (MT-CO2)",
                "COX3 (MT-CO3)",
                "CYTB (MT-CYB)",
                "ND1 (MT-ND1)",
                "ND2 (MT-ND2)",
                "ND3 (MT-ND3)",
                "ND4 (MT-ND4)",
                "ND4L (MT-ND4L)",
                "ND5 (MT-ND5)",
                "ND6 (MT-ND6)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP6 (MT-ATP6)",
                "ATP8 (MT-ATP8)",
                "COX1 (MT-CO1)",
                "COX2 (MT-CO2)",
                "COX3 (MT-CO3)",
                "CYTB (MT-CYB)",
                "ND1 (MT-ND1)",
                "ND2 (MT-ND2)",
                "ND3 (MT-ND3)",
                "ND4 (MT-ND4)",
                "ND4L (MT-ND4L)",
                "ND5 (MT-ND5)",
                "ND6 (MT-ND6)"
            ],
            "TP": 13,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "MT-ATP6 (ATP6)",
            "MT-ATP8 (ATP8)",
            "MT-CO1 (COX1)",
            "MT-CO2 (COX2)",
            "MT-CO3 (COX3)",
            "MT-CYB (CYTB)",
            "MT-ND1 (ND1)",
            "MT-ND2 (ND2)",
            "MT-ND3 (ND3)",
            "MT-ND4 (ND4)",
            "MT-ND4L (ND4L)",
            "MT-ND5 (ND5)",
            "MT-ND6 (ND6)",
            "MT-RNR1 (12S rRNA)",
            "MT-RNR2 (16S rRNA)",
            "MT-TA (tRNA-Ala)",
            "MT-TC (tRNA-Cys)",
            "MT-TD (tRNA-Asp)",
            "MT-TE (tRNA-Glu)",
            "MT-TF (tRNA-Phe)",
            "MT-TG (tRNA-Gly)",
            "MT-TH (tRNA-His)",
            "MT-TI (tRNA-Ile)",
            "MT-TK (tRNA-Lys)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "MT-ATP6 (ATP6)",
                "MT-ATP8 (ATP8)",
                "MT-CO1 (COX1)",
                "MT-CO2 (COX2)",
                "MT-CO3 (COX3)",
                "MT-CYB (CYTB)",
                "MT-ND1 (ND1)",
                "MT-ND2 (ND2)",
                "MT-ND3 (ND3)",
                "MT-ND4 (ND4)",
                "MT-ND4L (ND4L)",
                "MT-ND5 (ND5)",
                "MT-ND6 (ND6)",
                "MT-RNR1 (12S rRNA)",
                "MT-RNR2 (16S rRNA)",
                "MT-TA (tRNA-Ala)",
                "MT-TC (tRNA-Cys)",
                "MT-TD (tRNA-Asp)",
                "MT-TE (tRNA-Glu)",
                "MT-TF (tRNA-Phe)",
                "MT-TG (tRNA-Gly)",
                "MT-TH (tRNA-His)",
                "MT-TI (tRNA-Ile)",
                "MT-TK (tRNA-Lys)"
            ],
            "mismatches": [],
            "true_referents": [
                "MT-ATP6 (ATP6)",
                "MT-ATP8 (ATP8)",
                "MT-CO1 (COX1)",
                "MT-CO2 (COX2)",
                "MT-CO3 (COX3)",
                "MT-CYB (CYTB)",
                "MT-ND1 (ND1)",
                "MT-ND2 (ND2)",
                "MT-ND3 (ND3)",
                "MT-ND4 (ND4)",
                "MT-ND4L (ND4L)",
                "MT-ND5 (ND5)",
                "MT-ND6 (ND6)",
                "MT-RNR1 (12S rRNA)",
                "MT-RNR2 (16S rRNA)",
                "MT-TA (tRNA-Ala)",
                "MT-TC (tRNA-Cys)",
                "MT-TD (tRNA-Asp)",
                "MT-TE (tRNA-Glu)",
                "MT-TF (tRNA-Phe)",
                "MT-TG (tRNA-Gly)",
                "MT-TH (tRNA-His)",
                "MT-TI (tRNA-Ile)",
                "MT-TK (tRNA-Lys)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "NADH dehydrogenase subunit 1 (ND1)",
            "NADH dehydrogenase subunit 2 (ND2)",
            "NADH dehydrogenase subunit 3 (ND3)",
            "NADH dehydrogenase subunit 4 (ND4)",
            "NADH dehydrogenase subunit 4L (ND4L)",
            "NADH dehydrogenase subunit 5 (ND5)",
            "NADH dehydrogenase subunit 6 (ND6)",
            "Cytochrome b (CYTB)",
            "Cytochrome c oxidase subunit 1 (COX1)",
            "Cytochrome c oxidase subunit 2 (COX2)",
            "Cytochrome c oxidase subunit 3 (COX3)",
            "ATP synthase F0 subunit 6 (ATP6)",
            "ATP synthase F0 subunit 8 (ATP8)",
            "Cytochrome c oxidase subunit 4 (COX4)",
            "Cytochrome c oxidase subunit 5A (COX5A)",
            "Cytochrome c oxidase subunit 5B (COX5B)",
            "Cytochrome c oxidase subunit 6A (COX6A)",
            "Cytochrome c oxidase subunit 6B (COX6B)",
            "Cytochrome c oxidase subunit 7A (COX7A)",
            "Cytochrome c oxidase subunit 7B (COX7B)",
            "Cytochrome c oxidase subunit 7C (COX7C)",
            "Cytochrome c oxidase subunit 8A (COX8A)",
            "Cytochrome c oxidase subunit 8B (COX8B)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "NADH dehydrogenase subunit 1 (ND1)",
                "NADH dehydrogenase subunit 2 (ND2)",
                "NADH dehydrogenase subunit 3 (ND3)",
                "NADH dehydrogenase subunit 4 (ND4)",
                "NADH dehydrogenase subunit 4L (ND4L)",
                "NADH dehydrogenase subunit 5 (ND5)",
                "NADH dehydrogenase subunit 6 (ND6)",
                "Cytochrome b (CYTB)",
                "Cytochrome c oxidase subunit 1 (COX1)",
                "Cytochrome c oxidase subunit 2 (COX2)",
                "Cytochrome c oxidase subunit 3 (COX3)",
                "ATP synthase F0 subunit 6 (ATP6)",
                "ATP synthase F0 subunit 8 (ATP8)",
                "Cytochrome c oxidase subunit 4 (COX4)",
                "Cytochrome c oxidase subunit 5A (COX5A)",
                "Cytochrome c oxidase subunit 5B (COX5B)",
                "Cytochrome c oxidase subunit 6A (COX6A)",
                "Cytochrome c oxidase subunit 6B (COX6B)",
                "Cytochrome c oxidase subunit 7A (COX7A)",
                "Cytochrome c oxidase subunit 7B (COX7B)",
                "Cytochrome c oxidase subunit 7C (COX7C)",
                "Cytochrome c oxidase subunit 8A (COX8A)",
                "Cytochrome c oxidase subunit 8B (COX8B)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase F0 subunit 6 (ATP6)",
                "ATP synthase F0 subunit 8 (ATP8)",
                "Cytochrome b (CYTB)",
                "Cytochrome c oxidase subunit 1 (COX1)",
                "Cytochrome c oxidase subunit 2 (COX2)",
                "Cytochrome c oxidase subunit 3 (COX3)",
                "Cytochrome c oxidase subunit 4 (COX4)",
                "Cytochrome c oxidase subunit 5A (COX5A)",
                "Cytochrome c oxidase subunit 5B (COX5B)",
                "Cytochrome c oxidase subunit 6A (COX6A)",
                "Cytochrome c oxidase subunit 6B (COX6B)",
                "Cytochrome c oxidase subunit 7A (COX7A)",
                "Cytochrome c oxidase subunit 7B (COX7B)",
                "Cytochrome c oxidase subunit 7C (COX7C)",
                "Cytochrome c oxidase subunit 8A (COX8A)",
                "Cytochrome c oxidase subunit 8B (COX8B)",
                "NADH dehydrogenase subunit 1 (ND1)",
                "NADH dehydrogenase subunit 2 (ND2)",
                "NADH dehydrogenase subunit 3 (ND3)",
                "NADH dehydrogenase subunit 4 (ND4)",
                "NADH dehydrogenase subunit 4L (ND4L)",
                "NADH dehydrogenase subunit 5 (ND5)",
                "NADH dehydrogenase subunit 6 (ND6)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "Cytochrome c Oxidase Subunit I (COX1)",
            "Cytochrome c Oxidase Subunit II (COX2)",
            "Cytochrome c Oxidase Subunit III (COX3)",
            "NADH Dehydrogenase Subunit 1 (ND1)",
            "NADH Dehydrogenase Subunit 2 (ND2)",
            "NADH Dehydrogenase Subunit 3 (ND3)",
            "NADH Dehydrogenase Subunit 4 (ND4)",
            "NADH Dehydrogenase Subunit 4L (ND4L)",
            "NADH Dehydrogenase Subunit 5 (ND5)",
            "NADH Dehydrogenase Subunit 6 (ND6)",
            "ATP Synthase F0 Subunit 6 (ATP6)",
            "ATP Synthase F0 Subunit 8 (ATP8)",
            "Cytochrome b (CYTB)",
            "12S Ribosomal RNA (12S rRNA)",
            "16S Ribosomal RNA (16S rRNA)",
            "Displacement Loop (D-Loop)",
            "Mitochondrial Transcription Factor A (TFAM)",
            "Mitochondrial Transcription Termination Factor (mTERF)",
            "Mitochondrial DNA Polymerase Gamma (POLG)",
            "Mitochondrial Transcription Factor B1 (TFB1M)",
            "Mitochondrial Transcription Factor B2 (TFB2M)",
            "Mitochondrial Ribosomal Protein L12 (MRPL12)",
            "Mitochondrial Ribosomal Protein S12 (MRPS12)",
            "Mitochondrial Ribosomal Protein L3 (MRPL3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytochrome c Oxidase Subunit I (COX1)",
                "Cytochrome c Oxidase Subunit II (COX2)",
                "Cytochrome c Oxidase Subunit III (COX3)",
                "NADH Dehydrogenase Subunit 1 (ND1)",
                "NADH Dehydrogenase Subunit 2 (ND2)",
                "NADH Dehydrogenase Subunit 3 (ND3)",
                "NADH Dehydrogenase Subunit 4 (ND4)",
                "NADH Dehydrogenase Subunit 4L (ND4L)",
                "NADH Dehydrogenase Subunit 5 (ND5)",
                "NADH Dehydrogenase Subunit 6 (ND6)",
                "ATP Synthase F0 Subunit 6 (ATP6)",
                "ATP Synthase F0 Subunit 8 (ATP8)",
                "Cytochrome b (CYTB)",
                "12S Ribosomal RNA (12S rRNA)",
                "16S Ribosomal RNA (16S rRNA)",
                "Displacement Loop (D-Loop)",
                "Mitochondrial Transcription Factor A (TFAM)",
                "Mitochondrial Transcription Termination Factor (mTERF)",
                "Mitochondrial DNA Polymerase Gamma (POLG)",
                "Mitochondrial Transcription Factor B1 (TFB1M)",
                "Mitochondrial Transcription Factor B2 (TFB2M)",
                "Mitochondrial Ribosomal Protein L12 (MRPL12)",
                "Mitochondrial Ribosomal Protein S12 (MRPS12)",
                "Mitochondrial Ribosomal Protein L3 (MRPL3)"
            ],
            "mismatches": [],
            "true_referents": [
                "12S Ribosomal RNA (12S rRNA)",
                "16S Ribosomal RNA (16S rRNA)",
                "ATP Synthase F0 Subunit 6 (ATP6)",
                "ATP Synthase F0 Subunit 8 (ATP8)",
                "Cytochrome b (CYTB)",
                "Cytochrome c Oxidase Subunit I (COX1)",
                "Cytochrome c Oxidase Subunit II (COX2)",
                "Cytochrome c Oxidase Subunit III (COX3)",
                "Displacement Loop (D-Loop)",
                "Mitochondrial DNA Polymerase Gamma (POLG)",
                "Mitochondrial Ribosomal Protein L12 (MRPL12)",
                "Mitochondrial Ribosomal Protein L3 (MRPL3)",
                "Mitochondrial Ribosomal Protein S12 (MRPS12)",
                "Mitochondrial Transcription Factor A (TFAM)",
                "Mitochondrial Transcription Factor B1 (TFB1M)",
                "Mitochondrial Transcription Factor B2 (TFB2M)",
                "Mitochondrial Transcription Termination Factor (mTERF)",
                "NADH Dehydrogenase Subunit 1 (ND1)",
                "NADH Dehydrogenase Subunit 2 (ND2)",
                "NADH Dehydrogenase Subunit 3 (ND3)",
                "NADH Dehydrogenase Subunit 4 (ND4)",
                "NADH Dehydrogenase Subunit 4L (ND4L)",
                "NADH Dehydrogenase Subunit 5 (ND5)",
                "NADH Dehydrogenase Subunit 6 (ND6)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "Mitochondrial DNA gene MT-RNR1 (Mitochondrial RNA Ribosomal Protein 1) (MT-RNR1)",
            "Mitochondrial DNA gene MT-TL1 (Mitochondrial Transfer RNA Leucine 1) (MT-TL1)",
            "Mitochondrial DNA gene MT-TK (Mitochondrial Thymidine Kinase) (MT-TK)",
            "Mitochondrial DNA gene MT-ND1 (Mitochondrial NADH Dehydrogenase 1) (MT-ND1)",
            "Mitochondrial DNA gene MT-ND2 (Mitochondrial NADH Dehydrogenase 2) (MT-ND2)",
            "Mitochondrial DNA gene MT-ND3 (Mitochondrial NADH Dehydrogenase 3) (MT-ND3)",
            "Mitochondrial DNA gene MT-ND4 (Mitochondrial NADH Dehydrogenase 4) (MT-ND4)",
            "Mitochondrial DNA gene MT-ND4L (Mitochondrial NADH Dehydrogenase 4L) (MT-ND4L)",
            "Mitochondrial DNA gene MT-ND5 (Mitochondrial NADH Dehydrogenase 5) (MT-ND5)",
            "Mitochondrial DNA gene MT-ND6 (Mitochondrial NADH Dehydrogenase 6) (MT-ND6)",
            "Mitochondrial DNA gene MT-CO1 (Mitochondrial Cytochrome Oxidase 1) (MT-CO1)",
            "Mitochondrial DNA gene MT-CO2 (Mitochondrial Cytochrome Oxidase 2) (MT-CO2)",
            "Mitochondrial DNA gene MT-CO3 (Mitochondrial Cytochrome Oxidase 3) (MT-CO3)",
            "Mitochondrial DNA gene MT-CYB (Mitochondrial Cytochrome B) (MT-CYB)",
            "Mitochondrial DNA gene MT-ATP6 (Mitochondrial ATP Synthase 6) (MT-ATP6)",
            "Mitochondrial DNA gene MT-ATP8 (Mitochondrial ATP Synthase 8) (MT-ATP8)",
            "Mitochondrial DNA gene MT-TW (Mitochondrial T-RNA Tyrosine) (MT-TW)",
            "Mitochondrial DNA gene MT-TV (Mitochondrial T-RNA Valine) (MT-TV)",
            "Mitochondrial DNA gene MT-TH (Mitochondrial T-RNA Histidine) (MT-TH)",
            "Mitochondrial DNA gene MT-TM (Mitochondrial T-RNA Methionine) (MT-TM)",
            "Mitochondrial DNA gene MT-TK2 (Mitochondrial Thymidine Kinase 2) (MT-TK2)",
            "Mitochondrial DNA gene MT-RNR2 (Mitochondrial RNA Ribosomal Protein 2) (MT-RNR2)",
            "Mitochondrial DNA gene MT-RNR3 (Mitochondrial RNA Ribosomal Protein 3) (MT-RNR3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Mitochondrial DNA gene MT-RNR1 (Mitochondrial RNA Ribosomal Protein 1) (MT-RNR1)",
                "Mitochondrial DNA gene MT-TL1 (Mitochondrial Transfer RNA Leucine 1) (MT-TL1)",
                "Mitochondrial DNA gene MT-TK (Mitochondrial Thymidine Kinase) (MT-TK)",
                "Mitochondrial DNA gene MT-ND1 (Mitochondrial NADH Dehydrogenase 1) (MT-ND1)",
                "Mitochondrial DNA gene MT-ND2 (Mitochondrial NADH Dehydrogenase 2) (MT-ND2)",
                "Mitochondrial DNA gene MT-ND3 (Mitochondrial NADH Dehydrogenase 3) (MT-ND3)",
                "Mitochondrial DNA gene MT-ND4 (Mitochondrial NADH Dehydrogenase 4) (MT-ND4)",
                "Mitochondrial DNA gene MT-ND4L (Mitochondrial NADH Dehydrogenase 4L) (MT-ND4L)",
                "Mitochondrial DNA gene MT-ND5 (Mitochondrial NADH Dehydrogenase 5) (MT-ND5)",
                "Mitochondrial DNA gene MT-ND6 (Mitochondrial NADH Dehydrogenase 6) (MT-ND6)",
                "Mitochondrial DNA gene MT-CO1 (Mitochondrial Cytochrome Oxidase 1) (MT-CO1)",
                "Mitochondrial DNA gene MT-CO2 (Mitochondrial Cytochrome Oxidase 2) (MT-CO2)",
                "Mitochondrial DNA gene MT-CO3 (Mitochondrial Cytochrome Oxidase 3) (MT-CO3)",
                "Mitochondrial DNA gene MT-CYB (Mitochondrial Cytochrome B) (MT-CYB)",
                "Mitochondrial DNA gene MT-ATP6 (Mitochondrial ATP Synthase 6) (MT-ATP6)",
                "Mitochondrial DNA gene MT-ATP8 (Mitochondrial ATP Synthase 8) (MT-ATP8)",
                "Mitochondrial DNA gene MT-TW (Mitochondrial T-RNA Tyrosine) (MT-TW)",
                "Mitochondrial DNA gene MT-TV (Mitochondrial T-RNA Valine) (MT-TV)",
                "Mitochondrial DNA gene MT-TH (Mitochondrial T-RNA Histidine) (MT-TH)",
                "Mitochondrial DNA gene MT-TM (Mitochondrial T-RNA Methionine) (MT-TM)",
                "Mitochondrial DNA gene MT-TK2 (Mitochondrial Thymidine Kinase 2) (MT-TK2)",
                "Mitochondrial DNA gene MT-RNR2 (Mitochondrial RNA Ribosomal Protein 2) (MT-RNR2)",
                "Mitochondrial DNA gene MT-RNR3 (Mitochondrial RNA Ribosomal Protein 3) (MT-RNR3)"
            ],
            "mismatches": [],
            "true_referents": [
                "Mitochondrial DNA gene MT-ATP6 (Mitochondrial ATP Synthase 6) (MT-ATP6)",
                "Mitochondrial DNA gene MT-ATP8 (Mitochondrial ATP Synthase 8) (MT-ATP8)",
                "Mitochondrial DNA gene MT-CO1 (Mitochondrial Cytochrome Oxidase 1) (MT-CO1)",
                "Mitochondrial DNA gene MT-CO2 (Mitochondrial Cytochrome Oxidase 2) (MT-CO2)",
                "Mitochondrial DNA gene MT-CO3 (Mitochondrial Cytochrome Oxidase 3) (MT-CO3)",
                "Mitochondrial DNA gene MT-CYB (Mitochondrial Cytochrome B) (MT-CYB)",
                "Mitochondrial DNA gene MT-ND1 (Mitochondrial NADH Dehydrogenase 1) (MT-ND1)",
                "Mitochondrial DNA gene MT-ND2 (Mitochondrial NADH Dehydrogenase 2) (MT-ND2)",
                "Mitochondrial DNA gene MT-ND3 (Mitochondrial NADH Dehydrogenase 3) (MT-ND3)",
                "Mitochondrial DNA gene MT-ND4 (Mitochondrial NADH Dehydrogenase 4) (MT-ND4)",
                "Mitochondrial DNA gene MT-ND4L (Mitochondrial NADH Dehydrogenase 4L) (MT-ND4L)",
                "Mitochondrial DNA gene MT-ND5 (Mitochondrial NADH Dehydrogenase 5) (MT-ND5)",
                "Mitochondrial DNA gene MT-ND6 (Mitochondrial NADH Dehydrogenase 6) (MT-ND6)",
                "Mitochondrial DNA gene MT-RNR1 (Mitochondrial RNA Ribosomal Protein 1) (MT-RNR1)",
                "Mitochondrial DNA gene MT-RNR2 (Mitochondrial RNA Ribosomal Protein 2) (MT-RNR2)",
                "Mitochondrial DNA gene MT-RNR3 (Mitochondrial RNA Ribosomal Protein 3) (MT-RNR3)",
                "Mitochondrial DNA gene MT-TH (Mitochondrial T-RNA Histidine) (MT-TH)",
                "Mitochondrial DNA gene MT-TK (Mitochondrial Thymidine Kinase) (MT-TK)",
                "Mitochondrial DNA gene MT-TK2 (Mitochondrial Thymidine Kinase 2) (MT-TK2)",
                "Mitochondrial DNA gene MT-TL1 (Mitochondrial Transfer RNA Leucine 1) (MT-TL1)",
                "Mitochondrial DNA gene MT-TM (Mitochondrial T-RNA Methionine) (MT-TM)",
                "Mitochondrial DNA gene MT-TV (Mitochondrial T-RNA Valine) (MT-TV)",
                "Mitochondrial DNA gene MT-TW (Mitochondrial T-RNA Tyrosine) (MT-TW)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            "MT-ATP6 (ATP6)",
            "MT-ATP8 (ATP8)",
            "MT-CO1 (CO1)",
            "MT-CO2 (CO2)",
            "MT-CO3 (CO3)",
            "MT-CYB (CYB)",
            "MT-ND1 (ND1)",
            "MT-ND2 (ND2)",
            "MT-ND3 (ND3)",
            "MT-ND4 (ND4)",
            "MT-ND4L (ND4L)",
            "MT-ND5 (ND5)",
            "MT-ND6 (ND6)",
            "MT-RNR1 (12S)",
            "MT-RNR2 (16S)",
            "MT-TA (tRNA-Ala)",
            "MT-TC (tRNA-Cys)",
            "MT-TD (tRNA-Asp)",
            "MT-TE (tRNA-Glu)",
            "MT-TF (tRNA-Phe)",
            "MT-TG (tRNA-Gly)",
            "MT-TH (tRNA-His)",
            "MT-TI (tRNA-Ile)",
            "MT-TK (tRNA-Lys)",
            "MT-TL1 (tRNA-Leu)",
            "MT-TL2 (tRNA-Leu)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "MT-ATP6 (ATP6)",
                "MT-ATP8 (ATP8)",
                "MT-CO1 (CO1)",
                "MT-CO2 (CO2)",
                "MT-CO3 (CO3)",
                "MT-CYB (CYB)",
                "MT-ND1 (ND1)",
                "MT-ND2 (ND2)",
                "MT-ND3 (ND3)",
                "MT-ND4 (ND4)",
                "MT-ND4L (ND4L)",
                "MT-ND5 (ND5)",
                "MT-ND6 (ND6)",
                "MT-RNR1 (12S)",
                "MT-RNR2 (16S)",
                "MT-TA (tRNA-Ala)",
                "MT-TC (tRNA-Cys)",
                "MT-TD (tRNA-Asp)",
                "MT-TE (tRNA-Glu)",
                "MT-TF (tRNA-Phe)",
                "MT-TG (tRNA-Gly)",
                "MT-TH (tRNA-His)",
                "MT-TI (tRNA-Ile)",
                "MT-TK (tRNA-Lys)"
            ],
            "mismatches": [
                "MT-TL1 (tRNA-Leu)",
                "MT-TL2 (tRNA-Leu)"
            ],
            "true_referents": [
                "MT-ATP6 (ATP6)",
                "MT-ATP8 (ATP8)",
                "MT-CO1 (CO1)",
                "MT-CO2 (CO2)",
                "MT-CO3 (CO3)",
                "MT-CYB (CYB)",
                "MT-ND1 (ND1)",
                "MT-ND2 (ND2)",
                "MT-ND3 (ND3)",
                "MT-ND4 (ND4)",
                "MT-ND4L (ND4L)",
                "MT-ND5 (ND5)",
                "MT-ND6 (ND6)",
                "MT-RNR1 (12S)",
                "MT-RNR2 (16S)",
                "MT-TA (tRNA-Ala)",
                "MT-TC (tRNA-Cys)",
                "MT-TD (tRNA-Asp)",
                "MT-TE (tRNA-Glu)",
                "MT-TF (tRNA-Phe)",
                "MT-TG (tRNA-Gly)",
                "MT-TH (tRNA-His)",
                "MT-TI (tRNA-Ile)",
                "MT-TK (tRNA-Lys)"
            ],
            "TP": 24,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "mitochondrial DNA encoded protein-coding gene",
        "domain": "biology",
        "response": [
            {
                "Referent": "Gene A",
                "Canonical Name": "Gene A"
            },
            {
                "Referent": "Gene B",
                "Canonical Name": "Gene B"
            },
            {
                "Referent": "Gene C",
                "Canonical Name": "Gene C"
            },
            {
                "Referent": "Gene D",
                "Canonical Name": "Gene D"
            },
            {
                "Referent": "Gene E",
                "Canonical Name": "Gene E"
            },
            {
                "Referent": "Gene F",
                "Canonical Name": "Gene F"
            },
            {
                "Referent": "Gene G",
                "Canonical Name": "Gene G"
            },
            {
                "Referent": "Gene H",
                "Canonical Name": "Gene H"
            },
            {
                "Referent": "Gene I",
                "Canonical Name": "Gene I"
            },
            {
                "Referent": "Gene J",
                "Canonical Name": "Gene J"
            },
            {
                "Referent": "Gene K",
                "Canonical Name": "Gene K"
            },
            {
                "Referent": "Gene L",
                "Canonical Name": "Gene L"
            },
            {
                "Referent": "Gene M",
                "Canonical Name": "Gene M"
            },
            {
                "Referent": "Gene N",
                "Canonical Name": "Gene N"
            },
            {
                "Referent": "Gene O",
                "Canonical Name": "Gene O"
            },
            {
                "Referent": "Gene P",
                "Canonical Name": "Gene P"
            },
            {
                "Referent": "Gene Q",
                "Canonical Name": "Gene Q"
            },
            {
                "Referent": "Gene R",
                "Canonical Name": "Gene R"
            },
            {
                "Referent": "Gene S",
                "Canonical Name": "Gene S"
            },
            {
                "Referent": "Gene T",
                "Canonical Name": "Gene T"
            },
            {
                "Referent": "Gene U",
                "Canonical Name": "Gene U"
            },
            {
                "Referent": "Gene V",
                "Canonical Name": "Gene V"
            },
            {
                "Referent": "Gene W",
                "Canonical Name": "Gene W"
            },
            {
                "Referent": "Gene X",
                "Canonical Name": "Gene X"
            },
            {
                "Referent": "Gene Y",
                "Canonical Name": "Gene Y"
            },
            {
                "Referent": "Gene Z",
                "Canonical Name": "Gene Z"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gene A",
                "Gene B",
                "Gene C",
                "Gene D",
                "Gene E",
                "Gene F",
                "Gene G",
                "Gene H",
                "Gene I",
                "Gene J",
                "Gene K",
                "Gene L",
                "Gene M",
                "Gene N",
                "Gene O",
                "Gene P",
                "Gene Q",
                "Gene R",
                "Gene S",
                "Gene T",
                "Gene U",
                "Gene V",
                "Gene W",
                "Gene X"
            ],
            "mismatches": [
                "Gene Y",
                "Gene Z"
            ],
            "true_referents": [
                "{\"Referent\": \"Gene A\", \"Canonical Name\": \"Gene A\"}",
                "{\"Referent\": \"Gene B\", \"Canonical Name\": \"Gene B\"}",
                "{\"Referent\": \"Gene C\", \"Canonical Name\": \"Gene C\"}",
                "{\"Referent\": \"Gene D\", \"Canonical Name\": \"Gene D\"}",
                "{\"Referent\": \"Gene E\", \"Canonical Name\": \"Gene E\"}",
                "{\"Referent\": \"Gene F\", \"Canonical Name\": \"Gene F\"}",
                "{\"Referent\": \"Gene G\", \"Canonical Name\": \"Gene G\"}",
                "{\"Referent\": \"Gene H\", \"Canonical Name\": \"Gene H\"}",
                "{\"Referent\": \"Gene I\", \"Canonical Name\": \"Gene I\"}",
                "{\"Referent\": \"Gene J\", \"Canonical Name\": \"Gene J\"}",
                "{\"Referent\": \"Gene K\", \"Canonical Name\": \"Gene K\"}",
                "{\"Referent\": \"Gene L\", \"Canonical Name\": \"Gene L\"}",
                "{\"Referent\": \"Gene M\", \"Canonical Name\": \"Gene M\"}",
                "{\"Referent\": \"Gene N\", \"Canonical Name\": \"Gene N\"}",
                "{\"Referent\": \"Gene O\", \"Canonical Name\": \"Gene O\"}",
                "{\"Referent\": \"Gene P\", \"Canonical Name\": \"Gene P\"}",
                "{\"Referent\": \"Gene Q\", \"Canonical Name\": \"Gene Q\"}",
                "{\"Referent\": \"Gene R\", \"Canonical Name\": \"Gene R\"}",
                "{\"Referent\": \"Gene S\", \"Canonical Name\": \"Gene S\"}",
                "{\"Referent\": \"Gene T\", \"Canonical Name\": \"Gene T\"}",
                "{\"Referent\": \"Gene U\", \"Canonical Name\": \"Gene U\"}",
                "{\"Referent\": \"Gene V\", \"Canonical Name\": \"Gene V\"}",
                "{\"Referent\": \"Gene W\", \"Canonical Name\": \"Gene W\"}",
                "{\"Referent\": \"Gene X\", \"Canonical Name\": \"Gene X\"}"
            ],
            "TP": 24,
            "FP": 2,
            "FN": 0
        }
    }
]