[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "Complex I (NADH:ubiquinone oxidoreductase)",
            "Complex II (Succinate dehydrogenase)",
            "Complex III (Ubiquinol-cytochrome c reductase)",
            "Complex IV (Cytochrome c oxidase)",
            "ATP synthase",
            "Voltage-dependent anion channel (VDAC)",
            "Adenine nucleotide translocator (ANT)",
            "Pyruvate dehydrogenase complex",
            "Fumarate hydratase",
            "Malate dehydrogenase",
            "Isocitrate dehydrogenase",
            "Ketoglutarate dehydrogenase",
            "Mitochondrial glycerol-3-phosphate dehydrogenase",
            "Mitochondrial aldehyde dehydrogenase",
            "Mitochondrial acetyl-CoA synthetase",
            "Mitochondrial citrate synthase",
            "Mitochondrial aconitase",
            "Mitochondrial isocitrate dehydrogenase",
            "Mitochondrial malate dehydrogenase",
            "Mitochondrial fumarase",
            "Mitochondrial succinate dehydrogenase",
            "Mitochondrial glutamate dehydrogenase",
            "Mitochondrial malic enzyme"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Complex I (NADH:ubiquinone oxidoreductase)",
                "Complex II (Succinate dehydrogenase)",
                "Complex III (Ubiquinol-cytochrome c reductase)",
                "Complex IV (Cytochrome c oxidase)",
                "ATP synthase",
                "Voltage-dependent anion channel (VDAC)",
                "Adenine nucleotide translocator (ANT)",
                "Pyruvate dehydrogenase complex",
                "Fumarate hydratase",
                "Malate dehydrogenase",
                "Isocitrate dehydrogenase",
                "Ketoglutarate dehydrogenase",
                "Mitochondrial glycerol-3-phosphate dehydrogenase",
                "Mitochondrial aldehyde dehydrogenase",
                "Mitochondrial acetyl-CoA synthetase",
                "Mitochondrial citrate synthase",
                "Mitochondrial aconitase",
                "Mitochondrial isocitrate dehydrogenase",
                "Mitochondrial malate dehydrogenase",
                "Mitochondrial fumarase",
                "Mitochondrial succinate dehydrogenase",
                "Mitochondrial glutamate dehydrogenase",
                "Mitochondrial malic enzyme"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase",
                "Adenine nucleotide translocator (ANT)",
                "Complex I (NADH:ubiquinone oxidoreductase)",
                "Complex II (Succinate dehydrogenase)",
                "Complex III (Ubiquinol-cytochrome c reductase)",
                "Complex IV (Cytochrome c oxidase)",
                "Fumarate hydratase",
                "Isocitrate dehydrogenase",
                "Ketoglutarate dehydrogenase",
                "Malate dehydrogenase",
                "Mitochondrial acetyl-CoA synthetase",
                "Mitochondrial aconitase",
                "Mitochondrial aldehyde dehydrogenase",
                "Mitochondrial citrate synthase",
                "Mitochondrial fumarase",
                "Mitochondrial glutamate dehydrogenase",
                "Mitochondrial glycerol-3-phosphate dehydrogenase",
                "Mitochondrial isocitrate dehydrogenase",
                "Mitochondrial malate dehydrogenase",
                "Mitochondrial malic enzyme",
                "Mitochondrial succinate dehydrogenase",
                "Pyruvate dehydrogenase complex",
                "Voltage-dependent anion channel (VDAC)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "ATP Synthase (Complex V)",
            "Cytochrome c Oxidase (Complex IV)",
            "NADH:Ubiquinone Oxidoreductase (Complex I)",
            "Succinate:Ubiquinone Oxidoreductase (Complex II)",
            "Ubiquinol:Cytochrome c Oxidoreductase (Complex III)",
            "ATP/ADP Translocase (ANT)",
            "Mitochondrial Carrier Family 1 Member 4 (SLC25A4)",
            "Mitochondrial Carrier Family 1 Member 5 (SLC25A5)",
            "Mitochondrial Carrier Family 1 Member 6 (SLC25A6)",
            "Mitochondrial Carrier Family 1 Member 7 (SLC25A7)",
            "Mitochondrial Carrier Family 1 Member 8 (SLC25A8)",
            "Mitochondrial Carrier Family 1 Member 9 (SLC25A9)",
            "Mitochondrial Carrier Family 1 Member 10 (SLC25A10)",
            "Mitochondrial Carrier Family 1 Member 11 (SLC25A11)",
            "Mitochondrial Carrier Family 1 Member 12 (SLC25A12)",
            "Mitochondrial Carrier Family 1 Member 13 (SLC25A13)",
            "Mitochondrial Carrier Family 1 Member 14 (SLC25A14)",
            "Mitochondrial Carrier Family 1 Member 15 (SLC25A15)",
            "Mitochondrial Carrier Family 1 Member 16 (SLC25A16)",
            "Mitochondrial Carrier Family 1 Member 17 (SLC25A17)",
            "Mitochondrial Carrier Family 1 Member 18 (SLC25A18)",
            "Mitochondrial Carrier Family 1 Member 19 (SLC25A19)",
            "Mitochondrial Carrier Family 1 Member 20 (SLC25A20)",
            "Mitochondrial Carrier Family 1 Member 21 (SLC25A21)",
            "Mitochondrial Carrier Family 1 Member 22 (SLC25A22)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATP Synthase (Complex V)",
                "Cytochrome c Oxidase (Complex IV)",
                "NADH:Ubiquinone Oxidoreductase (Complex I)",
                "Succinate:Ubiquinone Oxidoreductase (Complex II)",
                "Ubiquinol:Cytochrome c Oxidoreductase (Complex III)",
                "ATP/ADP Translocase (ANT)",
                "Mitochondrial Carrier Family 1 Member 4 (SLC25A4)",
                "Mitochondrial Carrier Family 1 Member 5 (SLC25A5)",
                "Mitochondrial Carrier Family 1 Member 6 (SLC25A6)",
                "Mitochondrial Carrier Family 1 Member 7 (SLC25A7)",
                "Mitochondrial Carrier Family 1 Member 8 (SLC25A8)",
                "Mitochondrial Carrier Family 1 Member 9 (SLC25A9)",
                "Mitochondrial Carrier Family 1 Member 10 (SLC25A10)",
                "Mitochondrial Carrier Family 1 Member 11 (SLC25A11)",
                "Mitochondrial Carrier Family 1 Member 12 (SLC25A12)",
                "Mitochondrial Carrier Family 1 Member 13 (SLC25A13)",
                "Mitochondrial Carrier Family 1 Member 14 (SLC25A14)",
                "Mitochondrial Carrier Family 1 Member 15 (SLC25A15)",
                "Mitochondrial Carrier Family 1 Member 16 (SLC25A16)",
                "Mitochondrial Carrier Family 1 Member 17 (SLC25A17)",
                "Mitochondrial Carrier Family 1 Member 18 (SLC25A18)",
                "Mitochondrial Carrier Family 1 Member 19 (SLC25A19)",
                "Mitochondrial Carrier Family 1 Member 20 (SLC25A20)",
                "Mitochondrial Carrier Family 1 Member 21 (SLC25A21)"
            ],
            "mismatches": [
                "Mitochondrial Carrier Family 1 Member 22 (SLC25A22)"
            ],
            "true_referents": [
                "ATP Synthase (Complex V)",
                "ATP/ADP Translocase (ANT)",
                "Cytochrome c Oxidase (Complex IV)",
                "Mitochondrial Carrier Family 1 Member 10 (SLC25A10)",
                "Mitochondrial Carrier Family 1 Member 11 (SLC25A11)",
                "Mitochondrial Carrier Family 1 Member 12 (SLC25A12)",
                "Mitochondrial Carrier Family 1 Member 13 (SLC25A13)",
                "Mitochondrial Carrier Family 1 Member 14 (SLC25A14)",
                "Mitochondrial Carrier Family 1 Member 15 (SLC25A15)",
                "Mitochondrial Carrier Family 1 Member 16 (SLC25A16)",
                "Mitochondrial Carrier Family 1 Member 17 (SLC25A17)",
                "Mitochondrial Carrier Family 1 Member 18 (SLC25A18)",
                "Mitochondrial Carrier Family 1 Member 19 (SLC25A19)",
                "Mitochondrial Carrier Family 1 Member 20 (SLC25A20)",
                "Mitochondrial Carrier Family 1 Member 21 (SLC25A21)",
                "Mitochondrial Carrier Family 1 Member 4 (SLC25A4)",
                "Mitochondrial Carrier Family 1 Member 5 (SLC25A5)",
                "Mitochondrial Carrier Family 1 Member 6 (SLC25A6)",
                "Mitochondrial Carrier Family 1 Member 7 (SLC25A7)",
                "Mitochondrial Carrier Family 1 Member 8 (SLC25A8)",
                "Mitochondrial Carrier Family 1 Member 9 (SLC25A9)",
                "NADH:Ubiquinone Oxidoreductase (Complex I)",
                "Succinate:Ubiquinone Oxidoreductase (Complex II)",
                "Ubiquinol:Cytochrome c Oxidoreductase (Complex III)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "ATP synthase (Complex V)",
            "Complex I (NADH dehydrogenase)",
            "Complex II (Succinate dehydrogenase)",
            "Complex III (Coenzyme Q-cytochrome c reductase)",
            "Complex IV (Cytochrome c oxidase)",
            "Mitochondrial inner membrane protein 1 (MIM1)",
            "Mitochondrial inner membrane protein 2 (MIM2)",
            "Mitochondrial inner membrane protein 3 (MIM3)",
            "Mitochondrial inner membrane protein 4 (MIM4)",
            "Mitochondrial inner membrane protein 5 (MIM5)",
            "Mitochondrial inner membrane protein 6 (MIM6)",
            "Mitochondrial inner membrane protein 7 (MIM7)",
            "Mitochondrial inner membrane protein 8 (MIM8)",
            "Mitochondrial inner membrane protein 9 (MIM9)",
            "Mitochondrial inner membrane protein 10 (MIM10)",
            "Mitochondrial inner membrane protein 11 (MIM11)",
            "Mitochondrial inner membrane protein 12 (MIM12)",
            "Mitochondrial inner membrane protein 13 (MIM13)",
            "Mitochondrial inner membrane protein 14 (MIM14)",
            "Mitochondrial inner membrane protein 15 (MIM15)",
            "Mitochondrial inner membrane protein 16 (MIM16)",
            "Mitochondrial inner membrane protein 17 (MIM17)",
            "Mitochondrial inner membrane protein 18 (MIM18)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATP synthase (Complex V)",
                "Complex I (NADH dehydrogenase)",
                "Complex II (Succinate dehydrogenase)",
                "Complex III (Coenzyme Q-cytochrome c reductase)",
                "Complex IV (Cytochrome c oxidase)",
                "Mitochondrial inner membrane protein 1 (MIM1)",
                "Mitochondrial inner membrane protein 2 (MIM2)",
                "Mitochondrial inner membrane protein 3 (MIM3)",
                "Mitochondrial inner membrane protein 4 (MIM4)",
                "Mitochondrial inner membrane protein 5 (MIM5)",
                "Mitochondrial inner membrane protein 6 (MIM6)",
                "Mitochondrial inner membrane protein 7 (MIM7)",
                "Mitochondrial inner membrane protein 8 (MIM8)",
                "Mitochondrial inner membrane protein 9 (MIM9)",
                "Mitochondrial inner membrane protein 10 (MIM10)",
                "Mitochondrial inner membrane protein 11 (MIM11)",
                "Mitochondrial inner membrane protein 12 (MIM12)",
                "Mitochondrial inner membrane protein 13 (MIM13)",
                "Mitochondrial inner membrane protein 14 (MIM14)",
                "Mitochondrial inner membrane protein 15 (MIM15)",
                "Mitochondrial inner membrane protein 16 (MIM16)",
                "Mitochondrial inner membrane protein 17 (MIM17)",
                "Mitochondrial inner membrane protein 18 (MIM18)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase (Complex V)",
                "Complex I (NADH dehydrogenase)",
                "Complex II (Succinate dehydrogenase)",
                "Complex III (Coenzyme Q-cytochrome c reductase)",
                "Complex IV (Cytochrome c oxidase)",
                "Mitochondrial inner membrane protein 1 (MIM1)",
                "Mitochondrial inner membrane protein 10 (MIM10)",
                "Mitochondrial inner membrane protein 11 (MIM11)",
                "Mitochondrial inner membrane protein 12 (MIM12)",
                "Mitochondrial inner membrane protein 13 (MIM13)",
                "Mitochondrial inner membrane protein 14 (MIM14)",
                "Mitochondrial inner membrane protein 15 (MIM15)",
                "Mitochondrial inner membrane protein 16 (MIM16)",
                "Mitochondrial inner membrane protein 17 (MIM17)",
                "Mitochondrial inner membrane protein 18 (MIM18)",
                "Mitochondrial inner membrane protein 2 (MIM2)",
                "Mitochondrial inner membrane protein 3 (MIM3)",
                "Mitochondrial inner membrane protein 4 (MIM4)",
                "Mitochondrial inner membrane protein 5 (MIM5)",
                "Mitochondrial inner membrane protein 6 (MIM6)",
                "Mitochondrial inner membrane protein 7 (MIM7)",
                "Mitochondrial inner membrane protein 8 (MIM8)",
                "Mitochondrial inner membrane protein 9 (MIM9)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "Complex I (NADH dehydrogenase)",
            "Complex II (Succinate dehydrogenase)",
            "Complex III (Cytochrome bc1 complex)",
            "Complex IV (Cytochrome c oxidase)",
            "Complex V (ATP synthase)",
            "NADH:ubiquinone oxidoreductase",
            "Succinate:ubiquinone oxidoreductase",
            "Ubiquinol-cytochrome c reductase",
            "Cytochrome c oxidase",
            "ATP synthase F0F1",
            "Mitochondrial respiratory chain complex I",
            "Mitochondrial respiratory chain complex II",
            "Mitochondrial respiratory chain complex III",
            "Mitochondrial respiratory chain complex IV",
            "Mitochondrial respiratory chain complex V",
            "NADH dehydrogenase complex",
            "Succinate dehydrogenase complex",
            "Cytochrome bc1 complex",
            "Cytochrome c oxidase complex",
            "ATP synthase complex",
            "Proton-pumping ATPase",
            "F1F0-ATP synthase",
            "Inner mitochondrial membrane protein complex",
            "Electron transport chain complex"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Complex I (NADH dehydrogenase)",
                "Complex II (Succinate dehydrogenase)",
                "Complex III (Cytochrome bc1 complex)",
                "Complex IV (Cytochrome c oxidase)",
                "Complex V (ATP synthase)",
                "NADH:ubiquinone oxidoreductase",
                "Succinate:ubiquinone oxidoreductase",
                "Ubiquinol-cytochrome c reductase",
                "Cytochrome c oxidase",
                "ATP synthase F0F1",
                "Mitochondrial respiratory chain complex I",
                "Mitochondrial respiratory chain complex II",
                "Mitochondrial respiratory chain complex III",
                "Mitochondrial respiratory chain complex IV",
                "Mitochondrial respiratory chain complex V",
                "NADH dehydrogenase complex",
                "Succinate dehydrogenase complex",
                "Cytochrome bc1 complex",
                "Cytochrome c oxidase complex",
                "ATP synthase complex",
                "Proton-pumping ATPase",
                "F1F0-ATP synthase",
                "Inner mitochondrial membrane protein complex",
                "Electron transport chain complex"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase F0F1",
                "ATP synthase complex",
                "Complex I (NADH dehydrogenase)",
                "Complex II (Succinate dehydrogenase)",
                "Complex III (Cytochrome bc1 complex)",
                "Complex IV (Cytochrome c oxidase)",
                "Complex V (ATP synthase)",
                "Cytochrome bc1 complex",
                "Cytochrome c oxidase",
                "Cytochrome c oxidase complex",
                "Electron transport chain complex",
                "F1F0-ATP synthase",
                "Inner mitochondrial membrane protein complex",
                "Mitochondrial respiratory chain complex I",
                "Mitochondrial respiratory chain complex II",
                "Mitochondrial respiratory chain complex III",
                "Mitochondrial respiratory chain complex IV",
                "Mitochondrial respiratory chain complex V",
                "NADH dehydrogenase complex",
                "NADH:ubiquinone oxidoreductase",
                "Proton-pumping ATPase",
                "Succinate dehydrogenase complex",
                "Succinate:ubiquinone oxidoreductase",
                "Ubiquinol-cytochrome c reductase"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "NADH:ubiquinone oxidoreductase (Complex I)",
            "Succinate dehydrogenase (Complex II)",
            "Ubiquinol:cytochrome c oxidoreductase (Complex III)",
            "Cytochrome c oxidase (Complex IV)",
            "ATP synthase (Complex V)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "NADH:ubiquinone oxidoreductase (Complex I)",
                "Succinate dehydrogenase (Complex II)",
                "Ubiquinol:cytochrome c oxidoreductase (Complex III)",
                "Cytochrome c oxidase (Complex IV)",
                "ATP synthase (Complex V)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase (Complex V)",
                "Cytochrome c oxidase (Complex IV)",
                "NADH:ubiquinone oxidoreductase (Complex I)",
                "Succinate dehydrogenase (Complex II)",
                "Ubiquinol:cytochrome c oxidoreductase (Complex III)"
            ],
            "TP": 5,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "ATP synthase (ATPS)",
            "NADH dehydrogenase (Complex I)",
            "Succinate dehydrogenase (Complex II)",
            "Cytochrome b-c1 complex (Complex III)",
            "Cytochrome c oxidase (Complex IV)",
            "NADH:ubiquinone oxidoreductase (Complex I)",
            "Ubiquinol-cytochrome c reductase (Complex III)",
            "Cytochrome c (Cyt c)",
            "F0F1 ATP synthase (F0F1)",
            "Respiratory complex I (RCI)",
            "Respiratory complex II (RCII)",
            "Respiratory complex III (RCIII)",
            "Respiratory complex IV (RCIV)",
            "Mitochondrial ATP synthase (mATPase)",
            "Mitochondrial respiratory chain complex I (MRCI)",
            "Mitochondrial respiratory chain complex II (MRCII)",
            "Mitochondrial respiratory chain complex III (MRCIII)",
            "Mitochondrial respiratory chain complex IV (MRCIV)",
            "NADH-ubiquinone oxidoreductase (NDU)",
            "Succinate-ubiquinone oxidoreductase (SDH)",
            "Ubiquinone-cytochrome c reductase (UQCR)",
            "Cytochrome c oxidase complex (CCO)",
            "Complex I NADH-ubiquinone oxidoreductase (CIN)",
            "Complex II succinate-ubiquinone oxidoreductase (CIIN)",
            "Complex III cytochrome bc1 complex (CIIIN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATP synthase (ATPS)",
                "NADH dehydrogenase (Complex I)",
                "Succinate dehydrogenase (Complex II)",
                "Cytochrome b-c1 complex (Complex III)",
                "Cytochrome c oxidase (Complex IV)",
                "NADH:ubiquinone oxidoreductase (Complex I)",
                "Ubiquinol-cytochrome c reductase (Complex III)",
                "Cytochrome c (Cyt c)",
                "F0F1 ATP synthase (F0F1)",
                "Respiratory complex I (RCI)",
                "Respiratory complex II (RCII)",
                "Respiratory complex III (RCIII)",
                "Respiratory complex IV (RCIV)",
                "Mitochondrial ATP synthase (mATPase)",
                "Mitochondrial respiratory chain complex I (MRCI)",
                "Mitochondrial respiratory chain complex II (MRCII)",
                "Mitochondrial respiratory chain complex III (MRCIII)",
                "Mitochondrial respiratory chain complex IV (MRCIV)",
                "NADH-ubiquinone oxidoreductase (NDU)",
                "Succinate-ubiquinone oxidoreductase (SDH)",
                "Ubiquinone-cytochrome c reductase (UQCR)",
                "Cytochrome c oxidase complex (CCO)",
                "Complex I NADH-ubiquinone oxidoreductase (CIN)",
                "Complex II succinate-ubiquinone oxidoreductase (CIIN)"
            ],
            "mismatches": [
                "Complex III cytochrome bc1 complex (CIIIN)"
            ],
            "true_referents": [
                "ATP synthase (ATPS)",
                "Complex I NADH-ubiquinone oxidoreductase (CIN)",
                "Complex II succinate-ubiquinone oxidoreductase (CIIN)",
                "Cytochrome b-c1 complex (Complex III)",
                "Cytochrome c (Cyt c)",
                "Cytochrome c oxidase (Complex IV)",
                "Cytochrome c oxidase complex (CCO)",
                "F0F1 ATP synthase (F0F1)",
                "Mitochondrial ATP synthase (mATPase)",
                "Mitochondrial respiratory chain complex I (MRCI)",
                "Mitochondrial respiratory chain complex II (MRCII)",
                "Mitochondrial respiratory chain complex III (MRCIII)",
                "Mitochondrial respiratory chain complex IV (MRCIV)",
                "NADH dehydrogenase (Complex I)",
                "NADH-ubiquinone oxidoreductase (NDU)",
                "NADH:ubiquinone oxidoreductase (Complex I)",
                "Respiratory complex I (RCI)",
                "Respiratory complex II (RCII)",
                "Respiratory complex III (RCIII)",
                "Respiratory complex IV (RCIV)",
                "Succinate dehydrogenase (Complex II)",
                "Succinate-ubiquinone oxidoreductase (SDH)",
                "Ubiquinol-cytochrome c reductase (Complex III)",
                "Ubiquinone-cytochrome c reductase (UQCR)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "NADH dehydrogenase (Complex I)",
            "Succinate dehydrogenase (Complex II)",
            "Ubiquinol-cytochrome c reductase (Complex III)",
            "Cytochrome c oxidase (Complex IV)",
            "ATP synthase (Complex V)",
            "Adenine nucleotide translocase (ANT)",
            "Phosphate carrier (PiC)",
            "Uncoupling protein 1 (UCP1)",
            "Uncoupling protein 2 (UCP2)",
            "Uncoupling protein 3 (UCP3)",
            "Uncoupling protein 4 (UCP4)",
            "Uncoupling protein 5 (UCP5)",
            "Mitochondrial carrier homolog 2 (MTCH2)",
            "Mitochondrial carrier homolog 1 (MTCH1)",
            "Mitochondrial phosphate carrier protein (SLC25A3)",
            "Mitochondrial dicarboxylate carrier (SLC25A10)",
            "Mitochondrial 2-oxoglutarate/malate carrier protein (SLC25A11)",
            "Mitochondrial glutamate carrier 1 (SLC25A22)",
            "Mitochondrial glutamate carrier 2 (SLC25A18)",
            "Mitochondrial aspartate/glutamate carrier 1 (SLC25A12)",
            "Mitochondrial aspartate/glutamate carrier 2 (SLC25A13)",
            "Mitochondrial ADP/ATP carrier protein 1 (SLC25A4)",
            "Mitochondrial ADP/ATP carrier protein 2 (SLC25A5)",
            "Mitochondrial ADP/ATP carrier protein 3 (SLC25A6)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "NADH dehydrogenase (Complex I)",
                "Succinate dehydrogenase (Complex II)",
                "Ubiquinol-cytochrome c reductase (Complex III)",
                "Cytochrome c oxidase (Complex IV)",
                "ATP synthase (Complex V)",
                "Adenine nucleotide translocase (ANT)",
                "Phosphate carrier (PiC)",
                "Uncoupling protein 1 (UCP1)",
                "Uncoupling protein 2 (UCP2)",
                "Uncoupling protein 3 (UCP3)",
                "Uncoupling protein 4 (UCP4)",
                "Uncoupling protein 5 (UCP5)",
                "Mitochondrial carrier homolog 2 (MTCH2)",
                "Mitochondrial carrier homolog 1 (MTCH1)",
                "Mitochondrial phosphate carrier protein (SLC25A3)",
                "Mitochondrial dicarboxylate carrier (SLC25A10)",
                "Mitochondrial 2-oxoglutarate/malate carrier protein (SLC25A11)",
                "Mitochondrial glutamate carrier 1 (SLC25A22)",
                "Mitochondrial glutamate carrier 2 (SLC25A18)",
                "Mitochondrial aspartate/glutamate carrier 1 (SLC25A12)",
                "Mitochondrial aspartate/glutamate carrier 2 (SLC25A13)",
                "Mitochondrial ADP/ATP carrier protein 1 (SLC25A4)",
                "Mitochondrial ADP/ATP carrier protein 2 (SLC25A5)",
                "Mitochondrial ADP/ATP carrier protein 3 (SLC25A6)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase (Complex V)",
                "Adenine nucleotide translocase (ANT)",
                "Cytochrome c oxidase (Complex IV)",
                "Mitochondrial 2-oxoglutarate/malate carrier protein (SLC25A11)",
                "Mitochondrial ADP/ATP carrier protein 1 (SLC25A4)",
                "Mitochondrial ADP/ATP carrier protein 2 (SLC25A5)",
                "Mitochondrial ADP/ATP carrier protein 3 (SLC25A6)",
                "Mitochondrial aspartate/glutamate carrier 1 (SLC25A12)",
                "Mitochondrial aspartate/glutamate carrier 2 (SLC25A13)",
                "Mitochondrial carrier homolog 1 (MTCH1)",
                "Mitochondrial carrier homolog 2 (MTCH2)",
                "Mitochondrial dicarboxylate carrier (SLC25A10)",
                "Mitochondrial glutamate carrier 1 (SLC25A22)",
                "Mitochondrial glutamate carrier 2 (SLC25A18)",
                "Mitochondrial phosphate carrier protein (SLC25A3)",
                "NADH dehydrogenase (Complex I)",
                "Phosphate carrier (PiC)",
                "Succinate dehydrogenase (Complex II)",
                "Ubiquinol-cytochrome c reductase (Complex III)",
                "Uncoupling protein 1 (UCP1)",
                "Uncoupling protein 2 (UCP2)",
                "Uncoupling protein 3 (UCP3)",
                "Uncoupling protein 4 (UCP4)",
                "Uncoupling protein 5 (UCP5)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "ATP synthase (ATPase)",
            "Cytochrome c oxidase (COX)",
            "NADH dehydrogenase (Complex I)",
            "Succinate dehydrogenase (Complex II)",
            "Ubiquinol-cytochrome c reductase (Complex III)",
            "ATP synthase (Complex V)",
            "Cytochrome bc1 complex",
            "Adenine nucleotide translocase (ANT)",
            "Mitochondrial electron transport chain",
            "Electron transport chain complex",
            "Respiratory chain",
            "Mitochondrial ATPase",
            "Complex IV",
            "Complex I",
            "Complex II",
            "Complex III",
            "Complex V",
            "Complexes of oxidative phosphorylation",
            "Proton pump",
            "Oxidative phosphorylation complexes",
            "Mitochondrial protein complexes",
            "Mitochondrial respiratory chain",
            "Mitochondrial ATP synthase",
            "Mitochondrial electron transport system"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATP synthase (ATPase)",
                "Cytochrome c oxidase (COX)",
                "NADH dehydrogenase (Complex I)",
                "Succinate dehydrogenase (Complex II)",
                "Ubiquinol-cytochrome c reductase (Complex III)",
                "ATP synthase (Complex V)",
                "Cytochrome bc1 complex",
                "Adenine nucleotide translocase (ANT)",
                "Mitochondrial electron transport chain",
                "Electron transport chain complex",
                "Respiratory chain",
                "Mitochondrial ATPase",
                "Complex IV",
                "Complex I",
                "Complex II",
                "Complex III",
                "Complex V",
                "Complexes of oxidative phosphorylation",
                "Proton pump",
                "Oxidative phosphorylation complexes",
                "Mitochondrial protein complexes",
                "Mitochondrial respiratory chain",
                "Mitochondrial ATP synthase",
                "Mitochondrial electron transport system"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase (ATPase)",
                "ATP synthase (Complex V)",
                "Adenine nucleotide translocase (ANT)",
                "Complex I",
                "Complex II",
                "Complex III",
                "Complex IV",
                "Complex V",
                "Complexes of oxidative phosphorylation",
                "Cytochrome bc1 complex",
                "Cytochrome c oxidase (COX)",
                "Electron transport chain complex",
                "Mitochondrial ATP synthase",
                "Mitochondrial ATPase",
                "Mitochondrial electron transport chain",
                "Mitochondrial electron transport system",
                "Mitochondrial protein complexes",
                "Mitochondrial respiratory chain",
                "NADH dehydrogenase (Complex I)",
                "Oxidative phosphorylation complexes",
                "Proton pump",
                "Respiratory chain",
                "Succinate dehydrogenase (Complex II)",
                "Ubiquinol-cytochrome c reductase (Complex III)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "NADH:ubiquinone oxidoreductase (Complex I)",
            "Succinate dehydrogenase (Complex II)",
            "Ubiquinol-cytochrome c oxidoreductase (Complex III)",
            "Cytochrome c oxidase (Complex IV)",
            "ATP synthase (Complex V)",
            "Respirasome (Supercomplex I+III+IV)",
            "Supercomplex I+III",
            "Supercomplex III+IV",
            "Supercomplex I+III\u2082",
            "Supercomplex II+III",
            "Mitochondrial ATP synthase dimer",
            "Mitochondrial ATP synthase monomer",
            "Mitochondrial respiratory supercomplex II+III+IV",
            "Mitochondrial Complex I subcomplex",
            "Mitochondrial Complex III dimer",
            "Mitochondrial Complex IV tetramer",
            "Mitochondrial supercomplex assembly factor",
            "Mitochondrial cytochrome bc\u2081 complex",
            "Mitochondrial iron-sulfur protein complex",
            "Mitochondrial ubiquinone-binding complex",
            "Mitochondrial cytochrome c complex",
            "Mitochondrial Rieske protein complex",
            "Mitochondrial COX7A2 complex",
            "Mitochondrial COX4I1 complex"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "NADH:ubiquinone oxidoreductase (Complex I)",
                "Succinate dehydrogenase (Complex II)",
                "Ubiquinol-cytochrome c oxidoreductase (Complex III)",
                "Cytochrome c oxidase (Complex IV)",
                "ATP synthase (Complex V)",
                "Respirasome (Supercomplex I+III+IV)",
                "Supercomplex I+III",
                "Supercomplex III+IV",
                "Supercomplex I+III\u2082",
                "Supercomplex II+III",
                "Mitochondrial ATP synthase dimer",
                "Mitochondrial ATP synthase monomer",
                "Mitochondrial respiratory supercomplex II+III+IV",
                "Mitochondrial Complex I subcomplex",
                "Mitochondrial Complex III dimer",
                "Mitochondrial Complex IV tetramer",
                "Mitochondrial supercomplex assembly factor",
                "Mitochondrial cytochrome bc\u2081 complex",
                "Mitochondrial iron-sulfur protein complex",
                "Mitochondrial ubiquinone-binding complex",
                "Mitochondrial cytochrome c complex",
                "Mitochondrial Rieske protein complex",
                "Mitochondrial COX7A2 complex",
                "Mitochondrial COX4I1 complex"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase (Complex V)",
                "Cytochrome c oxidase (Complex IV)",
                "Mitochondrial ATP synthase dimer",
                "Mitochondrial ATP synthase monomer",
                "Mitochondrial COX4I1 complex",
                "Mitochondrial COX7A2 complex",
                "Mitochondrial Complex I subcomplex",
                "Mitochondrial Complex III dimer",
                "Mitochondrial Complex IV tetramer",
                "Mitochondrial Rieske protein complex",
                "Mitochondrial cytochrome bc\u2081 complex",
                "Mitochondrial cytochrome c complex",
                "Mitochondrial iron-sulfur protein complex",
                "Mitochondrial respiratory supercomplex II+III+IV",
                "Mitochondrial supercomplex assembly factor",
                "Mitochondrial ubiquinone-binding complex",
                "NADH:ubiquinone oxidoreductase (Complex I)",
                "Respirasome (Supercomplex I+III+IV)",
                "Succinate dehydrogenase (Complex II)",
                "Supercomplex I+III",
                "Supercomplex I+III\u2082",
                "Supercomplex II+III",
                "Supercomplex III+IV",
                "Ubiquinol-cytochrome c oxidoreductase (Complex III)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "ATP synthase (Complex V)",
            "F1F0-ATPase",
            "H+-ATPase",
            "Mitochondrial ATPase",
            "FOF1 ATP synthase",
            "Respiratory chain complex V",
            "Mitochondrial ATP synthetase",
            "Proton-translocating ATPase",
            "Mitochondrial F1F0-ATPase",
            "Electron transport chain complex V",
            "Mitochondrial H+-ATPase",
            "F-type ATPase",
            "F-ATPase",
            "ETC complex V",
            "OXPHOS complex V",
            "Mitochondrial proton pump",
            "ATP synthase F0F1",
            "Mitochondrial F-type ATP synthase",
            "Rotary ATP synthase",
            "Mitochondrial rotary ATPase",
            "F-type rotary ATPase",
            "Inner mitochondrial membrane ATPase",
            "Proton-motive force-driven ATP synthase",
            "Chemiosmotic ATP synthase"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATP synthase (Complex V)",
                "F1F0-ATPase",
                "H+-ATPase",
                "Mitochondrial ATPase",
                "FOF1 ATP synthase",
                "Respiratory chain complex V",
                "Mitochondrial ATP synthetase",
                "Proton-translocating ATPase",
                "Mitochondrial F1F0-ATPase",
                "Electron transport chain complex V",
                "Mitochondrial H+-ATPase",
                "F-type ATPase",
                "F-ATPase",
                "ETC complex V",
                "OXPHOS complex V",
                "Mitochondrial proton pump",
                "ATP synthase F0F1",
                "Mitochondrial F-type ATP synthase",
                "Rotary ATP synthase",
                "Mitochondrial rotary ATPase",
                "F-type rotary ATPase",
                "Inner mitochondrial membrane ATPase",
                "Proton-motive force-driven ATP synthase",
                "Chemiosmotic ATP synthase"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase (Complex V)",
                "ATP synthase F0F1",
                "Chemiosmotic ATP synthase",
                "ETC complex V",
                "Electron transport chain complex V",
                "F-ATPase",
                "F-type ATPase",
                "F-type rotary ATPase",
                "F1F0-ATPase",
                "FOF1 ATP synthase",
                "H+-ATPase",
                "Inner mitochondrial membrane ATPase",
                "Mitochondrial ATP synthetase",
                "Mitochondrial ATPase",
                "Mitochondrial F-type ATP synthase",
                "Mitochondrial F1F0-ATPase",
                "Mitochondrial H+-ATPase",
                "Mitochondrial proton pump",
                "Mitochondrial rotary ATPase",
                "OXPHOS complex V",
                "Proton-motive force-driven ATP synthase",
                "Proton-translocating ATPase",
                "Respiratory chain complex V",
                "Rotary ATP synthase"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "ATP synthase (Complex V)",
            "NADH dehydrogenase (Complex I)",
            "Succinate dehydrogenase (Complex II)",
            "Coenzyme Q10 - cytochrome c reductase (Complex III)",
            "Cytochrome c oxidase (Complex IV)",
            "Electron-transferring flavoprotein dehydrogenase (ETFDH)",
            "Electron transfer flavoprotein-ubiquinone oxidoreductase (ETF-QO)",
            "Glycerol-3-phosphate dehydrogenase (GPD2)",
            "Dihydroorotate dehydrogenase (DHODH)",
            "Choline dehydrogenase (CHDH)",
            "Sulfide:quinone oxidoreductase (SQOR)",
            "Proline dehydrogenase (PRODH)",
            "Electron transfer flavoprotein (ETF)",
            "Sarcosine dehydrogenase (SARDH)",
            "Dimethylglycine dehydrogenase (DMGDH)",
            "Hydroxyacyl-CoA dehydrogenase (HADH)",
            "Electron-transferring-flavoprotein dehydrogenase (ETFDH)",
            "Dihydrolipoamide dehydrogenase (DLD)",
            "Branched-chain alpha-keto acid dehydrogenase complex (BCKDC)",
            "Pyruvate dehydrogenase complex (PDC)",
            "Alpha-ketoglutarate dehydrogenase complex (KGDC)",
            "Malate dehydrogenase (MDH2)",
            "Isocitrate dehydrogenase (IDH2)",
            "Glycerol-3-phosphate dehydrogenase 2 (GPD2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATP synthase (Complex V)",
                "NADH dehydrogenase (Complex I)",
                "Succinate dehydrogenase (Complex II)",
                "Coenzyme Q10 - cytochrome c reductase (Complex III)",
                "Cytochrome c oxidase (Complex IV)",
                "Electron-transferring flavoprotein dehydrogenase (ETFDH)",
                "Electron transfer flavoprotein-ubiquinone oxidoreductase (ETF-QO)",
                "Glycerol-3-phosphate dehydrogenase (GPD2)",
                "Dihydroorotate dehydrogenase (DHODH)",
                "Choline dehydrogenase (CHDH)",
                "Sulfide:quinone oxidoreductase (SQOR)",
                "Proline dehydrogenase (PRODH)",
                "Electron transfer flavoprotein (ETF)",
                "Sarcosine dehydrogenase (SARDH)",
                "Dimethylglycine dehydrogenase (DMGDH)",
                "Hydroxyacyl-CoA dehydrogenase (HADH)",
                "Dihydrolipoamide dehydrogenase (DLD)",
                "Branched-chain alpha-keto acid dehydrogenase complex (BCKDC)",
                "Pyruvate dehydrogenase complex (PDC)",
                "Alpha-ketoglutarate dehydrogenase complex (KGDC)",
                "Malate dehydrogenase (MDH2)",
                "Isocitrate dehydrogenase (IDH2)",
                "Glycerol-3-phosphate dehydrogenase 2 (GPD2)"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase (Complex V)",
                "Alpha-ketoglutarate dehydrogenase complex (KGDC)",
                "Branched-chain alpha-keto acid dehydrogenase complex (BCKDC)",
                "Choline dehydrogenase (CHDH)",
                "Coenzyme Q10 - cytochrome c reductase (Complex III)",
                "Cytochrome c oxidase (Complex IV)",
                "Dihydrolipoamide dehydrogenase (DLD)",
                "Dihydroorotate dehydrogenase (DHODH)",
                "Dimethylglycine dehydrogenase (DMGDH)",
                "Electron transfer flavoprotein (ETF)",
                "Electron transfer flavoprotein-ubiquinone oxidoreductase (ETF-QO)",
                "Electron-transferring flavoprotein dehydrogenase (ETFDH)",
                "Electron-transferring-flavoprotein dehydrogenase (ETFDH)",
                "Glycerol-3-phosphate dehydrogenase (GPD2)",
                "Glycerol-3-phosphate dehydrogenase 2 (GPD2)",
                "Hydroxyacyl-CoA dehydrogenase (HADH)",
                "Isocitrate dehydrogenase (IDH2)",
                "Malate dehydrogenase (MDH2)",
                "NADH dehydrogenase (Complex I)",
                "Proline dehydrogenase (PRODH)",
                "Pyruvate dehydrogenase complex (PDC)",
                "Sarcosine dehydrogenase (SARDH)",
                "Succinate dehydrogenase (Complex II)",
                "Sulfide:quinone oxidoreductase (SQOR)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "NADH dehydrogenase (Complex I)",
            "Succinate dehydrogenase (Complex II)",
            "Cytochrome bc1 complex (Complex III)",
            "Cytochrome c oxidase (Complex IV)",
            "ATP synthase (Complex V)",
            "Ubiquinol-cytochrome c reductase",
            "Cytochrome c reductase",
            "Cytochrome c1",
            "Rieske iron-sulfur protein",
            "Cytochrome b",
            "Ubiquinone-binding protein",
            "Ubiquinol oxidase",
            "Succinate-coenzyme Q reductase",
            "Fumarate reductase",
            "Quinol oxidase",
            "Cytochrome aa3",
            "Cytochrome bo3",
            "Cytochrome bd",
            "Cytochrome o",
            "Cytochrome c peroxidase",
            "Cytochrome c nitrite reductase",
            "Cytochrome c553",
            "Cytochrome c552",
            "Cytochrome c551"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "NADH dehydrogenase (Complex I)",
                "Succinate dehydrogenase (Complex II)",
                "Cytochrome bc1 complex (Complex III)",
                "Cytochrome c oxidase (Complex IV)",
                "ATP synthase (Complex V)",
                "Ubiquinol-cytochrome c reductase",
                "Cytochrome c reductase",
                "Cytochrome c1",
                "Rieske iron-sulfur protein",
                "Cytochrome b",
                "Ubiquinone-binding protein",
                "Ubiquinol oxidase",
                "Succinate-coenzyme Q reductase",
                "Fumarate reductase",
                "Quinol oxidase",
                "Cytochrome aa3",
                "Cytochrome bo3",
                "Cytochrome bd",
                "Cytochrome o",
                "Cytochrome c peroxidase",
                "Cytochrome c nitrite reductase",
                "Cytochrome c553",
                "Cytochrome c552",
                "Cytochrome c551"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase (Complex V)",
                "Cytochrome aa3",
                "Cytochrome b",
                "Cytochrome bc1 complex (Complex III)",
                "Cytochrome bd",
                "Cytochrome bo3",
                "Cytochrome c nitrite reductase",
                "Cytochrome c oxidase (Complex IV)",
                "Cytochrome c peroxidase",
                "Cytochrome c reductase",
                "Cytochrome c1",
                "Cytochrome c551",
                "Cytochrome c552",
                "Cytochrome c553",
                "Cytochrome o",
                "Fumarate reductase",
                "NADH dehydrogenase (Complex I)",
                "Quinol oxidase",
                "Rieske iron-sulfur protein",
                "Succinate dehydrogenase (Complex II)",
                "Succinate-coenzyme Q reductase",
                "Ubiquinol oxidase",
                "Ubiquinol-cytochrome c reductase",
                "Ubiquinone-binding protein"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "ATP synthase (ATP)",
            "Complex V (CV)",
            "F1F0-ATP synthase",
            "Mitochondrial ATP synthase",
            "Mitochondrial F1F0-ATP synthase",
            "Oxidative phosphorylation complex V",
            "Respiratory complex V",
            "Rotary ATPase",
            "Rotary ATP synthase",
            "Mitochondrial proton-translocating ATPase",
            "Mitochondrial H+-transporting ATP synthase",
            "Mitochondrial H+-transporting two-sector ATPase",
            "Mitochondrial membrane ATP synthase",
            "Mitochondrial membrane ATPase",
            "Mitochondrial membrane ATP synthase complex",
            "Mitochondrial membrane ATP synthase enzyme complex",
            "Mitochondrial membrane ATP synthase protein complex",
            "Mitochondrial membrane ATP synthase subunit complex",
            "Mitochondrial membrane ATP synthase holoenzyme",
            "Mitochondrial membrane ATP synthase holoenzyme complex",
            "Mitochondrial membrane ATP synthase multisubunit complex",
            "Mitochondrial membrane ATP synthase oligomeric complex",
            "Mitochondrial membrane ATP synthase oligomeric holoenzyme",
            "Mitochondrial membrane ATP synthase oligomeric protein complex"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATP synthase (ATP)",
                "Complex V (CV)",
                "F1F0-ATP synthase",
                "Mitochondrial ATP synthase",
                "Mitochondrial F1F0-ATP synthase",
                "Oxidative phosphorylation complex V",
                "Respiratory complex V",
                "Rotary ATPase",
                "Rotary ATP synthase",
                "Mitochondrial proton-translocating ATPase",
                "Mitochondrial H+-transporting ATP synthase",
                "Mitochondrial H+-transporting two-sector ATPase",
                "Mitochondrial membrane ATP synthase",
                "Mitochondrial membrane ATPase",
                "Mitochondrial membrane ATP synthase complex",
                "Mitochondrial membrane ATP synthase enzyme complex",
                "Mitochondrial membrane ATP synthase protein complex",
                "Mitochondrial membrane ATP synthase subunit complex",
                "Mitochondrial membrane ATP synthase holoenzyme",
                "Mitochondrial membrane ATP synthase holoenzyme complex",
                "Mitochondrial membrane ATP synthase multisubunit complex",
                "Mitochondrial membrane ATP synthase oligomeric complex",
                "Mitochondrial membrane ATP synthase oligomeric holoenzyme",
                "Mitochondrial membrane ATP synthase oligomeric protein complex"
            ],
            "mismatches": [],
            "true_referents": [
                "ATP synthase (ATP)",
                "Complex V (CV)",
                "F1F0-ATP synthase",
                "Mitochondrial ATP synthase",
                "Mitochondrial F1F0-ATP synthase",
                "Mitochondrial H+-transporting ATP synthase",
                "Mitochondrial H+-transporting two-sector ATPase",
                "Mitochondrial membrane ATP synthase",
                "Mitochondrial membrane ATP synthase complex",
                "Mitochondrial membrane ATP synthase enzyme complex",
                "Mitochondrial membrane ATP synthase holoenzyme",
                "Mitochondrial membrane ATP synthase holoenzyme complex",
                "Mitochondrial membrane ATP synthase multisubunit complex",
                "Mitochondrial membrane ATP synthase oligomeric complex",
                "Mitochondrial membrane ATP synthase oligomeric holoenzyme",
                "Mitochondrial membrane ATP synthase oligomeric protein complex",
                "Mitochondrial membrane ATP synthase protein complex",
                "Mitochondrial membrane ATP synthase subunit complex",
                "Mitochondrial membrane ATPase",
                "Mitochondrial proton-translocating ATPase",
                "Oxidative phosphorylation complex V",
                "Respiratory complex V",
                "Rotary ATP synthase",
                "Rotary ATPase"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "ATP synthase (Complex V)",
            "F1F0 ATP synthase",
            "Mitochondrial ATP synthase",
            "ATPase",
            "Proton-translocating ATPase",
            "Mitochondrial proton-translocating ATPase",
            "F1-ATPase",
            "F0-ATPase",
            "ATP synthase complex",
            "Mitochondrial inner membrane ATP synthase",
            "Complex V of the electron transport chain",
            "Mitochondrial electron transport chain",
            "Oxidative phosphorylation complex",
            "Mitochondrial oxidative phosphorylation complex",
            "ATP generating complex",
            "Mitochondrial ATP generating complex",
            "Proton pumping ATPase",
            "Mitochondrial proton pumping ATPase",
            "Mitochondrial electron transport chain complex",
            "Mitochondrial ATP synthase enzyme",
            "Mitochondrial inner membrane enzyme",
            "Mitochondrial oxidative phosphorylation enzyme",
            "Mitochondrial electron transport chain enzyme",
            "Mitochondrial ATP generating enzyme",
            "Mitochondrial proton pumping enzyme"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATP synthase (Complex V)",
                "F1F0 ATP synthase",
                "Mitochondrial ATP synthase",
                "ATPase",
                "Proton-translocating ATPase",
                "Mitochondrial proton-translocating ATPase",
                "F1-ATPase",
                "F0-ATPase",
                "ATP synthase complex",
                "Mitochondrial inner membrane ATP synthase",
                "Complex V of the electron transport chain",
                "Mitochondrial electron transport chain",
                "Oxidative phosphorylation complex",
                "Mitochondrial oxidative phosphorylation complex",
                "ATP generating complex",
                "Mitochondrial ATP generating complex",
                "Proton pumping ATPase",
                "Mitochondrial proton pumping ATPase",
                "Mitochondrial electron transport chain complex",
                "Mitochondrial ATP synthase enzyme",
                "Mitochondrial inner membrane enzyme",
                "Mitochondrial oxidative phosphorylation enzyme",
                "Mitochondrial electron transport chain enzyme",
                "Mitochondrial ATP generating enzyme"
            ],
            "mismatches": [
                "Mitochondrial proton pumping enzyme"
            ],
            "true_referents": [
                "ATP generating complex",
                "ATP synthase (Complex V)",
                "ATP synthase complex",
                "ATPase",
                "Complex V of the electron transport chain",
                "F0-ATPase",
                "F1-ATPase",
                "F1F0 ATP synthase",
                "Mitochondrial ATP generating complex",
                "Mitochondrial ATP generating enzyme",
                "Mitochondrial ATP synthase",
                "Mitochondrial ATP synthase enzyme",
                "Mitochondrial electron transport chain",
                "Mitochondrial electron transport chain complex",
                "Mitochondrial electron transport chain enzyme",
                "Mitochondrial inner membrane ATP synthase",
                "Mitochondrial inner membrane enzyme",
                "Mitochondrial oxidative phosphorylation complex",
                "Mitochondrial oxidative phosphorylation enzyme",
                "Mitochondrial proton pumping ATPase",
                "Mitochondrial proton-translocating ATPase",
                "Oxidative phosphorylation complex",
                "Proton pumping ATPase",
                "Proton-translocating ATPase"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            "NADH dehydrogenase (Complex I)",
            "Cytochrome b-c1 complex (Complex III)",
            "Cytochrome c oxidase (Complex IV)",
            "Coenzyme Q - cytochrome c reductase",
            "F1F0-ATP synthase (Complex V)",
            "Succinate dehydrogenase (Complex II)",
            "Flavoprotein subcomplex",
            "Iron-sulfur subcomplex",
            "Hydrogenase subcomplex",
            "Proton-translocating NADH dehydrogenase",
            "Cytochrome b6f complex",
            "Rieske iron-sulfur protein subcomplex",
            "Cytochrome c1 subcomplex",
            "Q-cytochrome c oxidoreductase subcomplex",
            "Cytochrome a-a3 subcomplex",
            "CuA subcomplex",
            "CuB subcomplex",
            "Cytochrome a subcomplex",
            "Cytochrome c oxidase subcomplex",
            "Proton-translocating cytochrome c oxidase subcomplex",
            "Cytochrome c reductase subcomplex",
            "Cytochrome b subcomplex",
            "Cytochrome c1-cu subcomplex"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "NADH dehydrogenase (Complex I)",
                "Cytochrome b-c1 complex (Complex III)",
                "Cytochrome c oxidase (Complex IV)",
                "Coenzyme Q - cytochrome c reductase",
                "F1F0-ATP synthase (Complex V)",
                "Succinate dehydrogenase (Complex II)",
                "Flavoprotein subcomplex",
                "Iron-sulfur subcomplex",
                "Hydrogenase subcomplex",
                "Proton-translocating NADH dehydrogenase",
                "Cytochrome b6f complex",
                "Rieske iron-sulfur protein subcomplex",
                "Cytochrome c1 subcomplex",
                "Q-cytochrome c oxidoreductase subcomplex",
                "Cytochrome a-a3 subcomplex",
                "CuA subcomplex",
                "CuB subcomplex",
                "Cytochrome a subcomplex",
                "Cytochrome c oxidase subcomplex",
                "Proton-translocating cytochrome c oxidase subcomplex",
                "Cytochrome c reductase subcomplex",
                "Cytochrome b subcomplex",
                "Cytochrome c1-cu subcomplex"
            ],
            "mismatches": [],
            "true_referents": [
                "Coenzyme Q - cytochrome c reductase",
                "CuA subcomplex",
                "CuB subcomplex",
                "Cytochrome a subcomplex",
                "Cytochrome a-a3 subcomplex",
                "Cytochrome b subcomplex",
                "Cytochrome b-c1 complex (Complex III)",
                "Cytochrome b6f complex",
                "Cytochrome c oxidase (Complex IV)",
                "Cytochrome c oxidase subcomplex",
                "Cytochrome c reductase subcomplex",
                "Cytochrome c1 subcomplex",
                "Cytochrome c1-cu subcomplex",
                "F1F0-ATP synthase (Complex V)",
                "Flavoprotein subcomplex",
                "Hydrogenase subcomplex",
                "Iron-sulfur subcomplex",
                "NADH dehydrogenase (Complex I)",
                "Proton-translocating NADH dehydrogenase",
                "Proton-translocating cytochrome c oxidase subcomplex",
                "Q-cytochrome c oxidoreductase subcomplex",
                "Rieske iron-sulfur protein subcomplex",
                "Succinate dehydrogenase (Complex II)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "electron transport chain protein complex",
        "domain": "biology",
        "response": [
            [
                "Referent",
                "ATP synthase"
            ],
            [
                "Referent",
                "ATP synthase complex"
            ],
            [
                "Referent",
                "ATP synthase complex (F1-F0 complex)"
            ]
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "ATP synthase",
                "ATP synthase complex",
                "ATP synthase complex (F1-F0 complex)"
            ],
            "mismatches": [],
            "true_referents": [
                "[\"Referent\", \"ATP synthase complex (F1-F0 complex)\"]",
                "[\"Referent\", \"ATP synthase complex\"]",
                "[\"Referent\", \"ATP synthase\"]"
            ],
            "TP": 3,
            "FP": 0,
            "FN": 0
        }
    }
]