[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Aconitase (ACO)",
            "Citrate synthase (CS)",
            "Isocitrate dehydrogenase (IDH)",
            "\u03b1-Ketoglutarate dehydrogenase complex (KGD)",
            "Succinyl-CoA synthetase (SCS)",
            "Succinate dehydrogenase (SDH)",
            "Fumarase (FH)",
            "Malate dehydrogenase (MDH)",
            "Mitochondrial citrate carrier (CIC)",
            "Mitochondrial glycerol-3-phosphate dehydrogenase (G3PDH)",
            "Mitochondrial malate dehydrogenase (MDH2)",
            "Mitochondrial NADP-dependent isocitrate dehydrogenase (IDH2)",
            "Mitochondrial succinate dehydrogenase complex (SDHC)",
            "Mitochondrial succinate-CoA ligase (SCL)",
            "Mitochondrial \u03b1-ketoglutarate dehydrogenase complex (KGD2)",
            "Mitochondrial isocitrate dehydrogenase 1 (IDH1)",
            "Mitochondrial isocitrate dehydrogenase 2 (IDH2)",
            "Mitochondrial citrate synthase (CS)",
            "Mitochondrial aconitase 1 (ACO1)",
            "Mitochondrial aconitase 2 (ACO2)",
            "Mitochondrial succinyl-CoA synthetase alpha subunit (SUCS2)",
            "Mitochondrial succinyl-CoA synthetase beta subunit (SUCS1)",
            "Mitochondrial fumarase (FH)",
            "Mitochondrial malate dehydrogenase (MDH2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aconitase (ACO)",
                "Citrate synthase (CS)",
                "Isocitrate dehydrogenase (IDH)",
                "\u03b1-Ketoglutarate dehydrogenase complex (KGD)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinate dehydrogenase (SDH)",
                "Fumarase (FH)",
                "Malate dehydrogenase (MDH)",
                "Mitochondrial citrate carrier (CIC)",
                "Mitochondrial glycerol-3-phosphate dehydrogenase (G3PDH)",
                "Mitochondrial malate dehydrogenase (MDH2)",
                "Mitochondrial NADP-dependent isocitrate dehydrogenase (IDH2)",
                "Mitochondrial succinate dehydrogenase complex (SDHC)",
                "Mitochondrial succinate-CoA ligase (SCL)",
                "Mitochondrial \u03b1-ketoglutarate dehydrogenase complex (KGD2)",
                "Mitochondrial isocitrate dehydrogenase 1 (IDH1)",
                "Mitochondrial isocitrate dehydrogenase 2 (IDH2)",
                "Mitochondrial citrate synthase (CS)",
                "Mitochondrial aconitase 1 (ACO1)",
                "Mitochondrial aconitase 2 (ACO2)",
                "Mitochondrial succinyl-CoA synthetase alpha subunit (SUCS2)",
                "Mitochondrial succinyl-CoA synthetase beta subunit (SUCS1)",
                "Mitochondrial fumarase (FH)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aconitase (ACO)",
                "Citrate synthase (CS)",
                "Fumarase (FH)",
                "Isocitrate dehydrogenase (IDH)",
                "Malate dehydrogenase (MDH)",
                "Mitochondrial NADP-dependent isocitrate dehydrogenase (IDH2)",
                "Mitochondrial aconitase 1 (ACO1)",
                "Mitochondrial aconitase 2 (ACO2)",
                "Mitochondrial citrate carrier (CIC)",
                "Mitochondrial citrate synthase (CS)",
                "Mitochondrial fumarase (FH)",
                "Mitochondrial glycerol-3-phosphate dehydrogenase (G3PDH)",
                "Mitochondrial isocitrate dehydrogenase 1 (IDH1)",
                "Mitochondrial isocitrate dehydrogenase 2 (IDH2)",
                "Mitochondrial malate dehydrogenase (MDH2)",
                "Mitochondrial succinate dehydrogenase complex (SDHC)",
                "Mitochondrial succinate-CoA ligase (SCL)",
                "Mitochondrial succinyl-CoA synthetase alpha subunit (SUCS2)",
                "Mitochondrial succinyl-CoA synthetase beta subunit (SUCS1)",
                "Mitochondrial \u03b1-ketoglutarate dehydrogenase complex (KGD2)",
                "Succinate dehydrogenase (SDH)",
                "Succinyl-CoA synthetase (SCS)",
                "\u03b1-Ketoglutarate dehydrogenase complex (KGD)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Citrate Synthase (CS)",
            "Aconitase (ACO)",
            "Isocitrate Dehydrogenase (IDH)",
            "\u03b1-Ketoglutarate Dehydrogenase Complex (\u03b1-KGDH)",
            "Succinyl-CoA Synthetase (SCS)",
            "Succinate Dehydrogenase (SDH)",
            "Fumarase (FUM)",
            "Malate Dehydrogenase (MDH)",
            "NAD+-Isocitrate Dehydrogenase (NAD+-IDH)",
            "NADP+-Isocitrate Dehydrogenase (NADP+-IDH)",
            "Succinate Dehydrogenase (Complex II) (SDH)",
            "Fumarate Hydratase (Fumarase) (FH)",
            "Malate Dehydrogenase (NAD+) (MDH1)",
            "Malate Dehydrogenase (NADP+) (MDH2)",
            "Aconitase (aconitate hydratase) (ACO2)",
            "Succinyl-CoA Ligase (ADP-forming) (SUCLA2)",
            "Succinyl-CoA Ligase (GDP-forming) (SUCLG1)",
            "Isocitrate Dehydrogenase [NADP] (Cytosolic) (IDH3)",
            "Isocitrate Dehydrogenase [NADP] (Mitochondrial) (IDH1)",
            "Isocitrate Dehydrogenase [NAD] (Mitochondrial) (IDH2)",
            "\u03b1-Ketoglutarate Dehydrogenase (E1 Component) (OGDH)",
            "\u03b1-Ketoglutarate Dehydrogenase (E2 Component) (DLST)",
            "\u03b1-Ketoglutarate Dehydrogenase (E3 Component) (DLD)",
            "Citrate Synthase (CIT)",
            "Succinate Dehydrogenase [Flavoprotein] Subunit A (SDHA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Citrate Synthase (CS)",
                "Aconitase (ACO)",
                "Isocitrate Dehydrogenase (IDH)",
                "\u03b1-Ketoglutarate Dehydrogenase Complex (\u03b1-KGDH)",
                "Succinyl-CoA Synthetase (SCS)",
                "Succinate Dehydrogenase (SDH)",
                "Fumarase (FUM)",
                "Malate Dehydrogenase (MDH)",
                "NAD+-Isocitrate Dehydrogenase (NAD+-IDH)",
                "NADP+-Isocitrate Dehydrogenase (NADP+-IDH)",
                "Succinate Dehydrogenase (Complex II) (SDH)",
                "Fumarate Hydratase (Fumarase) (FH)",
                "Malate Dehydrogenase (NAD+) (MDH1)",
                "Malate Dehydrogenase (NADP+) (MDH2)",
                "Aconitase (aconitate hydratase) (ACO2)",
                "Succinyl-CoA Ligase (ADP-forming) (SUCLA2)",
                "Succinyl-CoA Ligase (GDP-forming) (SUCLG1)",
                "Isocitrate Dehydrogenase [NADP] (Cytosolic) (IDH3)",
                "Isocitrate Dehydrogenase [NADP] (Mitochondrial) (IDH1)",
                "Isocitrate Dehydrogenase [NAD] (Mitochondrial) (IDH2)",
                "\u03b1-Ketoglutarate Dehydrogenase (E1 Component) (OGDH)",
                "\u03b1-Ketoglutarate Dehydrogenase (E2 Component) (DLST)",
                "\u03b1-Ketoglutarate Dehydrogenase (E3 Component) (DLD)",
                "Citrate Synthase (CIT)"
            ],
            "mismatches": [
                "Succinate Dehydrogenase [Flavoprotein] Subunit A (SDHA)"
            ],
            "true_referents": [
                "Aconitase (ACO)",
                "Aconitase (aconitate hydratase) (ACO2)",
                "Citrate Synthase (CIT)",
                "Citrate Synthase (CS)",
                "Fumarase (FUM)",
                "Fumarate Hydratase (Fumarase) (FH)",
                "Isocitrate Dehydrogenase (IDH)",
                "Isocitrate Dehydrogenase [NADP] (Cytosolic) (IDH3)",
                "Isocitrate Dehydrogenase [NADP] (Mitochondrial) (IDH1)",
                "Isocitrate Dehydrogenase [NAD] (Mitochondrial) (IDH2)",
                "Malate Dehydrogenase (MDH)",
                "Malate Dehydrogenase (NAD+) (MDH1)",
                "Malate Dehydrogenase (NADP+) (MDH2)",
                "NAD+-Isocitrate Dehydrogenase (NAD+-IDH)",
                "NADP+-Isocitrate Dehydrogenase (NADP+-IDH)",
                "Succinate Dehydrogenase (Complex II) (SDH)",
                "Succinate Dehydrogenase (SDH)",
                "Succinyl-CoA Ligase (ADP-forming) (SUCLA2)",
                "Succinyl-CoA Ligase (GDP-forming) (SUCLG1)",
                "Succinyl-CoA Synthetase (SCS)",
                "\u03b1-Ketoglutarate Dehydrogenase (E1 Component) (OGDH)",
                "\u03b1-Ketoglutarate Dehydrogenase (E2 Component) (DLST)",
                "\u03b1-Ketoglutarate Dehydrogenase (E3 Component) (DLD)",
                "\u03b1-Ketoglutarate Dehydrogenase Complex (\u03b1-KGDH)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Citrate synthase (CS)",
            "Aconitase (ACO)",
            "Isocitrate dehydrogenase (IDH)",
            "\u03b1-Ketoglutarate dehydrogenase (\u03b1-KGDH)",
            "Succinyl-CoA synthetase (SCS)",
            "Succinate dehydrogenase (SDH)",
            "Fumarase (FUM)",
            "Malate dehydrogenase (MDH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Citrate synthase (CS)",
                "Aconitase (ACO)",
                "Isocitrate dehydrogenase (IDH)",
                "\u03b1-Ketoglutarate dehydrogenase (\u03b1-KGDH)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinate dehydrogenase (SDH)",
                "Fumarase (FUM)",
                "Malate dehydrogenase (MDH)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aconitase (ACO)",
                "Citrate synthase (CS)",
                "Fumarase (FUM)",
                "Isocitrate dehydrogenase (IDH)",
                "Malate dehydrogenase (MDH)",
                "Succinate dehydrogenase (SDH)",
                "Succinyl-CoA synthetase (SCS)",
                "\u03b1-Ketoglutarate dehydrogenase (\u03b1-KGDH)"
            ],
            "TP": 8,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Citrate Synthase (CS)",
            "Aconitase (ACO)",
            "Isocitrate Dehydrogenase (IDH)",
            "\u03b1-Ketoglutarate Dehydrogenase Complex (\u03b1-KGDH)",
            "Succinyl-CoA Synthetase (SCS)",
            "Succinate Dehydrogenase (SDH)",
            "Fumarate Hydratase (FH)",
            "Malate Dehydrogenase (MDH)",
            "Citrate Lyase (CLY)",
            "Aconitate Hydratase (ACH)",
            "Isocitrate Lyase (ICL)",
            "2-Oxoglutarate Ferredoxin Oxidoreductase (OGOR)",
            "Succinyl-CoA Reductase (SCR)",
            "Fumarate Reductase (FRD)",
            "Malic Enzyme (ME)",
            "Pyruvate Carboxylase (PYC)",
            "Phosphoenolpyruvate Carboxykinase (PEPCK)",
            "Glutamate Dehydrogenase (GDH)",
            "NAD+ dependent isocitrate dehydrogenase",
            "NADH dependent isocitrate dehydrogenase",
            "Succinate-ubiquinone oxidoreductase",
            "Fumarase",
            "Mitochondrial matrix malate dehydrogenase",
            "Cytosolic malate dehydrogenase"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Citrate Synthase (CS)",
                "Aconitase (ACO)",
                "Isocitrate Dehydrogenase (IDH)",
                "\u03b1-Ketoglutarate Dehydrogenase Complex (\u03b1-KGDH)",
                "Succinyl-CoA Synthetase (SCS)",
                "Succinate Dehydrogenase (SDH)",
                "Fumarate Hydratase (FH)",
                "Malate Dehydrogenase (MDH)",
                "Citrate Lyase (CLY)",
                "Aconitate Hydratase (ACH)",
                "Isocitrate Lyase (ICL)",
                "2-Oxoglutarate Ferredoxin Oxidoreductase (OGOR)",
                "Succinyl-CoA Reductase (SCR)",
                "Fumarate Reductase (FRD)",
                "Malic Enzyme (ME)",
                "Pyruvate Carboxylase (PYC)",
                "Phosphoenolpyruvate Carboxykinase (PEPCK)",
                "Glutamate Dehydrogenase (GDH)",
                "NAD+ dependent isocitrate dehydrogenase",
                "NADH dependent isocitrate dehydrogenase",
                "Succinate-ubiquinone oxidoreductase",
                "Fumarase",
                "Mitochondrial matrix malate dehydrogenase",
                "Cytosolic malate dehydrogenase"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Oxoglutarate Ferredoxin Oxidoreductase (OGOR)",
                "Aconitase (ACO)",
                "Aconitate Hydratase (ACH)",
                "Citrate Lyase (CLY)",
                "Citrate Synthase (CS)",
                "Cytosolic malate dehydrogenase",
                "Fumarase",
                "Fumarate Hydratase (FH)",
                "Fumarate Reductase (FRD)",
                "Glutamate Dehydrogenase (GDH)",
                "Isocitrate Dehydrogenase (IDH)",
                "Isocitrate Lyase (ICL)",
                "Malate Dehydrogenase (MDH)",
                "Malic Enzyme (ME)",
                "Mitochondrial matrix malate dehydrogenase",
                "NAD+ dependent isocitrate dehydrogenase",
                "NADH dependent isocitrate dehydrogenase",
                "Phosphoenolpyruvate Carboxykinase (PEPCK)",
                "Pyruvate Carboxylase (PYC)",
                "Succinate Dehydrogenase (SDH)",
                "Succinate-ubiquinone oxidoreductase",
                "Succinyl-CoA Reductase (SCR)",
                "Succinyl-CoA Synthetase (SCS)",
                "\u03b1-Ketoglutarate Dehydrogenase Complex (\u03b1-KGDH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Citrate synthase (CS)",
            "Aconitase (ACO)",
            "Isocitrate dehydrogenase (IDH)",
            "Alpha-ketoglutarate dehydrogenase (OGDH)",
            "Succinyl-CoA synthetase (SCS)",
            "Succinate dehydrogenase (SDH)",
            "Fumarase (FUM)",
            "Malate dehydrogenase (MDH)",
            "NAD+-dependent isocitrate dehydrogenase (IDH3)",
            "NADP+-dependent isocitrate dehydrogenase (IDH1)",
            "NADP+-dependent isocitrate dehydrogenase (IDH2)",
            "Dihydrolipoamide dehydrogenase (DLD)",
            "Aconitate hydratase (ACO2)",
            "Fumarate hydratase (FH)",
            "Succinate-coenzyme Q reductase (SQR)",
            "Citrate (Si)-synthase",
            "2-Oxoglutarate dehydrogenase complex (OGDC)",
            "Aconitase 1 (ACO1)",
            "Aconitase 2 (ACO2)",
            "Isocitrate lyase (ICL)",
            "Malate synthase (MS)",
            "Succinyl-CoA ligase (SUCL)",
            "Malic enzyme (ME)",
            "Pyruvate dehydrogenase (PDH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Citrate synthase (CS)",
                "Aconitase (ACO)",
                "Isocitrate dehydrogenase (IDH)",
                "Alpha-ketoglutarate dehydrogenase (OGDH)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinate dehydrogenase (SDH)",
                "Fumarase (FUM)",
                "Malate dehydrogenase (MDH)",
                "NAD+-dependent isocitrate dehydrogenase (IDH3)",
                "NADP+-dependent isocitrate dehydrogenase (IDH1)",
                "NADP+-dependent isocitrate dehydrogenase (IDH2)",
                "Dihydrolipoamide dehydrogenase (DLD)",
                "Aconitate hydratase (ACO2)",
                "Fumarate hydratase (FH)",
                "Succinate-coenzyme Q reductase (SQR)",
                "Citrate (Si)-synthase",
                "2-Oxoglutarate dehydrogenase complex (OGDC)",
                "Aconitase 1 (ACO1)",
                "Aconitase 2 (ACO2)",
                "Isocitrate lyase (ICL)",
                "Malate synthase (MS)",
                "Succinyl-CoA ligase (SUCL)",
                "Malic enzyme (ME)",
                "Pyruvate dehydrogenase (PDH)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Oxoglutarate dehydrogenase complex (OGDC)",
                "Aconitase (ACO)",
                "Aconitase 1 (ACO1)",
                "Aconitase 2 (ACO2)",
                "Aconitate hydratase (ACO2)",
                "Alpha-ketoglutarate dehydrogenase (OGDH)",
                "Citrate (Si)-synthase",
                "Citrate synthase (CS)",
                "Dihydrolipoamide dehydrogenase (DLD)",
                "Fumarase (FUM)",
                "Fumarate hydratase (FH)",
                "Isocitrate dehydrogenase (IDH)",
                "Isocitrate lyase (ICL)",
                "Malate dehydrogenase (MDH)",
                "Malate synthase (MS)",
                "Malic enzyme (ME)",
                "NAD+-dependent isocitrate dehydrogenase (IDH3)",
                "NADP+-dependent isocitrate dehydrogenase (IDH1)",
                "NADP+-dependent isocitrate dehydrogenase (IDH2)",
                "Pyruvate dehydrogenase (PDH)",
                "Succinate dehydrogenase (SDH)",
                "Succinate-coenzyme Q reductase (SQR)",
                "Succinyl-CoA ligase (SUCL)",
                "Succinyl-CoA synthetase (SCS)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Citrate synthase (CS)",
            "Aconitase (ACO)",
            "Isocitrate dehydrogenase (IDH)",
            "Alpha-ketoglutarate dehydrogenase (KGDH)",
            "Succinyl-CoA synthetase (SUCLG)",
            "Succinate dehydrogenase (SDH)",
            "Fumarase (FH)",
            "Malate dehydrogenase (MDH)",
            "NAD+-dependent isocitrate dehydrogenase (IDH1)",
            "NADP+-dependent isocitrate dehydrogenase (IDH2)",
            "Alpha-ketoglutarate dehydrogenase complex (KGDHC)",
            "Succinate-CoA ligase (SUCL)",
            "Fumarate hydratase (FH)",
            "NADH dehydrogenase (complex I)",
            "Succinate-ubiquinone oxidoreductase (complex II)",
            "Malate synthase (MLS)",
            "Citrate lyase (ACL)",
            "Pyruvate dehydrogenase (PDH)",
            "Pyruvate carboxylase (PC)",
            "Acetyl-CoA carboxylase (ACC)",
            "Citrate transporter (SLC25A1)",
            "Malate-aspartate shuttle enzymes (MDH, GOT)",
            "NADH oxidase (Nox)",
            "GTP-dependent succinate synthase (GTP-SS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Citrate synthase (CS)",
                "Aconitase (ACO)",
                "Isocitrate dehydrogenase (IDH)",
                "Alpha-ketoglutarate dehydrogenase (KGDH)",
                "Succinyl-CoA synthetase (SUCLG)",
                "Succinate dehydrogenase (SDH)",
                "Fumarase (FH)",
                "Malate dehydrogenase (MDH)",
                "NAD+-dependent isocitrate dehydrogenase (IDH1)",
                "NADP+-dependent isocitrate dehydrogenase (IDH2)",
                "Alpha-ketoglutarate dehydrogenase complex (KGDHC)",
                "Succinate-CoA ligase (SUCL)",
                "Fumarate hydratase (FH)",
                "NADH dehydrogenase (complex I)",
                "Succinate-ubiquinone oxidoreductase (complex II)",
                "Malate synthase (MLS)",
                "Citrate lyase (ACL)",
                "Pyruvate dehydrogenase (PDH)",
                "Pyruvate carboxylase (PC)",
                "Acetyl-CoA carboxylase (ACC)",
                "Citrate transporter (SLC25A1)",
                "Malate-aspartate shuttle enzymes (MDH, GOT)",
                "NADH oxidase (Nox)",
                "GTP-dependent succinate synthase (GTP-SS)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl-CoA carboxylase (ACC)",
                "Aconitase (ACO)",
                "Alpha-ketoglutarate dehydrogenase (KGDH)",
                "Alpha-ketoglutarate dehydrogenase complex (KGDHC)",
                "Citrate lyase (ACL)",
                "Citrate synthase (CS)",
                "Citrate transporter (SLC25A1)",
                "Fumarase (FH)",
                "Fumarate hydratase (FH)",
                "GTP-dependent succinate synthase (GTP-SS)",
                "Isocitrate dehydrogenase (IDH)",
                "Malate dehydrogenase (MDH)",
                "Malate synthase (MLS)",
                "Malate-aspartate shuttle enzymes (MDH, GOT)",
                "NAD+-dependent isocitrate dehydrogenase (IDH1)",
                "NADH dehydrogenase (complex I)",
                "NADH oxidase (Nox)",
                "NADP+-dependent isocitrate dehydrogenase (IDH2)",
                "Pyruvate carboxylase (PC)",
                "Pyruvate dehydrogenase (PDH)",
                "Succinate dehydrogenase (SDH)",
                "Succinate-CoA ligase (SUCL)",
                "Succinate-ubiquinone oxidoreductase (complex II)",
                "Succinyl-CoA synthetase (SUCLG)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Citrate synthase (CS)",
            "Aconitase (ACO)",
            "Isocitrate dehydrogenase (IDH)",
            "Alpha-ketoglutarate dehydrogenase (\u03b1-KGDH)",
            "Succinyl-CoA synthetase (SCS)",
            "Succinate dehydrogenase (SDH)",
            "Fumarase (FUM)",
            "Malate dehydrogenase (MDH)",
            "Dihydrolipoyl dehydrogenase (DLD)",
            "Dihydrolipoyl transsuccinylase (DLST)",
            "Dihydrolipoyl transacetylase (DLAT)",
            "Flavoprotein subunit of succinate dehydrogenase (SDHA)",
            "Iron-sulfur subunit of succinate dehydrogenase (SDHB)",
            "Succinate dehydrogenase cytochrome b560 subunit (SDHC)",
            "Succinate dehydrogenase assembly factor 1 (SDHAF1)",
            "Succinate dehydrogenase assembly factor 2 (SDHAF2)",
            "Iron-sulfur cluster assembly enzyme (ISCU)",
            "NADH dehydrogenase (ubiquinone) flavoprotein 1 (NDUFV1)",
            "NADH dehydrogenase (ubiquinone) iron-sulfur protein 2 (NDUFS2)",
            "NADH dehydrogenase (ubiquinone) iron-sulfur protein 7 (NDUFS7)",
            "NADH dehydrogenase (ubiquinone) iron-sulfur protein 8 (NDUFS8)",
            "Electron transfer flavoprotein-ubiquinone oxidoreductase (ETFQO)",
            "2-oxoglutarate dehydrogenase E1 component (OGDH)",
            "2-oxoglutarate dehydrogenase E2 component (DLST)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Citrate synthase (CS)",
                "Aconitase (ACO)",
                "Isocitrate dehydrogenase (IDH)",
                "Alpha-ketoglutarate dehydrogenase (\u03b1-KGDH)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinate dehydrogenase (SDH)",
                "Fumarase (FUM)",
                "Malate dehydrogenase (MDH)",
                "Dihydrolipoyl dehydrogenase (DLD)",
                "Dihydrolipoyl transsuccinylase (DLST)",
                "Dihydrolipoyl transacetylase (DLAT)",
                "Flavoprotein subunit of succinate dehydrogenase (SDHA)",
                "Iron-sulfur subunit of succinate dehydrogenase (SDHB)",
                "Succinate dehydrogenase cytochrome b560 subunit (SDHC)",
                "Succinate dehydrogenase assembly factor 1 (SDHAF1)",
                "Succinate dehydrogenase assembly factor 2 (SDHAF2)",
                "Iron-sulfur cluster assembly enzyme (ISCU)",
                "NADH dehydrogenase (ubiquinone) flavoprotein 1 (NDUFV1)",
                "NADH dehydrogenase (ubiquinone) iron-sulfur protein 2 (NDUFS2)",
                "NADH dehydrogenase (ubiquinone) iron-sulfur protein 7 (NDUFS7)",
                "NADH dehydrogenase (ubiquinone) iron-sulfur protein 8 (NDUFS8)",
                "Electron transfer flavoprotein-ubiquinone oxidoreductase (ETFQO)",
                "2-oxoglutarate dehydrogenase E1 component (OGDH)",
                "2-oxoglutarate dehydrogenase E2 component (DLST)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-oxoglutarate dehydrogenase E1 component (OGDH)",
                "2-oxoglutarate dehydrogenase E2 component (DLST)",
                "Aconitase (ACO)",
                "Alpha-ketoglutarate dehydrogenase (\u03b1-KGDH)",
                "Citrate synthase (CS)",
                "Dihydrolipoyl dehydrogenase (DLD)",
                "Dihydrolipoyl transacetylase (DLAT)",
                "Dihydrolipoyl transsuccinylase (DLST)",
                "Electron transfer flavoprotein-ubiquinone oxidoreductase (ETFQO)",
                "Flavoprotein subunit of succinate dehydrogenase (SDHA)",
                "Fumarase (FUM)",
                "Iron-sulfur cluster assembly enzyme (ISCU)",
                "Iron-sulfur subunit of succinate dehydrogenase (SDHB)",
                "Isocitrate dehydrogenase (IDH)",
                "Malate dehydrogenase (MDH)",
                "NADH dehydrogenase (ubiquinone) flavoprotein 1 (NDUFV1)",
                "NADH dehydrogenase (ubiquinone) iron-sulfur protein 2 (NDUFS2)",
                "NADH dehydrogenase (ubiquinone) iron-sulfur protein 7 (NDUFS7)",
                "NADH dehydrogenase (ubiquinone) iron-sulfur protein 8 (NDUFS8)",
                "Succinate dehydrogenase (SDH)",
                "Succinate dehydrogenase assembly factor 1 (SDHAF1)",
                "Succinate dehydrogenase assembly factor 2 (SDHAF2)",
                "Succinate dehydrogenase cytochrome b560 subunit (SDHC)",
                "Succinyl-CoA synthetase (SCS)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Citrate synthase (CS)",
            "Aconitase (ACO)",
            "Isocitrate dehydrogenase (IDH)",
            "Alpha-ketoglutarate dehydrogenase (\u03b1-KGDH)",
            "Succinyl-CoA synthetase (SCS)",
            "Succinate dehydrogenase (SDH)",
            "Fumarase (FUM)",
            "Malate dehydrogenase (MDH)",
            "Pyruvate dehydrogenase (PDH)",
            "Citrate (cis-aconitate) isomerase",
            "Citrate transporter",
            "Isocitrate lyase (ICL)",
            "Isocitrate dehydrogenase kinase (IDHK)",
            "Isocitrate dehydrogenase phosphatase (IDHP)",
            "Alpha-ketoglutarate transporter",
            "Alpha-ketoglutarate dehydrogenase kinase (\u03b1-KGDHK)",
            "Alpha-ketoglutarate dehydrogenase phosphatase (\u03b1-KGDHP)",
            "Succinyl-CoA transporter",
            "Succinate dehydrogenase kinase (SDHK)",
            "Succinate dehydrogenase phosphatase (SDHP)",
            "Fumarase hydratase",
            "Malate transporter",
            "Malate dehydrogenase kinase (MDHK)",
            "Malate dehydrogenase phosphatase (MDHP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Citrate synthase (CS)",
                "Aconitase (ACO)",
                "Isocitrate dehydrogenase (IDH)",
                "Alpha-ketoglutarate dehydrogenase (\u03b1-KGDH)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinate dehydrogenase (SDH)",
                "Fumarase (FUM)",
                "Malate dehydrogenase (MDH)",
                "Pyruvate dehydrogenase (PDH)",
                "Citrate (cis-aconitate) isomerase",
                "Citrate transporter",
                "Isocitrate lyase (ICL)",
                "Isocitrate dehydrogenase kinase (IDHK)",
                "Isocitrate dehydrogenase phosphatase (IDHP)",
                "Alpha-ketoglutarate transporter",
                "Alpha-ketoglutarate dehydrogenase kinase (\u03b1-KGDHK)",
                "Alpha-ketoglutarate dehydrogenase phosphatase (\u03b1-KGDHP)",
                "Succinyl-CoA transporter",
                "Succinate dehydrogenase kinase (SDHK)",
                "Succinate dehydrogenase phosphatase (SDHP)",
                "Fumarase hydratase",
                "Malate transporter",
                "Malate dehydrogenase kinase (MDHK)",
                "Malate dehydrogenase phosphatase (MDHP)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aconitase (ACO)",
                "Alpha-ketoglutarate dehydrogenase (\u03b1-KGDH)",
                "Alpha-ketoglutarate dehydrogenase kinase (\u03b1-KGDHK)",
                "Alpha-ketoglutarate dehydrogenase phosphatase (\u03b1-KGDHP)",
                "Alpha-ketoglutarate transporter",
                "Citrate (cis-aconitate) isomerase",
                "Citrate synthase (CS)",
                "Citrate transporter",
                "Fumarase (FUM)",
                "Fumarase hydratase",
                "Isocitrate dehydrogenase (IDH)",
                "Isocitrate dehydrogenase kinase (IDHK)",
                "Isocitrate dehydrogenase phosphatase (IDHP)",
                "Isocitrate lyase (ICL)",
                "Malate dehydrogenase (MDH)",
                "Malate dehydrogenase kinase (MDHK)",
                "Malate dehydrogenase phosphatase (MDHP)",
                "Malate transporter",
                "Pyruvate dehydrogenase (PDH)",
                "Succinate dehydrogenase (SDH)",
                "Succinate dehydrogenase kinase (SDHK)",
                "Succinate dehydrogenase phosphatase (SDHP)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinyl-CoA transporter"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Citrate Synthase (CS)",
            "Aconitase 1 (ACO1)",
            "Aconitase 2 (ACO2)",
            "Isocitrate Dehydrogenase 1 (IDH1)",
            "Isocitrate Dehydrogenase 2 (IDH2)",
            "Isocitrate Dehydrogenase 3 alpha (IDH3A)",
            "Isocitrate Dehydrogenase 3 beta (IDH3B)",
            "Isocitrate Dehydrogenase 3 gamma (IDH3G)",
            "Alpha-Ketoglutarate Dehydrogenase (KGDH)",
            "E1 Component of Alpha-Ketoglutarate Dehydrogenase (OGDH)",
            "E2 Component of Alpha-Ketoglutarate Dehydrogenase (DLST)",
            "E3 Component of Alpha-Ketoglutarate Dehydrogenase (DLD)",
            "Succinyl-CoA Synthetase Subunit Alpha (SUCLA)",
            "Succinyl-CoA Synthetase Subunit Beta (SUCLG)",
            "Succinate Dehydrogenase Subunit A (SDHA)",
            "Succinate Dehydrogenase Subunit B (SDHB)",
            "Succinate Dehydrogenase Subunit C (SDHC)",
            "Succinate Dehydrogenase Subunit D (SDHD)",
            "Fumarase (FH)",
            "Malate Dehydrogenase 1 (MDH1)",
            "Malate Dehydrogenase 2 (MDH2)",
            "Malate Dehydrogenase 3 (MDH3)",
            "Malate Dehydrogenase 4 (MDH4)",
            "Succinate-CoA Ligase (SUCL)",
            "Succinic Dehydrogenase (SDH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Citrate Synthase (CS)",
                "Aconitase 1 (ACO1)",
                "Aconitase 2 (ACO2)",
                "Isocitrate Dehydrogenase 1 (IDH1)",
                "Isocitrate Dehydrogenase 2 (IDH2)",
                "Isocitrate Dehydrogenase 3 alpha (IDH3A)",
                "Isocitrate Dehydrogenase 3 beta (IDH3B)",
                "Isocitrate Dehydrogenase 3 gamma (IDH3G)",
                "Alpha-Ketoglutarate Dehydrogenase (KGDH)",
                "E1 Component of Alpha-Ketoglutarate Dehydrogenase (OGDH)",
                "E2 Component of Alpha-Ketoglutarate Dehydrogenase (DLST)",
                "E3 Component of Alpha-Ketoglutarate Dehydrogenase (DLD)",
                "Succinyl-CoA Synthetase Subunit Alpha (SUCLA)",
                "Succinyl-CoA Synthetase Subunit Beta (SUCLG)",
                "Succinate Dehydrogenase Subunit A (SDHA)",
                "Succinate Dehydrogenase Subunit B (SDHB)",
                "Succinate Dehydrogenase Subunit C (SDHC)",
                "Succinate Dehydrogenase Subunit D (SDHD)",
                "Fumarase (FH)",
                "Malate Dehydrogenase 1 (MDH1)",
                "Malate Dehydrogenase 2 (MDH2)",
                "Malate Dehydrogenase 3 (MDH3)",
                "Malate Dehydrogenase 4 (MDH4)",
                "Succinate-CoA Ligase (SUCL)"
            ],
            "mismatches": [
                "Succinic Dehydrogenase (SDH)"
            ],
            "true_referents": [
                "Aconitase 1 (ACO1)",
                "Aconitase 2 (ACO2)",
                "Alpha-Ketoglutarate Dehydrogenase (KGDH)",
                "Citrate Synthase (CS)",
                "E1 Component of Alpha-Ketoglutarate Dehydrogenase (OGDH)",
                "E2 Component of Alpha-Ketoglutarate Dehydrogenase (DLST)",
                "E3 Component of Alpha-Ketoglutarate Dehydrogenase (DLD)",
                "Fumarase (FH)",
                "Isocitrate Dehydrogenase 1 (IDH1)",
                "Isocitrate Dehydrogenase 2 (IDH2)",
                "Isocitrate Dehydrogenase 3 alpha (IDH3A)",
                "Isocitrate Dehydrogenase 3 beta (IDH3B)",
                "Isocitrate Dehydrogenase 3 gamma (IDH3G)",
                "Malate Dehydrogenase 1 (MDH1)",
                "Malate Dehydrogenase 2 (MDH2)",
                "Malate Dehydrogenase 3 (MDH3)",
                "Malate Dehydrogenase 4 (MDH4)",
                "Succinate Dehydrogenase Subunit A (SDHA)",
                "Succinate Dehydrogenase Subunit B (SDHB)",
                "Succinate Dehydrogenase Subunit C (SDHC)",
                "Succinate Dehydrogenase Subunit D (SDHD)",
                "Succinate-CoA Ligase (SUCL)",
                "Succinyl-CoA Synthetase Subunit Alpha (SUCLA)",
                "Succinyl-CoA Synthetase Subunit Beta (SUCLG)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Citrate synthase (CS)",
            "Aconitase (ACO)",
            "Isocitrate dehydrogenase (IDH)",
            "\u03b1-Ketoglutarate dehydrogenase complex (OGDC)",
            "Succinyl-CoA synthetase (SCS)",
            "Succinate dehydrogenase (SDH)",
            "Fumarase (FH)",
            "Malate dehydrogenase (MDH)",
            "Pyruvate dehydrogenase complex (PDC)",
            "Dihydrolipoyl dehydrogenase (DLD)",
            "Dihydrolipoyl transacetylase (DLAT)",
            "Succinyl-CoA:3-ketoacid coenzyme A transferase (SCOT)",
            "2-oxoglutarate dehydrogenase (OGDH)",
            "Dihydrolipoyllysine-residue succinyltransferase (DLST)",
            "Isocitrate dehydrogenase [NAD] subunit alpha (IDH3A)",
            "Isocitrate dehydrogenase [NAD] subunit beta (IDH3B)",
            "Isocitrate dehydrogenase [NAD] subunit gamma (IDH3G)",
            "Succinate-CoA ligase [ADP-forming] subunit beta (SUCLA2)",
            "Succinate-CoA ligase [GDP-forming] subunit beta (SUCLG2)",
            "Succinate-CoA ligase [ADP/GDP-forming] subunit alpha (SUCLG1)",
            "Succinate dehydrogenase cytochrome b560 subunit (SDHC)",
            "Succinate dehydrogenase [ubiquinone] iron-sulfur subunit (SDHB)",
            "Succinate dehydrogenase [ubiquinone] flavoprotein subunit (SDHA)",
            "Succinate dehydrogenase assembly factor 2 (SDHAF2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Citrate synthase (CS)",
                "Aconitase (ACO)",
                "Isocitrate dehydrogenase (IDH)",
                "\u03b1-Ketoglutarate dehydrogenase complex (OGDC)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinate dehydrogenase (SDH)",
                "Fumarase (FH)",
                "Malate dehydrogenase (MDH)",
                "Pyruvate dehydrogenase complex (PDC)",
                "Dihydrolipoyl dehydrogenase (DLD)",
                "Dihydrolipoyl transacetylase (DLAT)",
                "Succinyl-CoA:3-ketoacid coenzyme A transferase (SCOT)",
                "2-oxoglutarate dehydrogenase (OGDH)",
                "Dihydrolipoyllysine-residue succinyltransferase (DLST)",
                "Isocitrate dehydrogenase [NAD] subunit alpha (IDH3A)",
                "Isocitrate dehydrogenase [NAD] subunit beta (IDH3B)",
                "Isocitrate dehydrogenase [NAD] subunit gamma (IDH3G)",
                "Succinate-CoA ligase [ADP-forming] subunit beta (SUCLA2)",
                "Succinate-CoA ligase [GDP-forming] subunit beta (SUCLG2)",
                "Succinate-CoA ligase [ADP/GDP-forming] subunit alpha (SUCLG1)",
                "Succinate dehydrogenase cytochrome b560 subunit (SDHC)",
                "Succinate dehydrogenase [ubiquinone] iron-sulfur subunit (SDHB)",
                "Succinate dehydrogenase [ubiquinone] flavoprotein subunit (SDHA)",
                "Succinate dehydrogenase assembly factor 2 (SDHAF2)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-oxoglutarate dehydrogenase (OGDH)",
                "Aconitase (ACO)",
                "Citrate synthase (CS)",
                "Dihydrolipoyl dehydrogenase (DLD)",
                "Dihydrolipoyl transacetylase (DLAT)",
                "Dihydrolipoyllysine-residue succinyltransferase (DLST)",
                "Fumarase (FH)",
                "Isocitrate dehydrogenase (IDH)",
                "Isocitrate dehydrogenase [NAD] subunit alpha (IDH3A)",
                "Isocitrate dehydrogenase [NAD] subunit beta (IDH3B)",
                "Isocitrate dehydrogenase [NAD] subunit gamma (IDH3G)",
                "Malate dehydrogenase (MDH)",
                "Pyruvate dehydrogenase complex (PDC)",
                "Succinate dehydrogenase (SDH)",
                "Succinate dehydrogenase [ubiquinone] flavoprotein subunit (SDHA)",
                "Succinate dehydrogenase [ubiquinone] iron-sulfur subunit (SDHB)",
                "Succinate dehydrogenase assembly factor 2 (SDHAF2)",
                "Succinate dehydrogenase cytochrome b560 subunit (SDHC)",
                "Succinate-CoA ligase [ADP-forming] subunit beta (SUCLA2)",
                "Succinate-CoA ligase [ADP/GDP-forming] subunit alpha (SUCLG1)",
                "Succinate-CoA ligase [GDP-forming] subunit beta (SUCLG2)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinyl-CoA:3-ketoacid coenzyme A transferase (SCOT)",
                "\u03b1-Ketoglutarate dehydrogenase complex (OGDC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Citrate synthase (CS)",
            "Aconitase (ACO)",
            "Isocitrate dehydrogenase (IDH)",
            "\u03b1-Ketoglutarate dehydrogenase complex (KGDHC)",
            "Succinyl-CoA synthetase (SCS)",
            "Succinate dehydrogenase (SDH)",
            "Fumarase (FH)",
            "Malate dehydrogenase (MDH)",
            "Pyruvate dehydrogenase complex (PDHC)",
            "Pyruvate carboxylase (PC)",
            "Phosphoenolpyruvate carboxykinase (PEPCK)",
            "Malic enzyme (ME)",
            "Glutamate dehydrogenase (GLUD)",
            "Aspartate aminotransferase (AST)",
            "Alanine aminotransferase (ALT)",
            "Dihydrolipoamide dehydrogenase (DLD)",
            "Dihydrolipoamide acetyltransferase (DLAT)",
            "Dihydrolipoamide succinyltransferase (DLST)",
            "Oxoglutarate dehydrogenase (OGDH)",
            "Succinyl-CoA ligase (SUCLG)",
            "Succinate-CoA ligase (SUCL)",
            "2-Oxoglutarate dehydrogenase (OGDH)",
            "Isocitrate lyase (ICL)",
            "Malate synthase (MS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Citrate synthase (CS)",
                "Aconitase (ACO)",
                "Isocitrate dehydrogenase (IDH)",
                "\u03b1-Ketoglutarate dehydrogenase complex (KGDHC)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinate dehydrogenase (SDH)",
                "Fumarase (FH)",
                "Malate dehydrogenase (MDH)",
                "Pyruvate dehydrogenase complex (PDHC)",
                "Pyruvate carboxylase (PC)",
                "Phosphoenolpyruvate carboxykinase (PEPCK)",
                "Malic enzyme (ME)",
                "Glutamate dehydrogenase (GLUD)",
                "Aspartate aminotransferase (AST)",
                "Alanine aminotransferase (ALT)",
                "Dihydrolipoamide dehydrogenase (DLD)",
                "Dihydrolipoamide acetyltransferase (DLAT)",
                "Dihydrolipoamide succinyltransferase (DLST)",
                "Oxoglutarate dehydrogenase (OGDH)",
                "Succinyl-CoA ligase (SUCLG)",
                "Succinate-CoA ligase (SUCL)",
                "2-Oxoglutarate dehydrogenase (OGDH)",
                "Isocitrate lyase (ICL)",
                "Malate synthase (MS)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Oxoglutarate dehydrogenase (OGDH)",
                "Aconitase (ACO)",
                "Alanine aminotransferase (ALT)",
                "Aspartate aminotransferase (AST)",
                "Citrate synthase (CS)",
                "Dihydrolipoamide acetyltransferase (DLAT)",
                "Dihydrolipoamide dehydrogenase (DLD)",
                "Dihydrolipoamide succinyltransferase (DLST)",
                "Fumarase (FH)",
                "Glutamate dehydrogenase (GLUD)",
                "Isocitrate dehydrogenase (IDH)",
                "Isocitrate lyase (ICL)",
                "Malate dehydrogenase (MDH)",
                "Malate synthase (MS)",
                "Malic enzyme (ME)",
                "Oxoglutarate dehydrogenase (OGDH)",
                "Phosphoenolpyruvate carboxykinase (PEPCK)",
                "Pyruvate carboxylase (PC)",
                "Pyruvate dehydrogenase complex (PDHC)",
                "Succinate dehydrogenase (SDH)",
                "Succinate-CoA ligase (SUCL)",
                "Succinyl-CoA ligase (SUCLG)",
                "Succinyl-CoA synthetase (SCS)",
                "\u03b1-Ketoglutarate dehydrogenase complex (KGDHC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Citrate synthase (CS)",
            "Aconitase (ACO)",
            "Isocitrate dehydrogenase (IDH)",
            "\u03b1-Ketoglutarate dehydrogenase complex (\u03b1-KGDHC)",
            "Succinyl-CoA synthetase (SCS)",
            "Succinate dehydrogenase (SDH)",
            "Fumarase (FUM)",
            "Malate dehydrogenase (MDH)",
            "Pyruvate dehydrogenase complex (PDC)",
            "Pyruvate carboxylase (PC)",
            "Isocitrate lyase (ICL)",
            "Malate synthase (MS)",
            "2-Oxoglutarate dehydrogenase complex (OGDC)",
            "Succinate-semialdehyde dehydrogenase (SSADH)",
            "Succinyl-CoA:3-ketoacid-coenzyme A transferase (SCOT)",
            "Methylcitrate dehydratase (MCD)",
            "Methylcitrate synthase (MCS)",
            "Methylisocitrate lyase (MCL)",
            "Citramalate synthase (CMS)",
            "Mesaconyl-CoA hydratase (MCH)",
            "\u03b2-Methylmalyl-CoA lyase (MMCL)",
            "Glutaconyl-CoA decarboxylase (GCD)",
            "Crotonyl-CoA carboxylase/reductase (CCR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Citrate synthase (CS)",
                "Aconitase (ACO)",
                "Isocitrate dehydrogenase (IDH)",
                "\u03b1-Ketoglutarate dehydrogenase complex (\u03b1-KGDHC)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinate dehydrogenase (SDH)",
                "Fumarase (FUM)",
                "Malate dehydrogenase (MDH)",
                "Pyruvate dehydrogenase complex (PDC)",
                "Pyruvate carboxylase (PC)",
                "Isocitrate lyase (ICL)",
                "Malate synthase (MS)",
                "2-Oxoglutarate dehydrogenase complex (OGDC)",
                "Succinate-semialdehyde dehydrogenase (SSADH)",
                "Succinyl-CoA:3-ketoacid-coenzyme A transferase (SCOT)",
                "Methylcitrate dehydratase (MCD)",
                "Methylcitrate synthase (MCS)",
                "Methylisocitrate lyase (MCL)",
                "Citramalate synthase (CMS)",
                "Mesaconyl-CoA hydratase (MCH)",
                "\u03b2-Methylmalyl-CoA lyase (MMCL)",
                "Glutaconyl-CoA decarboxylase (GCD)",
                "Crotonyl-CoA carboxylase/reductase (CCR)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Oxoglutarate dehydrogenase complex (OGDC)",
                "Aconitase (ACO)",
                "Citramalate synthase (CMS)",
                "Citrate synthase (CS)",
                "Crotonyl-CoA carboxylase/reductase (CCR)",
                "Fumarase (FUM)",
                "Glutaconyl-CoA decarboxylase (GCD)",
                "Isocitrate dehydrogenase (IDH)",
                "Isocitrate lyase (ICL)",
                "Malate dehydrogenase (MDH)",
                "Malate synthase (MS)",
                "Mesaconyl-CoA hydratase (MCH)",
                "Methylcitrate dehydratase (MCD)",
                "Methylcitrate synthase (MCS)",
                "Methylisocitrate lyase (MCL)",
                "Pyruvate carboxylase (PC)",
                "Pyruvate dehydrogenase complex (PDC)",
                "Succinate dehydrogenase (SDH)",
                "Succinate-semialdehyde dehydrogenase (SSADH)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinyl-CoA:3-ketoacid-coenzyme A transferase (SCOT)",
                "\u03b1-Ketoglutarate dehydrogenase complex (\u03b1-KGDHC)",
                "\u03b2-Methylmalyl-CoA lyase (MMCL)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Citrate Synthase (CS)",
            "Aconitase (ACO)",
            "Isocitrate Dehydrogenase (IDH)",
            "\u03b1-Ketoglutarate Dehydrogenase (OGDH)",
            "Succinyl-CoA Synthetase (SUCLG)",
            "Succinate Dehydrogenase (SDH)",
            "Fumarase (FH)",
            "Malate Dehydrogenase (MDH)",
            "Pyruvate Dehydrogenase (PDH)",
            "Dihydrolipoyl Dehydrogenase (DLD)",
            "Dihydrolipoyl Transacetylase (DLAT)",
            "Dihydrolipoyl Lysine-Residue Acetyltransferase (DLAT)",
            "Pyruvate Carboxylase (PC)",
            "Phosphoenolpyruvate Carboxykinase (PEPCK)",
            "Malic Enzyme (ME)",
            "Glutamate Dehydrogenase (GDH)",
            "Isocitrate Lyase (ICL)",
            "Malate Synthase (MS)",
            "Oxoglutarate Dehydrogenase (OGDH)",
            "Oxoglutarate Decarboxylase (OGDC)",
            "Oxoglutarate Dehydrogenase Complex (OGDC)",
            "Succinyl-CoA Ligase (SUCL)",
            "Succinate-CoA Ligase (SUCL)",
            "Succinate Thiokinase (SUCL)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Citrate Synthase (CS)",
                "Aconitase (ACO)",
                "Isocitrate Dehydrogenase (IDH)",
                "\u03b1-Ketoglutarate Dehydrogenase (OGDH)",
                "Succinyl-CoA Synthetase (SUCLG)",
                "Succinate Dehydrogenase (SDH)",
                "Fumarase (FH)",
                "Malate Dehydrogenase (MDH)",
                "Pyruvate Dehydrogenase (PDH)",
                "Dihydrolipoyl Dehydrogenase (DLD)",
                "Dihydrolipoyl Transacetylase (DLAT)",
                "Dihydrolipoyl Lysine-Residue Acetyltransferase (DLAT)",
                "Pyruvate Carboxylase (PC)",
                "Phosphoenolpyruvate Carboxykinase (PEPCK)",
                "Malic Enzyme (ME)",
                "Glutamate Dehydrogenase (GDH)",
                "Isocitrate Lyase (ICL)",
                "Malate Synthase (MS)",
                "Oxoglutarate Dehydrogenase (OGDH)",
                "Oxoglutarate Decarboxylase (OGDC)",
                "Oxoglutarate Dehydrogenase Complex (OGDC)",
                "Succinyl-CoA Ligase (SUCL)",
                "Succinate-CoA Ligase (SUCL)",
                "Succinate Thiokinase (SUCL)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aconitase (ACO)",
                "Citrate Synthase (CS)",
                "Dihydrolipoyl Dehydrogenase (DLD)",
                "Dihydrolipoyl Lysine-Residue Acetyltransferase (DLAT)",
                "Dihydrolipoyl Transacetylase (DLAT)",
                "Fumarase (FH)",
                "Glutamate Dehydrogenase (GDH)",
                "Isocitrate Dehydrogenase (IDH)",
                "Isocitrate Lyase (ICL)",
                "Malate Dehydrogenase (MDH)",
                "Malate Synthase (MS)",
                "Malic Enzyme (ME)",
                "Oxoglutarate Decarboxylase (OGDC)",
                "Oxoglutarate Dehydrogenase (OGDH)",
                "Oxoglutarate Dehydrogenase Complex (OGDC)",
                "Phosphoenolpyruvate Carboxykinase (PEPCK)",
                "Pyruvate Carboxylase (PC)",
                "Pyruvate Dehydrogenase (PDH)",
                "Succinate Dehydrogenase (SDH)",
                "Succinate Thiokinase (SUCL)",
                "Succinate-CoA Ligase (SUCL)",
                "Succinyl-CoA Ligase (SUCL)",
                "Succinyl-CoA Synthetase (SUCLG)",
                "\u03b1-Ketoglutarate Dehydrogenase (OGDH)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "Citrate synthase (CS)",
            "Aconitase (ACO)",
            "Isocitrate dehydrogenase (IDH)",
            "Alpha-ketoglutarate dehydrogenase (AKGDH)",
            "Succinyl-CoA synthetase (SCS)",
            "Succinate dehydrogenase (SDH)",
            "Fumarase (FUM)",
            "Malate dehydrogenase (MDH)",
            "Citrate lyase (CLY)",
            "Citrate lyase alpha subunit (CLYA)",
            "Citrate lyase beta subunit (CLYB)",
            "Aconitase 1 (ACO1)",
            "Aconitase 2 (ACO2)",
            "Isocitrate dehydrogenase 1 (IDH1)",
            "Isocitrate dehydrogenase 2 (IDH2)",
            "Isocitrate dehydrogenase 3 (IDH3)",
            "Alpha-ketoglutarate dehydrogenase complex (AKGDHC)",
            "Succinyl-CoA synthetase alpha subunit (SCSA)",
            "Succinyl-CoA synthetase beta subunit (SCSB)",
            "Succinate dehydrogenase flavoprotein subunit (SDHF)",
            "Succinate dehydrogenase iron-sulfur subunit (SDHIS)",
            "Fumarase cytosolic (FUMC)",
            "Fumarase mitochondrial (FUMM)",
            "Malate dehydrogenase cytosolic (MDHC)",
            "Malate dehydrogenase mitochondrial (MDHM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Citrate synthase (CS)",
                "Aconitase (ACO)",
                "Isocitrate dehydrogenase (IDH)",
                "Alpha-ketoglutarate dehydrogenase (AKGDH)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinate dehydrogenase (SDH)",
                "Fumarase (FUM)",
                "Malate dehydrogenase (MDH)",
                "Citrate lyase (CLY)",
                "Citrate lyase alpha subunit (CLYA)",
                "Citrate lyase beta subunit (CLYB)",
                "Aconitase 1 (ACO1)",
                "Aconitase 2 (ACO2)",
                "Isocitrate dehydrogenase 1 (IDH1)",
                "Isocitrate dehydrogenase 2 (IDH2)",
                "Isocitrate dehydrogenase 3 (IDH3)",
                "Alpha-ketoglutarate dehydrogenase complex (AKGDHC)",
                "Succinyl-CoA synthetase alpha subunit (SCSA)",
                "Succinyl-CoA synthetase beta subunit (SCSB)",
                "Succinate dehydrogenase flavoprotein subunit (SDHF)",
                "Succinate dehydrogenase iron-sulfur subunit (SDHIS)",
                "Fumarase cytosolic (FUMC)",
                "Fumarase mitochondrial (FUMM)",
                "Malate dehydrogenase cytosolic (MDHC)"
            ],
            "mismatches": [
                "Malate dehydrogenase mitochondrial (MDHM)"
            ],
            "true_referents": [
                "Aconitase (ACO)",
                "Aconitase 1 (ACO1)",
                "Aconitase 2 (ACO2)",
                "Alpha-ketoglutarate dehydrogenase (AKGDH)",
                "Alpha-ketoglutarate dehydrogenase complex (AKGDHC)",
                "Citrate lyase (CLY)",
                "Citrate lyase alpha subunit (CLYA)",
                "Citrate lyase beta subunit (CLYB)",
                "Citrate synthase (CS)",
                "Fumarase (FUM)",
                "Fumarase cytosolic (FUMC)",
                "Fumarase mitochondrial (FUMM)",
                "Isocitrate dehydrogenase (IDH)",
                "Isocitrate dehydrogenase 1 (IDH1)",
                "Isocitrate dehydrogenase 2 (IDH2)",
                "Isocitrate dehydrogenase 3 (IDH3)",
                "Malate dehydrogenase (MDH)",
                "Malate dehydrogenase cytosolic (MDHC)",
                "Succinate dehydrogenase (SDH)",
                "Succinate dehydrogenase flavoprotein subunit (SDHF)",
                "Succinate dehydrogenase iron-sulfur subunit (SDHIS)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinyl-CoA synthetase alpha subunit (SCSA)",
                "Succinyl-CoA synthetase beta subunit (SCSB)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            "aconitase (ACO2)",
            "citrate synthase (CS)",
            "isocitrate dehydrogenase (IDH)",
            "isocitrate dehydrogenase 3 (NAD+) (IDH3)",
            "2-oxoglutarate dehydrogenase (OGDH)",
            "oxoglutarate dehydrogenase complex (OGDC)",
            "dihydrolipoyl dehydrogenase (DLD)",
            "dihydrolipoyl transsuccinylase (DLST)",
            "alpha-ketoglutarate dehydrogenase kinase (MAT1A)",
            "oxoglutarate dehydrogenase inhibitor (OGDI)",
            "citrate (Si)-synthase (CITRS)",
            "aconitate hydratase (AH)",
            "aconitase 1 (ACO1)",
            "isocitrate dehydrogenase 1 (NADP+) (IDH1)",
            "isocitrate dehydrogenase 2 (NADP+) (IDH2)",
            "2-oxoglutarate dehydrogenase E1 component (OGDH-E1)",
            "2-oxoglutarate dehydrogenase E2 component (OGDH-E2)",
            "2-oxoglutarate dehydrogenase E3 component (OGDH-E3)",
            "dihydrolipoyl transketolase (DLTK)",
            "dihydrolipoyl dehydrogenase (DLD)",
            "oxoglutarate dehydrogenase complex component E1 (OGDC-E1)",
            "oxoglutarate dehydrogenase complex component E2 (OGDC-E2)",
            "oxoglutarate dehydrogenase complex component E3 (OGDC-E3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "aconitase (ACO2)",
                "citrate synthase (CS)",
                "isocitrate dehydrogenase (IDH)",
                "isocitrate dehydrogenase 3 (NAD+) (IDH3)",
                "2-oxoglutarate dehydrogenase (OGDH)",
                "oxoglutarate dehydrogenase complex (OGDC)",
                "dihydrolipoyl dehydrogenase (DLD)",
                "dihydrolipoyl transsuccinylase (DLST)",
                "alpha-ketoglutarate dehydrogenase kinase (MAT1A)",
                "oxoglutarate dehydrogenase inhibitor (OGDI)",
                "citrate (Si)-synthase (CITRS)",
                "aconitate hydratase (AH)",
                "aconitase 1 (ACO1)",
                "isocitrate dehydrogenase 1 (NADP+) (IDH1)",
                "isocitrate dehydrogenase 2 (NADP+) (IDH2)",
                "2-oxoglutarate dehydrogenase E1 component (OGDH-E1)",
                "2-oxoglutarate dehydrogenase E2 component (OGDH-E2)",
                "2-oxoglutarate dehydrogenase E3 component (OGDH-E3)",
                "dihydrolipoyl transketolase (DLTK)",
                "oxoglutarate dehydrogenase complex component E1 (OGDC-E1)",
                "oxoglutarate dehydrogenase complex component E2 (OGDC-E2)",
                "oxoglutarate dehydrogenase complex component E3 (OGDC-E3)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-oxoglutarate dehydrogenase (OGDH)",
                "2-oxoglutarate dehydrogenase E1 component (OGDH-E1)",
                "2-oxoglutarate dehydrogenase E2 component (OGDH-E2)",
                "2-oxoglutarate dehydrogenase E3 component (OGDH-E3)",
                "aconitase (ACO2)",
                "aconitase 1 (ACO1)",
                "aconitate hydratase (AH)",
                "alpha-ketoglutarate dehydrogenase kinase (MAT1A)",
                "citrate (Si)-synthase (CITRS)",
                "citrate synthase (CS)",
                "dihydrolipoyl dehydrogenase (DLD)",
                "dihydrolipoyl transketolase (DLTK)",
                "dihydrolipoyl transsuccinylase (DLST)",
                "isocitrate dehydrogenase (IDH)",
                "isocitrate dehydrogenase 1 (NADP+) (IDH1)",
                "isocitrate dehydrogenase 2 (NADP+) (IDH2)",
                "isocitrate dehydrogenase 3 (NAD+) (IDH3)",
                "oxoglutarate dehydrogenase complex (OGDC)",
                "oxoglutarate dehydrogenase complex component E1 (OGDC-E1)",
                "oxoglutarate dehydrogenase complex component E2 (OGDC-E2)",
                "oxoglutarate dehydrogenase complex component E3 (OGDC-E3)",
                "oxoglutarate dehydrogenase inhibitor (OGDI)"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "TCA cycle enzyme",
        "domain": "biology",
        "response": [
            {
                "Referent": "Aconitase",
                "Canonical Name": "ACO2"
            },
            {
                "Referent": "Isocitrate dehydrogenase",
                "Canonical Name": "IDH1"
            },
            {
                "Referent": "Alpha-ketoglutarate dehydrogenase",
                "Canonical Name": "OGDH"
            },
            {
                "Referent": "Succinyl-CoA synthetase",
                "Canonical Name": "SUCLG1"
            },
            {
                "Referent": "Fumarase",
                "Canonical Name": "FH"
            },
            {
                "Referent": "Malate dehydrogenase",
                "Canonical Name": "MDH1"
            },
            {
                "Referent": "Citrate synthase",
                "Canonical Name": "CS"
            },
            {
                "Referent": "Isocitrate lyase",
                "Canonical Name": "ICL1"
            },
            {
                "Referent": "Succinate dehydrogenase",
                "Canonical Name": "SDH"
            },
            {
                "Referent": "Dihydrolipoamide dehydrogenase",
                "Canonical Name": "DLD"
            },
            {
                "Referent": "Succinyl-CoA ligase",
                "Canonical Name": "SUCLG2"
            },
            {
                "Referent": "2-oxoglutarate dehydrogenase",
                "Canonical Name": "OGDH2"
            },
            {
                "Referent": "Succinate dehydrogenase complex, subunit A",
                "Canonical Name": "SDHA"
            },
            {
                "Referent": "Succinate dehydrogenase complex, subunit B",
                "Canonical Name": "SDHB"
            },
            {
                "Referent": "Succinate dehydrogenase complex, subunit C",
                "Canonical Name": "SDHC"
            },
            {
                "Referent": "Succinate dehydrogenase complex, subunit D",
                "Canonical Name": "SDHD"
            },
            {
                "Referent": "Succinate dehydrogenase complex, subunit E",
                "Canonical Name": "SDHE"
            },
            {
                "Referent": "Succinate dehydrogenase complex, subunit F",
                "Canonical Name": "SDHF"
            },
            {
                "Referent": "Succinate dehydrogenase complex, subunit G",
                "Canonical Name": "SDHG"
            },
            {
                "Referent": "Succinate dehydrogenase complex, subunit H",
                "Canonical Name": "SDHH"
            },
            {
                "Referent": "Succinate dehydrogenase complex, subunit I",
                "Canonical Name": "SDHI"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aconitase",
                "Isocitrate dehydrogenase",
                "Alpha-ketoglutarate dehydrogenase",
                "Succinyl-CoA synthetase",
                "Fumarase",
                "Malate dehydrogenase",
                "Citrate synthase",
                "Isocitrate lyase",
                "Succinate dehydrogenase",
                "Dihydrolipoamide dehydrogenase",
                "Succinyl-CoA ligase",
                "2-oxoglutarate dehydrogenase",
                "Succinate dehydrogenase complex, subunit A",
                "Succinate dehydrogenase complex, subunit B",
                "Succinate dehydrogenase complex, subunit C",
                "Succinate dehydrogenase complex, subunit D",
                "Succinate dehydrogenase complex, subunit E",
                "Succinate dehydrogenase complex, subunit F",
                "Succinate dehydrogenase complex, subunit G",
                "Succinate dehydrogenase complex, subunit H",
                "Succinate dehydrogenase complex, subunit I"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"2-oxoglutarate dehydrogenase\", \"Canonical Name\": \"OGDH2\"}",
                "{\"Referent\": \"Aconitase\", \"Canonical Name\": \"ACO2\"}",
                "{\"Referent\": \"Alpha-ketoglutarate dehydrogenase\", \"Canonical Name\": \"OGDH\"}",
                "{\"Referent\": \"Citrate synthase\", \"Canonical Name\": \"CS\"}",
                "{\"Referent\": \"Dihydrolipoamide dehydrogenase\", \"Canonical Name\": \"DLD\"}",
                "{\"Referent\": \"Fumarase\", \"Canonical Name\": \"FH\"}",
                "{\"Referent\": \"Isocitrate dehydrogenase\", \"Canonical Name\": \"IDH1\"}",
                "{\"Referent\": \"Isocitrate lyase\", \"Canonical Name\": \"ICL1\"}",
                "{\"Referent\": \"Malate dehydrogenase\", \"Canonical Name\": \"MDH1\"}",
                "{\"Referent\": \"Succinate dehydrogenase complex, subunit A\", \"Canonical Name\": \"SDHA\"}",
                "{\"Referent\": \"Succinate dehydrogenase complex, subunit B\", \"Canonical Name\": \"SDHB\"}",
                "{\"Referent\": \"Succinate dehydrogenase complex, subunit C\", \"Canonical Name\": \"SDHC\"}",
                "{\"Referent\": \"Succinate dehydrogenase complex, subunit D\", \"Canonical Name\": \"SDHD\"}",
                "{\"Referent\": \"Succinate dehydrogenase complex, subunit E\", \"Canonical Name\": \"SDHE\"}",
                "{\"Referent\": \"Succinate dehydrogenase complex, subunit F\", \"Canonical Name\": \"SDHF\"}",
                "{\"Referent\": \"Succinate dehydrogenase complex, subunit G\", \"Canonical Name\": \"SDHG\"}",
                "{\"Referent\": \"Succinate dehydrogenase complex, subunit H\", \"Canonical Name\": \"SDHH\"}",
                "{\"Referent\": \"Succinate dehydrogenase complex, subunit I\", \"Canonical Name\": \"SDHI\"}",
                "{\"Referent\": \"Succinate dehydrogenase\", \"Canonical Name\": \"SDH\"}",
                "{\"Referent\": \"Succinyl-CoA ligase\", \"Canonical Name\": \"SUCLG2\"}",
                "{\"Referent\": \"Succinyl-CoA synthetase\", \"Canonical Name\": \"SUCLG1\"}"
            ],
            "TP": 21,
            "FP": 0,
            "FN": 0
        }
    }
]