[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase 1 (HK1)",
            "Hexokinase 2 (HK2)",
            "Glucokinase (GCK)",
            "Phosphoglycerate Kinase 1 (PGK1)",
            "Pyruvate Kinase (PKM)",
            "Phosphofructokinase 1 (PFK1)",
            "Phosphoglycerate Mutase 1 (PGAM1)",
            "Pyruvate Dehydrogenase E1 Subunit Alpha (PDHA1)",
            "Triosephosphate Isomerase 1 (TPI1)",
            "Aldolase A (ALDOA)",
            "Enolase 1 (ENO1)",
            "Phosphoglycerate Dehydrogenase (PHGDH)",
            "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
            "Lactate Dehydrogenase A (LDHA)",
            "Pyruvate Dehydrogenase Kinase 1 (PDK1)",
            "Pyruvate Dehydrogenase Kinase 4 (PDK4)",
            "Pyruvate Dehydrogenase E1 Subunit Beta (PDHB)",
            "Pyruvate Dehydrogenase E1-Activating Kinase 1 (PDK2)",
            "Pyruvate Dehydrogenase Phosphatase Catalytic Subunit 1 (PDP1)",
            "Pyruvate Dehydrogenase Phosphatase Catalytic Subunit 2 (PDP2)",
            "Pyruvate Dehydrogenase E1-Activating Kinase 3 (PDK3)",
            "Pyruvate Dehydrogenase E1-Activating Kinase 4 (PDK4)",
            "Phosphoglycerate Dehydrogenase (PHGDH)",
            "Pyruvate Kinase M2 (PKM2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Glucokinase (GCK)",
                "Phosphoglycerate Kinase 1 (PGK1)",
                "Pyruvate Kinase (PKM)",
                "Phosphofructokinase 1 (PFK1)",
                "Phosphoglycerate Mutase 1 (PGAM1)",
                "Pyruvate Dehydrogenase E1 Subunit Alpha (PDHA1)",
                "Triosephosphate Isomerase 1 (TPI1)",
                "Aldolase A (ALDOA)",
                "Enolase 1 (ENO1)",
                "Phosphoglycerate Dehydrogenase (PHGDH)",
                "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
                "Lactate Dehydrogenase A (LDHA)",
                "Pyruvate Dehydrogenase Kinase 1 (PDK1)",
                "Pyruvate Dehydrogenase Kinase 4 (PDK4)",
                "Pyruvate Dehydrogenase E1 Subunit Beta (PDHB)",
                "Pyruvate Dehydrogenase E1-Activating Kinase 1 (PDK2)",
                "Pyruvate Dehydrogenase Phosphatase Catalytic Subunit 1 (PDP1)",
                "Pyruvate Dehydrogenase Phosphatase Catalytic Subunit 2 (PDP2)",
                "Pyruvate Dehydrogenase E1-Activating Kinase 3 (PDK3)",
                "Pyruvate Dehydrogenase E1-Activating Kinase 4 (PDK4)",
                "Pyruvate Kinase M2 (PKM2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aldolase A (ALDOA)",
                "Enolase 1 (ENO1)",
                "Glucokinase (GCK)",
                "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Lactate Dehydrogenase A (LDHA)",
                "Phosphofructokinase 1 (PFK1)",
                "Phosphoglycerate Dehydrogenase (PHGDH)",
                "Phosphoglycerate Kinase 1 (PGK1)",
                "Phosphoglycerate Mutase 1 (PGAM1)",
                "Pyruvate Dehydrogenase E1 Subunit Alpha (PDHA1)",
                "Pyruvate Dehydrogenase E1 Subunit Beta (PDHB)",
                "Pyruvate Dehydrogenase E1-Activating Kinase 1 (PDK2)",
                "Pyruvate Dehydrogenase E1-Activating Kinase 3 (PDK3)",
                "Pyruvate Dehydrogenase E1-Activating Kinase 4 (PDK4)",
                "Pyruvate Dehydrogenase Kinase 1 (PDK1)",
                "Pyruvate Dehydrogenase Kinase 4 (PDK4)",
                "Pyruvate Dehydrogenase Phosphatase Catalytic Subunit 1 (PDP1)",
                "Pyruvate Dehydrogenase Phosphatase Catalytic Subunit 2 (PDP2)",
                "Pyruvate Kinase (PKM)",
                "Pyruvate Kinase M2 (PKM2)",
                "Triosephosphate Isomerase 1 (TPI1)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase 1 (HK1)",
            "Hexokinase 2 (HK2)",
            "Glucokinase (GCK)",
            "Phosphoglucose isomerase (PGI)",
            "Phosphofructokinase-1 (PFK1)",
            "Fructose-bisphosphate aldolase A (ALDOA)",
            "Triosephosphate isomerase (TPI1)",
            "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
            "Phosphoglycerate kinase 1 (PGK1)",
            "Phosphoglycerate mutase 1 (PGAM1)",
            "Enolase 1 (ENO1)",
            "Lactate dehydrogenase A (LDHA)",
            "Lactate dehydrogenase B (LDHB)",
            "Pyruvate kinase muscle isozyme (PKM)",
            "Pyruvate kinase liver and red cell (PKLR)",
            "Pyruvate kinase M2 (PKM2)",
            "Pyruvate kinase R (PKLR)",
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "Phosphoglucomutase 1 (PGM1)",
            "Phosphoglucomutase 3 (PGM3)",
            "Phosphoglycerate mutase 2 (PGAM2)",
            "Enolase 2 (ENO2)",
            "Glycogen synthase (GYS1)",
            "Phosphoglycerate kinase 2 (PGK2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Glucokinase (GCK)",
                "Phosphoglucose isomerase (PGI)",
                "Phosphofructokinase-1 (PFK1)",
                "Fructose-bisphosphate aldolase A (ALDOA)",
                "Triosephosphate isomerase (TPI1)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Enolase 1 (ENO1)",
                "Lactate dehydrogenase A (LDHA)",
                "Lactate dehydrogenase B (LDHB)",
                "Pyruvate kinase muscle isozyme (PKM)",
                "Pyruvate kinase liver and red cell (PKLR)",
                "Pyruvate kinase M2 (PKM2)",
                "Pyruvate kinase R (PKLR)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Phosphoglucomutase 1 (PGM1)",
                "Phosphoglucomutase 3 (PGM3)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Enolase 2 (ENO2)",
                "Glycogen synthase (GYS1)",
                "Phosphoglycerate kinase 2 (PGK2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Enolase 1 (ENO1)",
                "Enolase 2 (ENO2)",
                "Fructose-bisphosphate aldolase A (ALDOA)",
                "Glucokinase (GCK)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Glycogen synthase (GYS1)",
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Lactate dehydrogenase A (LDHA)",
                "Lactate dehydrogenase B (LDHB)",
                "Phosphofructokinase-1 (PFK1)",
                "Phosphoglucomutase 1 (PGM1)",
                "Phosphoglucomutase 3 (PGM3)",
                "Phosphoglucose isomerase (PGI)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate kinase 2 (PGK2)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Pyruvate kinase M2 (PKM2)",
                "Pyruvate kinase R (PKLR)",
                "Pyruvate kinase liver and red cell (PKLR)",
                "Pyruvate kinase muscle isozyme (PKM)",
                "Triosephosphate isomerase (TPI1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase 1 (HK1)",
            "Hexokinase 2 (HK2)",
            "Glucokinase (GCK)",
            "Glucose-6-phosphate isomerase (GPI)",
            "Phosphofructokinase 1 (PFKL)",
            "Aldolase A (ALDOA)",
            "Triose phosphate isomerase (TPI1)",
            "Glyceraldehyde 3-phosphate dehydrogenase (GAPDH)",
            "Phosphoglycerate kinase 1 (PGK1)",
            "Phosphoglycerate mutase 1 (PGAM1)",
            "Enolase 1 (ENO1)",
            "Pyruvate kinase M1/M2 (PKM)",
            "Lactate dehydrogenase A (LDHA)",
            "Lactate dehydrogenase B (LDHB)",
            "Pyruvate dehydrogenase E1 component subunit alpha 1 (PDHA1)",
            "Pyruvate dehydrogenase E1 component subunit beta (PDHB)",
            "Dihydrolipoamide S-succinyltransferase (DLST)",
            "Dihydrolipoamide dehydrogenase (DLD)",
            "Pyruvate dehydrogenase kinase 1 (PDK1)",
            "Pyruvate dehydrogenase kinase 2 (PDK2)",
            "Pyruvate dehydrogenase kinase 3 (PDK3)",
            "Pyruvate dehydrogenase kinase 4 (PDK4)",
            "Phosphoenolpyruvate carboxykinase 1 (PCK1)",
            "Phosphoenolpyruvate carboxykinase 2 (PCK2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Glucokinase (GCK)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Phosphofructokinase 1 (PFKL)",
                "Aldolase A (ALDOA)",
                "Triose phosphate isomerase (TPI1)",
                "Glyceraldehyde 3-phosphate dehydrogenase (GAPDH)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Enolase 1 (ENO1)",
                "Pyruvate kinase M1/M2 (PKM)",
                "Lactate dehydrogenase A (LDHA)",
                "Lactate dehydrogenase B (LDHB)",
                "Pyruvate dehydrogenase E1 component subunit alpha 1 (PDHA1)",
                "Pyruvate dehydrogenase E1 component subunit beta (PDHB)",
                "Dihydrolipoamide S-succinyltransferase (DLST)",
                "Dihydrolipoamide dehydrogenase (DLD)",
                "Pyruvate dehydrogenase kinase 1 (PDK1)",
                "Pyruvate dehydrogenase kinase 2 (PDK2)",
                "Pyruvate dehydrogenase kinase 3 (PDK3)",
                "Pyruvate dehydrogenase kinase 4 (PDK4)",
                "Phosphoenolpyruvate carboxykinase 1 (PCK1)",
                "Phosphoenolpyruvate carboxykinase 2 (PCK2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aldolase A (ALDOA)",
                "Dihydrolipoamide S-succinyltransferase (DLST)",
                "Dihydrolipoamide dehydrogenase (DLD)",
                "Enolase 1 (ENO1)",
                "Glucokinase (GCK)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Glyceraldehyde 3-phosphate dehydrogenase (GAPDH)",
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Lactate dehydrogenase A (LDHA)",
                "Lactate dehydrogenase B (LDHB)",
                "Phosphoenolpyruvate carboxykinase 1 (PCK1)",
                "Phosphoenolpyruvate carboxykinase 2 (PCK2)",
                "Phosphofructokinase 1 (PFKL)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Pyruvate dehydrogenase E1 component subunit alpha 1 (PDHA1)",
                "Pyruvate dehydrogenase E1 component subunit beta (PDHB)",
                "Pyruvate dehydrogenase kinase 1 (PDK1)",
                "Pyruvate dehydrogenase kinase 2 (PDK2)",
                "Pyruvate dehydrogenase kinase 3 (PDK3)",
                "Pyruvate dehydrogenase kinase 4 (PDK4)",
                "Pyruvate kinase M1/M2 (PKM)",
                "Triose phosphate isomerase (TPI1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase (HK)",
            "Glucose-6-Phosphate Isomerase (GPI)",
            "Phosphofructokinase-1 (PFK1)",
            "Aldolase (ALDOA)",
            "Triose Phosphate Isomerase (TPI1)",
            "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
            "Phosphoglycerate Kinase 1 (PGK1)",
            "Phosphoglycerate Mutase (PGM1)",
            "Enolase (ENO1)",
            "Pyruvate Kinase M2 (PKM2)",
            "Pyruvate Kinase L (PKLR)",
            "Fructose-1,6-Bisphosphatase (FBP1)",
            "Phosphofructokinase-2/Fructose-2,6-Bisphosphatase 3 (PFKFB3)",
            "Aldolase B (ALDOB)",
            "Pyruvate Dehydrogenase Kinase 1 (PDK1)",
            "Lactate Dehydrogenase A (LDHA)",
            "Hexokinase 2 (HK2)",
            "Phosphoglycerate Mutase 2 (PGM2)",
            "Enolase 3 (ENO3)",
            "Triosephosphate Dehydrogenase (GAPDHS)",
            "Pyruvate Kinase M1 (PKM1)",
            "Glucose Transporter 1 (GLUT1)",
            "Phosphofructokinase-1 catalytic subunit (PFK-C)",
            "6-Phosphofructo-2-Kinase (PFK2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase (HK)",
                "Glucose-6-Phosphate Isomerase (GPI)",
                "Phosphofructokinase-1 (PFK1)",
                "Aldolase (ALDOA)",
                "Triose Phosphate Isomerase (TPI1)",
                "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
                "Phosphoglycerate Kinase 1 (PGK1)",
                "Phosphoglycerate Mutase (PGM1)",
                "Enolase (ENO1)",
                "Pyruvate Kinase M2 (PKM2)",
                "Pyruvate Kinase L (PKLR)",
                "Fructose-1,6-Bisphosphatase (FBP1)",
                "Phosphofructokinase-2/Fructose-2,6-Bisphosphatase 3 (PFKFB3)",
                "Aldolase B (ALDOB)",
                "Pyruvate Dehydrogenase Kinase 1 (PDK1)",
                "Lactate Dehydrogenase A (LDHA)",
                "Hexokinase 2 (HK2)",
                "Phosphoglycerate Mutase 2 (PGM2)",
                "Enolase 3 (ENO3)",
                "Triosephosphate Dehydrogenase (GAPDHS)",
                "Pyruvate Kinase M1 (PKM1)",
                "Glucose Transporter 1 (GLUT1)",
                "Phosphofructokinase-1 catalytic subunit (PFK-C)",
                "6-Phosphofructo-2-Kinase (PFK2)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-Phosphofructo-2-Kinase (PFK2)",
                "Aldolase (ALDOA)",
                "Aldolase B (ALDOB)",
                "Enolase (ENO1)",
                "Enolase 3 (ENO3)",
                "Fructose-1,6-Bisphosphatase (FBP1)",
                "Glucose Transporter 1 (GLUT1)",
                "Glucose-6-Phosphate Isomerase (GPI)",
                "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
                "Hexokinase (HK)",
                "Hexokinase 2 (HK2)",
                "Lactate Dehydrogenase A (LDHA)",
                "Phosphofructokinase-1 (PFK1)",
                "Phosphofructokinase-1 catalytic subunit (PFK-C)",
                "Phosphofructokinase-2/Fructose-2,6-Bisphosphatase 3 (PFKFB3)",
                "Phosphoglycerate Kinase 1 (PGK1)",
                "Phosphoglycerate Mutase (PGM1)",
                "Phosphoglycerate Mutase 2 (PGM2)",
                "Pyruvate Dehydrogenase Kinase 1 (PDK1)",
                "Pyruvate Kinase L (PKLR)",
                "Pyruvate Kinase M1 (PKM1)",
                "Pyruvate Kinase M2 (PKM2)",
                "Triose Phosphate Isomerase (TPI1)",
                "Triosephosphate Dehydrogenase (GAPDHS)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase 1 (HK1)",
            "Hexokinase 2 (HK2)",
            "Hexokinase 3 (HK3)",
            "Hexokinase 4 (HK4 or GCK)",
            "Glucokinase (GCK)",
            "Phosphoglucose isomerase (GPI)",
            "Phosphofructokinase, liver type (PFKL)",
            "Phosphofructokinase, muscle type (PFKM)",
            "Phosphofructokinase, platelet (PFKP)",
            "Aldolase A (ALDOA)",
            "Aldolase B (ALDOB)",
            "Aldolase C (ALDOC)",
            "Triosephosphate isomerase 1 (TPI1)",
            "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
            "Phosphoglycerate kinase 1 (PGK1)",
            "Phosphoglycerate kinase 2 (PGK2)",
            "Phosphoglycerate mutase 1 (PGAM1)",
            "Phosphoglycerate mutase 2 (PGAM2)",
            "Enolase 1 (ENO1)",
            "Enolase 2 (ENO2)",
            "Enolase 3 (ENO3)",
            "Pyruvate kinase, liver and red blood cell (PKLR)",
            "Pyruvate kinase, muscle (PKM)",
            "Lactate dehydrogenase A (LDHA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Hexokinase 3 (HK3)",
                "Hexokinase 4 (HK4 or GCK)",
                "Glucokinase (GCK)",
                "Phosphoglucose isomerase (GPI)",
                "Phosphofructokinase, liver type (PFKL)",
                "Phosphofructokinase, muscle type (PFKM)",
                "Phosphofructokinase, platelet (PFKP)",
                "Aldolase A (ALDOA)",
                "Aldolase B (ALDOB)",
                "Aldolase C (ALDOC)",
                "Triosephosphate isomerase 1 (TPI1)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate kinase 2 (PGK2)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Enolase 1 (ENO1)",
                "Enolase 2 (ENO2)",
                "Enolase 3 (ENO3)",
                "Pyruvate kinase, liver and red blood cell (PKLR)",
                "Pyruvate kinase, muscle (PKM)",
                "Lactate dehydrogenase A (LDHA)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aldolase A (ALDOA)",
                "Aldolase B (ALDOB)",
                "Aldolase C (ALDOC)",
                "Enolase 1 (ENO1)",
                "Enolase 2 (ENO2)",
                "Enolase 3 (ENO3)",
                "Glucokinase (GCK)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Hexokinase 3 (HK3)",
                "Hexokinase 4 (HK4 or GCK)",
                "Lactate dehydrogenase A (LDHA)",
                "Phosphofructokinase, liver type (PFKL)",
                "Phosphofructokinase, muscle type (PFKM)",
                "Phosphofructokinase, platelet (PFKP)",
                "Phosphoglucose isomerase (GPI)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate kinase 2 (PGK2)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Pyruvate kinase, liver and red blood cell (PKLR)",
                "Pyruvate kinase, muscle (PKM)",
                "Triosephosphate isomerase 1 (TPI1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase 1 (HK1)",
            "Hexokinase 2 (HK2)",
            "Phosphofructokinase 1 (PFK1)",
            "Phosphofructokinase 2 (PFKFB1)",
            "Aldolase A (ALDOA)",
            "Aldolase B (ALDOB)",
            "Triosephosphate isomerase (TPI1)",
            "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
            "Phosphoglycerate kinase (PGK1)",
            "Phosphoglycerate mutase 1 (PGAM1)",
            "Enolase 1 (ENO1)",
            "Pyruvate kinase M1/2 (PKM)",
            "Lactate dehydrogenase A (LDHA)",
            "Lactate dehydrogenase B (LDHB)",
            "Glucose transporter type 1 (GLUT1)",
            "Glucose transporter type 4 (GLUT4)",
            "Fructose-bisphosphate aldolase (ALDOA)",
            "Phosphoglycerate mutase 2 (PGAM2)",
            "Glycerol-3-phosphate dehydrogenase (GPD1)",
            "Dihydroxyacetone phosphate acyltransferase (DHAPAT)",
            "Pyruvate dehydrogenase (PDH)",
            "Pyruvate dehydrogenase kinase (PDK1)",
            "Pyruvate carboxylase (PC)",
            "Fructose-1,6-bisphosphatase (FBP1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Phosphofructokinase 1 (PFK1)",
                "Phosphofructokinase 2 (PFKFB1)",
                "Aldolase A (ALDOA)",
                "Aldolase B (ALDOB)",
                "Triosephosphate isomerase (TPI1)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Phosphoglycerate kinase (PGK1)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Enolase 1 (ENO1)",
                "Pyruvate kinase M1/2 (PKM)",
                "Lactate dehydrogenase A (LDHA)",
                "Lactate dehydrogenase B (LDHB)",
                "Glucose transporter type 1 (GLUT1)",
                "Glucose transporter type 4 (GLUT4)",
                "Fructose-bisphosphate aldolase (ALDOA)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Glycerol-3-phosphate dehydrogenase (GPD1)",
                "Dihydroxyacetone phosphate acyltransferase (DHAPAT)",
                "Pyruvate dehydrogenase (PDH)",
                "Pyruvate dehydrogenase kinase (PDK1)",
                "Pyruvate carboxylase (PC)",
                "Fructose-1,6-bisphosphatase (FBP1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aldolase A (ALDOA)",
                "Aldolase B (ALDOB)",
                "Dihydroxyacetone phosphate acyltransferase (DHAPAT)",
                "Enolase 1 (ENO1)",
                "Fructose-1,6-bisphosphatase (FBP1)",
                "Fructose-bisphosphate aldolase (ALDOA)",
                "Glucose transporter type 1 (GLUT1)",
                "Glucose transporter type 4 (GLUT4)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Glycerol-3-phosphate dehydrogenase (GPD1)",
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Lactate dehydrogenase A (LDHA)",
                "Lactate dehydrogenase B (LDHB)",
                "Phosphofructokinase 1 (PFK1)",
                "Phosphofructokinase 2 (PFKFB1)",
                "Phosphoglycerate kinase (PGK1)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Pyruvate carboxylase (PC)",
                "Pyruvate dehydrogenase (PDH)",
                "Pyruvate dehydrogenase kinase (PDK1)",
                "Pyruvate kinase M1/2 (PKM)",
                "Triosephosphate isomerase (TPI1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase 1 (HK1)",
            "Hexokinase 2 (HK2)",
            "Hexokinase 3 (HK3)",
            "Glucokinase (GCK)",
            "Glucose-6-Phosphate Isomerase (GPI)",
            "Phosphofructokinase, Liver Type (PFKL)",
            "Phosphofructokinase, Muscle Type (PFKM)",
            "Phosphofructokinase, Platelet Type (PFKP)",
            "Fructose-Bisphosphate Aldolase A (ALDOA)",
            "Fructose-Bisphosphate Aldolase B (ALDOB)",
            "Fructose-Bisphosphate Aldolase C (ALDOC)",
            "Triosephosphate Isomerase 1 (TPI1)",
            "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
            "Phosphoglycerate Kinase 1 (PGK1)",
            "Phosphoglycerate Mutase 1 (PGAM1)",
            "Phosphoglycerate Mutase 2 (PGAM2)",
            "Enolase 1, Alpha Non-Neuron (ENO1)",
            "Enolase 2, Gamma Neuron-Specific (ENO2)",
            "Enolase 3, Beta Muscle-Specific (ENO3)",
            "Pyruvate Kinase, Liver and RBC (PKLR)",
            "Pyruvate Kinase, Muscle (PKM)",
            "Lactate Dehydrogenase A (LDHA)",
            "Lactate Dehydrogenase B (LDHB)",
            "Lactate Dehydrogenase C (LDHC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Hexokinase 3 (HK3)",
                "Glucokinase (GCK)",
                "Glucose-6-Phosphate Isomerase (GPI)",
                "Phosphofructokinase, Liver Type (PFKL)",
                "Phosphofructokinase, Muscle Type (PFKM)",
                "Phosphofructokinase, Platelet Type (PFKP)",
                "Fructose-Bisphosphate Aldolase A (ALDOA)",
                "Fructose-Bisphosphate Aldolase B (ALDOB)",
                "Fructose-Bisphosphate Aldolase C (ALDOC)",
                "Triosephosphate Isomerase 1 (TPI1)",
                "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
                "Phosphoglycerate Kinase 1 (PGK1)",
                "Phosphoglycerate Mutase 1 (PGAM1)",
                "Phosphoglycerate Mutase 2 (PGAM2)",
                "Enolase 1, Alpha Non-Neuron (ENO1)",
                "Enolase 2, Gamma Neuron-Specific (ENO2)",
                "Enolase 3, Beta Muscle-Specific (ENO3)",
                "Pyruvate Kinase, Liver and RBC (PKLR)",
                "Pyruvate Kinase, Muscle (PKM)",
                "Lactate Dehydrogenase A (LDHA)",
                "Lactate Dehydrogenase B (LDHB)",
                "Lactate Dehydrogenase C (LDHC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Enolase 1, Alpha Non-Neuron (ENO1)",
                "Enolase 2, Gamma Neuron-Specific (ENO2)",
                "Enolase 3, Beta Muscle-Specific (ENO3)",
                "Fructose-Bisphosphate Aldolase A (ALDOA)",
                "Fructose-Bisphosphate Aldolase B (ALDOB)",
                "Fructose-Bisphosphate Aldolase C (ALDOC)",
                "Glucokinase (GCK)",
                "Glucose-6-Phosphate Isomerase (GPI)",
                "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Hexokinase 3 (HK3)",
                "Lactate Dehydrogenase A (LDHA)",
                "Lactate Dehydrogenase B (LDHB)",
                "Lactate Dehydrogenase C (LDHC)",
                "Phosphofructokinase, Liver Type (PFKL)",
                "Phosphofructokinase, Muscle Type (PFKM)",
                "Phosphofructokinase, Platelet Type (PFKP)",
                "Phosphoglycerate Kinase 1 (PGK1)",
                "Phosphoglycerate Mutase 1 (PGAM1)",
                "Phosphoglycerate Mutase 2 (PGAM2)",
                "Pyruvate Kinase, Liver and RBC (PKLR)",
                "Pyruvate Kinase, Muscle (PKM)",
                "Triosephosphate Isomerase 1 (TPI1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase (HK)",
            "Glucose-6-phosphate isomerase (GPI)",
            "Phosphofructokinase (PFK)",
            "Fructose-bisphosphate aldolase (ALDO)",
            "Triosephosphate isomerase (TPI)",
            "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
            "Phosphoglycerate kinase (PGK)",
            "Phosphoglycerate mutase (PGM)",
            "Enolase (ENO)",
            "Pyruvate kinase (PK)",
            "Pyruvate dehydrogenase (PDH)",
            "Lactate dehydrogenase (LDH)",
            "Pyruvate carboxylase (PC)",
            "Phosphoenolpyruvate carboxykinase (PEPCK)",
            "Fructose-1,6-bisphosphatase (FBP)",
            "Glucose-6-phosphatase (G6Pase)",
            "Phosphoglucomutase (PGM)",
            "Glucokinase (GCK)",
            "Pyruvate dehydrogenase kinase (PDK)",
            "Pyruvate dehydrogenase phosphatase (PDP)",
            "Phosphoenolpyruvate synthase (PEPS)",
            "Fructose-2,6-bisphosphatase (F2,6BPase)",
            "Phosphoglycerate dehydrogenase (PGDH)",
            "Phosphoglycerate phosphatase (PGP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase (HK)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Phosphofructokinase (PFK)",
                "Fructose-bisphosphate aldolase (ALDO)",
                "Triosephosphate isomerase (TPI)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Phosphoglycerate kinase (PGK)",
                "Phosphoglycerate mutase (PGM)",
                "Enolase (ENO)",
                "Pyruvate kinase (PK)",
                "Pyruvate dehydrogenase (PDH)",
                "Lactate dehydrogenase (LDH)",
                "Pyruvate carboxylase (PC)",
                "Phosphoenolpyruvate carboxykinase (PEPCK)",
                "Fructose-1,6-bisphosphatase (FBP)",
                "Glucose-6-phosphatase (G6Pase)",
                "Phosphoglucomutase (PGM)",
                "Glucokinase (GCK)",
                "Pyruvate dehydrogenase kinase (PDK)",
                "Pyruvate dehydrogenase phosphatase (PDP)",
                "Phosphoenolpyruvate synthase (PEPS)",
                "Fructose-2,6-bisphosphatase (F2,6BPase)",
                "Phosphoglycerate dehydrogenase (PGDH)",
                "Phosphoglycerate phosphatase (PGP)"
            ],
            "mismatches": [],
            "true_referents": [
                "Enolase (ENO)",
                "Fructose-1,6-bisphosphatase (FBP)",
                "Fructose-2,6-bisphosphatase (F2,6BPase)",
                "Fructose-bisphosphate aldolase (ALDO)",
                "Glucokinase (GCK)",
                "Glucose-6-phosphatase (G6Pase)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Hexokinase (HK)",
                "Lactate dehydrogenase (LDH)",
                "Phosphoenolpyruvate carboxykinase (PEPCK)",
                "Phosphoenolpyruvate synthase (PEPS)",
                "Phosphofructokinase (PFK)",
                "Phosphoglucomutase (PGM)",
                "Phosphoglycerate dehydrogenase (PGDH)",
                "Phosphoglycerate kinase (PGK)",
                "Phosphoglycerate mutase (PGM)",
                "Phosphoglycerate phosphatase (PGP)",
                "Pyruvate carboxylase (PC)",
                "Pyruvate dehydrogenase (PDH)",
                "Pyruvate dehydrogenase kinase (PDK)",
                "Pyruvate dehydrogenase phosphatase (PDP)",
                "Pyruvate kinase (PK)",
                "Triosephosphate isomerase (TPI)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase 1 (HK1)",
            "Hexokinase 2 (HK2)",
            "Hexokinase 3 (HK3)",
            "Glucokinase (GCK)",
            "Phosphoglucose isomerase (PGI)",
            "Phosphofructokinase, liver type (PFKL)",
            "Phosphofructokinase, muscle type (PFKM)",
            "Phosphofructokinase, platelet type (PFKP)",
            "Aldolase A (ALDOA)",
            "Aldolase B (ALDOB)",
            "Aldolase C (ALDOC)",
            "Triose phosphate isomerase (TPI1)",
            "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
            "Phosphoglycerate kinase 1 (PGK1)",
            "Phosphoglycerate kinase 2 (PGK2)",
            "Phosphoglycerate mutase 1 (PGAM1)",
            "Phosphoglycerate mutase 2 (PGAM2)",
            "Enolase 1 (ENO1)",
            "Enolase 2 (ENO2)",
            "Enolase 3 (ENO3)",
            "Pyruvate kinase M (PKM)",
            "Pyruvate kinase L/R (PKLR)",
            "Pyruvate kinase muscle type (PKM2)",
            "Pyruvate dehydrogenase kinase 1 (PDK1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Hexokinase 3 (HK3)",
                "Glucokinase (GCK)",
                "Phosphoglucose isomerase (PGI)",
                "Phosphofructokinase, liver type (PFKL)",
                "Phosphofructokinase, muscle type (PFKM)",
                "Phosphofructokinase, platelet type (PFKP)",
                "Aldolase A (ALDOA)",
                "Aldolase B (ALDOB)",
                "Aldolase C (ALDOC)",
                "Triose phosphate isomerase (TPI1)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate kinase 2 (PGK2)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Enolase 1 (ENO1)",
                "Enolase 2 (ENO2)",
                "Enolase 3 (ENO3)",
                "Pyruvate kinase M (PKM)",
                "Pyruvate kinase L/R (PKLR)",
                "Pyruvate kinase muscle type (PKM2)",
                "Pyruvate dehydrogenase kinase 1 (PDK1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aldolase A (ALDOA)",
                "Aldolase B (ALDOB)",
                "Aldolase C (ALDOC)",
                "Enolase 1 (ENO1)",
                "Enolase 2 (ENO2)",
                "Enolase 3 (ENO3)",
                "Glucokinase (GCK)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Hexokinase 3 (HK3)",
                "Phosphofructokinase, liver type (PFKL)",
                "Phosphofructokinase, muscle type (PFKM)",
                "Phosphofructokinase, platelet type (PFKP)",
                "Phosphoglucose isomerase (PGI)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate kinase 2 (PGK2)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Pyruvate dehydrogenase kinase 1 (PDK1)",
                "Pyruvate kinase L/R (PKLR)",
                "Pyruvate kinase M (PKM)",
                "Pyruvate kinase muscle type (PKM2)",
                "Triose phosphate isomerase (TPI1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase (HK)",
            "Glucose-6-phosphate isomerase (GPI)",
            "Phosphofructokinase (PFK)",
            "Aldolase (ALDOA)",
            "Triosephosphate isomerase (TPI1)",
            "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
            "Phosphoglycerate kinase (PGK)",
            "Phosphoglycerate mutase (PGAM)",
            "Enolase (ENO)",
            "Pyruvate kinase (PK)",
            "Glucose transporter 1 (GLUT1)",
            "Glucose transporter 4 (GLUT4)",
            "Fructose-2,6-bisphosphatase (PFKFB)",
            "Lactate dehydrogenase (LDH)",
            "Glucokinase (GCK)",
            "Phosphofructokinase-2 (PFKFB2)",
            "6-Phosphofructo-2-kinase/fructose-2,6-bisphosphatase 3 (PFKFB3)",
            "Pyruvate dehydrogenase kinase (PDK)",
            "Phosphoenolpyruvate carboxykinase (PCK)",
            "Fructose-1,6-bisphosphatase (FBP)",
            "Glucose-6-phosphatase (G6PC)",
            "Aldolase B (ALDOB)",
            "Aldolase C (ALDOC)",
            "Phosphoglucomutase (PGM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase (HK)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Phosphofructokinase (PFK)",
                "Aldolase (ALDOA)",
                "Triosephosphate isomerase (TPI1)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Phosphoglycerate kinase (PGK)",
                "Phosphoglycerate mutase (PGAM)",
                "Enolase (ENO)",
                "Pyruvate kinase (PK)",
                "Glucose transporter 1 (GLUT1)",
                "Glucose transporter 4 (GLUT4)",
                "Fructose-2,6-bisphosphatase (PFKFB)",
                "Lactate dehydrogenase (LDH)",
                "Glucokinase (GCK)",
                "Phosphofructokinase-2 (PFKFB2)",
                "6-Phosphofructo-2-kinase/fructose-2,6-bisphosphatase 3 (PFKFB3)",
                "Pyruvate dehydrogenase kinase (PDK)",
                "Phosphoenolpyruvate carboxykinase (PCK)",
                "Fructose-1,6-bisphosphatase (FBP)",
                "Glucose-6-phosphatase (G6PC)",
                "Aldolase B (ALDOB)",
                "Aldolase C (ALDOC)",
                "Phosphoglucomutase (PGM)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-Phosphofructo-2-kinase/fructose-2,6-bisphosphatase 3 (PFKFB3)",
                "Aldolase (ALDOA)",
                "Aldolase B (ALDOB)",
                "Aldolase C (ALDOC)",
                "Enolase (ENO)",
                "Fructose-1,6-bisphosphatase (FBP)",
                "Fructose-2,6-bisphosphatase (PFKFB)",
                "Glucokinase (GCK)",
                "Glucose transporter 1 (GLUT1)",
                "Glucose transporter 4 (GLUT4)",
                "Glucose-6-phosphatase (G6PC)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Hexokinase (HK)",
                "Lactate dehydrogenase (LDH)",
                "Phosphoenolpyruvate carboxykinase (PCK)",
                "Phosphofructokinase (PFK)",
                "Phosphofructokinase-2 (PFKFB2)",
                "Phosphoglucomutase (PGM)",
                "Phosphoglycerate kinase (PGK)",
                "Phosphoglycerate mutase (PGAM)",
                "Pyruvate dehydrogenase kinase (PDK)",
                "Pyruvate kinase (PK)",
                "Triosephosphate isomerase (TPI1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase 1 (HK1)",
            "Hexokinase 2 (HK2)",
            "Hexokinase 3 (HK3)",
            "Glucokinase (GCK)",
            "Glucose-6-phosphate isomerase (GPI)",
            "6-phosphofructokinase, liver type (PFKL)",
            "6-phosphofructokinase, muscle type (PFKM)",
            "6-phosphofructokinase, platelet type (PFKP)",
            "Fructose-bisphosphate aldolase A (ALDOA)",
            "Fructose-bisphosphate aldolase B (ALDOB)",
            "Fructose-bisphosphate aldolase C (ALDOC)",
            "Triosephosphate isomerase (TPI1)",
            "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
            "Phosphoglycerate kinase 1 (PGK1)",
            "Phosphoglycerate kinase 2 (PGK2)",
            "Phosphoglycerate mutase 1 (PGAM1)",
            "Phosphoglycerate mutase 2 (PGAM2)",
            "Enolase 1 (ENO1)",
            "Enolase 2 (ENO2)",
            "Enolase 3 (ENO3)",
            "Pyruvate kinase L/R (PKLR)",
            "Pyruvate kinase M1/2 (PKM)",
            "Lactate dehydrogenase A (LDHA)",
            "Lactate dehydrogenase B (LDHB)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Hexokinase 3 (HK3)",
                "Glucokinase (GCK)",
                "Glucose-6-phosphate isomerase (GPI)",
                "6-phosphofructokinase, liver type (PFKL)",
                "6-phosphofructokinase, muscle type (PFKM)",
                "6-phosphofructokinase, platelet type (PFKP)",
                "Fructose-bisphosphate aldolase A (ALDOA)",
                "Fructose-bisphosphate aldolase B (ALDOB)",
                "Fructose-bisphosphate aldolase C (ALDOC)",
                "Triosephosphate isomerase (TPI1)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate kinase 2 (PGK2)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Enolase 1 (ENO1)",
                "Enolase 2 (ENO2)",
                "Enolase 3 (ENO3)",
                "Pyruvate kinase L/R (PKLR)",
                "Pyruvate kinase M1/2 (PKM)",
                "Lactate dehydrogenase A (LDHA)",
                "Lactate dehydrogenase B (LDHB)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-phosphofructokinase, liver type (PFKL)",
                "6-phosphofructokinase, muscle type (PFKM)",
                "6-phosphofructokinase, platelet type (PFKP)",
                "Enolase 1 (ENO1)",
                "Enolase 2 (ENO2)",
                "Enolase 3 (ENO3)",
                "Fructose-bisphosphate aldolase A (ALDOA)",
                "Fructose-bisphosphate aldolase B (ALDOB)",
                "Fructose-bisphosphate aldolase C (ALDOC)",
                "Glucokinase (GCK)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Hexokinase 3 (HK3)",
                "Lactate dehydrogenase A (LDHA)",
                "Lactate dehydrogenase B (LDHB)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate kinase 2 (PGK2)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Pyruvate kinase L/R (PKLR)",
                "Pyruvate kinase M1/2 (PKM)",
                "Triosephosphate isomerase (TPI1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase 1 (HK1)",
            "Hexokinase 2 (HK2)",
            "Glucose-6-phosphate isomerase (GPI)",
            "Phosphofructokinase 1 (PFK1)",
            "Aldolase A (ALDOA)",
            "Triose phosphate isomerase (TPI1)",
            "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
            "Phosphoglycerate kinase 1 (PGK1)",
            "Phosphoglycerate mutase 1 (PGAM1)",
            "Enolase 1 (ENO1)",
            "Pyruvate kinase M1/2 (PKM)",
            "Lactate dehydrogenase A (LDHA)",
            "Hexokinase 3 (HK3)",
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "Phosphofructokinase, platelet (PFKP)",
            "Aldolase B (ALDOB)",
            "Glyceraldehyde-3-phosphate dehydrogenase, testis-specific (GAPDS)",
            "Phosphoglycerate kinase 2 (PGK2)",
            "Phosphoglycerate mutase 2 (PGAM2)",
            "Enolase 2 (ENO2)",
            "Pyruvate kinase L/R (PKLR)",
            "Lactate dehydrogenase B (LDHB)",
            "Hexokinase 4 (HK4)",
            "Phosphofructokinase, muscle (PFKM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Phosphofructokinase 1 (PFK1)",
                "Aldolase A (ALDOA)",
                "Triose phosphate isomerase (TPI1)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Enolase 1 (ENO1)",
                "Pyruvate kinase M1/2 (PKM)",
                "Lactate dehydrogenase A (LDHA)",
                "Hexokinase 3 (HK3)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Phosphofructokinase, platelet (PFKP)",
                "Aldolase B (ALDOB)",
                "Glyceraldehyde-3-phosphate dehydrogenase, testis-specific (GAPDS)",
                "Phosphoglycerate kinase 2 (PGK2)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Enolase 2 (ENO2)",
                "Pyruvate kinase L/R (PKLR)",
                "Lactate dehydrogenase B (LDHB)",
                "Hexokinase 4 (HK4)",
                "Phosphofructokinase, muscle (PFKM)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aldolase A (ALDOA)",
                "Aldolase B (ALDOB)",
                "Enolase 1 (ENO1)",
                "Enolase 2 (ENO2)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Glyceraldehyde-3-phosphate dehydrogenase, testis-specific (GAPDS)",
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Hexokinase 3 (HK3)",
                "Hexokinase 4 (HK4)",
                "Lactate dehydrogenase A (LDHA)",
                "Lactate dehydrogenase B (LDHB)",
                "Phosphofructokinase 1 (PFK1)",
                "Phosphofructokinase, muscle (PFKM)",
                "Phosphofructokinase, platelet (PFKP)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate kinase 2 (PGK2)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Pyruvate kinase L/R (PKLR)",
                "Pyruvate kinase M1/2 (PKM)",
                "Triose phosphate isomerase (TPI1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase (HK)",
            "Glucose-6-phosphate isomerase (GPI)",
            "Phosphofructokinase (PFK)",
            "Aldolase (ALDO)",
            "Triosephosphate isomerase (TPI)",
            "Glyceraldehyde 3-phosphate dehydrogenase (GAPDH)",
            "Phosphoglycerate kinase (PGK)",
            "Phosphoglycerate mutase (PGAM)",
            "Enolase (ENO)",
            "Pyruvate kinase (PK)",
            "Lactate dehydrogenase (LDH)",
            "Glucose transporter (GLUT)",
            "Pyruvate dehydrogenase (PDH)",
            "Citrate synthase (CS)",
            "Aconitase (ACO)",
            "Isocitrate dehydrogenase (IDH)",
            "Alpha-ketoglutarate dehydrogenase (KGDH)",
            "Succinyl-CoA synthetase (SCS)",
            "Succinate dehydrogenase (SDH)",
            "Fumarase (FH)",
            "Malate dehydrogenase (MDH)",
            "Pyruvate carboxylase (PC)",
            "Fructose-1,6-bisphosphatase (FBP)",
            "Glucose-6-phosphatase (G6PC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase (HK)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Phosphofructokinase (PFK)",
                "Aldolase (ALDO)",
                "Triosephosphate isomerase (TPI)",
                "Glyceraldehyde 3-phosphate dehydrogenase (GAPDH)",
                "Phosphoglycerate kinase (PGK)",
                "Phosphoglycerate mutase (PGAM)",
                "Enolase (ENO)",
                "Pyruvate kinase (PK)",
                "Lactate dehydrogenase (LDH)",
                "Glucose transporter (GLUT)",
                "Pyruvate dehydrogenase (PDH)",
                "Citrate synthase (CS)",
                "Aconitase (ACO)",
                "Isocitrate dehydrogenase (IDH)",
                "Alpha-ketoglutarate dehydrogenase (KGDH)",
                "Succinyl-CoA synthetase (SCS)",
                "Succinate dehydrogenase (SDH)",
                "Fumarase (FH)",
                "Malate dehydrogenase (MDH)",
                "Pyruvate carboxylase (PC)",
                "Fructose-1,6-bisphosphatase (FBP)",
                "Glucose-6-phosphatase (G6PC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aconitase (ACO)",
                "Aldolase (ALDO)",
                "Alpha-ketoglutarate dehydrogenase (KGDH)",
                "Citrate synthase (CS)",
                "Enolase (ENO)",
                "Fructose-1,6-bisphosphatase (FBP)",
                "Fumarase (FH)",
                "Glucose transporter (GLUT)",
                "Glucose-6-phosphatase (G6PC)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Glyceraldehyde 3-phosphate dehydrogenase (GAPDH)",
                "Hexokinase (HK)",
                "Isocitrate dehydrogenase (IDH)",
                "Lactate dehydrogenase (LDH)",
                "Malate dehydrogenase (MDH)",
                "Phosphofructokinase (PFK)",
                "Phosphoglycerate kinase (PGK)",
                "Phosphoglycerate mutase (PGAM)",
                "Pyruvate carboxylase (PC)",
                "Pyruvate dehydrogenase (PDH)",
                "Pyruvate kinase (PK)",
                "Succinate dehydrogenase (SDH)",
                "Succinyl-CoA synthetase (SCS)",
                "Triosephosphate isomerase (TPI)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "GAPDH (Glyceraldehyde 3-phosphate dehydrogenase) (GAPDH)",
            "PFK1 (Phosphofructokinase 1)",
            "PFKM (Phosphofructokinase M)",
            "ALDOA (Fructose-bisphosphate aldolase A)",
            "ALDOB (Fructose-bisphosphate aldolase B)",
            "TPI1 (Triosephosphate isomerase 1)",
            "PGK1 (Phosphoglycerate kinase 1)",
            "PGM1 (Phosphoglycerate mutase 1)",
            "ENO1 (Enolase 1)",
            "PKM2 (Pyruvate kinase isozyme M2)",
            "PKLR (Pyruvate kinase, liver)",
            "LDHA (Lactate dehydrogenase A)",
            "LDHB (Lactate dehydrogenase B)",
            "LDHC (Lactate dehydrogenase C)",
            "PGAM1 (Phosphoglycerate mutase 1)",
            "PYGL (Glycogen phosphorylase, liver)",
            "PYGM (Glycogen phosphorylase, muscle)",
            "GCK (Glucokinase)",
            "HK1 (Hexokinase 1)",
            "HK2 (Hexokinase 2)",
            "HK3 (Hexokinase 3)",
            "HK4 (Hexokinase 4)",
            "HKDC1 (Hexokinase domain-containing protein 1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "GAPDH (Glyceraldehyde 3-phosphate dehydrogenase) (GAPDH)",
                "PFK1 (Phosphofructokinase 1)",
                "PFKM (Phosphofructokinase M)",
                "ALDOA (Fructose-bisphosphate aldolase A)",
                "ALDOB (Fructose-bisphosphate aldolase B)",
                "TPI1 (Triosephosphate isomerase 1)",
                "PGK1 (Phosphoglycerate kinase 1)",
                "PGM1 (Phosphoglycerate mutase 1)",
                "ENO1 (Enolase 1)",
                "PKM2 (Pyruvate kinase isozyme M2)",
                "PKLR (Pyruvate kinase, liver)",
                "LDHA (Lactate dehydrogenase A)",
                "LDHB (Lactate dehydrogenase B)",
                "LDHC (Lactate dehydrogenase C)",
                "PGAM1 (Phosphoglycerate mutase 1)",
                "PYGL (Glycogen phosphorylase, liver)",
                "PYGM (Glycogen phosphorylase, muscle)",
                "GCK (Glucokinase)",
                "HK1 (Hexokinase 1)",
                "HK2 (Hexokinase 2)",
                "HK3 (Hexokinase 3)",
                "HK4 (Hexokinase 4)",
                "HKDC1 (Hexokinase domain-containing protein 1)"
            ],
            "mismatches": [],
            "true_referents": [
                "ALDOA (Fructose-bisphosphate aldolase A)",
                "ALDOB (Fructose-bisphosphate aldolase B)",
                "ENO1 (Enolase 1)",
                "GAPDH (Glyceraldehyde 3-phosphate dehydrogenase) (GAPDH)",
                "GCK (Glucokinase)",
                "HK1 (Hexokinase 1)",
                "HK2 (Hexokinase 2)",
                "HK3 (Hexokinase 3)",
                "HK4 (Hexokinase 4)",
                "HKDC1 (Hexokinase domain-containing protein 1)",
                "LDHA (Lactate dehydrogenase A)",
                "LDHB (Lactate dehydrogenase B)",
                "LDHC (Lactate dehydrogenase C)",
                "PFK1 (Phosphofructokinase 1)",
                "PFKM (Phosphofructokinase M)",
                "PGAM1 (Phosphoglycerate mutase 1)",
                "PGK1 (Phosphoglycerate kinase 1)",
                "PGM1 (Phosphoglycerate mutase 1)",
                "PKLR (Pyruvate kinase, liver)",
                "PKM2 (Pyruvate kinase isozyme M2)",
                "PYGL (Glycogen phosphorylase, liver)",
                "PYGM (Glycogen phosphorylase, muscle)",
                "TPI1 (Triosephosphate isomerase 1)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            "Hexokinase 1 (HK1)",
            "Hexokinase 2 (HK2)",
            "Glucokinase (GCK)",
            "Glucose-6-phosphatase (G6PC)",
            "Fructose-1,6-bisphosphatase 1 (FBP1)",
            "Fructose-1,6-bisphosphatase 2 (FBP2)",
            "Aldolase A (ALDOA)",
            "Aldolase B (ALDOB)",
            "Aldolase C (ALDOC)",
            "Triosephosphate isomerase 1 (TPI1)",
            "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
            "Phosphoglycerate kinase 1 (PGK1)",
            "Phosphoglycerate kinase 2 (PGK2)",
            "Phosphoglycerate mutase 1 (PGAM1)",
            "Phosphoglycerate mutase 2 (PGAM2)",
            "Enolase 1 (ENO1)",
            "Enolase 2 (ENO2)",
            "Enolase 3 (ENO3)",
            "Pyruvate kinase M1 (PKM1)",
            "Pyruvate kinase M2 (PKM2)",
            "Pyruvate kinase L (PKL)",
            "Pyruvate kinase R (PKR)",
            "Lactate dehydrogenase A (LDHA)",
            "Lactate dehydrogenase B (LDHB)",
            "Lactate dehydrogenase C (LDHC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Glucokinase (GCK)",
                "Glucose-6-phosphatase (G6PC)",
                "Fructose-1,6-bisphosphatase 1 (FBP1)",
                "Fructose-1,6-bisphosphatase 2 (FBP2)",
                "Aldolase A (ALDOA)",
                "Aldolase B (ALDOB)",
                "Aldolase C (ALDOC)",
                "Triosephosphate isomerase 1 (TPI1)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate kinase 2 (PGK2)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Enolase 1 (ENO1)",
                "Enolase 2 (ENO2)",
                "Enolase 3 (ENO3)",
                "Pyruvate kinase M1 (PKM1)",
                "Pyruvate kinase M2 (PKM2)",
                "Pyruvate kinase L (PKL)",
                "Pyruvate kinase R (PKR)",
                "Lactate dehydrogenase A (LDHA)",
                "Lactate dehydrogenase B (LDHB)"
            ],
            "mismatches": [
                "Lactate dehydrogenase C (LDHC)"
            ],
            "true_referents": [
                "Aldolase A (ALDOA)",
                "Aldolase B (ALDOB)",
                "Aldolase C (ALDOC)",
                "Enolase 1 (ENO1)",
                "Enolase 2 (ENO2)",
                "Enolase 3 (ENO3)",
                "Fructose-1,6-bisphosphatase 1 (FBP1)",
                "Fructose-1,6-bisphosphatase 2 (FBP2)",
                "Glucokinase (GCK)",
                "Glucose-6-phosphatase (G6PC)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Hexokinase 1 (HK1)",
                "Hexokinase 2 (HK2)",
                "Lactate dehydrogenase A (LDHA)",
                "Lactate dehydrogenase B (LDHB)",
                "Phosphoglycerate kinase 1 (PGK1)",
                "Phosphoglycerate kinase 2 (PGK2)",
                "Phosphoglycerate mutase 1 (PGAM1)",
                "Phosphoglycerate mutase 2 (PGAM2)",
                "Pyruvate kinase L (PKL)",
                "Pyruvate kinase M1 (PKM1)",
                "Pyruvate kinase M2 (PKM2)",
                "Pyruvate kinase R (PKR)",
                "Triosephosphate isomerase 1 (TPI1)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "glycolysis pathway gene",
        "domain": "biology",
        "response": [
            {
                "Referent": "Hexokinase",
                "Canonical Name": "HK1"
            },
            {
                "Referent": "Glucokinase",
                "Canonical Name": "GCK"
            },
            {
                "Referent": "Phosphofructokinase",
                "Canonical Name": "PFK1"
            },
            {
                "Referent": "Pyruvate kinase",
                "Canonical Name": "PK"
            },
            {
                "Referent": "Enolase",
                "Canonical Name": "ENO1"
            },
            {
                "Referent": "Pyruvate dehydrogenase kinase",
                "Canonical Name": "PDK1"
            },
            {
                "Referent": "Phosphoglycerate mutase",
                "Canonical Name": "PGAM1"
            },
            {
                "Referent": "Enolase 2",
                "Canonical Name": "ENO2"
            },
            {
                "Referent": "Triosephosphate isomerase",
                "Canonical Name": "TPI1"
            },
            {
                "Referent": "Aldolase A",
                "Canonical Name": "ALDOA"
            },
            {
                "Referent": "Fructose bisphosphate aldolase",
                "Canonical Name": "ALDOC"
            },
            {
                "Referent": "Glyceraldehyde 3-phosphate dehydrogenase",
                "Canonical Name": "GAPDH"
            },
            {
                "Referent": "Phosphoglycerate kinase",
                "Canonical Name": "PGK1"
            },
            {
                "Referent": "Pyruvate kinase M2",
                "Canonical Name": "PKM2"
            },
            {
                "Referent": "L-lactate dehydrogenase",
                "Canonical Name": "LDH"
            },
            {
                "Referent": "Pyruvate dehydrogenase",
                "Canonical Name": "PDH"
            },
            {
                "Referent": "Phosphoglycerate mutase 2",
                "Canonical Name": "PGAM2"
            },
            {
                "Referent": "Phosphoglycerate mutase 1",
                "Canonical Name": "PGAM1"
            },
            {
                "Referent": "Pyruvate dehydrogenase kinase 4",
                "Canonical Name": "PDK4"
            },
            {
                "Referent": "Pyruvate dehydrogenase kinase 3",
                "Canonical Name": "PDK3"
            },
            {
                "Referent": "Pyruvate dehydrogenase kinase 2",
                "Canonical Name": "PDK2"
            },
            {
                "Referent": "Pyruvate dehydrogenase kinase 1",
                "Canonical Name": "PDK1"
            },
            {
                "Referent": "Pyruvate dehydrogenase kinase 4",
                "Canonical Name": "PDK4"
            },
            {
                "Referent": "Pyruvate dehydrogenase kinase 3",
                "Canonical Name": "PDK3"
            },
            {
                "Referent": "Pyruvate dehydrogenase kinase 2",
                "Canonical Name": "PDK2"
            },
            {
                "Referent": "Pyruvate dehydrogenase kinase 1",
                "Canonical Name": "PDK1"
            },
            {
                "Referent": "Pyruvate dehydrogenase kinase 4",
                "Canonical Name": "PDK4"
            },
            {
                "Referent": "Pyruvate dehydrogenase kinase 3",
                "Canonical Name": "PDK3"
            },
            {
                "Referent": "Pyruvate dehydrogenase kinase 2",
                "Canonical Name": "PDK2"
            },
            {
                "Referent": "Pyruvate dehydrogenase kinase 1",
                "Canonical Name": "PDK1"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexokinase",
                "Glucokinase",
                "Phosphofructokinase",
                "Pyruvate kinase",
                "Enolase",
                "Pyruvate dehydrogenase kinase",
                "Phosphoglycerate mutase",
                "Enolase 2",
                "Triosephosphate isomerase",
                "Aldolase A",
                "Fructose bisphosphate aldolase",
                "Glyceraldehyde 3-phosphate dehydrogenase",
                "Phosphoglycerate kinase",
                "Pyruvate kinase M2",
                "L-lactate dehydrogenase",
                "Pyruvate dehydrogenase",
                "Phosphoglycerate mutase 2",
                "Phosphoglycerate mutase 1",
                "Pyruvate dehydrogenase kinase 4",
                "Pyruvate dehydrogenase kinase 3",
                "Pyruvate dehydrogenase kinase 2",
                "Pyruvate dehydrogenase kinase 1"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"Aldolase A\", \"Canonical Name\": \"ALDOA\"}",
                "{\"Referent\": \"Enolase 2\", \"Canonical Name\": \"ENO2\"}",
                "{\"Referent\": \"Enolase\", \"Canonical Name\": \"ENO1\"}",
                "{\"Referent\": \"Fructose bisphosphate aldolase\", \"Canonical Name\": \"ALDOC\"}",
                "{\"Referent\": \"Glucokinase\", \"Canonical Name\": \"GCK\"}",
                "{\"Referent\": \"Glyceraldehyde 3-phosphate dehydrogenase\", \"Canonical Name\": \"GAPDH\"}",
                "{\"Referent\": \"Hexokinase\", \"Canonical Name\": \"HK1\"}",
                "{\"Referent\": \"L-lactate dehydrogenase\", \"Canonical Name\": \"LDH\"}",
                "{\"Referent\": \"Phosphofructokinase\", \"Canonical Name\": \"PFK1\"}",
                "{\"Referent\": \"Phosphoglycerate kinase\", \"Canonical Name\": \"PGK1\"}",
                "{\"Referent\": \"Phosphoglycerate mutase 1\", \"Canonical Name\": \"PGAM1\"}",
                "{\"Referent\": \"Phosphoglycerate mutase 2\", \"Canonical Name\": \"PGAM2\"}",
                "{\"Referent\": \"Phosphoglycerate mutase\", \"Canonical Name\": \"PGAM1\"}",
                "{\"Referent\": \"Pyruvate dehydrogenase kinase 1\", \"Canonical Name\": \"PDK1\"}",
                "{\"Referent\": \"Pyruvate dehydrogenase kinase 2\", \"Canonical Name\": \"PDK2\"}",
                "{\"Referent\": \"Pyruvate dehydrogenase kinase 3\", \"Canonical Name\": \"PDK3\"}",
                "{\"Referent\": \"Pyruvate dehydrogenase kinase 4\", \"Canonical Name\": \"PDK4\"}",
                "{\"Referent\": \"Pyruvate dehydrogenase kinase\", \"Canonical Name\": \"PDK1\"}",
                "{\"Referent\": \"Pyruvate dehydrogenase\", \"Canonical Name\": \"PDH\"}",
                "{\"Referent\": \"Pyruvate kinase M2\", \"Canonical Name\": \"PKM2\"}",
                "{\"Referent\": \"Pyruvate kinase\", \"Canonical Name\": \"PK\"}",
                "{\"Referent\": \"Triosephosphate isomerase\", \"Canonical Name\": \"TPI1\"}"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    }
]