[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "Transketolase (TKT)",
            "Transaldolase (TALDO1)",
            "6-Phosphogluconate Dehydrogenase (PGD)",
            "Ribose-5-Phosphate Isomerase A (RPIA)",
            "Ribulose-5-Phosphate 3-Epimerase (RPE)",
            "Glucose-6-Phosphate Dehydrogenase (G6PD)",
            "Ribokinase (RHK)",
            "Xylulokinase (XYLK)",
            "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
            "Phosphoglucomutase 1 (PGM1)",
            "Ribose-5-Phosphate Isomerase B (RPIB)",
            "Phosphoribosyl Pyrophosphate Synthetase 1 (PRPS1)",
            "Phosphoribosyl Pyrophosphate Synthetase 2 (PRPS2)",
            "Phosphoribosyl Pyrophosphate Amidotransferase (PAICS)",
            "5-Aminolevulinate Synthase 2 (ALAS2)",
            "5-Aminolevulinate Synthase 1 (ALAS1)",
            "Phosphoribosylformylglycinamidine Synthase Small Subunit (PFAS)",
            "Phosphoribosylformylglycinamidine Synthase Large Subunit (PFARS)",
            "5-Aminolevulinate Dehydratase 1 (ALAD)",
            "Uroporphyrinogen III Synthase (UROS)",
            "Uroporphyrinogen Decarboxylase (UROD)",
            "Coproporphyrinogen III Oxidase (CPOX)",
            "Heme Synthase (HMBS)",
            "Heme Oxygenase 1 (HMOX1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Transketolase (TKT)",
                "Transaldolase (TALDO1)",
                "6-Phosphogluconate Dehydrogenase (PGD)",
                "Ribose-5-Phosphate Isomerase A (RPIA)",
                "Ribulose-5-Phosphate 3-Epimerase (RPE)",
                "Glucose-6-Phosphate Dehydrogenase (G6PD)",
                "Ribokinase (RHK)",
                "Xylulokinase (XYLK)",
                "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
                "Phosphoglucomutase 1 (PGM1)",
                "Ribose-5-Phosphate Isomerase B (RPIB)",
                "Phosphoribosyl Pyrophosphate Synthetase 1 (PRPS1)",
                "Phosphoribosyl Pyrophosphate Synthetase 2 (PRPS2)",
                "Phosphoribosyl Pyrophosphate Amidotransferase (PAICS)",
                "5-Aminolevulinate Synthase 2 (ALAS2)",
                "5-Aminolevulinate Synthase 1 (ALAS1)",
                "Phosphoribosylformylglycinamidine Synthase Small Subunit (PFAS)",
                "Phosphoribosylformylglycinamidine Synthase Large Subunit (PFARS)",
                "5-Aminolevulinate Dehydratase 1 (ALAD)",
                "Uroporphyrinogen III Synthase (UROS)",
                "Uroporphyrinogen Decarboxylase (UROD)",
                "Coproporphyrinogen III Oxidase (CPOX)",
                "Heme Synthase (HMBS)",
                "Heme Oxygenase 1 (HMOX1)"
            ],
            "mismatches": [],
            "true_referents": [
                "5-Aminolevulinate Dehydratase 1 (ALAD)",
                "5-Aminolevulinate Synthase 1 (ALAS1)",
                "5-Aminolevulinate Synthase 2 (ALAS2)",
                "6-Phosphogluconate Dehydrogenase (PGD)",
                "Coproporphyrinogen III Oxidase (CPOX)",
                "Glucose-6-Phosphate Dehydrogenase (G6PD)",
                "Glyceraldehyde-3-Phosphate Dehydrogenase (GAPDH)",
                "Heme Oxygenase 1 (HMOX1)",
                "Heme Synthase (HMBS)",
                "Phosphoglucomutase 1 (PGM1)",
                "Phosphoribosyl Pyrophosphate Amidotransferase (PAICS)",
                "Phosphoribosyl Pyrophosphate Synthetase 1 (PRPS1)",
                "Phosphoribosyl Pyrophosphate Synthetase 2 (PRPS2)",
                "Phosphoribosylformylglycinamidine Synthase Large Subunit (PFARS)",
                "Phosphoribosylformylglycinamidine Synthase Small Subunit (PFAS)",
                "Ribokinase (RHK)",
                "Ribose-5-Phosphate Isomerase A (RPIA)",
                "Ribose-5-Phosphate Isomerase B (RPIB)",
                "Ribulose-5-Phosphate 3-Epimerase (RPE)",
                "Transaldolase (TALDO1)",
                "Transketolase (TKT)",
                "Uroporphyrinogen Decarboxylase (UROD)",
                "Uroporphyrinogen III Synthase (UROS)",
                "Xylulokinase (XYLK)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "Transaldolase 1 (TALDO1)",
            "Transketolase (TKT)",
            "Ribose-5-phosphate isomerase A (RPIA)",
            "Ribulose-5-phosphate 3-epimerase (RPE)",
            "6-Phosphogluconate dehydrogenase (6PGD)",
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "Ribose-5-phosphate ketol-isomerase (RKI)",
            "Arabinose-5-phosphate isomerase (A5PI)",
            "Ribulose-phosphate 3-epimerase (RPE)",
            "Ribose-phosphate diphosphokinase (PRPS1)",
            "Ribose-5-phosphate isomerase B (RPIB)",
            "Transaldolase 2 (TALDO2)",
            "Glucose-6-phosphate isomerase (GPI)",
            "Transketolase-like 1 (TKTL1)",
            "Transketolase-like 2 (TKTL2)",
            "Transketolase-like 3 (TKTL3)",
            "Transketolase-like 4 (TKTL4)",
            "Glucose-6-phosphate isomerase 2 (GPI2)",
            "Ribulose-5-phosphate 4-epimerase (RPE2)",
            "Ribose-5-phosphate isomerase C (RPI3)",
            "6-Phosphogluconolactonase (PGLS)",
            "6-Phosphogluconate dehydratase (6PGD)",
            "Ribose-5-phosphate isomerase D (RPI4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Transaldolase 1 (TALDO1)",
                "Transketolase (TKT)",
                "Ribose-5-phosphate isomerase A (RPIA)",
                "Ribulose-5-phosphate 3-epimerase (RPE)",
                "6-Phosphogluconate dehydrogenase (6PGD)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Ribose-5-phosphate ketol-isomerase (RKI)",
                "Arabinose-5-phosphate isomerase (A5PI)",
                "Ribose-phosphate diphosphokinase (PRPS1)",
                "Ribose-5-phosphate isomerase B (RPIB)",
                "Transaldolase 2 (TALDO2)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Transketolase-like 1 (TKTL1)",
                "Transketolase-like 2 (TKTL2)",
                "Transketolase-like 3 (TKTL3)",
                "Transketolase-like 4 (TKTL4)",
                "Glucose-6-phosphate isomerase 2 (GPI2)",
                "Ribulose-5-phosphate 4-epimerase (RPE2)",
                "Ribose-5-phosphate isomerase C (RPI3)",
                "6-Phosphogluconolactonase (PGLS)",
                "6-Phosphogluconate dehydratase (6PGD)",
                "Ribose-5-phosphate isomerase D (RPI4)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-Phosphogluconate dehydratase (6PGD)",
                "6-Phosphogluconate dehydrogenase (6PGD)",
                "6-Phosphogluconolactonase (PGLS)",
                "Arabinose-5-phosphate isomerase (A5PI)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Glucose-6-phosphate isomerase 2 (GPI2)",
                "Ribose-5-phosphate isomerase A (RPIA)",
                "Ribose-5-phosphate isomerase B (RPIB)",
                "Ribose-5-phosphate isomerase C (RPI3)",
                "Ribose-5-phosphate isomerase D (RPI4)",
                "Ribose-5-phosphate ketol-isomerase (RKI)",
                "Ribose-phosphate diphosphokinase (PRPS1)",
                "Ribulose-5-phosphate 3-epimerase (RPE)",
                "Ribulose-5-phosphate 4-epimerase (RPE2)",
                "Ribulose-phosphate 3-epimerase (RPE)",
                "Transaldolase 1 (TALDO1)",
                "Transaldolase 2 (TALDO2)",
                "Transketolase (TKT)",
                "Transketolase-like 1 (TKTL1)",
                "Transketolase-like 2 (TKTL2)",
                "Transketolase-like 3 (TKTL3)",
                "Transketolase-like 4 (TKTL4)"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "6-Phosphogluconolactonase (PGLS)",
            "6-Phosphogluconate dehydrogenase (PGD)",
            "Ribose-5-phosphate isomerase (RPI)",
            "Ribulose-phosphate 3-epimerase (RPE)",
            "Transketolase (TKT)",
            "Transaldolase (TALDO1)",
            "Phosphoribosyl pyrophosphate synthetase 1 (PRPS1)",
            "Phosphoribosyl pyrophosphate synthetase 2 (PRPS2)",
            "Phosphoribosyl pyrophosphate synthetase 3 (PRPS3)",
            "Transketolase-like protein 1 (TKTL1)",
            "Transketolase-like protein 2 (TKTL2)",
            "Transaldolase 2 (TALDO2)",
            "Phosphoribosyl pyrophosphate synthetase-associated protein 1 (PRPSAP1)",
            "Phosphoribosyl pyrophosphate synthetase-associated protein 2 (PRPSAP2)",
            "Ribose-5-phosphate isomerase B (RPIB)",
            "6-Phosphogluconolactonase-like protein 1 (PGLS2)",
            "6-Phosphogluconate dehydrogenase-like protein 1 (PGD2)",
            "Ribose-5-phosphate isomerase C (RPIC)",
            "Ribulose-phosphate 3-epimerase-like protein 1 (RPEL1)",
            "Transketolase-like protein 3 (TKTL3)",
            "Transaldolase-like protein 1 (TALDO1L1)",
            "Phosphoribosyl pyrophosphate synthetase 4 (PRPS4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "6-Phosphogluconolactonase (PGLS)",
                "6-Phosphogluconate dehydrogenase (PGD)",
                "Ribose-5-phosphate isomerase (RPI)",
                "Ribulose-phosphate 3-epimerase (RPE)",
                "Transketolase (TKT)",
                "Transaldolase (TALDO1)",
                "Phosphoribosyl pyrophosphate synthetase 1 (PRPS1)",
                "Phosphoribosyl pyrophosphate synthetase 2 (PRPS2)",
                "Phosphoribosyl pyrophosphate synthetase 3 (PRPS3)",
                "Transketolase-like protein 1 (TKTL1)",
                "Transketolase-like protein 2 (TKTL2)",
                "Transaldolase 2 (TALDO2)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 1 (PRPSAP1)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 2 (PRPSAP2)",
                "Ribose-5-phosphate isomerase B (RPIB)",
                "6-Phosphogluconolactonase-like protein 1 (PGLS2)",
                "6-Phosphogluconate dehydrogenase-like protein 1 (PGD2)",
                "Ribose-5-phosphate isomerase C (RPIC)",
                "Ribulose-phosphate 3-epimerase-like protein 1 (RPEL1)",
                "Transketolase-like protein 3 (TKTL3)",
                "Transaldolase-like protein 1 (TALDO1L1)",
                "Phosphoribosyl pyrophosphate synthetase 4 (PRPS4)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-Phosphogluconate dehydrogenase (PGD)",
                "6-Phosphogluconate dehydrogenase-like protein 1 (PGD2)",
                "6-Phosphogluconolactonase (PGLS)",
                "6-Phosphogluconolactonase-like protein 1 (PGLS2)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Phosphoribosyl pyrophosphate synthetase 1 (PRPS1)",
                "Phosphoribosyl pyrophosphate synthetase 2 (PRPS2)",
                "Phosphoribosyl pyrophosphate synthetase 3 (PRPS3)",
                "Phosphoribosyl pyrophosphate synthetase 4 (PRPS4)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 1 (PRPSAP1)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 2 (PRPSAP2)",
                "Ribose-5-phosphate isomerase (RPI)",
                "Ribose-5-phosphate isomerase B (RPIB)",
                "Ribose-5-phosphate isomerase C (RPIC)",
                "Ribulose-phosphate 3-epimerase (RPE)",
                "Ribulose-phosphate 3-epimerase-like protein 1 (RPEL1)",
                "Transaldolase (TALDO1)",
                "Transaldolase 2 (TALDO2)",
                "Transaldolase-like protein 1 (TALDO1L1)",
                "Transketolase (TKT)",
                "Transketolase-like protein 1 (TKTL1)",
                "Transketolase-like protein 2 (TKTL2)",
                "Transketolase-like protein 3 (TKTL3)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "6-Phosphogluconolactase (PGL)",
            "Phosphoglucomutase 1 (PGM1)",
            "Transketolase (TKT)",
            "Transaldolase (TAL)",
            "Ribose-5-phosphate isomerase (RPE)",
            "Ribulose-phosphate 3-epimerase (RPI)",
            "G6PD deficiency gene (G6PD)",
            "PGL gene (PGL)",
            "PGM1 gene (PGM1)",
            "TKT gene (TKT)",
            "TAL gene (TAL)",
            "RPE gene (RPE)",
            "RPI gene (RPI)",
            "Human G6PD gene (G6PD)",
            "Mouse Tkt gene (Tkt)",
            "Escherichia coli tal gene (tal)",
            "Saccharomyces cerevisiae ZWF1 (G6PD analog)",
            "Arabidopsis thaliana PGL gene (AtPGL)",
            "G6PD pseudogene (G6PD-ps)",
            "TKT regulatory region",
            "TAL promoter sequence",
            "RPI mRNA transcript",
            "Human PGM1 isoform 1 gene (PGM1-1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "6-Phosphogluconolactase (PGL)",
                "Phosphoglucomutase 1 (PGM1)",
                "Transketolase (TKT)",
                "Transaldolase (TAL)",
                "Ribose-5-phosphate isomerase (RPE)",
                "Ribulose-phosphate 3-epimerase (RPI)",
                "G6PD deficiency gene (G6PD)",
                "PGL gene (PGL)",
                "PGM1 gene (PGM1)",
                "TKT gene (TKT)",
                "TAL gene (TAL)",
                "RPE gene (RPE)",
                "RPI gene (RPI)",
                "Human G6PD gene (G6PD)",
                "Mouse Tkt gene (Tkt)",
                "Escherichia coli tal gene (tal)",
                "Saccharomyces cerevisiae ZWF1 (G6PD analog)",
                "Arabidopsis thaliana PGL gene (AtPGL)",
                "G6PD pseudogene (G6PD-ps)",
                "TKT regulatory region",
                "TAL promoter sequence",
                "RPI mRNA transcript",
                "Human PGM1 isoform 1 gene (PGM1-1)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-Phosphogluconolactase (PGL)",
                "Arabidopsis thaliana PGL gene (AtPGL)",
                "Escherichia coli tal gene (tal)",
                "G6PD deficiency gene (G6PD)",
                "G6PD pseudogene (G6PD-ps)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Human G6PD gene (G6PD)",
                "Human PGM1 isoform 1 gene (PGM1-1)",
                "Mouse Tkt gene (Tkt)",
                "PGL gene (PGL)",
                "PGM1 gene (PGM1)",
                "Phosphoglucomutase 1 (PGM1)",
                "RPE gene (RPE)",
                "RPI gene (RPI)",
                "RPI mRNA transcript",
                "Ribose-5-phosphate isomerase (RPE)",
                "Ribulose-phosphate 3-epimerase (RPI)",
                "Saccharomyces cerevisiae ZWF1 (G6PD analog)",
                "TAL gene (TAL)",
                "TAL promoter sequence",
                "TKT gene (TKT)",
                "TKT regulatory region",
                "Transaldolase (TAL)",
                "Transketolase (TKT)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "6-phosphogluconolactonase (PGLS)",
            "6-phosphogluconate dehydrogenase (PGD)",
            "Transketolase (TKT)",
            "Transaldolase (TALDO1)",
            "Ribose-5-phosphate isomerase (RPIA)",
            "Ribulose-5-phosphate epimerase (RPE)",
            "Xylulose-5-phosphate phosphatase (X5PP)",
            "Phosphoribosyl pyrophosphate synthetase 1 (PRPS1)",
            "Phosphoribosyl pyrophosphate synthetase 2 (PRPS2)",
            "Phosphoribosyl pyrophosphate synthetase 3 (PRPS3)",
            "Phosphogluconate dehydrogenase (PGDH)",
            "Pentose phosphate pathway regulator (PPP1R15A)",
            "Hexose-6-phosphate dehydrogenase (H6PD)",
            "Glucose-6-phosphate isomerase (GPI)",
            "Phosphomannose isomerase (MPI)",
            "Phosphoribosylformylglycinamidine synthase (PFAS)",
            "Phosphoribosylglycinamide formyltransferase (GART)",
            "Phosphoribosylglycinamide synthetase (GARS)",
            "Phosphoribosylglycinamide cyclo-ligase (PFGL)",
            "Phosphoribosylaminoimidazole carboxylase (PAICS)",
            "Phosphoribosylaminoimidazole-succinocarboxamide synthase (PAICS)",
            "Phosphoribosylaminoimidazole-succinocarboxamide lyase (PAICL)",
            "Phosphoribosylaminoimidazole carboxamide formyltransferase (AICARFT)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "6-phosphogluconolactonase (PGLS)",
                "6-phosphogluconate dehydrogenase (PGD)",
                "Transketolase (TKT)",
                "Transaldolase (TALDO1)",
                "Ribose-5-phosphate isomerase (RPIA)",
                "Ribulose-5-phosphate epimerase (RPE)",
                "Xylulose-5-phosphate phosphatase (X5PP)",
                "Phosphoribosyl pyrophosphate synthetase 1 (PRPS1)",
                "Phosphoribosyl pyrophosphate synthetase 2 (PRPS2)",
                "Phosphoribosyl pyrophosphate synthetase 3 (PRPS3)",
                "Pentose phosphate pathway regulator (PPP1R15A)",
                "Hexose-6-phosphate dehydrogenase (H6PD)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Phosphomannose isomerase (MPI)",
                "Phosphoribosylformylglycinamidine synthase (PFAS)",
                "Phosphoribosylglycinamide formyltransferase (GART)",
                "Phosphoribosylglycinamide synthetase (GARS)",
                "Phosphoribosylglycinamide cyclo-ligase (PFGL)",
                "Phosphoribosylaminoimidazole carboxylase (PAICS)",
                "Phosphoribosylaminoimidazole-succinocarboxamide synthase (PAICS)",
                "Phosphoribosylaminoimidazole-succinocarboxamide lyase (PAICL)",
                "Phosphoribosylaminoimidazole carboxamide formyltransferase (AICARFT)"
            ],
            "mismatches": [
                "Phosphogluconate dehydrogenase (PGDH)"
            ],
            "true_referents": [
                "6-phosphogluconate dehydrogenase (PGD)",
                "6-phosphogluconolactonase (PGLS)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Glucose-6-phosphate isomerase (GPI)",
                "Hexose-6-phosphate dehydrogenase (H6PD)",
                "Pentose phosphate pathway regulator (PPP1R15A)",
                "Phosphogluconate dehydrogenase (PGDH)",
                "Phosphomannose isomerase (MPI)",
                "Phosphoribosyl pyrophosphate synthetase 1 (PRPS1)",
                "Phosphoribosyl pyrophosphate synthetase 2 (PRPS2)",
                "Phosphoribosyl pyrophosphate synthetase 3 (PRPS3)",
                "Phosphoribosylaminoimidazole carboxamide formyltransferase (AICARFT)",
                "Phosphoribosylaminoimidazole carboxylase (PAICS)",
                "Phosphoribosylaminoimidazole-succinocarboxamide lyase (PAICL)",
                "Phosphoribosylaminoimidazole-succinocarboxamide synthase (PAICS)",
                "Phosphoribosylformylglycinamidine synthase (PFAS)",
                "Phosphoribosylglycinamide cyclo-ligase (PFGL)",
                "Phosphoribosylglycinamide formyltransferase (GART)",
                "Phosphoribosylglycinamide synthetase (GARS)",
                "Ribose-5-phosphate isomerase (RPIA)",
                "Ribulose-5-phosphate epimerase (RPE)",
                "Transaldolase (TALDO1)",
                "Transketolase (TKT)",
                "Xylulose-5-phosphate phosphatase (X5PP)"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "6-Phosphogluconolactonase (PGLS)",
            "6-Phosphogluconate dehydrogenase (PGD)",
            "Transaldolase (TALDO1)",
            "Transketolase (TKT)",
            "Phosphoribulose kinase (PRPS1)",
            "Ribulose-5-phosphate epimerase (RPE)",
            "Ribose-5-phosphate isomerase (RPIA)",
            "NADP+-dependent malate dehydrogenase (MDH1)",
            "NADP+-dependent isocitrate dehydrogenase (IDH1)",
            "NADP+-dependent glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
            "Fructose-1,6-bisphosphatase (FBP1)",
            "Aldose reductase (AKR1B1)",
            "Aldose 1-epimerase (GALM)",
            "Mannose-6-phosphate isomerase (MPI)",
            "Phosphoglucomutase (PGM)",
            "Glucose-1-phosphate adenylyltransferase (ADP-Glc pyrophosphorylase)",
            "Phosphoenolpyruvate carboxykinase (PCK1)",
            "Pyruvate kinase (PKM)",
            "Phosphofructokinase (PFK)",
            "Hexokinase (HK)",
            "Glucose transporter type 1 (GLUT1)",
            "Glucose transporter type 2 (GLUT2)",
            "Sorbitol dehydrogenase (SORD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "6-Phosphogluconolactonase (PGLS)",
                "6-Phosphogluconate dehydrogenase (PGD)",
                "Transaldolase (TALDO1)",
                "Transketolase (TKT)",
                "Phosphoribulose kinase (PRPS1)",
                "Ribulose-5-phosphate epimerase (RPE)",
                "Ribose-5-phosphate isomerase (RPIA)",
                "NADP+-dependent malate dehydrogenase (MDH1)",
                "NADP+-dependent isocitrate dehydrogenase (IDH1)",
                "NADP+-dependent glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Fructose-1,6-bisphosphatase (FBP1)",
                "Aldose reductase (AKR1B1)",
                "Aldose 1-epimerase (GALM)",
                "Mannose-6-phosphate isomerase (MPI)",
                "Phosphoglucomutase (PGM)",
                "Glucose-1-phosphate adenylyltransferase (ADP-Glc pyrophosphorylase)",
                "Phosphoenolpyruvate carboxykinase (PCK1)",
                "Pyruvate kinase (PKM)",
                "Phosphofructokinase (PFK)",
                "Hexokinase (HK)",
                "Glucose transporter type 1 (GLUT1)",
                "Glucose transporter type 2 (GLUT2)",
                "Sorbitol dehydrogenase (SORD)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-Phosphogluconate dehydrogenase (PGD)",
                "6-Phosphogluconolactonase (PGLS)",
                "Aldose 1-epimerase (GALM)",
                "Aldose reductase (AKR1B1)",
                "Fructose-1,6-bisphosphatase (FBP1)",
                "Glucose transporter type 1 (GLUT1)",
                "Glucose transporter type 2 (GLUT2)",
                "Glucose-1-phosphate adenylyltransferase (ADP-Glc pyrophosphorylase)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Hexokinase (HK)",
                "Mannose-6-phosphate isomerase (MPI)",
                "NADP+-dependent glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "NADP+-dependent isocitrate dehydrogenase (IDH1)",
                "NADP+-dependent malate dehydrogenase (MDH1)",
                "Phosphoenolpyruvate carboxykinase (PCK1)",
                "Phosphofructokinase (PFK)",
                "Phosphoglucomutase (PGM)",
                "Phosphoribulose kinase (PRPS1)",
                "Pyruvate kinase (PKM)",
                "Ribose-5-phosphate isomerase (RPIA)",
                "Ribulose-5-phosphate epimerase (RPE)",
                "Sorbitol dehydrogenase (SORD)",
                "Transaldolase (TALDO1)",
                "Transketolase (TKT)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate dehydrogenase gene (G6PD)",
            "6-phosphogluconolactonase gene (PGLS)",
            "6-phosphogluconate dehydrogenase gene (PGD)",
            "Ribose-5-phosphate isomerase gene (RPIA)",
            "Ribulose-5-phosphate-3-epimerase gene (RPE)",
            "Transketolase gene (TKT)",
            "Transaldolase gene (TALDO1)",
            "Phosphoglucomutase gene (PGM)",
            "Phosphopentomutase gene (PPM1)",
            "Ribokinase gene (RBKS)",
            "Ribose-phosphate pyrophosphokinase gene (PRPS1)",
            "Phosphoribosyl pyrophosphate synthetase gene (PRPS2)",
            "Phosphoribosyl pyrophosphate amidotransferase gene (PPAT)",
            "Nucleoside-diphosphate kinase gene (NME1)",
            "Nucleoside-diphosphate kinase gene (NME2)",
            "Adenylate kinase gene (AK1)",
            "Adenylate kinase gene (AK2)",
            "Adenylate kinase gene (AK3)",
            "Adenylate kinase gene (AK4)",
            "Adenylate kinase gene (AK5)",
            "Adenylate kinase gene (AK6)",
            "Adenylate kinase gene (AK7)",
            "Adenylate kinase gene (AK8)",
            "Adenylate kinase gene (AK9)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate dehydrogenase gene (G6PD)",
                "6-phosphogluconolactonase gene (PGLS)",
                "6-phosphogluconate dehydrogenase gene (PGD)",
                "Ribose-5-phosphate isomerase gene (RPIA)",
                "Ribulose-5-phosphate-3-epimerase gene (RPE)",
                "Transketolase gene (TKT)",
                "Transaldolase gene (TALDO1)",
                "Phosphoglucomutase gene (PGM)",
                "Phosphopentomutase gene (PPM1)",
                "Ribokinase gene (RBKS)",
                "Ribose-phosphate pyrophosphokinase gene (PRPS1)",
                "Phosphoribosyl pyrophosphate synthetase gene (PRPS2)",
                "Phosphoribosyl pyrophosphate amidotransferase gene (PPAT)",
                "Nucleoside-diphosphate kinase gene (NME1)",
                "Nucleoside-diphosphate kinase gene (NME2)",
                "Adenylate kinase gene (AK1)",
                "Adenylate kinase gene (AK2)",
                "Adenylate kinase gene (AK3)",
                "Adenylate kinase gene (AK4)",
                "Adenylate kinase gene (AK5)",
                "Adenylate kinase gene (AK6)",
                "Adenylate kinase gene (AK7)",
                "Adenylate kinase gene (AK8)",
                "Adenylate kinase gene (AK9)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-phosphogluconate dehydrogenase gene (PGD)",
                "6-phosphogluconolactonase gene (PGLS)",
                "Adenylate kinase gene (AK1)",
                "Adenylate kinase gene (AK2)",
                "Adenylate kinase gene (AK3)",
                "Adenylate kinase gene (AK4)",
                "Adenylate kinase gene (AK5)",
                "Adenylate kinase gene (AK6)",
                "Adenylate kinase gene (AK7)",
                "Adenylate kinase gene (AK8)",
                "Adenylate kinase gene (AK9)",
                "Glucose-6-phosphate dehydrogenase gene (G6PD)",
                "Nucleoside-diphosphate kinase gene (NME1)",
                "Nucleoside-diphosphate kinase gene (NME2)",
                "Phosphoglucomutase gene (PGM)",
                "Phosphopentomutase gene (PPM1)",
                "Phosphoribosyl pyrophosphate amidotransferase gene (PPAT)",
                "Phosphoribosyl pyrophosphate synthetase gene (PRPS2)",
                "Ribokinase gene (RBKS)",
                "Ribose-5-phosphate isomerase gene (RPIA)",
                "Ribose-phosphate pyrophosphokinase gene (PRPS1)",
                "Ribulose-5-phosphate-3-epimerase gene (RPE)",
                "Transaldolase gene (TALDO1)",
                "Transketolase gene (TKT)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "6-phosphogluconolactonase (6PGL)",
            "6-phosphogluconate dehydrogenase (6PGD)",
            "Transketolase (TKT)",
            "Transaldolase (TALDO)",
            "Ribose-5-phosphate isomerase (RPIA)",
            "Ribulose-5-phosphate 3-epimerase (RPE)",
            "Phosphogluconate dehydrogenase (PGD)",
            "Ribulose-phosphate 3-epimerase (RPE)",
            "Phosphopentose isomerase (PPI)",
            "Ribose-phosphate pyrophosphokinase (PRPS1)",
            "Ribose-phosphate diphosphokinase (PRPS1)",
            "Ribose-phosphate diphosphokinase (PRPS2)",
            "Ribose-phosphate diphosphokinase (PRPS1L1)",
            "Ribose-phosphate diphosphokinase (PRPS1L2)",
            "Ribose-phosphate diphosphokinase (PRPS1L3)",
            "Ribose-phosphate diphosphokinase (PRPS1L4)",
            "Ribose-phosphate diphosphokinase (PRPS1L5)",
            "Ribose-phosphate diphosphokinase (PRPS1L6)",
            "Ribose-phosphate diphosphokinase (PRPS1L7)",
            "Ribose-phosphate diphosphokinase (PRPS1L8)",
            "Ribose-phosphate diphosphokinase (PRPS1L9)",
            "Ribose-phosphate diphosphokinase (PRPS1L10)",
            "Ribose-phosphate diphosphokinase (PRPS1L11)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "6-phosphogluconolactonase (6PGL)",
                "6-phosphogluconate dehydrogenase (6PGD)",
                "Transketolase (TKT)",
                "Transaldolase (TALDO)",
                "Ribose-5-phosphate isomerase (RPIA)",
                "Ribulose-5-phosphate 3-epimerase (RPE)",
                "Phosphogluconate dehydrogenase (PGD)",
                "Ribulose-phosphate 3-epimerase (RPE)",
                "Phosphopentose isomerase (PPI)",
                "Ribose-phosphate pyrophosphokinase (PRPS1)",
                "Ribose-phosphate diphosphokinase (PRPS2)",
                "Ribose-phosphate diphosphokinase (PRPS1L1)",
                "Ribose-phosphate diphosphokinase (PRPS1L2)",
                "Ribose-phosphate diphosphokinase (PRPS1L3)",
                "Ribose-phosphate diphosphokinase (PRPS1L4)",
                "Ribose-phosphate diphosphokinase (PRPS1L5)",
                "Ribose-phosphate diphosphokinase (PRPS1L6)",
                "Ribose-phosphate diphosphokinase (PRPS1L7)",
                "Ribose-phosphate diphosphokinase (PRPS1L8)",
                "Ribose-phosphate diphosphokinase (PRPS1L9)",
                "Ribose-phosphate diphosphokinase (PRPS1L10)",
                "Ribose-phosphate diphosphokinase (PRPS1L11)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-phosphogluconate dehydrogenase (6PGD)",
                "6-phosphogluconolactonase (6PGL)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Phosphogluconate dehydrogenase (PGD)",
                "Phosphopentose isomerase (PPI)",
                "Ribose-5-phosphate isomerase (RPIA)",
                "Ribose-phosphate diphosphokinase (PRPS1)",
                "Ribose-phosphate diphosphokinase (PRPS1L1)",
                "Ribose-phosphate diphosphokinase (PRPS1L10)",
                "Ribose-phosphate diphosphokinase (PRPS1L11)",
                "Ribose-phosphate diphosphokinase (PRPS1L2)",
                "Ribose-phosphate diphosphokinase (PRPS1L3)",
                "Ribose-phosphate diphosphokinase (PRPS1L4)",
                "Ribose-phosphate diphosphokinase (PRPS1L5)",
                "Ribose-phosphate diphosphokinase (PRPS1L6)",
                "Ribose-phosphate diphosphokinase (PRPS1L7)",
                "Ribose-phosphate diphosphokinase (PRPS1L8)",
                "Ribose-phosphate diphosphokinase (PRPS1L9)",
                "Ribose-phosphate diphosphokinase (PRPS2)",
                "Ribose-phosphate pyrophosphokinase (PRPS1)",
                "Ribulose-5-phosphate 3-epimerase (RPE)",
                "Ribulose-phosphate 3-epimerase (RPE)",
                "Transaldolase (TALDO)",
                "Transketolase (TKT)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "6-Phosphogluconolactonase (PGLS)",
            "6-Phosphogluconate dehydrogenase (PGD)",
            "Ribose-5-phosphate isomerase A (RPIA)",
            "Ribose-5-phosphate isomerase B (RPIB)",
            "Ribulose-5-phosphate 3-epimerase (RPE)",
            "Transketolase (TKT)",
            "Transketolase-like 1 (TKTL1)",
            "Transketolase-like 2 (TKTL2)",
            "Transaldolase 1 (TALDO1)",
            "Transaldolase 2 (TALDO2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "6-Phosphogluconolactonase (PGLS)",
                "6-Phosphogluconate dehydrogenase (PGD)",
                "Ribose-5-phosphate isomerase A (RPIA)",
                "Ribose-5-phosphate isomerase B (RPIB)",
                "Ribulose-5-phosphate 3-epimerase (RPE)",
                "Transketolase (TKT)",
                "Transketolase-like 1 (TKTL1)",
                "Transketolase-like 2 (TKTL2)",
                "Transaldolase 1 (TALDO1)",
                "Transaldolase 2 (TALDO2)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-Phosphogluconate dehydrogenase (PGD)",
                "6-Phosphogluconolactonase (PGLS)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Ribose-5-phosphate isomerase A (RPIA)",
                "Ribose-5-phosphate isomerase B (RPIB)",
                "Ribulose-5-phosphate 3-epimerase (RPE)",
                "Transaldolase 1 (TALDO1)",
                "Transaldolase 2 (TALDO2)",
                "Transketolase (TKT)",
                "Transketolase-like 1 (TKTL1)",
                "Transketolase-like 2 (TKTL2)"
            ],
            "TP": 11,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "6-phosphogluconate dehydrogenase (PGD)",
            "Transketolase (TKT)",
            "Transaldolase (TALDO1)",
            "Ribose-5-phosphate isomerase (RPIA)",
            "Ribulose-5-phosphate 3-epimerase (RPE)",
            "Phosphoribosyl pyrophosphate synthetase 1 (PRPS1)",
            "Phosphoribosyl pyrophosphate synthetase 2 (PRPS2)",
            "Phosphoribosyl pyrophosphate synthetase-associated protein 1 (PRPSAP1)",
            "Phosphoribosyl pyrophosphate synthetase-associated protein 2 (PRPSAP2)",
            "Hexose-6-phosphate dehydrogenase (H6PD)",
            "Glucose-6-phosphate dehydrogenase X-linked (G6PDX)",
            "Transketolase-like 1 (TKTL1)",
            "Transketolase-like 2 (TKTL2)",
            "Phosphoglucomutase 1 (PGM1)",
            "Phosphoglucomutase 2 (PGM2)",
            "Phosphoglucomutase 3 (PGM3)",
            "Glucose phosphate isomerase (GPI)",
            "Fructose-1,6-bisphosphatase 1 (FBP1)",
            "Fructose-1,6-bisphosphatase 2 (FBP2)",
            "Phosphofructokinase, liver type (PFKL)",
            "Phosphofructokinase, muscle type (PFKM)",
            "Phosphofructokinase, platelet type (PFKP)",
            "Aldolase A, fructose-bisphosphate (ALDOA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "6-phosphogluconate dehydrogenase (PGD)",
                "Transketolase (TKT)",
                "Transaldolase (TALDO1)",
                "Ribose-5-phosphate isomerase (RPIA)",
                "Ribulose-5-phosphate 3-epimerase (RPE)",
                "Phosphoribosyl pyrophosphate synthetase 1 (PRPS1)",
                "Phosphoribosyl pyrophosphate synthetase 2 (PRPS2)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 1 (PRPSAP1)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 2 (PRPSAP2)",
                "Hexose-6-phosphate dehydrogenase (H6PD)",
                "Glucose-6-phosphate dehydrogenase X-linked (G6PDX)",
                "Transketolase-like 1 (TKTL1)",
                "Transketolase-like 2 (TKTL2)",
                "Phosphoglucomutase 1 (PGM1)",
                "Phosphoglucomutase 2 (PGM2)",
                "Phosphoglucomutase 3 (PGM3)",
                "Glucose phosphate isomerase (GPI)",
                "Fructose-1,6-bisphosphatase 1 (FBP1)",
                "Fructose-1,6-bisphosphatase 2 (FBP2)",
                "Phosphofructokinase, liver type (PFKL)",
                "Phosphofructokinase, muscle type (PFKM)",
                "Phosphofructokinase, platelet type (PFKP)",
                "Aldolase A, fructose-bisphosphate (ALDOA)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-phosphogluconate dehydrogenase (PGD)",
                "Aldolase A, fructose-bisphosphate (ALDOA)",
                "Fructose-1,6-bisphosphatase 1 (FBP1)",
                "Fructose-1,6-bisphosphatase 2 (FBP2)",
                "Glucose phosphate isomerase (GPI)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Glucose-6-phosphate dehydrogenase X-linked (G6PDX)",
                "Hexose-6-phosphate dehydrogenase (H6PD)",
                "Phosphofructokinase, liver type (PFKL)",
                "Phosphofructokinase, muscle type (PFKM)",
                "Phosphofructokinase, platelet type (PFKP)",
                "Phosphoglucomutase 1 (PGM1)",
                "Phosphoglucomutase 2 (PGM2)",
                "Phosphoglucomutase 3 (PGM3)",
                "Phosphoribosyl pyrophosphate synthetase 1 (PRPS1)",
                "Phosphoribosyl pyrophosphate synthetase 2 (PRPS2)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 1 (PRPSAP1)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 2 (PRPSAP2)",
                "Ribose-5-phosphate isomerase (RPIA)",
                "Ribulose-5-phosphate 3-epimerase (RPE)",
                "Transaldolase (TALDO1)",
                "Transketolase (TKT)",
                "Transketolase-like 1 (TKTL1)",
                "Transketolase-like 2 (TKTL2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "glucose-6-phosphate dehydrogenase (G6PD)",
            "6-phosphogluconolactonase (PGLS)",
            "6-phosphogluconate dehydrogenase (PGD)",
            "ribulose-5-phosphate isomerase (RPIA)",
            "ribulose-5-phosphate 3-epimerase (RPE)",
            "transketolase (TKT)",
            "transaldolase 1 (TALDO1)",
            "phosphopentose epimerase (PPME)",
            "phosphopentose isomerase (PPI)",
            "fructose-bisphosphate aldolase (ALDOA)",
            "fructose-bisphosphatase 1 (FBP1)",
            "phosphofructokinase (PFK)",
            "glucose-6-phosphate isomerase (GPI)",
            "hexose-6-phosphate dehydrogenase (H6PD)",
            "ribose-5-phosphate isomerase A (RPIA)",
            "sedoheptulokinase (SHPK)",
            "glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
            "phosphoglycerate kinase (PGK)",
            "phosphoglycerate mutase (PGAM)",
            "enolase (ENO)",
            "pyruvate kinase (PKM)",
            "lactate dehydrogenase A (LDHA)",
            "triose phosphate isomerase (TPI)",
            "phosphoribosyl pyrophosphate synthetase (PRPS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "glucose-6-phosphate dehydrogenase (G6PD)",
                "6-phosphogluconolactonase (PGLS)",
                "6-phosphogluconate dehydrogenase (PGD)",
                "ribulose-5-phosphate isomerase (RPIA)",
                "ribulose-5-phosphate 3-epimerase (RPE)",
                "transketolase (TKT)",
                "transaldolase 1 (TALDO1)",
                "phosphopentose epimerase (PPME)",
                "phosphopentose isomerase (PPI)",
                "fructose-bisphosphate aldolase (ALDOA)",
                "fructose-bisphosphatase 1 (FBP1)",
                "phosphofructokinase (PFK)",
                "glucose-6-phosphate isomerase (GPI)",
                "hexose-6-phosphate dehydrogenase (H6PD)",
                "sedoheptulokinase (SHPK)",
                "glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "phosphoglycerate kinase (PGK)",
                "phosphoglycerate mutase (PGAM)",
                "enolase (ENO)",
                "pyruvate kinase (PKM)",
                "lactate dehydrogenase A (LDHA)",
                "triose phosphate isomerase (TPI)",
                "phosphoribosyl pyrophosphate synthetase (PRPS)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-phosphogluconate dehydrogenase (PGD)",
                "6-phosphogluconolactonase (PGLS)",
                "enolase (ENO)",
                "fructose-bisphosphatase 1 (FBP1)",
                "fructose-bisphosphate aldolase (ALDOA)",
                "glucose-6-phosphate dehydrogenase (G6PD)",
                "glucose-6-phosphate isomerase (GPI)",
                "glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "hexose-6-phosphate dehydrogenase (H6PD)",
                "lactate dehydrogenase A (LDHA)",
                "phosphofructokinase (PFK)",
                "phosphoglycerate kinase (PGK)",
                "phosphoglycerate mutase (PGAM)",
                "phosphopentose epimerase (PPME)",
                "phosphopentose isomerase (PPI)",
                "phosphoribosyl pyrophosphate synthetase (PRPS)",
                "pyruvate kinase (PKM)",
                "ribose-5-phosphate isomerase A (RPIA)",
                "ribulose-5-phosphate 3-epimerase (RPE)",
                "ribulose-5-phosphate isomerase (RPIA)",
                "sedoheptulokinase (SHPK)",
                "transaldolase 1 (TALDO1)",
                "transketolase (TKT)",
                "triose phosphate isomerase (TPI)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "6-phosphogluconolactonase (PGLS)",
            "Glucosamine-6-phosphate deaminase (GNPDA)",
            "6-phosphogluconate dehydrogenase (PGD)",
            "Ribose-5-phosphate isomerase (RPIA)",
            "Ribulose-5-phosphate epimerase (RPE)",
            "Transketolase (TKT)",
            "Transaldolase (TALDO1)",
            "Glucose-6-phosphate 1-dehydrogenase (G6PD2)",
            "6-phosphogluconolactonase 2 (PGLS2)",
            "Phosphogluconate dehydrogenase (PGD2)",
            "Ribose-5-phosphate isomerase B (RPIBB)",
            "Ribulose-5-phosphate-3-epimerase (RPE2)",
            "Transketolase-like protein 1 (TKTL1)",
            "Transaldolase 2 (TALDO2)",
            "Glucose-6-phosphate dehydrogenase X-linked (G6PDX)",
            "6-phosphogluconolactonase 3 (PGLS3)",
            "Phosphogluconate dehydrogenase 3 (PGD3)",
            "Ribose-5-phosphate isomerase A (RPIA2)",
            "Ribulose-5-phosphate-3-epimerase-like 1 (RPE3L1)",
            "Transketolase-like protein 2 (TKTL2)",
            "Transaldolase 3 (TALDO3)",
            "Glucose-6-phosphate dehydrogenase 2 (G6PD3)",
            "6-phosphogluconolactonase 4 (PGLS4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "6-phosphogluconolactonase (PGLS)",
                "Glucosamine-6-phosphate deaminase (GNPDA)",
                "6-phosphogluconate dehydrogenase (PGD)",
                "Ribose-5-phosphate isomerase (RPIA)",
                "Ribulose-5-phosphate epimerase (RPE)",
                "Transketolase (TKT)",
                "Transaldolase (TALDO1)",
                "Glucose-6-phosphate 1-dehydrogenase (G6PD2)",
                "6-phosphogluconolactonase 2 (PGLS2)",
                "Phosphogluconate dehydrogenase (PGD2)",
                "Ribose-5-phosphate isomerase B (RPIBB)",
                "Ribulose-5-phosphate-3-epimerase (RPE2)",
                "Transketolase-like protein 1 (TKTL1)",
                "Transaldolase 2 (TALDO2)",
                "Glucose-6-phosphate dehydrogenase X-linked (G6PDX)",
                "6-phosphogluconolactonase 3 (PGLS3)",
                "Phosphogluconate dehydrogenase 3 (PGD3)",
                "Ribose-5-phosphate isomerase A (RPIA2)",
                "Ribulose-5-phosphate-3-epimerase-like 1 (RPE3L1)",
                "Transketolase-like protein 2 (TKTL2)",
                "Transaldolase 3 (TALDO3)",
                "Glucose-6-phosphate dehydrogenase 2 (G6PD3)",
                "6-phosphogluconolactonase 4 (PGLS4)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-phosphogluconate dehydrogenase (PGD)",
                "6-phosphogluconolactonase (PGLS)",
                "6-phosphogluconolactonase 2 (PGLS2)",
                "6-phosphogluconolactonase 3 (PGLS3)",
                "6-phosphogluconolactonase 4 (PGLS4)",
                "Glucosamine-6-phosphate deaminase (GNPDA)",
                "Glucose-6-phosphate 1-dehydrogenase (G6PD2)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Glucose-6-phosphate dehydrogenase 2 (G6PD3)",
                "Glucose-6-phosphate dehydrogenase X-linked (G6PDX)",
                "Phosphogluconate dehydrogenase (PGD2)",
                "Phosphogluconate dehydrogenase 3 (PGD3)",
                "Ribose-5-phosphate isomerase (RPIA)",
                "Ribose-5-phosphate isomerase A (RPIA2)",
                "Ribose-5-phosphate isomerase B (RPIBB)",
                "Ribulose-5-phosphate epimerase (RPE)",
                "Ribulose-5-phosphate-3-epimerase (RPE2)",
                "Ribulose-5-phosphate-3-epimerase-like 1 (RPE3L1)",
                "Transaldolase (TALDO1)",
                "Transaldolase 2 (TALDO2)",
                "Transaldolase 3 (TALDO3)",
                "Transketolase (TKT)",
                "Transketolase-like protein 1 (TKTL1)",
                "Transketolase-like protein 2 (TKTL2)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate dehydrogenase (G6PD)",
            "6-phosphogluconate dehydrogenase (PGD)",
            "Transketolase (TKT)",
            "Transaldolase (TALDO1)",
            "Ribose-5-phosphate isomerase (RPIA)",
            "Ribulose-5-phosphate 3-epimerase (RPPE)",
            "Phosphogluconate dehydrogenase (PGD)",
            "Phosphoriboisomerase (PRPS1)",
            "Phosphoribosyl pyrophosphate synthetase 1 (PRPS1)",
            "Phosphoribosyl pyrophosphate synthetase 2 (PRPS2)",
            "Phosphoribosyl pyrophosphate synthetase-associated protein 1 (PRPSAP1)",
            "Phosphoribosyl pyrophosphate synthetase-associated protein 2 (PRPSAP2)",
            "Glucose-6-phosphate 1-dehydrogenase (G6PD)",
            "6-phosphogluconate dehydrogenase, decarboxylating (PGD)",
            "Ribose-5-phosphate isomerase A (RPIA)",
            "Ribulose-5-phosphate 3-epimerase (RPPE)",
            "Transketolase (TKT1)",
            "Transaldolase (TALDO)",
            "Phosphoribosyl pyrophosphate synthetase 1-like 1 (PRPS1L1)",
            "Phosphoribosyl pyrophosphate synthetase 1-like 3 (PRPS1L3)",
            "Phosphoribosyl pyrophosphate synthetase 1-like 2 (PRPS1L2)",
            "Phosphoribosyl pyrophosphate synthetase-associated protein 1-like (PRPSAP1L)",
            "Phosphoribosyl pyrophosphate synthetase-associated protein 2-like (PRPSAP2L)",
            "Glucose-6-phosphate 1-dehydrogenase-like (G6PD-like)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "6-phosphogluconate dehydrogenase (PGD)",
                "Transketolase (TKT)",
                "Transaldolase (TALDO1)",
                "Ribose-5-phosphate isomerase (RPIA)",
                "Ribulose-5-phosphate 3-epimerase (RPPE)",
                "Phosphoriboisomerase (PRPS1)",
                "Phosphoribosyl pyrophosphate synthetase 1 (PRPS1)",
                "Phosphoribosyl pyrophosphate synthetase 2 (PRPS2)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 1 (PRPSAP1)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 2 (PRPSAP2)",
                "Glucose-6-phosphate 1-dehydrogenase (G6PD)",
                "6-phosphogluconate dehydrogenase, decarboxylating (PGD)",
                "Ribose-5-phosphate isomerase A (RPIA)",
                "Transketolase (TKT1)",
                "Transaldolase (TALDO)",
                "Phosphoribosyl pyrophosphate synthetase 1-like 1 (PRPS1L1)",
                "Phosphoribosyl pyrophosphate synthetase 1-like 3 (PRPS1L3)",
                "Phosphoribosyl pyrophosphate synthetase 1-like 2 (PRPS1L2)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 1-like (PRPSAP1L)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 2-like (PRPSAP2L)",
                "Glucose-6-phosphate 1-dehydrogenase-like (G6PD-like)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-phosphogluconate dehydrogenase (PGD)",
                "6-phosphogluconate dehydrogenase, decarboxylating (PGD)",
                "Glucose-6-phosphate 1-dehydrogenase (G6PD)",
                "Glucose-6-phosphate 1-dehydrogenase-like (G6PD-like)",
                "Glucose-6-phosphate dehydrogenase (G6PD)",
                "Phosphogluconate dehydrogenase (PGD)",
                "Phosphoriboisomerase (PRPS1)",
                "Phosphoribosyl pyrophosphate synthetase 1 (PRPS1)",
                "Phosphoribosyl pyrophosphate synthetase 1-like 1 (PRPS1L1)",
                "Phosphoribosyl pyrophosphate synthetase 1-like 2 (PRPS1L2)",
                "Phosphoribosyl pyrophosphate synthetase 1-like 3 (PRPS1L3)",
                "Phosphoribosyl pyrophosphate synthetase 2 (PRPS2)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 1 (PRPSAP1)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 1-like (PRPSAP1L)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 2 (PRPSAP2)",
                "Phosphoribosyl pyrophosphate synthetase-associated protein 2-like (PRPSAP2L)",
                "Ribose-5-phosphate isomerase (RPIA)",
                "Ribose-5-phosphate isomerase A (RPIA)",
                "Ribulose-5-phosphate 3-epimerase (RPPE)",
                "Transaldolase (TALDO)",
                "Transaldolase (TALDO1)",
                "Transketolase (TKT)",
                "Transketolase (TKT1)"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "G6PD (Glucose-6-phosphate dehydrogenase) gene",
            "Zwf1 (Zwfi) gene",
            "Gnd1 (Glucose-6-phosphate dehydrogenase) gene",
            "Tps1 (Transaldolase) gene",
            "Tpi1 (Triosephosphate isomerase) gene",
            "Rpe1 (Ribose-5-phosphate epimerase) gene",
            "Rpe2 (Ribose-5-phosphate epimerase) gene",
            "Gnd2 (Glucose-6-phosphate dehydrogenase) gene",
            "Zwf2 (Zwfi) gene",
            "Tps2 (Transaldolase) gene",
            "Tpi2 (Triosephosphate isomerase) gene",
            "Rpe3 (Ribose-5-phosphate epimerase) gene",
            "Rpe4 (Ribose-5-phosphate epimerase) gene",
            "G6PDH (Glucose-6-phosphate dehydrogenase) gene",
            "Zwf3 (Zwfi) gene",
            "Tps3 (Transaldolase) gene",
            "Tpi3 (Triosephosphate isomerase) gene",
            "Rpe5 (Ribose-5-phosphate epimerase) gene",
            "Rpe6 (Ribose-5-phosphate epimerase) gene",
            "G6PDH1 (Glucose-6-phosphate dehydrogenase) gene",
            "Zwf4 (Zwfi) gene",
            "Tps4 (Transaldolase) gene",
            "Tpi4 (Triosephosphate isomerase) gene",
            "Rpe7 (Ribose-5-phosphate epimerase) gene",
            "Rpe8 (Ribose-5-phosphate epimerase) gene",
            "G6PDH2 (Glucose-6-phosphate dehydrogenase) gene",
            "Zwf5 (Zwfi) gene"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "G6PD (Glucose-6-phosphate dehydrogenase) gene",
                "Zwf1 (Zwfi) gene",
                "Gnd1 (Glucose-6-phosphate dehydrogenase) gene",
                "Tps1 (Transaldolase) gene",
                "Tpi1 (Triosephosphate isomerase) gene",
                "Rpe1 (Ribose-5-phosphate epimerase) gene",
                "Rpe2 (Ribose-5-phosphate epimerase) gene",
                "Gnd2 (Glucose-6-phosphate dehydrogenase) gene",
                "Zwf2 (Zwfi) gene",
                "Tps2 (Transaldolase) gene",
                "Tpi2 (Triosephosphate isomerase) gene",
                "Rpe3 (Ribose-5-phosphate epimerase) gene",
                "Rpe4 (Ribose-5-phosphate epimerase) gene",
                "G6PDH (Glucose-6-phosphate dehydrogenase) gene",
                "Zwf3 (Zwfi) gene",
                "Tps3 (Transaldolase) gene",
                "Tpi3 (Triosephosphate isomerase) gene",
                "Rpe5 (Ribose-5-phosphate epimerase) gene",
                "Rpe6 (Ribose-5-phosphate epimerase) gene",
                "G6PDH1 (Glucose-6-phosphate dehydrogenase) gene",
                "Zwf4 (Zwfi) gene",
                "Tps4 (Transaldolase) gene",
                "Tpi4 (Triosephosphate isomerase) gene",
                "Rpe7 (Ribose-5-phosphate epimerase) gene"
            ],
            "mismatches": [
                "Rpe8 (Ribose-5-phosphate epimerase) gene",
                "G6PDH2 (Glucose-6-phosphate dehydrogenase) gene",
                "Zwf5 (Zwfi) gene"
            ],
            "true_referents": [
                "G6PD (Glucose-6-phosphate dehydrogenase) gene",
                "G6PDH (Glucose-6-phosphate dehydrogenase) gene",
                "G6PDH1 (Glucose-6-phosphate dehydrogenase) gene",
                "Gnd1 (Glucose-6-phosphate dehydrogenase) gene",
                "Gnd2 (Glucose-6-phosphate dehydrogenase) gene",
                "Rpe1 (Ribose-5-phosphate epimerase) gene",
                "Rpe2 (Ribose-5-phosphate epimerase) gene",
                "Rpe3 (Ribose-5-phosphate epimerase) gene",
                "Rpe4 (Ribose-5-phosphate epimerase) gene",
                "Rpe5 (Ribose-5-phosphate epimerase) gene",
                "Rpe6 (Ribose-5-phosphate epimerase) gene",
                "Rpe7 (Ribose-5-phosphate epimerase) gene",
                "Tpi1 (Triosephosphate isomerase) gene",
                "Tpi2 (Triosephosphate isomerase) gene",
                "Tpi3 (Triosephosphate isomerase) gene",
                "Tpi4 (Triosephosphate isomerase) gene",
                "Tps1 (Transaldolase) gene",
                "Tps2 (Transaldolase) gene",
                "Tps3 (Transaldolase) gene",
                "Tps4 (Transaldolase) gene",
                "Zwf1 (Zwfi) gene",
                "Zwf2 (Zwfi) gene",
                "Zwf3 (Zwfi) gene",
                "Zwf4 (Zwfi) gene"
            ],
            "TP": 24,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": [
            "RPE (RPE)",
            "RPI (RPI)",
            "TKT (TKT)",
            "TKTL1 (TKTL1)",
            "TKTL2 (TKTL2)",
            "G6PD (G6PD)",
            "PGD (PGD)",
            "PGAM1 (PGAM1)",
            "PGAM2 (PGAM2)",
            "ENO1 (ENO1)",
            "ENO2 (ENO2)",
            "ENO3 (ENO3)",
            "ENO4 (ENO4)",
            "PKLR (PKLR)",
            "PKM (PKM)",
            "GLPK (GLPK)",
            "H6PD (H6PD)",
            "GNPDA1 (GNPDA1)",
            "GNPDA2 (GNPDA2)",
            "GNPDA3 (GNPDA3)",
            "FLloquent (FLO)",
            "TALDO1 (TALDO1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "RPE (RPE)",
                "RPI (RPI)",
                "TKT (TKT)",
                "TKTL1 (TKTL1)",
                "TKTL2 (TKTL2)",
                "G6PD (G6PD)",
                "PGD (PGD)",
                "PGAM1 (PGAM1)",
                "PGAM2 (PGAM2)",
                "ENO1 (ENO1)",
                "ENO2 (ENO2)",
                "ENO3 (ENO3)",
                "ENO4 (ENO4)",
                "PKLR (PKLR)",
                "PKM (PKM)",
                "GLPK (GLPK)",
                "H6PD (H6PD)",
                "GNPDA1 (GNPDA1)",
                "GNPDA2 (GNPDA2)",
                "GNPDA3 (GNPDA3)",
                "FLloquent (FLO)",
                "TALDO1 (TALDO1)"
            ],
            "mismatches": [],
            "true_referents": [
                "ENO1 (ENO1)",
                "ENO2 (ENO2)",
                "ENO3 (ENO3)",
                "ENO4 (ENO4)",
                "FLloquent (FLO)",
                "G6PD (G6PD)",
                "GLPK (GLPK)",
                "GNPDA1 (GNPDA1)",
                "GNPDA2 (GNPDA2)",
                "GNPDA3 (GNPDA3)",
                "H6PD (H6PD)",
                "PGAM1 (PGAM1)",
                "PGAM2 (PGAM2)",
                "PGD (PGD)",
                "PKLR (PKLR)",
                "PKM (PKM)",
                "RPE (RPE)",
                "RPI (RPI)",
                "TALDO1 (TALDO1)",
                "TKT (TKT)",
                "TKTL1 (TKTL1)",
                "TKTL2 (TKTL2)"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "pentose phosphate pathway enzyme gene",
        "domain": "biology",
        "response": "[\n        {\n            \"Referent\": \"G6PDH\" (EC 1.1.1.49)\n        },\n        {\n            \"Referent\": \"TPI\" (EC 2.7.4.1)\n        },\n        {\n            \"Referent\": \"PGK\" (EC 2.7.2.3)\n        },\n        {\n            \"Referent\": \"PGAM\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"ENO1\" (EC 1.1.1.1)\n        },\n        {\n            \"Referent\": \"PYK\" (EC 2.7.1.40)\n        },\n        {\n            \"Referent\": \"PGAM2\" (EC 2.7.2.5)\n        },\n        {\n            \"Referent\": \"PGK2\" (EC 2.7.2.3)\n        },\n        {\n            \"Referent\": \"PGM1\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM2\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM3\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM4\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM5\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM6\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM7\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM8\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM9\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGD\" (EC 2.7.2.6)\n        },\n        {\n            \"Referent\": \"PGL\" (EC 2.7.2.6)\n        },\n        {\n            \"Referent\": \"PGM10\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM11\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM12\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM13\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM14\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM15\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM16\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM17\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM18\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM19\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM20\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM21\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM22\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM23\" (EC 2.7.2.4)\n        },\n        {\n            \"Referent\": \"PGM24\" (EC 2.7.2.4)\n        }\n    ]",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]