[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "Ribose-5-phosphate (R5P)",
            "Xylulose-5-phosphate (X5P)",
            "Ribulose-5-phosphate (Ru5P)",
            "Glyceraldehyde-3-phosphate (GAP)",
            "Erythrose-4-phosphate (E4P)",
            "Sedoheptulose-7-phosphate (S7P)",
            "Dihydroxyacetone phosphate (DHAP)",
            "Phosphoribosyl pyrophosphate (PRPP)",
            "Phosphoribose-1-phosphate (PR1P)",
            "Phosphoribose-2-phosphate (PR2P)",
            "5-Phosphoribosylamine (PRA)",
            "5-Amino-1-\u03b2-D-ribofuranosyl-imidazole-4-carboxamide (AICAR)",
            "5-Phosphoribosyl-5-amino-1-\u03b2-D-ribofuranosyl-imidazole-4-carboxamide (PRAICAR)",
            "5-Amino-4-deoxyribonucleotide (ADNR)",
            "5-Phosphoribosyl-5-amino-4-deoxyribonucleotide (PRA-DNR)",
            "5-Aminoimidazole ribonucleotide (AIR)",
            "5-Amino-4-imidazolyl-1-\u03b2-D-ribofuranosyl-2-methylaminomethanol (AICAR)",
            "5-Aminoimidazole-4-carboxamide ribonucleotide (AICA-riboside)",
            "5-Aminoimidazole-4-carboxamide-1-\u03b2-D-ribofuranosyl-5-phosphate (AICA-PRPP)",
            "5-Aminoimidazole-4-carboxamide ribonucleotide (AICAR)",
            "5-Aminoimidazole-4-carboxamide-1-\u03b2-D-ribofuranosyl-5-phosphate (AICA-PRP)",
            "5-Phosphoribosyl-5-aminoimidazole-4-carboxamide (PRAICAR)",
            "5-Phosphoribosyl-5-aminoimidazole-4-carboxamide-1-\u03b2-D-ribofuranosyl-5-phosphate (PRAICAR-PRP)",
            "5-Phosphoribosyl-5-aminoimidazole-4-carboxamide-1-\u03b2-D-ribofuranosyl-5-phosphate (AICA-PRP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ribose-5-phosphate (R5P)",
                "Xylulose-5-phosphate (X5P)",
                "Ribulose-5-phosphate (Ru5P)",
                "Glyceraldehyde-3-phosphate (GAP)",
                "Erythrose-4-phosphate (E4P)",
                "Sedoheptulose-7-phosphate (S7P)",
                "Dihydroxyacetone phosphate (DHAP)",
                "Phosphoribosyl pyrophosphate (PRPP)",
                "Phosphoribose-1-phosphate (PR1P)",
                "Phosphoribose-2-phosphate (PR2P)",
                "5-Phosphoribosylamine (PRA)",
                "5-Amino-1-\u03b2-D-ribofuranosyl-imidazole-4-carboxamide (AICAR)",
                "5-Phosphoribosyl-5-amino-1-\u03b2-D-ribofuranosyl-imidazole-4-carboxamide (PRAICAR)",
                "5-Amino-4-deoxyribonucleotide (ADNR)",
                "5-Phosphoribosyl-5-amino-4-deoxyribonucleotide (PRA-DNR)",
                "5-Aminoimidazole ribonucleotide (AIR)",
                "5-Amino-4-imidazolyl-1-\u03b2-D-ribofuranosyl-2-methylaminomethanol (AICAR)",
                "5-Aminoimidazole-4-carboxamide ribonucleotide (AICA-riboside)",
                "5-Aminoimidazole-4-carboxamide-1-\u03b2-D-ribofuranosyl-5-phosphate (AICA-PRPP)",
                "5-Aminoimidazole-4-carboxamide ribonucleotide (AICAR)",
                "5-Aminoimidazole-4-carboxamide-1-\u03b2-D-ribofuranosyl-5-phosphate (AICA-PRP)",
                "5-Phosphoribosyl-5-aminoimidazole-4-carboxamide (PRAICAR)",
                "5-Phosphoribosyl-5-aminoimidazole-4-carboxamide-1-\u03b2-D-ribofuranosyl-5-phosphate (PRAICAR-PRP)",
                "5-Phosphoribosyl-5-aminoimidazole-4-carboxamide-1-\u03b2-D-ribofuranosyl-5-phosphate (AICA-PRP)"
            ],
            "mismatches": [],
            "true_referents": [
                "5-Amino-1-\u03b2-D-ribofuranosyl-imidazole-4-carboxamide (AICAR)",
                "5-Amino-4-deoxyribonucleotide (ADNR)",
                "5-Amino-4-imidazolyl-1-\u03b2-D-ribofuranosyl-2-methylaminomethanol (AICAR)",
                "5-Aminoimidazole ribonucleotide (AIR)",
                "5-Aminoimidazole-4-carboxamide ribonucleotide (AICA-riboside)",
                "5-Aminoimidazole-4-carboxamide ribonucleotide (AICAR)",
                "5-Aminoimidazole-4-carboxamide-1-\u03b2-D-ribofuranosyl-5-phosphate (AICA-PRP)",
                "5-Aminoimidazole-4-carboxamide-1-\u03b2-D-ribofuranosyl-5-phosphate (AICA-PRPP)",
                "5-Phosphoribosyl-5-amino-1-\u03b2-D-ribofuranosyl-imidazole-4-carboxamide (PRAICAR)",
                "5-Phosphoribosyl-5-amino-4-deoxyribonucleotide (PRA-DNR)",
                "5-Phosphoribosyl-5-aminoimidazole-4-carboxamide (PRAICAR)",
                "5-Phosphoribosyl-5-aminoimidazole-4-carboxamide-1-\u03b2-D-ribofuranosyl-5-phosphate (AICA-PRP)",
                "5-Phosphoribosyl-5-aminoimidazole-4-carboxamide-1-\u03b2-D-ribofuranosyl-5-phosphate (PRAICAR-PRP)",
                "5-Phosphoribosylamine (PRA)",
                "Dihydroxyacetone phosphate (DHAP)",
                "Erythrose-4-phosphate (E4P)",
                "Glyceraldehyde-3-phosphate (GAP)",
                "Phosphoribose-1-phosphate (PR1P)",
                "Phosphoribose-2-phosphate (PR2P)",
                "Phosphoribosyl pyrophosphate (PRPP)",
                "Ribose-5-phosphate (R5P)",
                "Ribulose-5-phosphate (Ru5P)",
                "Sedoheptulose-7-phosphate (S7P)",
                "Xylulose-5-phosphate (X5P)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "Ribose-5-phosphate (R5P)",
            "Ribulose-5-phosphate (Ru5P)",
            "Xylulose-5-phosphate (Xu5P)",
            "Sedoheptulose-7-phosphate (S7P)",
            "Glyceraldehyde-3-phosphate (G3P)",
            "Erythrose-4-phosphate (E4P)",
            "Fructose-6-phosphate (F6P)",
            "Glucose-6-phosphate (G6P)",
            "6-Phosphogluconolactone (6PGL)",
            "6-Phosphogluconate (6PG)",
            "Ribulose-1,5-bisphosphate (RuBP)",
            "Sedoheptulose-1,7-bisphosphate (S1,7BP)",
            "Fru-6-P (F6P)",
            "Gluconate-6-phosphate (G6P)",
            "Ribose-1-phosphate (R1P)",
            "Xylulose-1-phosphate (Xu1P)",
            "Ribose-1,5-bisphosphate (R1,5BP)",
            "Sedoheptulose-1,7-bisphosphate (S1,7BP)",
            "Fructose-1,6-bisphosphate (F1,6BP)",
            "Glyceraldehyde-1-phosphate (G1P)",
            "Erythrose-4-phosphate (E4P)",
            "Ribulose-1,5-bisphosphate (RuBP)",
            "Transketolase intermediate",
            "Transaldolase intermediate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ribose-5-phosphate (R5P)",
                "Ribulose-5-phosphate (Ru5P)",
                "Xylulose-5-phosphate (Xu5P)",
                "Sedoheptulose-7-phosphate (S7P)",
                "Glyceraldehyde-3-phosphate (G3P)",
                "Erythrose-4-phosphate (E4P)",
                "Fructose-6-phosphate (F6P)",
                "Glucose-6-phosphate (G6P)",
                "6-Phosphogluconolactone (6PGL)",
                "6-Phosphogluconate (6PG)",
                "Ribulose-1,5-bisphosphate (RuBP)",
                "Sedoheptulose-1,7-bisphosphate (S1,7BP)",
                "Fru-6-P (F6P)",
                "Ribose-1-phosphate (R1P)",
                "Xylulose-1-phosphate (Xu1P)",
                "Ribose-1,5-bisphosphate (R1,5BP)",
                "Fructose-1,6-bisphosphate (F1,6BP)",
                "Glyceraldehyde-1-phosphate (G1P)",
                "Transketolase intermediate",
                "Transaldolase intermediate"
            ],
            "mismatches": [],
            "true_referents": [
                "6-Phosphogluconate (6PG)",
                "6-Phosphogluconolactone (6PGL)",
                "Erythrose-4-phosphate (E4P)",
                "Fru-6-P (F6P)",
                "Fructose-1,6-bisphosphate (F1,6BP)",
                "Fructose-6-phosphate (F6P)",
                "Gluconate-6-phosphate (G6P)",
                "Glucose-6-phosphate (G6P)",
                "Glyceraldehyde-1-phosphate (G1P)",
                "Glyceraldehyde-3-phosphate (G3P)",
                "Ribose-1,5-bisphosphate (R1,5BP)",
                "Ribose-1-phosphate (R1P)",
                "Ribose-5-phosphate (R5P)",
                "Ribulose-1,5-bisphosphate (RuBP)",
                "Ribulose-5-phosphate (Ru5P)",
                "Sedoheptulose-1,7-bisphosphate (S1,7BP)",
                "Sedoheptulose-7-phosphate (S7P)",
                "Transaldolase intermediate",
                "Transketolase intermediate",
                "Xylulose-1-phosphate (Xu1P)",
                "Xylulose-5-phosphate (Xu5P)"
            ],
            "TP": 20,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "Glucose 6-phosphate (G6P)",
            "6-Phosphogluconolactone",
            "6-Phosphogluconate",
            "Ribulose 5-phosphate",
            "Ribose 5-phosphate (R5P)",
            "Xylulose 5-phosphate (Xu5P)",
            "Sedoheptulose 7-phosphate",
            "Sedoheptulose 1,7-bisphosphate",
            "Erythrose 4-phosphate",
            "Glyceraldehyde 3-phosphate (G3P)",
            "Fructose 6-phosphate (F6P)",
            "Fructose 1,6-bisphosphate (F1,6BP)",
            "Dihydroxyacetone phosphate (DHAP)",
            "NADPH",
            "NADP+",
            "Ribose 5-phosphate isomerase",
            "Ribulose 5-phosphate 3-epimerase",
            "Transketolase",
            "Transaldolase",
            "Glucose 6-phosphate dehydrogenase",
            "6-Phosphogluconate dehydrogenase",
            "Phosphopentose isomerase",
            "Phosphopentose epimerase",
            "Phosphoribulokinase"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose 6-phosphate (G6P)",
                "6-Phosphogluconolactone",
                "6-Phosphogluconate",
                "Ribulose 5-phosphate",
                "Ribose 5-phosphate (R5P)",
                "Xylulose 5-phosphate (Xu5P)",
                "Sedoheptulose 7-phosphate",
                "Sedoheptulose 1,7-bisphosphate",
                "Erythrose 4-phosphate",
                "Glyceraldehyde 3-phosphate (G3P)",
                "Fructose 6-phosphate (F6P)",
                "Fructose 1,6-bisphosphate (F1,6BP)",
                "Dihydroxyacetone phosphate (DHAP)",
                "NADPH",
                "NADP+",
                "Ribose 5-phosphate isomerase",
                "Ribulose 5-phosphate 3-epimerase",
                "Transketolase",
                "Transaldolase",
                "Glucose 6-phosphate dehydrogenase",
                "6-Phosphogluconate dehydrogenase",
                "Phosphopentose isomerase",
                "Phosphopentose epimerase",
                "Phosphoribulokinase"
            ],
            "mismatches": [],
            "true_referents": [
                "6-Phosphogluconate",
                "6-Phosphogluconate dehydrogenase",
                "6-Phosphogluconolactone",
                "Dihydroxyacetone phosphate (DHAP)",
                "Erythrose 4-phosphate",
                "Fructose 1,6-bisphosphate (F1,6BP)",
                "Fructose 6-phosphate (F6P)",
                "Glucose 6-phosphate (G6P)",
                "Glucose 6-phosphate dehydrogenase",
                "Glyceraldehyde 3-phosphate (G3P)",
                "NADP+",
                "NADPH",
                "Phosphopentose epimerase",
                "Phosphopentose isomerase",
                "Phosphoribulokinase",
                "Ribose 5-phosphate (R5P)",
                "Ribose 5-phosphate isomerase",
                "Ribulose 5-phosphate",
                "Ribulose 5-phosphate 3-epimerase",
                "Sedoheptulose 1,7-bisphosphate",
                "Sedoheptulose 7-phosphate",
                "Transaldolase",
                "Transketolase",
                "Xylulose 5-phosphate (Xu5P)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate (G6P)",
            "6-Phosphoglucono-\u03b4-lactone (6-PGL)",
            "6-Phosphogluconate (6-PG)",
            "Ribulose-5-phosphate (Ru5P)",
            "Xylulose-5-phosphate (Xu5P)",
            "Ribose-5-phosphate (R5P)",
            "Fructose-6-phosphate (F6P)",
            "Glyceraldehyde-3-phosphate (G3P)",
            "Erythrose-4-phosphate (E4P)",
            "Sedoheptulose-1,7-bisphosphate (S7P)",
            "Glycerone phosphate (GlyP)",
            "Dihydroxyacetone phosphate (DHAP)",
            "Transketolase-bound hydroxymethylthiamine pyrophosphate (TK-HMPP)",
            "Phosphoribosyl pyrophosphate (PRPP)",
            "5-Phosphoribosyl-1-pyrophosphate (PRPP)",
            "NADP+ (oxidized nicotinamide adenine dinucleotide phosphate)",
            "NADPH (reduced nicotinamide adenine dinucleotide phosphate)",
            "Glucose-1-phosphate (G1P)",
            "Fructose-1,6-bisphosphate (F1,6BP)",
            "Mannose-6-phosphate (M6P)",
            "Sedoheptulose-1-phosphate (S1P)",
            "Ribulose-1,5-bisphosphate (Ru1,5BP)",
            "Xylitol-5-phosphate (X5P)",
            "2-Deoxyribose-5-phosphate (dRib5P)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate (G6P)",
                "6-Phosphoglucono-\u03b4-lactone (6-PGL)",
                "6-Phosphogluconate (6-PG)",
                "Ribulose-5-phosphate (Ru5P)",
                "Xylulose-5-phosphate (Xu5P)",
                "Ribose-5-phosphate (R5P)",
                "Fructose-6-phosphate (F6P)",
                "Glyceraldehyde-3-phosphate (G3P)",
                "Erythrose-4-phosphate (E4P)",
                "Sedoheptulose-1,7-bisphosphate (S7P)",
                "Glycerone phosphate (GlyP)",
                "Dihydroxyacetone phosphate (DHAP)",
                "Transketolase-bound hydroxymethylthiamine pyrophosphate (TK-HMPP)",
                "Phosphoribosyl pyrophosphate (PRPP)",
                "5-Phosphoribosyl-1-pyrophosphate (PRPP)",
                "NADP+ (oxidized nicotinamide adenine dinucleotide phosphate)",
                "NADPH (reduced nicotinamide adenine dinucleotide phosphate)",
                "Glucose-1-phosphate (G1P)",
                "Fructose-1,6-bisphosphate (F1,6BP)",
                "Mannose-6-phosphate (M6P)",
                "Sedoheptulose-1-phosphate (S1P)",
                "Ribulose-1,5-bisphosphate (Ru1,5BP)",
                "Xylitol-5-phosphate (X5P)",
                "2-Deoxyribose-5-phosphate (dRib5P)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Deoxyribose-5-phosphate (dRib5P)",
                "5-Phosphoribosyl-1-pyrophosphate (PRPP)",
                "6-Phosphogluconate (6-PG)",
                "6-Phosphoglucono-\u03b4-lactone (6-PGL)",
                "Dihydroxyacetone phosphate (DHAP)",
                "Erythrose-4-phosphate (E4P)",
                "Fructose-1,6-bisphosphate (F1,6BP)",
                "Fructose-6-phosphate (F6P)",
                "Glucose-1-phosphate (G1P)",
                "Glucose-6-phosphate (G6P)",
                "Glyceraldehyde-3-phosphate (G3P)",
                "Glycerone phosphate (GlyP)",
                "Mannose-6-phosphate (M6P)",
                "NADP+ (oxidized nicotinamide adenine dinucleotide phosphate)",
                "NADPH (reduced nicotinamide adenine dinucleotide phosphate)",
                "Phosphoribosyl pyrophosphate (PRPP)",
                "Ribose-5-phosphate (R5P)",
                "Ribulose-1,5-bisphosphate (Ru1,5BP)",
                "Ribulose-5-phosphate (Ru5P)",
                "Sedoheptulose-1,7-bisphosphate (S7P)",
                "Sedoheptulose-1-phosphate (S1P)",
                "Transketolase-bound hydroxymethylthiamine pyrophosphate (TK-HMPP)",
                "Xylitol-5-phosphate (X5P)",
                "Xylulose-5-phosphate (Xu5P)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate (G6P)",
            "6-Phosphoglucono-\u03b4-lactone",
            "6-Phosphogluconate",
            "Ribulose-5-phosphate (Ru5P)",
            "Ribose-5-phosphate (R5P)",
            "Xylulose-5-phosphate (Xu5P)",
            "Sedoheptulose-7-phosphate (S7P)",
            "Erythrose-4-phosphate (E4P)",
            "Fructose-6-phosphate (F6P)",
            "Glyceraldehyde-3-phosphate (G3P)",
            "NADPH",
            "NADP+",
            "CO2",
            "Transketolase",
            "Transaldolase",
            "3-Phosphoglycerate (3PG)",
            "Fructose-1,6-bisphosphate (F1,6BP)",
            "Dihydroxyacetone phosphate (DHAP)",
            "1,3-Bisphosphoglycerate (1,3BPG)",
            "2-Phosphoglycerate (2PG)",
            "Phosphoenolpyruvate (PEP)",
            "Pyruvate",
            "Lactate",
            "Gluconolactone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate (G6P)",
                "6-Phosphoglucono-\u03b4-lactone",
                "6-Phosphogluconate",
                "Ribulose-5-phosphate (Ru5P)",
                "Ribose-5-phosphate (R5P)",
                "Xylulose-5-phosphate (Xu5P)",
                "Sedoheptulose-7-phosphate (S7P)",
                "Erythrose-4-phosphate (E4P)",
                "Fructose-6-phosphate (F6P)",
                "Glyceraldehyde-3-phosphate (G3P)",
                "NADPH",
                "NADP+",
                "CO2",
                "Transketolase",
                "Transaldolase",
                "3-Phosphoglycerate (3PG)",
                "Fructose-1,6-bisphosphate (F1,6BP)",
                "Dihydroxyacetone phosphate (DHAP)",
                "1,3-Bisphosphoglycerate (1,3BPG)",
                "2-Phosphoglycerate (2PG)",
                "Phosphoenolpyruvate (PEP)",
                "Pyruvate",
                "Lactate"
            ],
            "mismatches": [
                "Gluconolactone"
            ],
            "true_referents": [
                "1,3-Bisphosphoglycerate (1,3BPG)",
                "2-Phosphoglycerate (2PG)",
                "3-Phosphoglycerate (3PG)",
                "6-Phosphogluconate",
                "6-Phosphoglucono-\u03b4-lactone",
                "CO2",
                "Dihydroxyacetone phosphate (DHAP)",
                "Erythrose-4-phosphate (E4P)",
                "Fructose-1,6-bisphosphate (F1,6BP)",
                "Fructose-6-phosphate (F6P)",
                "Gluconolactone",
                "Glucose-6-phosphate (G6P)",
                "Glyceraldehyde-3-phosphate (G3P)",
                "Lactate",
                "NADP+",
                "NADPH",
                "Phosphoenolpyruvate (PEP)",
                "Pyruvate",
                "Ribose-5-phosphate (R5P)",
                "Ribulose-5-phosphate (Ru5P)",
                "Sedoheptulose-7-phosphate (S7P)",
                "Transaldolase",
                "Transketolase",
                "Xylulose-5-phosphate (Xu5P)"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate (G6P)",
            "6-Phosphogluconate (6PG)",
            "Ribulose-5-phosphate (Ru5P)",
            "Ribose-5-phosphate (R5P)",
            "Xylulose-5-phosphate (Xu5P)",
            "Erythrose-4-phosphate (E4P)",
            "Sedulose-7-phosphate (S7P)",
            "Fructose-6-phosphate (F6P)",
            "Glyceraldehyde-3-phosphate (G3P)",
            "Dihydroxyacetone phosphate (DHAP)",
            "NADPH (NADPH)",
            "NADP+ (NADP)",
            "2-Keto-3-deoxy-6-phosphogluconate (KDPG)",
            "Transaldolase product (TAP)",
            "Transketolase product (TKP)",
            "3-Phosphoglycerate (3PG)",
            "Phosphoenolpyruvate (PEP)",
            "Adenosine triphosphate (ATP)",
            "Adenosine diphosphate (ADP)",
            "Nicotinamide adenine dinucleotide (NAD)",
            "Coenzyme A (CoA)",
            "Acetyl-CoA (AcCoA)",
            "Pyruvate (Pyr)",
            "Lactate (Lac)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate (G6P)",
                "6-Phosphogluconate (6PG)",
                "Ribulose-5-phosphate (Ru5P)",
                "Ribose-5-phosphate (R5P)",
                "Xylulose-5-phosphate (Xu5P)",
                "Erythrose-4-phosphate (E4P)",
                "Sedulose-7-phosphate (S7P)",
                "Fructose-6-phosphate (F6P)",
                "Glyceraldehyde-3-phosphate (G3P)",
                "Dihydroxyacetone phosphate (DHAP)",
                "NADPH (NADPH)",
                "NADP+ (NADP)",
                "2-Keto-3-deoxy-6-phosphogluconate (KDPG)",
                "Transaldolase product (TAP)",
                "Transketolase product (TKP)",
                "3-Phosphoglycerate (3PG)",
                "Phosphoenolpyruvate (PEP)",
                "Adenosine triphosphate (ATP)",
                "Adenosine diphosphate (ADP)",
                "Nicotinamide adenine dinucleotide (NAD)",
                "Coenzyme A (CoA)",
                "Acetyl-CoA (AcCoA)",
                "Pyruvate (Pyr)",
                "Lactate (Lac)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Keto-3-deoxy-6-phosphogluconate (KDPG)",
                "3-Phosphoglycerate (3PG)",
                "6-Phosphogluconate (6PG)",
                "Acetyl-CoA (AcCoA)",
                "Adenosine diphosphate (ADP)",
                "Adenosine triphosphate (ATP)",
                "Coenzyme A (CoA)",
                "Dihydroxyacetone phosphate (DHAP)",
                "Erythrose-4-phosphate (E4P)",
                "Fructose-6-phosphate (F6P)",
                "Glucose-6-phosphate (G6P)",
                "Glyceraldehyde-3-phosphate (G3P)",
                "Lactate (Lac)",
                "NADP+ (NADP)",
                "NADPH (NADPH)",
                "Nicotinamide adenine dinucleotide (NAD)",
                "Phosphoenolpyruvate (PEP)",
                "Pyruvate (Pyr)",
                "Ribose-5-phosphate (R5P)",
                "Ribulose-5-phosphate (Ru5P)",
                "Sedulose-7-phosphate (S7P)",
                "Transaldolase product (TAP)",
                "Transketolase product (TKP)",
                "Xylulose-5-phosphate (Xu5P)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate (G6P)",
            "6-Phosphoglucono-\u03b4-lactone (6PGL)",
            "6-Phosphogluconate (6PG)",
            "Ribulose 5-phosphate (Ru5P)",
            "Xylulose 5-phosphate (Xu5P)",
            "Sedoheptulose 7-phosphate (S7P)",
            "Erythrose 4-phosphate (E4P)",
            "Glyceraldehyde 3-phosphate (G3P)",
            "Fructose 6-phosphate (F6P)",
            "Ribose 5-phosphate (R5P)",
            "Dihydroxyacetone phosphate (DHAP)",
            "Glucono-1,5-lactone 6-phosphate",
            "3-Keto-6-phosphogluconate",
            "2-Keto-3-deoxy-6-phosphogluconate",
            "1,3-Bisphosphoglycerate (1,3BPG)",
            "3-Phosphoglycerate (3PG)",
            "2-Phosphoglycerate (2PG)",
            "Phosphoenolpyruvate (PEP)",
            "Pyruvate",
            "Acetyl-CoA",
            "Citrate",
            "Isocitrate",
            "\u03b1-Ketoglutarate (\u03b1KG)",
            "Succinyl-CoA"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate (G6P)",
                "6-Phosphoglucono-\u03b4-lactone (6PGL)",
                "6-Phosphogluconate (6PG)",
                "Ribulose 5-phosphate (Ru5P)",
                "Xylulose 5-phosphate (Xu5P)",
                "Sedoheptulose 7-phosphate (S7P)",
                "Erythrose 4-phosphate (E4P)",
                "Glyceraldehyde 3-phosphate (G3P)",
                "Fructose 6-phosphate (F6P)",
                "Ribose 5-phosphate (R5P)",
                "Dihydroxyacetone phosphate (DHAP)",
                "Glucono-1,5-lactone 6-phosphate",
                "3-Keto-6-phosphogluconate",
                "2-Keto-3-deoxy-6-phosphogluconate",
                "1,3-Bisphosphoglycerate (1,3BPG)",
                "3-Phosphoglycerate (3PG)",
                "2-Phosphoglycerate (2PG)",
                "Phosphoenolpyruvate (PEP)",
                "Pyruvate",
                "Acetyl-CoA",
                "Citrate",
                "Isocitrate",
                "\u03b1-Ketoglutarate (\u03b1KG)",
                "Succinyl-CoA"
            ],
            "mismatches": [],
            "true_referents": [
                "1,3-Bisphosphoglycerate (1,3BPG)",
                "2-Keto-3-deoxy-6-phosphogluconate",
                "2-Phosphoglycerate (2PG)",
                "3-Keto-6-phosphogluconate",
                "3-Phosphoglycerate (3PG)",
                "6-Phosphogluconate (6PG)",
                "6-Phosphoglucono-\u03b4-lactone (6PGL)",
                "Acetyl-CoA",
                "Citrate",
                "Dihydroxyacetone phosphate (DHAP)",
                "Erythrose 4-phosphate (E4P)",
                "Fructose 6-phosphate (F6P)",
                "Glucono-1,5-lactone 6-phosphate",
                "Glucose-6-phosphate (G6P)",
                "Glyceraldehyde 3-phosphate (G3P)",
                "Isocitrate",
                "Phosphoenolpyruvate (PEP)",
                "Pyruvate",
                "Ribose 5-phosphate (R5P)",
                "Ribulose 5-phosphate (Ru5P)",
                "Sedoheptulose 7-phosphate (S7P)",
                "Succinyl-CoA",
                "Xylulose 5-phosphate (Xu5P)",
                "\u03b1-Ketoglutarate (\u03b1KG)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate (G6P)",
            "6-Phosphogluconolactone (6PGL)",
            "6-Phosphogluconate (6PG)",
            "Ribulose-5-phosphate (Ru5P)",
            "Ribose-5-phosphate (R5P)",
            "Xylulose-5-phosphate (Xu5P)",
            "Sedoheptulose-7-phosphate (S7P)",
            "Erythrose-4-phosphate (E4P)",
            "Fructose-6-phosphate (F6P)",
            "Glyceraldehyde-3-phosphate (G3P)",
            "Dihydroxyacetone phosphate (DHAP)",
            "Sedoheptulose-1,7-bisphosphate (S17BP)",
            "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
            "Phosphogluconate dehydrogenase (PGD)",
            "Transketolase (TKT)",
            "Transaldolase (TAL)",
            "Ribose-phosphate pyrophosphokinase (PRPS)",
            "Phosphoribosyl pyrophosphate (PRPP)",
            "NADPH",
            "NADP+",
            "Glucose-1-phosphate (G1P)",
            "Fructose-1,6-bisphosphate (F16BP)",
            "Phosphogluconolactonase (PGLS)",
            "Ribose-1-phosphate (R1P)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate (G6P)",
                "6-Phosphogluconolactone (6PGL)",
                "6-Phosphogluconate (6PG)",
                "Ribulose-5-phosphate (Ru5P)",
                "Ribose-5-phosphate (R5P)",
                "Xylulose-5-phosphate (Xu5P)",
                "Sedoheptulose-7-phosphate (S7P)",
                "Erythrose-4-phosphate (E4P)",
                "Fructose-6-phosphate (F6P)",
                "Glyceraldehyde-3-phosphate (G3P)",
                "Dihydroxyacetone phosphate (DHAP)",
                "Sedoheptulose-1,7-bisphosphate (S17BP)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "Phosphogluconate dehydrogenase (PGD)",
                "Transketolase (TKT)",
                "Transaldolase (TAL)",
                "Ribose-phosphate pyrophosphokinase (PRPS)",
                "Phosphoribosyl pyrophosphate (PRPP)",
                "NADPH",
                "NADP+",
                "Glucose-1-phosphate (G1P)",
                "Fructose-1,6-bisphosphate (F16BP)",
                "Phosphogluconolactonase (PGLS)",
                "Ribose-1-phosphate (R1P)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-Phosphogluconate (6PG)",
                "6-Phosphogluconolactone (6PGL)",
                "Dihydroxyacetone phosphate (DHAP)",
                "Erythrose-4-phosphate (E4P)",
                "Fructose-1,6-bisphosphate (F16BP)",
                "Fructose-6-phosphate (F6P)",
                "Glucose-1-phosphate (G1P)",
                "Glucose-6-phosphate (G6P)",
                "Glyceraldehyde-3-phosphate (G3P)",
                "Glyceraldehyde-3-phosphate dehydrogenase (GAPDH)",
                "NADP+",
                "NADPH",
                "Phosphogluconate dehydrogenase (PGD)",
                "Phosphogluconolactonase (PGLS)",
                "Phosphoribosyl pyrophosphate (PRPP)",
                "Ribose-1-phosphate (R1P)",
                "Ribose-5-phosphate (R5P)",
                "Ribose-phosphate pyrophosphokinase (PRPS)",
                "Ribulose-5-phosphate (Ru5P)",
                "Sedoheptulose-1,7-bisphosphate (S17BP)",
                "Sedoheptulose-7-phosphate (S7P)",
                "Transaldolase (TAL)",
                "Transketolase (TKT)",
                "Xylulose-5-phosphate (Xu5P)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "Glucose-6-phosphate (G6P)",
            "6-Phosphogluconolactone (6PGL)",
            "6-Phosphogluconate (6PG)",
            "Ribulose-5-phosphate (Ru5P)",
            "Ribose-5-phosphate (R5P)",
            "Xylulose-5-phosphate (Xu5P)",
            "Erythrose-4-phosphate (E4P)",
            "Sedoheptulose-7-phosphate (S7P)",
            "Fructose-6-phosphate (F6P)",
            "Glyceraldehyde-3-phosphate (G3P)",
            "Dihydroxyacetone phosphate (DHAP)",
            "Sedoheptulose-1,7-bisphosphate",
            "Erythrulose-4-phosphate",
            "Tagatose-6-phosphate",
            "Fructose-1,6-bisphosphate (F1,6BP)",
            "Sediroheptulose-7-phosphate",
            "Ribose-1,5-bisphosphate",
            "D-Xylulose-5-phosphate",
            "L-Xylulose-5-phosphate",
            "Sedoheptulose-1,7-bisphosphate",
            "Allulose-6-phosphate",
            "Mannoheptulose-7-phosphate",
            "Psychosose-6-phosphate",
            "Neohorsefuranose-5-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose-6-phosphate (G6P)",
                "6-Phosphogluconolactone (6PGL)",
                "6-Phosphogluconate (6PG)",
                "Ribulose-5-phosphate (Ru5P)",
                "Ribose-5-phosphate (R5P)",
                "Xylulose-5-phosphate (Xu5P)",
                "Erythrose-4-phosphate (E4P)",
                "Sedoheptulose-7-phosphate (S7P)",
                "Fructose-6-phosphate (F6P)",
                "Glyceraldehyde-3-phosphate (G3P)",
                "Dihydroxyacetone phosphate (DHAP)",
                "Sedoheptulose-1,7-bisphosphate",
                "Erythrulose-4-phosphate",
                "Tagatose-6-phosphate",
                "Fructose-1,6-bisphosphate (F1,6BP)",
                "Ribose-1,5-bisphosphate",
                "D-Xylulose-5-phosphate",
                "L-Xylulose-5-phosphate",
                "Allulose-6-phosphate",
                "Mannoheptulose-7-phosphate",
                "Psychosose-6-phosphate",
                "Neohorsefuranose-5-phosphate"
            ],
            "mismatches": [
                "Sediroheptulose-7-phosphate"
            ],
            "true_referents": [
                "6-Phosphogluconate (6PG)",
                "6-Phosphogluconolactone (6PGL)",
                "Allulose-6-phosphate",
                "D-Xylulose-5-phosphate",
                "Dihydroxyacetone phosphate (DHAP)",
                "Erythrose-4-phosphate (E4P)",
                "Erythrulose-4-phosphate",
                "Fructose-1,6-bisphosphate (F1,6BP)",
                "Fructose-6-phosphate (F6P)",
                "Glucose-6-phosphate (G6P)",
                "Glyceraldehyde-3-phosphate (G3P)",
                "L-Xylulose-5-phosphate",
                "Mannoheptulose-7-phosphate",
                "Neohorsefuranose-5-phosphate",
                "Psychosose-6-phosphate",
                "Ribose-1,5-bisphosphate",
                "Ribose-5-phosphate (R5P)",
                "Ribulose-5-phosphate (Ru5P)",
                "Sediroheptulose-7-phosphate",
                "Sedoheptulose-1,7-bisphosphate",
                "Sedoheptulose-7-phosphate (S7P)",
                "Tagatose-6-phosphate",
                "Xylulose-5-phosphate (Xu5P)"
            ],
            "TP": 22,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "Glucose 6-phosphate (G6P)",
            "6-Phosphogluconolactone",
            "6-Phosphogluconate",
            "Ribulose 5-phosphate (Ru5P)",
            "Ribose 5-phosphate (R5P)",
            "Xylulose 5-phosphate (X5P)",
            "Sedoheptulose 7-phosphate (S7P)",
            "Erythrose 4-phosphate (E4P)",
            "Glyceraldehyde 3-phosphate (GAP)",
            "Fructose 6-phosphate (F6P)",
            "2-Keto-3-deoxy-6-phosphogluconate (KDPG)",
            "Glucono-1,5-lactone 6-phosphate",
            "Gluconate 6-phosphate",
            "Ribulose 1,5-bisphosphate",
            "Arabinose 5-phosphate",
            "Octulose 8-phosphate",
            "Nonulose 9-phosphate",
            "Glucosamine 6-phosphate",
            "N-Acetylglucosamine 6-phosphate",
            "Mannose 6-phosphate",
            "Fructose 1,6-bisphosphate",
            "Dihydroxyacetone phosphate (DHAP)",
            "2-Deoxy-D-ribose 5-phosphate",
            "Deoxyribose 5-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glucose 6-phosphate (G6P)",
                "6-Phosphogluconolactone",
                "6-Phosphogluconate",
                "Ribulose 5-phosphate (Ru5P)",
                "Ribose 5-phosphate (R5P)",
                "Xylulose 5-phosphate (X5P)",
                "Sedoheptulose 7-phosphate (S7P)",
                "Erythrose 4-phosphate (E4P)",
                "Glyceraldehyde 3-phosphate (GAP)",
                "Fructose 6-phosphate (F6P)",
                "2-Keto-3-deoxy-6-phosphogluconate (KDPG)",
                "Glucono-1,5-lactone 6-phosphate",
                "Gluconate 6-phosphate",
                "Ribulose 1,5-bisphosphate",
                "Arabinose 5-phosphate",
                "Octulose 8-phosphate",
                "Nonulose 9-phosphate",
                "Glucosamine 6-phosphate",
                "N-Acetylglucosamine 6-phosphate",
                "Mannose 6-phosphate",
                "Fructose 1,6-bisphosphate",
                "Dihydroxyacetone phosphate (DHAP)",
                "2-Deoxy-D-ribose 5-phosphate",
                "Deoxyribose 5-phosphate"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Deoxy-D-ribose 5-phosphate",
                "2-Keto-3-deoxy-6-phosphogluconate (KDPG)",
                "6-Phosphogluconate",
                "6-Phosphogluconolactone",
                "Arabinose 5-phosphate",
                "Deoxyribose 5-phosphate",
                "Dihydroxyacetone phosphate (DHAP)",
                "Erythrose 4-phosphate (E4P)",
                "Fructose 1,6-bisphosphate",
                "Fructose 6-phosphate (F6P)",
                "Gluconate 6-phosphate",
                "Glucono-1,5-lactone 6-phosphate",
                "Glucosamine 6-phosphate",
                "Glucose 6-phosphate (G6P)",
                "Glyceraldehyde 3-phosphate (GAP)",
                "Mannose 6-phosphate",
                "N-Acetylglucosamine 6-phosphate",
                "Nonulose 9-phosphate",
                "Octulose 8-phosphate",
                "Ribose 5-phosphate (R5P)",
                "Ribulose 1,5-bisphosphate",
                "Ribulose 5-phosphate (Ru5P)",
                "Sedoheptulose 7-phosphate (S7P)",
                "Xylulose 5-phosphate (X5P)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "D-Glucose 6-phosphate (G6P)",
            "D-Fructose 6-phosphate (F6P)",
            "D-Glucono-1,5-lactone 6-phosphate",
            "6-Phospho-D-gluconate (6PG)",
            "D-Ribulose 5-phosphate (Ru5P)",
            "D-Ribose 5-phosphate (R5P)",
            "D-Xylulose 5-phosphate (Xu5P)",
            "D-Sedoheptulose 7-phosphate (S7P)",
            "D-Erythrose 4-phosphate (E4P)",
            "D-Glyceraldehyde 3-phosphate (GAP)",
            "\u03b2-D-Fructose 1,6-bisphosphate (FBP)",
            "Dihydroxyacetone phosphate (DHAP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "D-Glucose 6-phosphate (G6P)",
                "D-Fructose 6-phosphate (F6P)",
                "D-Glucono-1,5-lactone 6-phosphate",
                "6-Phospho-D-gluconate (6PG)",
                "D-Ribulose 5-phosphate (Ru5P)",
                "D-Ribose 5-phosphate (R5P)",
                "D-Xylulose 5-phosphate (Xu5P)",
                "D-Sedoheptulose 7-phosphate (S7P)",
                "D-Erythrose 4-phosphate (E4P)",
                "D-Glyceraldehyde 3-phosphate (GAP)",
                "\u03b2-D-Fructose 1,6-bisphosphate (FBP)",
                "Dihydroxyacetone phosphate (DHAP)"
            ],
            "mismatches": [],
            "true_referents": [
                "6-Phospho-D-gluconate (6PG)",
                "D-Erythrose 4-phosphate (E4P)",
                "D-Fructose 6-phosphate (F6P)",
                "D-Glucono-1,5-lactone 6-phosphate",
                "D-Glucose 6-phosphate (G6P)",
                "D-Glyceraldehyde 3-phosphate (GAP)",
                "D-Ribose 5-phosphate (R5P)",
                "D-Ribulose 5-phosphate (Ru5P)",
                "D-Sedoheptulose 7-phosphate (S7P)",
                "D-Xylulose 5-phosphate (Xu5P)",
                "Dihydroxyacetone phosphate (DHAP)",
                "\u03b2-D-Fructose 1,6-bisphosphate (FBP)"
            ],
            "TP": 12,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "D-Ribulose 5-phosphate (Ru5P)",
            "D-Ribose 5-phosphate (R5P)",
            "D-Xylulose 5-phosphate (Xu5P)",
            "Sedoheptulose 7-phosphate (S7P)",
            "Erythrose 4-phosphate (E4P)",
            "Glyceraldehyde 3-phosphate (G3P)",
            "Fructose 6-phosphate (F6P)",
            "Glucose 6-phosphate (G6P)",
            "6-Phosphogluconolactone (6PGL)",
            "6-Phosphogluconate (6PG)",
            "Ribulose 1,5-bisphosphate (RuBP)",
            "3-Phosphoglycerate (3PG)",
            "2-Phosphoglycolate (2PG)",
            "Phosphoenolpyruvate (PEP)",
            "Acetyl-CoA",
            "Pyruvate",
            "Oxaloacetate",
            "\u03b1-Ketoglutarate",
            "Succinyl-CoA",
            "Fumarate",
            "Malate",
            "Isocitrate",
            "Citrate",
            "cis-Aconitate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "D-Ribulose 5-phosphate (Ru5P)",
                "D-Ribose 5-phosphate (R5P)",
                "D-Xylulose 5-phosphate (Xu5P)",
                "Sedoheptulose 7-phosphate (S7P)",
                "Erythrose 4-phosphate (E4P)",
                "Glyceraldehyde 3-phosphate (G3P)",
                "Fructose 6-phosphate (F6P)",
                "Glucose 6-phosphate (G6P)",
                "6-Phosphogluconolactone (6PGL)",
                "6-Phosphogluconate (6PG)",
                "Ribulose 1,5-bisphosphate (RuBP)",
                "3-Phosphoglycerate (3PG)",
                "2-Phosphoglycolate (2PG)",
                "Phosphoenolpyruvate (PEP)",
                "Acetyl-CoA",
                "Pyruvate",
                "Oxaloacetate",
                "\u03b1-Ketoglutarate",
                "Succinyl-CoA",
                "Fumarate",
                "Malate",
                "Isocitrate",
                "Citrate",
                "cis-Aconitate"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Phosphoglycolate (2PG)",
                "3-Phosphoglycerate (3PG)",
                "6-Phosphogluconate (6PG)",
                "6-Phosphogluconolactone (6PGL)",
                "Acetyl-CoA",
                "Citrate",
                "D-Ribose 5-phosphate (R5P)",
                "D-Ribulose 5-phosphate (Ru5P)",
                "D-Xylulose 5-phosphate (Xu5P)",
                "Erythrose 4-phosphate (E4P)",
                "Fructose 6-phosphate (F6P)",
                "Fumarate",
                "Glucose 6-phosphate (G6P)",
                "Glyceraldehyde 3-phosphate (G3P)",
                "Isocitrate",
                "Malate",
                "Oxaloacetate",
                "Phosphoenolpyruvate (PEP)",
                "Pyruvate",
                "Ribulose 1,5-bisphosphate (RuBP)",
                "Sedoheptulose 7-phosphate (S7P)",
                "Succinyl-CoA",
                "cis-Aconitate",
                "\u03b1-Ketoglutarate"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "Ribose 5-phosphate (R5P)",
            "Ribulose 5-phosphate (Ru5P)",
            "Xylulose 5-phosphate (X5P)",
            "Erythrulose 4-phosphate (E4P)",
            "Sedoheptulose 7-phosphate (S7P)",
            "Glyceraldehyde 3-phosphate (G3P)",
            "Fructose 6-phosphate (F6P)",
            "6-Phosphogluconate (6PG)",
            "6-Phosphogluconolactone (6PGL)",
            "Glucose 6-phosphate (G6P)",
            "Glucono-1,5-lactone 6-phosphate (GL6P)",
            "2-Keto-3-deoxy-6-phosphogluconate (KDPG)",
            "2-Dehydro-3-deoxy-6-phosphogluconate (DDPG)",
            "Dihydroxyacetone phosphate (DHAP)",
            "Phosphoenolpyruvate (PEP)",
            "Pyruvate (Pyr)",
            "Acetyl-CoA (AcCoA)",
            "Oxaloacetate (OAA)",
            "Citrate (Cit)",
            "Isocitrate (ICit)",
            "\u03b1-Ketoglutarate (\u03b1-KG)",
            "Succinyl-CoA (SucCoA)",
            "Succinate (Suc)",
            "Fumarate (Fum)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ribose 5-phosphate (R5P)",
                "Ribulose 5-phosphate (Ru5P)",
                "Xylulose 5-phosphate (X5P)",
                "Erythrulose 4-phosphate (E4P)",
                "Sedoheptulose 7-phosphate (S7P)",
                "Glyceraldehyde 3-phosphate (G3P)",
                "Fructose 6-phosphate (F6P)",
                "6-Phosphogluconate (6PG)",
                "6-Phosphogluconolactone (6PGL)",
                "Glucose 6-phosphate (G6P)",
                "Glucono-1,5-lactone 6-phosphate (GL6P)",
                "2-Keto-3-deoxy-6-phosphogluconate (KDPG)",
                "2-Dehydro-3-deoxy-6-phosphogluconate (DDPG)",
                "Dihydroxyacetone phosphate (DHAP)",
                "Phosphoenolpyruvate (PEP)",
                "Pyruvate (Pyr)",
                "Acetyl-CoA (AcCoA)",
                "Oxaloacetate (OAA)",
                "Citrate (Cit)",
                "Isocitrate (ICit)",
                "\u03b1-Ketoglutarate (\u03b1-KG)",
                "Succinyl-CoA (SucCoA)",
                "Succinate (Suc)",
                "Fumarate (Fum)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Dehydro-3-deoxy-6-phosphogluconate (DDPG)",
                "2-Keto-3-deoxy-6-phosphogluconate (KDPG)",
                "6-Phosphogluconate (6PG)",
                "6-Phosphogluconolactone (6PGL)",
                "Acetyl-CoA (AcCoA)",
                "Citrate (Cit)",
                "Dihydroxyacetone phosphate (DHAP)",
                "Erythrulose 4-phosphate (E4P)",
                "Fructose 6-phosphate (F6P)",
                "Fumarate (Fum)",
                "Glucono-1,5-lactone 6-phosphate (GL6P)",
                "Glucose 6-phosphate (G6P)",
                "Glyceraldehyde 3-phosphate (G3P)",
                "Isocitrate (ICit)",
                "Oxaloacetate (OAA)",
                "Phosphoenolpyruvate (PEP)",
                "Pyruvate (Pyr)",
                "Ribose 5-phosphate (R5P)",
                "Ribulose 5-phosphate (Ru5P)",
                "Sedoheptulose 7-phosphate (S7P)",
                "Succinate (Suc)",
                "Succinyl-CoA (SucCoA)",
                "Xylulose 5-phosphate (X5P)",
                "\u03b1-Ketoglutarate (\u03b1-KG)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "R5P (Ribose-5-phosphate)",
            "Ribu5P (Ribulose-5-phosphate)",
            "Xu5P (Xylulose-5-phosphate)",
            "G3P (Glyceraldehyde-3-phosphate)",
            "6-PG (6-Phosphogluconate)",
            "CO2 (Carbon dioxide)",
            "NADPH (Nicotinamide adenine dinucleotide phosphate)",
            "ATP (Adenosine triphosphate)",
            "G6P (Glucose-6-phosphate)",
            " Sedoheptulose-7-phosphate",
            "Erythrose-4-phosphate",
            "Fructose-6-phosphate",
            "Glyceraldehyde-1,3-bisphosphate",
            "Dihydroxyacetone phosphate",
            "Erythrose-4-phosphate",
            "Fructose-1,6-bisphosphate",
            "Glyceraldehyde-3-phosphate",
            "Glycerol-3-phosphate",
            "Ribose-5-phosphate isomerase",
            "Ribulose-5-phosphate isomerase",
            "Xylulose-5-phosphate isomerase",
            "Glyceraldehyde-3-phosphate dehydrogenase",
            "6-Phosphogluconate dehydrogenase",
            "NADPH oxidase",
            "ATP synthase"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "R5P (Ribose-5-phosphate)",
                "Ribu5P (Ribulose-5-phosphate)",
                "Xu5P (Xylulose-5-phosphate)",
                "G3P (Glyceraldehyde-3-phosphate)",
                "6-PG (6-Phosphogluconate)",
                "CO2 (Carbon dioxide)",
                "NADPH (Nicotinamide adenine dinucleotide phosphate)",
                "ATP (Adenosine triphosphate)",
                "G6P (Glucose-6-phosphate)",
                " Sedoheptulose-7-phosphate",
                "Erythrose-4-phosphate",
                "Fructose-6-phosphate",
                "Dihydroxyacetone phosphate",
                "Fructose-1,6-bisphosphate",
                "Glyceraldehyde-3-phosphate",
                "Glycerol-3-phosphate",
                "Ribose-5-phosphate isomerase",
                "Ribulose-5-phosphate isomerase",
                "Xylulose-5-phosphate isomerase",
                "Glyceraldehyde-3-phosphate dehydrogenase",
                "6-Phosphogluconate dehydrogenase",
                "NADPH oxidase"
            ],
            "mismatches": [
                "Glyceraldehyde-1,3-bisphosphate",
                "ATP synthase"
            ],
            "true_referents": [
                " Sedoheptulose-7-phosphate",
                "6-PG (6-Phosphogluconate)",
                "6-Phosphogluconate dehydrogenase",
                "ATP (Adenosine triphosphate)",
                "CO2 (Carbon dioxide)",
                "Dihydroxyacetone phosphate",
                "Erythrose-4-phosphate",
                "Fructose-1,6-bisphosphate",
                "Fructose-6-phosphate",
                "G3P (Glyceraldehyde-3-phosphate)",
                "G6P (Glucose-6-phosphate)",
                "Glyceraldehyde-1,3-bisphosphate",
                "Glyceraldehyde-3-phosphate",
                "Glyceraldehyde-3-phosphate dehydrogenase",
                "Glycerol-3-phosphate",
                "NADPH (Nicotinamide adenine dinucleotide phosphate)",
                "NADPH oxidase",
                "R5P (Ribose-5-phosphate)",
                "Ribose-5-phosphate isomerase",
                "Ribu5P (Ribulose-5-phosphate)",
                "Ribulose-5-phosphate isomerase",
                "Xu5P (Xylulose-5-phosphate)",
                "Xylulose-5-phosphate isomerase"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            "D-Ribose-5-phosphate (R5P)",
            "D-Ribulose-5-phosphate (RUL5P)",
            "D-Xylulose-5-phosphate (XUL5P)",
            "D-Arabinose-5-phosphate (A5P)",
            "D-Ribose (RIB)",
            "D-Ribulose (RUL)",
            "D-Xylulose (XUL)",
            "D-Arabinose (A)",
            "6-Phospho-D-glucono-1,5-lactone (6PGL)",
            "D-Glucono-1,5-lactone-6-phosphate (GLC1L6P)",
            "6-Phospho-D-gluconate (6PG)",
            "D-Gluconate-6-phosphate (GLC6P)",
            "D-Gluconic acid (GLC)",
            "6-Phosphoglucono-\u03b4-lactone (6PGL)",
            "D-Glucono-\u03b4-lactone-6-phosphate (GLC\u03b4L6P)",
            "D-Glucono-\u03b4-lactone (GLC\u03b4L)",
            "2-Keto-3-deoxy-6-phosphogluconate (KDPG)",
            "D-Gluconate-6-phosphate (GLC6P)",
            "D-Gluconic acid (GLC)",
            "3-Deoxy-D-glycero-D-galacto-heptose-7-phosphate (DG7P)",
            "D-Sedoheptulose-7-phosphate (S7P)",
            "D-Sedoheptulose (S7)",
            "D-Glycero-D-manno-heptose-7-phosphate (GM7P)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "D-Ribose-5-phosphate (R5P)",
                "D-Ribulose-5-phosphate (RUL5P)",
                "D-Xylulose-5-phosphate (XUL5P)",
                "D-Arabinose-5-phosphate (A5P)",
                "D-Ribose (RIB)",
                "D-Ribulose (RUL)",
                "D-Xylulose (XUL)",
                "D-Arabinose (A)",
                "6-Phospho-D-glucono-1,5-lactone (6PGL)",
                "D-Glucono-1,5-lactone-6-phosphate (GLC1L6P)",
                "6-Phospho-D-gluconate (6PG)",
                "D-Gluconate-6-phosphate (GLC6P)",
                "D-Gluconic acid (GLC)",
                "6-Phosphoglucono-\u03b4-lactone (6PGL)",
                "D-Glucono-\u03b4-lactone-6-phosphate (GLC\u03b4L6P)",
                "D-Glucono-\u03b4-lactone (GLC\u03b4L)",
                "2-Keto-3-deoxy-6-phosphogluconate (KDPG)",
                "3-Deoxy-D-glycero-D-galacto-heptose-7-phosphate (DG7P)",
                "D-Sedoheptulose-7-phosphate (S7P)",
                "D-Sedoheptulose (S7)",
                "D-Glycero-D-manno-heptose-7-phosphate (GM7P)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Keto-3-deoxy-6-phosphogluconate (KDPG)",
                "3-Deoxy-D-glycero-D-galacto-heptose-7-phosphate (DG7P)",
                "6-Phospho-D-gluconate (6PG)",
                "6-Phospho-D-glucono-1,5-lactone (6PGL)",
                "6-Phosphoglucono-\u03b4-lactone (6PGL)",
                "D-Arabinose (A)",
                "D-Arabinose-5-phosphate (A5P)",
                "D-Gluconate-6-phosphate (GLC6P)",
                "D-Gluconic acid (GLC)",
                "D-Glucono-1,5-lactone-6-phosphate (GLC1L6P)",
                "D-Glucono-\u03b4-lactone (GLC\u03b4L)",
                "D-Glucono-\u03b4-lactone-6-phosphate (GLC\u03b4L6P)",
                "D-Glycero-D-manno-heptose-7-phosphate (GM7P)",
                "D-Ribose (RIB)",
                "D-Ribose-5-phosphate (R5P)",
                "D-Ribulose (RUL)",
                "D-Ribulose-5-phosphate (RUL5P)",
                "D-Sedoheptulose (S7)",
                "D-Sedoheptulose-7-phosphate (S7P)",
                "D-Xylulose (XUL)",
                "D-Xylulose-5-phosphate (XUL5P)"
            ],
            "TP": 21,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "pentose phosphate pathway organic intermediate",
        "domain": "biology",
        "response": [
            {
                "Referent": "D-ribose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            },
            {
                "Referent": "D-ribulose-5-phosphate (R5P)",
                "Canonical Name": "D-Ribulose-5-phosphate"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "{\"Referent\": \"D-ribose-5-phosphate (R5P)\", \"Canonical Name\": \"D-Ribulose-5-phosphate\"}",
                "{\"Referent\": \"D-ribulose-5-phosphate (R5P)\", \"Canonical Name\": \"D-Ribulose-5-phosphate\"}"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"D-ribose-5-phosphate (R5P)\", \"Canonical Name\": \"D-Ribulose-5-phosphate\"}",
                "{\"Referent\": \"D-ribulose-5-phosphate (R5P)\", \"Canonical Name\": \"D-Ribulose-5-phosphate\"}"
            ],
            "TP": 2,
            "FP": 0,
            "FN": 0
        }
    }
]