[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "fructose (Fru)",
            "tagatose",
            "psicose",
            "sorbose",
            "ribose-5-phosphate",
            "xylofuranose",
            "lyxofuranose",
            "ribulose",
            "xylulose",
            "lyxulose",
            "sedoheptulose",
            "fructofuranose",
            "galactofuranose",
            "glucosulose",
            "mannofuranose",
            "altrufuranose",
            "ribulose-5-phosphate",
            "xylulose-5-phosphate",
            "ribulose bisphosphate",
            "sedoheptulose-7-phosphate",
            "ribulose-1,5-bisphosphate",
            "xylulose-1,5-bisphosphate",
            "sedoheptulose-1,7-bisphosphate",
            "fructose-1,6-bisphosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "fructose (Fru)",
                "tagatose",
                "psicose",
                "sorbose",
                "fructofuranose"
            ],
            "mismatches": [
                "ribose-5-phosphate",
                "xylofuranose",
                "lyxofuranose",
                "ribulose",
                "xylulose",
                "lyxulose",
                "sedoheptulose",
                "galactofuranose",
                "glucosulose",
                "mannofuranose",
                "altrufuranose",
                "ribulose-5-phosphate",
                "xylulose-5-phosphate",
                "ribulose bisphosphate",
                "sedoheptulose-7-phosphate",
                "ribulose-1,5-bisphosphate",
                "xylulose-1,5-bisphosphate",
                "sedoheptulose-1,7-bisphosphate",
                "fructose-1,6-bisphosphate"
            ],
            "true_referents": [
                "D-fructofuranose 1,6-bisphosphate",
                "D-fructose",
                "D-fructose 1-phosphate",
                "D-fructose 6-phosphate",
                "D-psicose",
                "D-sorbose",
                "D-sorbose 1,6-bisphosphate",
                "D-tagatose",
                "L-fructofuranose",
                "L-fructopyranose",
                "L-fructose",
                "L-psicose",
                "L-rhamnulose",
                "L-sorbofuranose",
                "L-sorbose",
                "L-tagatose",
                "L-xylo-3-hexulose",
                "alpha-L-sorbofuranose",
                "beta-D-fructofuranose 1,6-bisphosphate",
                "beta-D-fructopyranose 1-phosphate",
                "fructofuranose",
                "fructopyranose",
                "fructose",
                "keto-D-fructose 1,6-bisphosphate",
                "keto-D-fructose 1-phosphate",
                "keto-D-tagatose",
                "keto-L-tagatose",
                "keto-L-tagatose 6-phosphate",
                "psicose",
                "sorbofuranose",
                "sorbose",
                "sorbose 1-phosphate",
                "tagatose"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "Fructose (Fru)",
            "Fructofuranose",
            "Fructopyranose",
            "Sorbose (Sor)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fructofuranose",
                "Fructopyranose",
                "Sorbose (Sor)"
            ],
            "mismatches": [
                "Fructose (Fru)"
            ],
            "true_referents": [
                "D-fructose",
                "D-sorbose",
                "L-fructofuranose",
                "L-fructopyranose",
                "L-fructose",
                "L-sorbose",
                "fructofuranose",
                "fructopyranose",
                "fructose",
                "sorbose"
            ],
            "TP": 3,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "Fructose (Fru)",
            "Tagatose",
            "Sorbose",
            "Psicose",
            "Allulose",
            "D-Fructofuranose",
            "L-Fructofuranose",
            "D-Fructopyranose",
            "L-Fructopyranose",
            "D-Psicose",
            "L-Psicose",
            "D-Tagatose",
            "L-Tagatose",
            "D-Sorbose",
            "L-Sorbose",
            "D-Xylulose",
            "L-Xylulose",
            "D-Altroheptulose",
            "L-Altroheptulose",
            "D-Mannoheptulose",
            "L-Mannoheptulose",
            "D-Sedoheptulose",
            "L-Sedoheptulose",
            "D-Taloheptulose",
            "L-Taloheptulose"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fructose (Fru)",
                "Tagatose",
                "Sorbose",
                "Psicose",
                "D-Fructofuranose",
                "L-Fructofuranose",
                "D-Fructopyranose",
                "L-Fructopyranose",
                "D-Psicose",
                "L-Psicose",
                "D-Tagatose",
                "L-Tagatose",
                "D-Sorbose",
                "L-Sorbose"
            ],
            "mismatches": [
                "Allulose",
                "D-Xylulose",
                "L-Xylulose",
                "D-Altroheptulose",
                "L-Altroheptulose",
                "D-Mannoheptulose",
                "L-Mannoheptulose",
                "D-Sedoheptulose",
                "L-Sedoheptulose",
                "D-Taloheptulose",
                "L-Taloheptulose"
            ],
            "true_referents": [
                "D-fructofuranose",
                "D-fructopyranose",
                "D-fructose",
                "D-psicose",
                "D-sorbose",
                "D-tagatofuranose",
                "D-tagatose",
                "L-fructofuranose",
                "L-fructopyranose",
                "L-fructose",
                "L-fuculose",
                "L-psicose",
                "L-sorbose",
                "L-sorbose 1-phosphate",
                "L-tagatose",
                "L-xylo-3-hexulose",
                "beta-D-fructofuranose",
                "beta-D-fructopyranose",
                "beta-L-fructopyranose",
                "fructofuranose",
                "fructopyranose",
                "fructose",
                "keto-D-sorbose",
                "keto-D-tagatose",
                "keto-L-tagatose",
                "psicose",
                "sorbose",
                "tagatose"
            ],
            "TP": 14,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "Fructose (Fru)",
            "D-Fructose",
            "L-Fructose",
            "Fructose-6-phosphate (F6P)",
            "D-Fructose-6-phosphate",
            "L-Fructose-6-phosphate",
            "Fructose-1,6-bisphosphate (FBP)",
            "D-Fructose-1,6-bisphosphate",
            "L-Fructose-1,6-bisphosphate",
            "Sedoheptulose (S7U)",
            "D-Sedoheptulose",
            "L-Sedoheptulose",
            "Sedoheptulose-1,7-bisphosphate (S1,7BP)",
            "D-Sedoheptulose-1,7-bisphosphate",
            "L-Sedoheptulose-1,7-bisphosphate",
            "D-Psicose",
            "L-Psicose",
            "D-Sorbose",
            "L-Sorbose",
            "D-Tagatose",
            "L-Tagatose",
            "D-Mannose (as an intermediate in fructose metabolism)",
            "L-Mannose (as an intermediate in fructose metabolism)",
            "Ribulose (Ru)",
            "D-Ribulose"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "D-Fructose",
                "L-Fructose",
                "D-Fructose-6-phosphate",
                "D-Fructose-1,6-bisphosphate",
                "D-Psicose",
                "L-Psicose",
                "D-Sorbose",
                "L-Sorbose",
                "D-Tagatose",
                "L-Tagatose",
                "Fructose"
            ],
            "mismatches": [
                "Fructose-6-phosphate (F6P)",
                "L-Fructose-6-phosphate",
                "Fructose-1,6-bisphosphate (FBP)",
                "L-Fructose-1,6-bisphosphate",
                "Sedoheptulose (S7U)",
                "D-Sedoheptulose",
                "L-Sedoheptulose",
                "Sedoheptulose-1,7-bisphosphate (S1,7BP)",
                "D-Sedoheptulose-1,7-bisphosphate",
                "L-Sedoheptulose-1,7-bisphosphate",
                "D-Mannose (as an intermediate in fructose metabolism)",
                "L-Mannose (as an intermediate in fructose metabolism)",
                "Ribulose (Ru)",
                "D-Ribulose"
            ],
            "true_referents": [
                "5-dehydro-D-fructose",
                "6-deoxy-beta-L-fructofuranose",
                "D-fructofuranose 1,6-bisphosphate",
                "D-fructopyranose",
                "D-fructose",
                "D-fructose 1-phosphate",
                "D-fructose 6-phosphate",
                "D-psicose",
                "D-sorbose",
                "D-sorbose 1,6-bisphosphate",
                "D-tagatose",
                "L-fructopyranose",
                "L-fructose",
                "L-fuculose",
                "L-psicose",
                "L-rhamnulose",
                "L-sorbose",
                "L-sorbose 1-phosphate",
                "L-tagatose",
                "L-xylo-3-hexulose",
                "alpha-D-tagatofuranose",
                "beta-D-fructofuranose 1,6-bisphosphate",
                "fructose",
                "fructoselysine 6-phosphate",
                "keto-D-fructose 1,6-bisphosphate",
                "keto-D-fructose 6-phosphate",
                "keto-D-sorbose",
                "keto-D-tagatose",
                "keto-L-fructose",
                "keto-L-tagatose",
                "psicose",
                "sorbose",
                "tagatose"
            ],
            "TP": 11,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "Fructose (C6H12O6)",
            "Sorbose (C6H12O6)",
            "Tagatose (C6H12O6)",
            "Psicose (C6H12O6)",
            "Allulose (C6H12O6)",
            "Dihydroxyacetone dimer (C6H12O6)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fructose (C6H12O6)",
                "Sorbose (C6H12O6)",
                "Tagatose (C6H12O6)",
                "Psicose (C6H12O6)"
            ],
            "mismatches": [
                "Allulose (C6H12O6)",
                "Dihydroxyacetone dimer (C6H12O6)"
            ],
            "true_referents": [
                "3-deoxy-keto-D-fructose",
                "5-dehydro-D-fructose",
                "6-deoxy-beta-L-fructofuranose",
                "D-fructose",
                "D-psicose",
                "D-sorbose",
                "L-fructose",
                "L-psicose",
                "L-sorbose",
                "L-xylo-3-hexulose",
                "fructose",
                "keto-D-sorbose",
                "keto-L-tagatose",
                "psicose",
                "sorbose",
                "tagatose derivative"
            ],
            "TP": 4,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "fructose (Fru)",
            "sorbose (Sor)",
            "psicose (Psi)",
            "tagatose (Tag)",
            "allulose (All)",
            "dihydroxyacetone (DHA)",
            "sorbose (Sor)",
            "2-keto-D-glucose (2KDG)",
            "2-keto-D-mannose (2KDM)",
            "2-keto-D-galactose (2KDGal)",
            "2-keto-D-lyxose (2KDLy)",
            "2-keto-D-ribose (2KDR)",
            "2-keto-D-arabinose (2KDA)",
            "2-keto-D-xylulose (2KDX)",
            "2-keto-D-xylose (2KDXy)",
            "2-keto-D-rhamnose (2KDRh)",
            "2-keto-D-fucose (2KDFu)",
            "2-keto-D-mannose (2KDM)",
            "2-keto-D-idohexose (2KDI)",
            "2-keto-D-gulose (2KDGul)",
            "2-keto-D-talose (2KDTal)",
            "2-keto-D-galactose (2KDGal)",
            "2-keto-D-allose (2KDA)",
            "2-keto-D-mannose (2KDM)",
            "2-keto-D-lyxose (2KDLy)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "fructose (Fru)",
                "sorbose (Sor)",
                "psicose (Psi)",
                "tagatose (Tag)"
            ],
            "mismatches": [
                "allulose (All)",
                "dihydroxyacetone (DHA)",
                "2-keto-D-glucose (2KDG)",
                "2-keto-D-mannose (2KDM)",
                "2-keto-D-galactose (2KDGal)",
                "2-keto-D-lyxose (2KDLy)",
                "2-keto-D-ribose (2KDR)",
                "2-keto-D-arabinose (2KDA)",
                "2-keto-D-xylulose (2KDX)",
                "2-keto-D-xylose (2KDXy)",
                "2-keto-D-rhamnose (2KDRh)",
                "2-keto-D-fucose (2KDFu)",
                "2-keto-D-idohexose (2KDI)",
                "2-keto-D-gulose (2KDGul)",
                "2-keto-D-talose (2KDTal)",
                "2-keto-D-allose (2KDA)"
            ],
            "true_referents": [
                "3-deoxy-keto-D-fructose",
                "3-keto-beta-D-galactose",
                "5-dehydro-D-fructose",
                "6-deoxy-beta-L-fructofuranose",
                "D-fructose",
                "D-psicose",
                "D-sorbose",
                "D-tagatose",
                "L-fructose",
                "L-psicose",
                "L-sorbose",
                "L-tagatose",
                "L-xylo-3-hexulose",
                "fructose",
                "keto-D-fructose",
                "keto-D-fructose 1-phosphate",
                "keto-D-fructose 6-phosphate",
                "keto-D-sorbose",
                "keto-D-tagatose",
                "keto-L-sorbose",
                "keto-L-tagatose",
                "ketohexose derivative",
                "psicose",
                "sorbose",
                "tagatose"
            ],
            "TP": 4,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "Fructose (C6H12O6)",
            "Psicose (C6H12O6)",
            "Sorbose (C6H12O6)",
            "Tagatose (C6H12O6)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fructose (C6H12O6)",
                "Psicose (C6H12O6)",
                "Sorbose (C6H12O6)"
            ],
            "mismatches": [
                "Tagatose (C6H12O6)"
            ],
            "true_referents": [
                "D-fructose",
                "D-psicose",
                "D-sorbose",
                "L-fructose",
                "L-psicose",
                "L-sorbose",
                "fructose",
                "keto-L-tagatose",
                "psicose",
                "sorbose",
                "tagatose derivative"
            ],
            "TP": 3,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "Fructose (Fru)",
            "Sorbose (Sor)",
            "Tagatose (Tag)",
            "Psicose (Psi)",
            "Allose (All)",
            "Altrose (Alt)",
            "Glucose (Glc)",
            "Mannose (Man)",
            "Gulose (Gul)",
            "Idose (Ido)",
            "Talose (Tal)",
            "Xylulose (Xyl)",
            "Lyxose (Lyx)",
            "Ribose (Rib)",
            "Arabinose (Ara)",
            "Deoxyribose (dRib)",
            "Erythrulose (Ery)",
            "Threose (Thr)",
            "Erythrose (Ert)",
            "Xylose (Xyl)",
            "Lyxose (Lyx)",
            "Rhamnose (Rha)",
            "Fucose (Fuc)",
            "Ketohexose"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fructose (Fru)",
                "Sorbose (Sor)",
                "Tagatose (Tag)",
                "Psicose (Psi)",
                "Ketohexose"
            ],
            "mismatches": [
                "Allose (All)",
                "Altrose (Alt)",
                "Glucose (Glc)",
                "Mannose (Man)",
                "Gulose (Gul)",
                "Idose (Ido)",
                "Talose (Tal)",
                "Xylulose (Xyl)",
                "Lyxose (Lyx)",
                "Ribose (Rib)",
                "Arabinose (Ara)",
                "Deoxyribose (dRib)",
                "Erythrulose (Ery)",
                "Threose (Thr)",
                "Erythrose (Ert)",
                "Xylose (Xyl)",
                "Lyxose (Lyx)",
                "Rhamnose (Rha)",
                "Fucose (Fuc)"
            ],
            "true_referents": [
                "1,5-anhydro-D-erythro-hex-1-en-3-ulose",
                "3-dehydro-D-guloside",
                "3-deoxy-3-methyl-beta-D-fructofuranose",
                "3-deoxyglucosone",
                "5-dehydro-D-fructose",
                "6-deoxy-beta-L-fructofuranose",
                "D-fructose",
                "D-psicose",
                "D-sorbose",
                "D-tagatose",
                "L-fructopyranose",
                "L-fructose",
                "L-fuculose",
                "L-fuculose 1-phosphate",
                "L-psicose",
                "L-rhamnulose",
                "L-rhamnulose 1-phosphate",
                "L-sorbose",
                "L-tagatose",
                "L-xylo-3-hexulose",
                "alpha-D-fructopyranose",
                "alpha-chrysopine",
                "beta-D-fructopyranose",
                "beta-chrysopine",
                "deoxyketohexose",
                "deoxyketohexose phosphate",
                "fructopyranose",
                "fructose",
                "keto-D-sorbose",
                "keto-D-tagatose",
                "keto-L-tagatose",
                "ketohexose derivative",
                "psicose",
                "sorbose",
                "tagatose"
            ],
            "TP": 5,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "Fructose (Fru)",
            "D-Fructose",
            "L-Fructose",
            "Psicose (Psi)",
            "D-Psicose",
            "L-Psicose",
            "Sorbose (Sor)",
            "D-Sorbose",
            "L-Sorbose",
            "Tagatose (Tag)",
            "D-Tagatose",
            "L-Tagatose",
            "Allofructose",
            "D-Allofructose",
            "L-Allofructose",
            "Neofructose",
            "D-Neofructose",
            "L-Neofructose",
            "Idose",
            "D-Idose",
            "L-Idose",
            "Cidarose",
            "D-Cidarose",
            "L-Cidarose"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "D-Fructose",
                "L-Fructose",
                "D-Psicose",
                "L-Psicose",
                "D-Sorbose",
                "L-Sorbose",
                "D-Tagatose",
                "L-Tagatose"
            ],
            "mismatches": [
                "Fructose (Fru)",
                "Psicose (Psi)",
                "Sorbose (Sor)",
                "Tagatose (Tag)",
                "Allofructose",
                "D-Allofructose",
                "L-Allofructose",
                "Neofructose",
                "D-Neofructose",
                "L-Neofructose",
                "Idose",
                "D-Idose",
                "L-Idose",
                "Cidarose",
                "D-Cidarose",
                "L-Cidarose"
            ],
            "true_referents": [
                "3-deoxyglucosone",
                "5-dehydro-D-fructose",
                "D-fructofuranose",
                "D-fructopyranose",
                "D-fructose",
                "D-psicose",
                "D-sorbopyranose",
                "D-sorbose",
                "D-tagatose",
                "L-fructopyranose",
                "L-fructose",
                "L-psicose",
                "L-sorbofuranose",
                "L-sorbopyranose",
                "L-sorbose",
                "L-sorbose 1-phosphate",
                "L-tagatose",
                "beta-D-sorbopyranose",
                "fructopyranose",
                "fructose",
                "keto-D-fructose",
                "keto-D-sorbose",
                "keto-D-tagatose",
                "keto-L-fructose",
                "keto-L-tagatose",
                "psicose",
                "sorbofuranose",
                "sorbose",
                "tagatose"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "Fructose (D-fructose)",
            "Psicose (D-psicose)",
            "Tagatose (D-tagatose)",
            "Sorbose (L-sorbose)",
            "Allulose (D-allulose)",
            "Ribulose (D-ribulose)",
            "Xylulose (D-xylulose)",
            "Hamamelose",
            "Glucosone",
            "Acarbose",
            "Fructose-6-phosphate",
            "Tagatose-6-phosphate",
            "Psicose-6-phosphate",
            "Sorbose-1-phosphate",
            "Fructose-1-phosphate",
            "Fructose-1,6-bisphosphate",
            "Sedoheptulose"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "D-fructose",
                "D-psicose",
                "D-tagatose",
                "L-sorbose",
                "D-fructose 6-phosphate",
                "D-tagatose 6-phosphate",
                "D-psicose 6-phosphate",
                "L-sorbose 1-phosphate",
                "D-fructose 1-phosphate",
                "beta-D-fructofuranose 1,6-bisphosphate"
            ],
            "mismatches": [
                "Allulose (D-allulose)",
                "Ribulose (D-ribulose)",
                "Xylulose (D-xylulose)",
                "Hamamelose",
                "Glucosone",
                "Acarbose",
                "Sedoheptulose"
            ],
            "true_referents": [
                "3-dehydro-D-glucoside",
                "5-dehydro-D-fructose",
                "D-fructopyranose",
                "D-fructose",
                "D-fructose 1-phosphate",
                "D-fructose 6-phosphate",
                "D-psicose",
                "D-psicose 6-phosphate",
                "D-psicose 6-phosphate(2-)",
                "D-sorbose",
                "D-tagatose",
                "D-tagatose 6-phosphate",
                "L-fructose",
                "L-fuculose",
                "L-psicose",
                "L-rhamnulose",
                "L-sorbose",
                "L-sorbose 1-phosphate",
                "L-tagatose",
                "L-tagatose 6-phosphate",
                "L-xylo-3-hexulose",
                "beta-D-fructofuranose 1,6-bisphosphate",
                "beta-D-sorbopyranose",
                "keto-D-fructose 1,6-bisphosphate",
                "keto-D-fructose 1-phosphate",
                "keto-D-fructose 6-phosphate",
                "keto-D-tagatose",
                "keto-L-tagatose",
                "keto-L-tagatose 6-phosphate",
                "levoglucosenone",
                "psicose",
                "sorbopyranose",
                "sorbose",
                "sorbose 1-phosphate",
                "tagatose"
            ],
            "TP": 10,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "D-fructose",
            "L-fructose",
            "D-psicose",
            "L-psicose",
            "D-sorbose",
            "L-sorbose",
            "D-tagatose",
            "L-tagatose"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "D-fructose",
                "L-fructose",
                "D-psicose",
                "L-psicose",
                "D-sorbose",
                "L-sorbose",
                "D-tagatose",
                "L-tagatose"
            ],
            "mismatches": [],
            "true_referents": [
                "5-dehydro-D-fructose",
                "D-fructose",
                "D-psicose",
                "D-sorbose",
                "D-tagatose",
                "L-fructose",
                "L-psicose",
                "L-sorbose",
                "L-sorbose 1-phosphate",
                "L-tagatose",
                "keto-D-sorbose",
                "keto-D-tagatose",
                "keto-L-fructose",
                "keto-L-tagatose",
                "psicose",
                "sorbose",
                "tagatose"
            ],
            "TP": 8,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "Fructose (C6H12O6)",
            "Sorbose (C6H12O6)",
            "Psicose (C6H12O6)",
            "Tagatose (C6H12O6)",
            "Galactose (C6H12O6)",
            "Talose (C6H12O6)",
            "Gulose (C6H12O6)",
            "Idose (C6H12O6)",
            "Allose (C6H12O6)",
            "Altrose (C6H12O6)",
            "Mannose (C6H12O6)",
            "Glucose (C6H12O6)",
            "Allohexose (C6H12O6)",
            "Allohexulose (C6H12O6)",
            "Allohexulopyranose (C6H12O6)",
            "Allohexulofuranose (C6H12O6)",
            "Hexodialdose (C6H12O6)",
            "Hexodiulose (C6H12O6)",
            "Hexosedialdose (C6H12O6)",
            "Hexosediulose (C6H12O6)",
            "Hexuronic acid (C6H10O7)",
            "Deoxyhexose (C6H12O5)",
            "Deoxyhexodialdose (C6H12O5)",
            "Deoxyhexosedialdose (C6H12O5)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fructose (C6H12O6)",
                "Sorbose (C6H12O6)",
                "Psicose (C6H12O6)"
            ],
            "mismatches": [
                "Tagatose (C6H12O6)",
                "Galactose (C6H12O6)",
                "Talose (C6H12O6)",
                "Gulose (C6H12O6)",
                "Idose (C6H12O6)",
                "Allose (C6H12O6)",
                "Altrose (C6H12O6)",
                "Mannose (C6H12O6)",
                "Glucose (C6H12O6)",
                "Allohexose (C6H12O6)",
                "Allohexulose (C6H12O6)",
                "Allohexulopyranose (C6H12O6)",
                "Allohexulofuranose (C6H12O6)",
                "Hexodialdose (C6H12O6)",
                "Hexodiulose (C6H12O6)",
                "Hexosedialdose (C6H12O6)",
                "Hexosediulose (C6H12O6)",
                "Hexuronic acid (C6H10O7)",
                "Deoxyhexose (C6H12O5)",
                "Deoxyhexodialdose (C6H12O5)",
                "Deoxyhexosedialdose (C6H12O5)"
            ],
            "true_referents": [
                "1,5-anhydro-D-erythro-hex-1-en-3-ulose",
                "3-dehydro-D-guloside",
                "3-deoxy-3-methyl-beta-D-fructofuranose",
                "3-keto-beta-D-galactose",
                "5-dehydro-D-fructose",
                "6-deoxy-6-sulfo-D-fructofuranose",
                "6-deoxy-beta-L-fructofuranose",
                "D-fructose",
                "D-fructose 6-phosphate",
                "D-psicose",
                "D-psicose 6-phosphate",
                "D-psicose 6-phosphate(2-)",
                "D-sorbose",
                "L-fructofuranose",
                "L-fructose",
                "L-psicose",
                "L-sorbopyranose",
                "L-sorbose",
                "L-xylo-3-hexulose",
                "alpha-chrysopine",
                "bis-beta-D-fructofuranose 1,2':2,3'-dianhydride",
                "deoxyketohexose",
                "deoxyketohexose derivative",
                "deoxyketohexose phosphate",
                "fructopyranose",
                "fructose",
                "keto-L-tagatose",
                "psicose",
                "sorbopyranose",
                "sorbose",
                "tagatose derivative"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "Glucose (Glc)",
            "Fructose (Fru)",
            "Ribulose (Rbu)",
            "Xylulose (Xul)",
            "Sedoheptulose (Sed)",
            "Erythrulose (Ery)",
            "Psicose (Psi)",
            "Sorbose (Sor)",
            "Tagatose (Tag)",
            "Dextrose (Dex)",
            "Levulose (Lev)",
            "Sucrose (Suc)",
            "Maltose (Mal)",
            "Lactose (Lac)",
            "Cellobiose (Cel)",
            "Trehalose (Tre)",
            "Melibiose (Mel)",
            "Palatinose (Pal)",
            "Turanose (Tur)",
            "Gentiobiose (Gen)",
            "Isomaltose (Iso)",
            "Kojibiose (Koj)",
            "Nigerose (Nig)",
            "Laminaribiose (Lam)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fructose (Fru)",
                "Psicose (Psi)",
                "Sorbose (Sor)",
                "Tagatose (Tag)"
            ],
            "mismatches": [
                "Glucose (Glc)",
                "Ribulose (Rbu)",
                "Xylulose (Xul)",
                "Sedoheptulose (Sed)",
                "Erythrulose (Ery)",
                "Dextrose (Dex)",
                "Levulose (Lev)",
                "Sucrose (Suc)",
                "Maltose (Mal)",
                "Lactose (Lac)",
                "Cellobiose (Cel)",
                "Trehalose (Tre)",
                "Melibiose (Mel)",
                "Palatinose (Pal)",
                "Turanose (Tur)",
                "Gentiobiose (Gen)",
                "Isomaltose (Iso)",
                "Kojibiose (Koj)",
                "Nigerose (Nig)",
                "Laminaribiose (Lam)"
            ],
            "true_referents": [
                "1,5-anhydro-D-erythro-hex-1-en-3-ulose",
                "6-deoxy-beta-L-fructofuranose",
                "D-fructose",
                "D-psicose",
                "D-sorbose",
                "D-tagatopyranose",
                "D-tagatose",
                "L-fructofuranose",
                "L-fructose",
                "L-psicose",
                "L-rhamnulose",
                "L-sorbose",
                "L-tagatose",
                "L-xylo-3-hexulose",
                "N-(1-deoxy-1-fructosyl)phenylalanine",
                "alpha-D-tagatopyranose",
                "beta-D-fructofuranose",
                "beta-D-fructofuranose 1,6-bisphosphate",
                "beta-D-fructopyranose",
                "beta-D-tagatofuranose",
                "beta-D-tagatopyranose",
                "beta-L-fructofuranose",
                "beta-chrysopine",
                "fructopyranose",
                "fructose",
                "keto-D-tagatose",
                "keto-L-tagatose",
                "psicose",
                "sorbose",
                "tagatose"
            ],
            "TP": 4,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "Glucose (Glc)",
            "Fructose (Fru)",
            "Galactose (Gal)",
            "Mannose (Man)",
            "Idose",
            "Altrose",
            "Talose",
            "Psicose",
            "Tagatose",
            "Ribulose",
            "Xylulose",
            "Ribose",
            "Arabinose",
            "Lyxose",
            "Xylose",
            "Rhamnose",
            "Fucose",
            "Aldose",
            "Ketose",
            "Erythrose",
            "Threose",
            "Ribose-5-phosphate",
            "Xylulose-5-phosphate"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fructose (Fru)",
                "Psicose",
                "Tagatose"
            ],
            "mismatches": [
                "Glucose (Glc)",
                "Galactose (Gal)",
                "Mannose (Man)",
                "Idose",
                "Altrose",
                "Talose",
                "Ribulose",
                "Xylulose",
                "Ribose",
                "Arabinose",
                "Lyxose",
                "Xylose",
                "Rhamnose",
                "Fucose",
                "Aldose",
                "Ketose",
                "Erythrose",
                "Threose",
                "Ribose-5-phosphate",
                "Xylulose-5-phosphate"
            ],
            "true_referents": [
                "1,5-anhydro-D-erythro-hex-1-en-3-ulose",
                "3-deoxy-3-methyl-beta-D-fructofuranose",
                "3-deoxyglucosone",
                "3-keto-beta-D-galactose",
                "6-deoxy-beta-L-fructofuranose",
                "D-fructose",
                "D-fructose 1-phosphate",
                "D-fructose 6-phosphate",
                "D-psicose",
                "D-tagatose",
                "L-fructopyranose",
                "L-fructose",
                "L-fuculose",
                "L-psicose",
                "L-rhamnulose",
                "L-rhamnulose 1-phosphate",
                "L-tagatose",
                "L-xylo-3-hexulose",
                "alpha-chrysopine",
                "beta-D-fructopyranose 1-phosphate",
                "beta-chrysopine",
                "deoxyketohexose",
                "fructopyranose",
                "fructose",
                "keto-D-fructose",
                "keto-D-sorbose",
                "psicose",
                "sorbose",
                "tagatose"
            ],
            "TP": 3,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            "Fructose (Fru)",
            "Sorbose (Sor)",
            "Tagatose (Tag)",
            "Psicose (Psi)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fructose (Fru)",
                "Sorbose (Sor)",
                "Tagatose (Tag)",
                "Psicose (Psi)"
            ],
            "mismatches": [],
            "true_referents": [
                "D-fructose",
                "D-psicose",
                "D-sorbose",
                "D-tagatose",
                "L-fructose",
                "L-psicose",
                "L-sorbose",
                "L-tagatose",
                "fructose",
                "psicose",
                "sorbose",
                "tagatose"
            ],
            "TP": 4,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "ketohexose",
        "domain": "chemistry",
        "response": [
            {
                "referent": "glucose",
                "canonical name": "Glucose"
            },
            {
                "referent": "fructose",
                "canonical name": "Fructose"
            },
            {
                "referent": "ribose",
                "canonical name": "Ribose"
            },
            {
                "referent": "deoxyribose",
                "canonical name": "Deoxyribose"
            },
            {
                "referent": "galactose",
                "canonical name": "Galactose"
            },
            {
                "referent": "xylose",
                "canonical name": "Xylose"
            },
            {
                "referent": "erythrose",
                "canonical name": "Erythrose"
            },
            {
                "referent": "lyxose",
                "canonical name": "Lyxose"
            },
            {
                "referent": "arabinose",
                "canonical name": "Arabinose"
            },
            {
                "referent": "altrose",
                "canonical name": "Altrose"
            },
            {
                "referent": "glucuronic acid",
                "canonical name": "Glucuronic acid"
            },
            {
                "referent": "galacturonic acid",
                "canonical name": "Galacturonic acid"
            },
            {
                "referent": "iduronic acid",
                "canonical name": "Iduonic acid"
            },
            {
                "referent": "glucuronamide",
                "canonical name": "Glucuronamide"
            },
            {
                "referent": "galacturonamide",
                "canonical name": "Galacturonamide"
            },
            {
                "referent": "iduronamide",
                "canonical name": "Iduronamide"
            },
            {
                "referent": "glucose-6-phosphate",
                "canonical name": "Glucose-6-phosphate"
            },
            {
                "referent": "glucose-1-phosphate",
                "canonical name": "Glucose-1-phosphate"
            },
            {
                "referent": "glucose-2-phosphate",
                "canonical name": "Glucose-2-phosphate"
            },
            {
                "referent": "glucose-3-phosphate",
                "canonical name": "Glucose-3-phosphate"
            },
            {
                "referent": "glucose-4-phosphate",
                "canonical name": "Glucose-4-phosphate"
            },
            {
                "referent": "glucose-5-phosphate",
                "canonical name": "Glucose-5-phosphate"
            },
            {
                "referent": "glucose-6-phosphate",
                "canonical name": "Glucose-6-phosphate"
            },
            {
                "referent": "glucose-1-phosphate",
                "canonical name": "Glucose-1-phosphate"
            },
            {
                "referent": "glucose-2-phosphate",
                "canonical name": "Glucose-2-phosphate"
            },
            {
                "referent": "glucose-3-phosphate",
                "canonical name": "Glucose-3-phosphate"
            },
            {
                "referent": "glucose-4-phosphate",
                "canonical name": "Glucose-4-phosphate"
            },
            {
                "referent": "glucose-5-phosphate",
                "canonical name": "Glucose-5-phosphate"
            },
            {
                "referent": "glucose-6-phosphate",
                "canonical name": "Glucose-6-phosphate"
            },
            {
                "referent": "glucose-1-phosphate",
                "canonical name": "Glucose-1-phosphate"
            },
            {
                "referent": "glucose-2-phosphate",
                "canonical name": "Glucose-2-phosphate"
            },
            {
                "referent": "glucose-3-phosphate",
                "canonical name": "Glucose-3-phosphate"
            },
            {
                "referent": "glucose-4-phosphate",
                "canonical name": "Glucose-4-phosphate"
            },
            {
                "referent": "glucose-5-phosphate",
                "canonical name": "Glucose-5-phosphate"
            },
            {
                "referent": "glucose-6-phosphate",
                "canonical name": "Glucose-6-phosphate"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "fructose"
            ],
            "mismatches": [
                "glucose",
                "ribose",
                "deoxyribose",
                "galactose",
                "xylose",
                "erythrose",
                "lyxose",
                "arabinose",
                "altrose",
                "glucuronic acid",
                "galacturonic acid",
                "iduronic acid",
                "glucuronamide",
                "galacturonamide",
                "iduronamide",
                "glucose-6-phosphate",
                "glucose-1-phosphate",
                "glucose-2-phosphate",
                "glucose-3-phosphate",
                "glucose-4-phosphate",
                "glucose-5-phosphate"
            ],
            "true_referents": [
                "3-deoxyglucosone",
                "3-keto-beta-D-galactose",
                "D-fructofuranuronic acid",
                "D-fructose",
                "D-fructose 1-phosphate",
                "D-fructose 6-phosphate",
                "D-psicose",
                "D-psicose 6-phosphate(2-)",
                "L-fructose",
                "L-psicose",
                "L-xylo-3-hexulose",
                "alpha-chrysopine",
                "beta-D-fructopyranose",
                "bis-beta-D-fructofuranose 1,2':2,3'-dianhydride",
                "chrysopine",
                "deoxyketohexose",
                "deoxyketohexose phosphate",
                "fructopyranose",
                "fructose"
            ],
            "TP": 1,
            "FP": 21,
            "FN": 0
        }
    }
]