[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "sucrose (C12H22O11)",
            "lactose (C12H22O11)",
            "maltose (C12H22O11)",
            "trehalose (C12H24O11)",
            "cellobiose (C12H22O11)",
            "gentiobiose (C12H22O11)",
            "isomaltose (C12H22O11)",
            "panose (C18H32O16)",
            "dulcitol (C6H14O6)",
            "kojibiose (C12H22O11)",
            "melibiose (C18H32O16)",
            "sorbitol (C6H14O6)",
            "toluose (C18H32O16)",
            "verbascose (C30H58O27)",
            "xylobiose (C6H12O6)",
            "rhamnose (C6H12O5)",
            "melibiose (C18H32O16)",
            "gentiobiose (C12H22O11)",
            "isomaltose (C12H22O11)",
            "panose (C18H32O16)",
            "kojibiose (C12H22O11)",
            "melibiulose (C18H32O16)",
            "rhamnose (C6H12O5)",
            "cellobiose (C12H22O11)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "sucrose (C12H22O11)",
                "lactose (C12H22O11)",
                "maltose (C12H22O11)",
                "trehalose (C12H24O11)",
                "cellobiose (C12H22O11)",
                "gentiobiose (C12H22O11)",
                "isomaltose (C12H22O11)",
                "kojibiose (C12H22O11)",
                "melibiose (C18H32O16)",
                "verbascose (C30H58O27)",
                "xylobiose (C6H12O6)"
            ],
            "mismatches": [
                "panose (C18H32O16)",
                "dulcitol (C6H14O6)",
                "sorbitol (C6H14O6)",
                "toluose (C18H32O16)",
                "rhamnose (C6H12O5)",
                "melibiulose (C18H32O16)"
            ],
            "true_referents": [
                "1-O-(4-O-alpha-D-glucoopyranosyl-beta-D-galactopyranosyl)-glycerol",
                "1-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "1-O-acetyl-alpha-maltose",
                "1-O-acetyl-beta-maltose",
                "2-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "2-O-(long-chain fatty acyl)-alpha,alpha-trehalose",
                "6-O-(beta-D-xylopyranosyl)-beta-D-glucopyranoside",
                "6-O-alpha-D-glucopyranosyl-D-fructofuranose",
                "6-O-alpha-D-glucopyranosyl-beta-D-fructofuranose",
                "7-O-methylvitexin 2''-O-beta-L-rhamnoside",
                "D-glucopyranosyl-(1->4)-aldehydo-D-mannose",
                "alpha,beta-trehalose",
                "alpha-L-rhamnopyranosyl-(1->2)-beta-D-glucopyranose",
                "alpha-L-rhamnosyl-(1->4)-D-glucuronate",
                "alpha-cellobiose",
                "alpha-lactose",
                "beta-D-Gal-(1->4)-beta-D-Xyl-OBn",
                "beta-D-galactosyl-(1->4)-L-rhamnose",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-melibiose",
                "bis-D-fructose 2',1:2,1'-dianhydride",
                "bis-beta-D-fructofuranose 1,2':2,3'-dianhydride",
                "cellobiose",
                "genistin 7-O-gentiobioside",
                "gentiobiose",
                "gentiobiose octaacetate",
                "irilone-4'-O-[beta-D-glucopyranosyl-(1->6)-beta-D-glucopyranoside]",
                "isomaltose",
                "kojibiose",
                "lactose phosphate",
                "maltose",
                "maltulose",
                "melibiose",
                "nigerose",
                "sambubiose",
                "sesaminol 2-O-beta-D-gentiobioside",
                "sucrose",
                "trehalose",
                "trehalose 6,6'-dimycolate",
                "verbascose",
                "vicianose",
                "xylobiose"
            ],
            "TP": 11,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Lactose (Lac)",
            "Maltose (Mal)",
            "Cellobiose (Cel)",
            "Trehalose (Tre)",
            "Chitin (Chi)",
            "N-Acetylglucosamine (GlcNAc)",
            "N-Acetylgalactosamine (GalNAc)",
            "Sucrose (Suc)",
            "Raffinose (Raf)",
            "Stachyose (Sta)",
            "Verbascose (Ver)",
            "Melibiose (Mel)",
            "Turanose (Tur)",
            "Isomaltose (Iso)",
            "Kojibiose (Koj)",
            "Nigerose (Nig)",
            "Laminaribiose (Lam)",
            "Lactulose (Lacul)",
            "Maltulose (Maltul)",
            "Sialyllactose (SialLLac)",
            "Gentiobiose (Gen)",
            "Turanose (Tur)",
            "Lacto-N-tetraose (LNT)",
            "Lacto-N-neotetraose (LNnT)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Lactose (Lac)",
                "Maltose (Mal)",
                "Cellobiose (Cel)",
                "Trehalose (Tre)",
                "Sucrose (Suc)",
                "Stachyose (Sta)",
                "Verbascose (Ver)",
                "Melibiose (Mel)",
                "Turanose (Tur)",
                "Isomaltose (Iso)",
                "Kojibiose (Koj)",
                "Nigerose (Nig)",
                "Laminaribiose (Lam)",
                "Lactulose (Lacul)",
                "Maltulose (Maltul)",
                "Gentiobiose (Gen)"
            ],
            "mismatches": [
                "Chitin (Chi)",
                "N-Acetylglucosamine (GlcNAc)",
                "N-Acetylgalactosamine (GalNAc)",
                "Raffinose (Raf)",
                "Sialyllactose (SialLLac)",
                "Lacto-N-tetraose (LNT)",
                "Lacto-N-neotetraose (LNnT)"
            ],
            "true_referents": [
                "(2S)-poncirin",
                "1,6-kestotetraose",
                "1-O-acetyl-beta-maltose",
                "2'-fucosyllactose",
                "3'-ketolactose",
                "4-nitrophenyl beta-lactoside",
                "6'-sialyl LacNAc-C12L",
                "6,6-kestotetraose",
                "6-kestotriose",
                "N-acetyl-alpha-D-galactosaminyl-(1->3)-[alpha-L-fucosyl-(1->2)]-beta-D-galactose derivative",
                "N-acetyl-beta-D-glucosaminyl-(1->4)-D-glucosamine",
                "N-acetyl-beta-D-glucosaminyl-(1->4)-alpha-D-glucosamine",
                "N-acetyllactosamine",
                "alpha,beta-trehalose",
                "alpha-D-galactosyl-N-acetyllactosamine",
                "alpha-L-rhamnopyranosyl-(1->2)-beta-D-glucopyranose",
                "alpha-cellobiose",
                "alpha-lactose",
                "beta-D-Gal-(1->3)-alpha-D-GalNAc",
                "beta-D-Galf-(1->5)-D-Galf",
                "beta-D-Galp-(1->3)-L-Araf",
                "beta-L-arabinofuranosyl-(1->2)-beta-L-arabinofuranose",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-melibiose",
                "cellobiose",
                "chitobioses",
                "cyclobis-(1->6)-alpha-nigerosyl",
                "decyl beta-D-maltopyranoside",
                "galactobiose",
                "gentiobiose",
                "inulobiose",
                "isomaltose",
                "kojibiose",
                "lactose",
                "lactose phosphate",
                "lactulose",
                "laminarabiose",
                "maltose",
                "maltose phosphate",
                "maltulose",
                "melibionic acid",
                "melibiose",
                "nigerose",
                "rutinose",
                "sambubiose",
                "stachyose",
                "streptobiosamine",
                "sucrose",
                "sucrose 6(G)-phosphate",
                "trehalose",
                "trehalose phosphate",
                "turanose",
                "verbascose",
                "vicianose"
            ],
            "TP": 16,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Sucrose (table sugar)",
            "Lactose (milk sugar)",
            "Maltose (malt sugar)",
            "Cellobiose",
            "Trehalose",
            "Kojibiose",
            "Nigerose",
            "Sophorose",
            "Laminaribiose",
            "Gentiobiose",
            "Turanose",
            "Melibiose",
            "Raffinose",
            "Stachyose",
            "Verbascose",
            "Isomaltose",
            "Palatinose",
            "Leucrose",
            "Maltulose",
            "Lactulose",
            "Lactosucrose",
            "Palatinose",
            "Turanose",
            "Maltobionose"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sucrose (table sugar)",
                "Lactose (milk sugar)",
                "Maltose (malt sugar)",
                "Cellobiose",
                "Trehalose",
                "Kojibiose",
                "Nigerose",
                "Sophorose",
                "Laminaribiose",
                "Gentiobiose",
                "Turanose",
                "Melibiose",
                "Stachyose",
                "Verbascose",
                "Isomaltose",
                "Leucrose",
                "Maltulose",
                "Lactulose"
            ],
            "mismatches": [
                "Raffinose",
                "Palatinose",
                "Lactosucrose",
                "Maltobionose"
            ],
            "true_referents": [
                "(2S)-poncirin",
                "3-ketosucrose",
                "6-hydroxyluteolin 7-O-laminaribioside",
                "6-kestotriose",
                "D-maltobiono-1,5-lactone",
                "alpha-L-rhamnopyranosyl-(1->2)-beta-D-glucopyranose",
                "alpha-cellobiose",
                "beta-L-arabinofuranosyl-(1->2)-beta-L-arabinofuranose",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-melibiose",
                "cellobiose",
                "cyclobis-(1->6)-alpha-nigerosyl",
                "galactobiose",
                "gentiobiose",
                "glycosylxylose",
                "inulobiose",
                "isomaltose",
                "kojibiose",
                "lactose",
                "lactulose",
                "laminarabiose",
                "leucrose",
                "maltose",
                "maltulose",
                "melibiose",
                "nigerose",
                "primeverose",
                "rutinose",
                "sambubiose",
                "sophorose",
                "sophoroside",
                "stachyose",
                "sucrose",
                "trehalose",
                "trehalose phosphate",
                "trehalulose",
                "turanose",
                "verbascose",
                "vicianose",
                "xylobiose"
            ],
            "TP": 18,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Sucrose (Suc)",
            "Lactose (Lac)",
            "Maltose (Mal)",
            "Cellobiose (Cel)",
            "Trehalose (Tre)",
            "Melibiose (Mel)",
            "Gentianose (Gen)",
            "Laminaribiose (Lam)",
            "Maltotriose (Mal3)",
            "Panose (Pan)",
            "Rutinoside (Rut)",
            "Verbascose (Ver)",
            "Stachyose (Sta)",
            "Raffinose (Raf)",
            "Melezitose (Melz)",
            "Turranose (Tur)",
            "Sophorose (Sop)",
            "Kojibiose (Koj)",
            "Nigerose (Nig)",
            "Isomaltose (IsoMal)",
            "Maltulose (Malulose)",
            "Thelobiose (The)",
            "Rosebiose (Ros)",
            "Phlorizin (Phl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Lactose (Lac)",
                "Maltose (Mal)",
                "Cellobiose (Cel)",
                "Trehalose (Tre)",
                "Melibiose (Mel)",
                "Laminaribiose (Lam)",
                "Verbascose (Ver)",
                "Stachyose (Sta)",
                "Sophorose (Sop)",
                "Kojibiose (Koj)",
                "Nigerose (Nig)",
                "Isomaltose (IsoMal)",
                "Maltulose (Malulose)"
            ],
            "mismatches": [
                "Sucrose (Suc)",
                "Gentianose (Gen)",
                "Maltotriose (Mal3)",
                "Panose (Pan)",
                "Rutinoside (Rut)",
                "Raffinose (Raf)",
                "Melezitose (Melz)",
                "Turranose (Tur)",
                "Thelobiose (The)",
                "Rosebiose (Ros)",
                "Phlorizin (Phl)"
            ],
            "true_referents": [
                "(2S)-poncirin",
                "3-hydroxyphloretin 2'-O-xylosylglucoside",
                "6-kestotriose",
                "alpha,beta-trehalose",
                "alpha-cellobiose",
                "alpha-lactose",
                "beta-D-Galf-(1->5)-D-Galf",
                "beta-D-Galp-(1->3)-L-Araf",
                "beta-L-arabinofuranosyl-(1->2)-beta-L-arabinofuranose",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-melibiose",
                "cellobiose",
                "cyclobis-(1->6)-alpha-nigerosyl",
                "formononetin 7-O-rutinoside",
                "genistin 7-O-gentiobioside",
                "gentiobiose",
                "inulobiose",
                "isomaltose",
                "isorhamnetin-3-O-rutinoside",
                "kojibiose",
                "lactose",
                "lactulose",
                "laminarabiose",
                "maltose",
                "maltose phosphate",
                "maltulose",
                "melibionic acid",
                "melibiose",
                "nigerose",
                "phleomycin D1",
                "pinen-10-yl vicianoside",
                "primeverose",
                "rutinose",
                "sambubiose",
                "sesaminol 2-O-beta-D-gentiobioside",
                "sophorose",
                "sophoroside",
                "stachyose",
                "streptobiosamine",
                "sucrose",
                "sucrose 6(G)-phosphate",
                "trehalose",
                "trehalose phosphate",
                "turanose",
                "tylosin",
                "verbascose",
                "vicianose"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Sucrose (C12H22O11)",
            "Lactose (C12H22O11)",
            "Maltose (C12H22O11)",
            "Trehalose (C12H22O11)",
            "Cellobiose (C12H22O11)",
            "Isomaltose (C12H22O11)",
            "Gentiobiose (C12H22O11)",
            "Melibiose (C12H22O11)",
            "Xylobiose (C12H22O11)",
            "Sophorose (C12H22O11)",
            "Laminaribiose (C12H22O11)",
            "Mannobiose (C12H22O11)",
            "Neotrehalose (C12H22O11)",
            "Palatinose (C12H22O11)",
            "Turanose (C12H22O11)",
            "Koijibiose (C12H22O11)",
            "Leucrose (C12H22O11)",
            "Maltulose (C12H22O11)",
            "Nigerose (C12H22O11)",
            "Melezitose (C18H32O16)",
            "Raffinose (C18H32O16)",
            "Stachyose (C24H42O21)",
            "Verbascose (C30H52O26)",
            "Ajugose (C36H62O31)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sucrose (C12H22O11)",
                "Maltose (C12H22O11)",
                "Trehalose (C12H22O11)",
                "Cellobiose (C12H22O11)",
                "Isomaltose (C12H22O11)",
                "Gentiobiose (C12H22O11)",
                "Melibiose (C12H22O11)",
                "Xylobiose (C12H22O11)",
                "Sophorose (C12H22O11)",
                "Laminaribiose (C12H22O11)",
                "Mannobiose (C12H22O11)",
                "Turanose (C12H22O11)",
                "Leucrose (C12H22O11)",
                "Maltulose (C12H22O11)",
                "Nigerose (C12H22O11)",
                "Stachyose (C24H42O21)",
                "Verbascose (C30H52O26)",
                "Ajugose (C36H62O31)"
            ],
            "mismatches": [
                "Lactose (C12H22O11)",
                "Neotrehalose (C12H22O11)",
                "Palatinose (C12H22O11)",
                "Koijibiose (C12H22O11)",
                "Melezitose (C18H32O16)",
                "Raffinose (C18H32O16)"
            ],
            "true_referents": [
                "1,3,3'-tri-O-methyl-4alpha-mannobiose",
                "1-O-acetyl-alpha-maltose",
                "1-O-acetyl-beta-maltose",
                "2-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "2-O-(long-chain fatty acyl)-alpha,alpha-trehalose",
                "2-O-palmitoyl-alpha,alpha-trehalose",
                "2-phenylethyl beta-primeveroside",
                "3,3'-neotrehalosadiamine",
                "3,6-di-O-methyl-beta-D-glucopyranosyl-(1->4)-alpha-L-rhamnopyranose",
                "3-ketosucrose",
                "6-O-alpha-D-glucopyranosyl-D-fructofuranose",
                "6-O-alpha-D-glucopyranosyl-beta-D-fructofuranose",
                "6-hydroxyluteolin 7-O-laminaribioside",
                "D-glucopyranosyl-(1->4)-aldehydo-D-mannose",
                "D-maltobiono-1,5-lactone",
                "D-xylobiono-1,5-lactone",
                "ajugose",
                "alpha-L-rhamnopyranosyl-(1->2)-beta-D-glucopyranose",
                "alpha-cellobiose",
                "alpha-lactose",
                "alpha-mannobiose",
                "beta-D-Gal-(1->4)-beta-D-Xyl-OBn",
                "beta-D-apiofuranosyl-(1->6)-D-glucopyranose",
                "beta-D-fructofuranosyl 6-O-octanoyl-alpha-D-glucopyranoside",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-melibiose",
                "cellobiose",
                "cyclobis-(1->6)-alpha-nigerosyl",
                "genistin 7-O-gentiobioside",
                "gentiobiose",
                "gentiobiose octaacetate",
                "irilone-4'-O-[beta-D-glucopyranosyl-(1->6)-beta-D-glucopyranoside]",
                "isomaltose",
                "kojibiose",
                "lactose phosphate",
                "lactulose",
                "laminarabiose",
                "leucrose",
                "maltose",
                "maltulose",
                "mannobiose",
                "melibiose",
                "nigerose",
                "sambubiose",
                "sesaminol 2-O-beta-D-gentiobioside",
                "sophorose",
                "sophoroside",
                "stachyose",
                "sucrose",
                "trehalose",
                "turanose",
                "verbascose",
                "vicianose",
                "xylobiose"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Sucrose (C12H22O11)",
            "Lactose (C12H22O11)",
            "Maltose (C12H22O11)",
            "Cellobiose (C12H22O11)",
            "Trehalose (C12H22O11)",
            "Raffinose (C18H32O16)",
            "Melezitose (C18H32O16)",
            "Maltotriose (C18H36O18)",
            "Melezitose (C18H32O16)",
            "Maltotetraose (C24H46O23)",
            "Maltopentaose (C30H54O27)",
            "Maltotriose (C18H36O18)",
            "Mannobiose (C12H22O11)",
            "Lactulose (C12H22O11)",
            "Manninotriose (C18H36O18)",
            "Galactosylsucrose (C18H32O16)",
            "Nigerose (C12H22O11)",
            "Melezitose (C18H32O16)",
            "Oligofructose (C6H10O5)n",
            "Isomaltose (C12H22O11)",
            "Raffinose (C18H32O16)",
            "Maltodextrin (C6H10O5)n",
            "Kestose (C18H32O16)",
            "Maltotetraose (C24H46O23)",
            "Gentiobiose (C12H22O11)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sucrose (C12H22O11)",
                "Lactose (C12H22O11)",
                "Maltose (C12H22O11)",
                "Cellobiose (C12H22O11)",
                "Trehalose (C12H22O11)",
                "Mannobiose (C12H22O11)",
                "Lactulose (C12H22O11)",
                "Nigerose (C12H22O11)",
                "Isomaltose (C12H22O11)"
            ],
            "mismatches": [
                "Raffinose (C18H32O16)",
                "Melezitose (C18H32O16)",
                "Maltotriose (C18H36O18)",
                "Maltotetraose (C24H46O23)",
                "Maltopentaose (C30H54O27)",
                "Manninotriose (C18H36O18)",
                "Galactosylsucrose (C18H32O16)",
                "Oligofructose (C6H10O5)n",
                "Maltodextrin (C6H10O5)n",
                "Kestose (C18H32O16)",
                "Gentiobiose (C12H22O11)"
            ],
            "true_referents": [
                "1,3,3'-tri-O-methyl-4alpha-mannobiose",
                "1,6-kestotetraose",
                "1-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "1-O-acetyl-alpha-maltose",
                "1-O-acetyl-beta-maltose",
                "2-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "2-O-(long-chain fatty acyl)-alpha,alpha-trehalose",
                "6,6-kestotetraose",
                "6-O-alpha-D-glucopyranosyl-D-fructofuranose",
                "6-O-alpha-D-glucopyranosyl-beta-D-fructofuranose",
                "6-kestotriose",
                "D-galactosyl-(1->4)-beta-D-glucose",
                "D-glucopyranosyl-(1->3)-D-mannopyranose",
                "D-glucopyranosyl-(1->4)-aldehydo-D-mannose",
                "D-maltobiono-1,5-lactone",
                "alpha-cellobiose",
                "alpha-lactose",
                "alpha-mannobiose",
                "beta-D-apiofuranosyl-(1->6)-D-glucopyranose",
                "beta-D-fructofuranosyl 6-O-octanoyl-alpha-D-glucopyranoside",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-melibiose",
                "bis-D-fructose 2',1:2,1'-dianhydride",
                "bis-beta-D-fructofuranose 1,2':2,3'-dianhydride",
                "cellobiose",
                "cyclobis-(1->6)-alpha-nigerosyl",
                "glycosylfructose",
                "isomaltose",
                "lactose phosphate",
                "lactulose",
                "maltose",
                "maltose 1-phosphate",
                "maltose phosphate",
                "maltulose",
                "mannobiose",
                "nigerose",
                "sucrose",
                "trehalose"
            ],
            "TP": 9,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Sucrose (C12H22O11)",
            "Lactose (C12H22O11)",
            "Maltose (C12H22O11)",
            "Cellobiose (C12H22O11)",
            "Trehalose (C12H22O11)",
            "Gentiobiose (C12H22O11)",
            "Melibiose (C12H22O11)",
            "Isomaltose (C12H22O11)",
            "Laminaribiose (C12H22O11)",
            "Turanose (C12H22O11)",
            "Nigerose (C12H22O11)",
            "Kojibiose (C12H22O11)",
            "Sophorose (C12H22O11)",
            "Globotriose (C12H22O11)",
            "Gentianose (C18H32O16)",
            "Raffinose (C18H32O16)",
            "Stachyose (C24H42O21)",
            "Vernonioside B1 (C30H48O15)",
            "Vernonioside B2 (C30H48O15)",
            "Vernonioside B3 (C30H48O15)",
            "Vernonioside B4 (C30H48O15)",
            "Vernonioside B5 (C30H48O15)",
            "Vernonioside B6 (C30H48O15)",
            "Vernonioside B7 (C30H48O15)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sucrose (C12H22O11)",
                "Lactose (C12H22O11)",
                "Maltose (C12H22O11)",
                "Cellobiose (C12H22O11)",
                "Trehalose (C12H22O11)",
                "Gentiobiose (C12H22O11)",
                "Melibiose (C12H22O11)",
                "Isomaltose (C12H22O11)",
                "Laminaribiose (C12H22O11)",
                "Turanose (C12H22O11)",
                "Nigerose (C12H22O11)",
                "Kojibiose (C12H22O11)",
                "Sophorose (C12H22O11)",
                "Stachyose (C24H42O21)"
            ],
            "mismatches": [
                "Globotriose (C12H22O11)",
                "Gentianose (C18H32O16)",
                "Raffinose (C18H32O16)",
                "Vernonioside B1 (C30H48O15)",
                "Vernonioside B2 (C30H48O15)",
                "Vernonioside B3 (C30H48O15)",
                "Vernonioside B4 (C30H48O15)",
                "Vernonioside B5 (C30H48O15)",
                "Vernonioside B6 (C30H48O15)",
                "Vernonioside B7 (C30H48O15)"
            ],
            "true_referents": [
                "1-O-acetyl-alpha-maltose",
                "1-O-acetyl-beta-maltose",
                "2-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "2-O-(long-chain fatty acyl)-alpha,alpha-trehalose",
                "3,6-di-O-methyl-beta-D-glucopyranosyl-(1->4)-alpha-L-rhamnopyranose",
                "6-O-alpha-D-glucopyranosyl-D-fructofuranose",
                "6-O-alpha-D-glucopyranosyl-beta-D-fructofuranose",
                "6-hydroxyluteolin 7-O-laminaribioside",
                "7-O-methylvitexin 2''-O-alpha-L-rhamnoside",
                "7-O-methylvitexin 2''-O-beta-L-rhamnoside",
                "Mogroside II-A2",
                "alpha-L-rhamnopyranosyl-(1->2)-beta-D-glucopyranose",
                "alpha-cellobiose",
                "alpha-lactose",
                "beta-D-GlcpA-(1->4)-beta-D-GlcpOCH2CH2NH2",
                "beta-D-apiofuranosyl-(1->6)-D-glucopyranose",
                "beta-D-fructofuranosyl 6-O-octanoyl-alpha-D-glucopyranoside",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-melibiose",
                "cellobiose",
                "chrysoeriol 7-O-gentiobioside",
                "cyclobis-(1->6)-alpha-nigerosyl",
                "genistin 7-O-gentiobioside",
                "gentiobiose",
                "gentiobiose octaacetate",
                "inulobiose",
                "irilone-4'-O-[beta-D-glucopyranosyl-(1->6)-beta-D-glucopyranoside]",
                "isomaltose",
                "isovitexin 2''-O-beta-D-glucoside",
                "kojibiose",
                "lactose phosphate",
                "laminarabiose",
                "lyciumoside IV",
                "maltose",
                "melibiose",
                "nicotianoside I",
                "nigerose",
                "quercetin 3-beta-gentiobioside",
                "sambubiose",
                "sesaminol 2-O-beta-D-gentiobioside",
                "sophorose",
                "sophoroside",
                "stachyose",
                "sucrose",
                "trehalose",
                "turanose",
                "vitexin 2''-O-beta-D-glucoside"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Sucrose",
            "Lactose",
            "Maltose",
            "Trehalose",
            "Isomaltose",
            "Cellobiose",
            "Lactulose",
            "Melibiose",
            "Gentianose",
            "Sophorose",
            "Nigerose",
            "Raffinose",
            "Stachyose",
            "Verbascose",
            "Mannobiose",
            "Glucobiose",
            "Galactobiose",
            "Xylobiose",
            "Arabinobiose",
            "Fucobiose",
            "Rhamnobiose",
            "Lyxobiose",
            "Ribobiose",
            "Xylulose"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sucrose",
                "Lactose",
                "Maltose",
                "Trehalose",
                "Isomaltose",
                "Cellobiose",
                "Lactulose",
                "Melibiose",
                "Sophorose",
                "Nigerose",
                "Stachyose",
                "Verbascose",
                "Mannobiose",
                "Galactobiose",
                "Xylobiose"
            ],
            "mismatches": [
                "Gentianose",
                "Raffinose",
                "Glucobiose",
                "Arabinobiose",
                "Fucobiose",
                "Rhamnobiose",
                "Lyxobiose",
                "Ribobiose",
                "Xylulose"
            ],
            "true_referents": [
                "(2S)-poncirin",
                "alpha-cellobiose",
                "alpha-mannobiose",
                "beta-(1->6)-galactobiose",
                "beta-L-arabinofuranosyl-(1->2)-beta-L-arabinofuranose",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-mannobiose",
                "beta-melibiose",
                "cellobiose",
                "cyclobis-(1->6)-alpha-nigerosyl",
                "galactobiose",
                "genistin 7-O-gentiobioside",
                "gentiobiose",
                "glycosylarabinose",
                "glycosylxylose",
                "inulobiose",
                "isomaltose",
                "kojibiose",
                "lactose",
                "lactulose",
                "laminarabiose",
                "maltose",
                "maltulose",
                "mannobiose",
                "melibiose",
                "nigerose",
                "robinobiose",
                "rutinose",
                "sesaminol 2-O-beta-D-gentiobioside",
                "sophorose",
                "sophoroside",
                "stachyose",
                "sucrose",
                "trehalose",
                "trehalose phosphate",
                "trehalulose",
                "turanose",
                "verbascose",
                "vicianose",
                "xylobiose"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Sucrose (Suc)",
            "Lactose",
            "Maltose",
            "Cellobiose",
            "Trehalose",
            "Isomaltose",
            "Melibiose",
            "Gentiobiose",
            "Lactulose",
            "Allolactose",
            "Turanose",
            "Kojibiose",
            "Neomaltose",
            "Trehalulose",
            "Xylobiose",
            "Arabinobiose",
            "Rhamnobiose",
            "Upiose",
            "Vicianose",
            "Guloside",
            "Tagatose",
            "Fucosyl Disaccharide",
            "Laminaribiose",
            "Pentosyl Disaccharide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Lactose",
                "Maltose",
                "Cellobiose",
                "Trehalose",
                "Isomaltose",
                "Melibiose",
                "Gentiobiose",
                "Lactulose",
                "Allolactose",
                "Turanose",
                "Kojibiose",
                "Trehalulose",
                "Xylobiose",
                "Vicianose",
                "Laminaribiose"
            ],
            "mismatches": [
                "Sucrose (Suc)",
                "Neomaltose",
                "Arabinobiose",
                "Rhamnobiose",
                "Upiose",
                "Guloside",
                "Tagatose",
                "Fucosyl Disaccharide",
                "Pentosyl Disaccharide"
            ],
            "true_referents": [
                "(R)-vicianin",
                "1,6-kestotetraose",
                "2,2'-difucosyllactose",
                "6-hydroxyluteolin 7-O-laminaribioside",
                "ajugose",
                "allolactose",
                "alpha-L-fucosyl-(1->2)-beta-D-galactoside",
                "alpha-L-rhamnopyranosyl-(1->2)-beta-D-glucopyranose",
                "alpha-allolactose",
                "alpha-cellobiose",
                "beta-allolactose",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-melibiose",
                "cellobiose",
                "galactobiose",
                "gentiobiose",
                "glycosylfucose",
                "glycosylpentose",
                "glycosylpentose derivative",
                "glycosylxylose",
                "gypenoside LXXV",
                "inulobiose",
                "isomaltose",
                "kojibiose",
                "lactose",
                "lactulose",
                "laminarabiose",
                "maltose",
                "maltulose",
                "melibiose",
                "pinen-10-yl vicianoside",
                "robinobiose",
                "rutinose",
                "sambubiose",
                "sophorose",
                "sophoroside",
                "sucrose",
                "sucrose 6(G)-phosphate",
                "trehalosamine",
                "trehalose",
                "trehalose phosphate",
                "trehalulose",
                "turanose",
                "vicianose",
                "xylobiose"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Sucrose (table sugar)",
            "Lactose (milk sugar)",
            "Maltose (malt sugar)",
            "Trehalose",
            "Cellobiose",
            "Gentiobiose",
            "Isomaltose",
            "Kojibiose",
            "Nigerose",
            "Sophorose",
            "Laminaribiose",
            "Melibiose",
            "Xylobiose",
            "Mannobiose",
            "Chitobiose",
            "Rutinose",
            "Primeverose",
            "Vicianose",
            "Sambubiose",
            "Rutinulose",
            "Turanose",
            "Maltulose",
            "Lactulose",
            "Palatinose (isomaltulose)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sucrose (table sugar)",
                "Lactose (milk sugar)",
                "Maltose (malt sugar)",
                "Trehalose",
                "Cellobiose",
                "Gentiobiose",
                "Isomaltose",
                "Kojibiose",
                "Nigerose",
                "Sophorose",
                "Melibiose",
                "Xylobiose",
                "Mannobiose",
                "Chitobiose",
                "Rutinose",
                "Primeverose",
                "Vicianose",
                "Sambubiose",
                "Turanose",
                "Maltulose",
                "Lactulose"
            ],
            "mismatches": [
                "Laminaribiose",
                "Rutinulose",
                "Palatinose (isomaltulose)"
            ],
            "true_referents": [
                "(R)-vicianin",
                "2-phenylethyl beta-primeveroside",
                "6-hydroxyluteolin 7-O-laminaribioside",
                "alpha-L-rhamnopyranosyl-(1->2)-beta-D-glucopyranose",
                "alpha-cellobiose",
                "alpha-mannobiose",
                "benzyl beta-primeveroside",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-mannobiose",
                "beta-melibiose",
                "cellobiose",
                "chitobioses",
                "cyanidin 3-O-rutinoside",
                "cyclobis-(1->6)-alpha-nigerosyl",
                "formononetin 7-O-rutinoside",
                "galactobiose",
                "gentiobiose",
                "glycosylxylose",
                "inulobiose",
                "isomaltose",
                "kojibiose",
                "lactose",
                "lactulose",
                "laminarabiose",
                "maltose",
                "maltulose",
                "mannobiose",
                "melibiose",
                "nigerose",
                "pinen-10-yl vicianoside",
                "primeverose",
                "rutin",
                "rutinose",
                "sambubiose",
                "sophorose",
                "sophoroside",
                "sucrose",
                "trehalose",
                "trehalose phosphate",
                "trehalulose",
                "turanose",
                "vicianose",
                "xylobiose"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Sucrose (table sugar)",
            "Lactose (milk sugar)",
            "Maltose (malt sugar)",
            "Trehalose",
            "Cellobiose",
            "Gentiobiose",
            "Kojibiose",
            "Laminaribiose",
            "Maltulose",
            "Mannobiose",
            "Melibiose",
            "Nigerose",
            "Palatinose (isomaltulose)",
            "Primeverose",
            "Rutinose",
            "Sacarose",
            "Sophorose",
            "Turanose",
            "Vicianose",
            "Xylobiose"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sucrose (table sugar)",
                "Lactose (milk sugar)",
                "Maltose (malt sugar)",
                "Trehalose",
                "Cellobiose",
                "Gentiobiose",
                "Kojibiose",
                "Maltulose",
                "Mannobiose",
                "Melibiose",
                "Nigerose",
                "Primeverose",
                "Rutinose",
                "Sophorose",
                "Turanose",
                "Vicianose",
                "Xylobiose"
            ],
            "mismatches": [
                "Laminaribiose",
                "Palatinose (isomaltulose)",
                "Sacarose"
            ],
            "true_referents": [
                "(R)-vicianin",
                "2-phenylethyl beta-primeveroside",
                "6-hydroxyluteolin 7-O-laminaribioside",
                "alpha-L-rhamnopyranosyl-(1->2)-beta-D-glucopyranose",
                "alpha-cellobiose",
                "alpha-mannobiose",
                "benzyl beta-primeveroside",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-mannobiose",
                "beta-melibiose",
                "cellobiose",
                "cyclobis-(1->6)-alpha-nigerosyl",
                "formononetin 7-O-rutinoside",
                "galactobiose",
                "gentiobiose",
                "inulobiose",
                "isomaltose",
                "kojibiose",
                "lactose",
                "lactulose",
                "laminarabiose",
                "maltose",
                "maltulose",
                "mannobiose",
                "melibiose",
                "nigerose",
                "pinen-10-yl vicianoside",
                "primeverose",
                "rutinose",
                "sambubiose",
                "sophorose",
                "sophoroside",
                "sucrose",
                "trehalose",
                "trehalose phosphate",
                "trehalulose",
                "turanose",
                "vicianose",
                "xylobiose"
            ],
            "TP": 17,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Sucrose (C12H22O11)",
            "Lactose (C12H22O11)",
            "Maltose (C12H22O11)",
            "Cellobiose (C12H22O11)",
            "Trehalose (C12H22O11)",
            "Gentiobiose (C12H22O11)",
            "Isomaltose (C12H22O11)",
            "Melibiose (C12H22O11)",
            "Rutinose (C12H22O11)",
            "Palatinose (C12H22O11)",
            "Turanose (C12H22O11)",
            "Maltulose (C12H22O11)",
            "Isomaltulose (C12H22O11)",
            "Kojibiose (C12H22O11)",
            "Nigerose (C12H22O11)",
            "Laminaribiose (C12H22O11)",
            "Sophorose (C12H22O11)",
            "Vicianose (C12H22O11)",
            "Allolactose (C12H22O11)",
            "Mannobiose (C12H22O11)",
            "Isotrehalose (C12H22O11)",
            "Sambubiose (C12H22O11)",
            "Primeverose (C12H22O11)",
            "Secaloindolinose (C12H22O11)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sucrose (C12H22O11)",
                "Lactose (C12H22O11)",
                "Maltose (C12H22O11)",
                "Cellobiose (C12H22O11)",
                "Trehalose (C12H22O11)",
                "Gentiobiose (C12H22O11)",
                "Isomaltose (C12H22O11)",
                "Melibiose (C12H22O11)",
                "Rutinose (C12H22O11)",
                "Turanose (C12H22O11)",
                "Maltulose (C12H22O11)",
                "Kojibiose (C12H22O11)",
                "Nigerose (C12H22O11)",
                "Laminaribiose (C12H22O11)",
                "Sophorose (C12H22O11)",
                "Vicianose (C12H22O11)",
                "Allolactose (C12H22O11)",
                "Mannobiose (C12H22O11)",
                "Sambubiose (C12H22O11)",
                "Primeverose (C12H22O11)"
            ],
            "mismatches": [
                "Palatinose (C12H22O11)",
                "Isomaltulose (C12H22O11)",
                "Isotrehalose (C12H22O11)",
                "Secaloindolinose (C12H22O11)"
            ],
            "true_referents": [
                "1,3,3'-tri-O-methyl-4alpha-mannobiose",
                "1-O-acetyl-alpha-maltose",
                "1-O-acetyl-beta-maltose",
                "2''-O-(6-sinapoylglucosyl)isovitexin",
                "2-O-(long-chain fatty acyl)-alpha,alpha-trehalose",
                "2-O-palmitoyl-alpha,alpha-trehalose",
                "2-phenylethyl beta-primeveroside",
                "3,6-di-O-methyl-beta-D-glucopyranosyl-(1->4)-alpha-L-rhamnopyranose",
                "3-O-alpha-rhamnopyranosyl-(1->4)-beta-glucopyranosyl-17-hydroxygeranyllinalool",
                "6-O-alpha-D-glucopyranosyl-D-fructofuranose",
                "6-O-alpha-D-glucopyranosyl-beta-D-fructofuranose",
                "6-hydroxyluteolin 7-O-laminaribioside",
                "7-O-[alpha-L-rhamnosyl-(1->2)-beta-D-glucosyl]isoorientin",
                "7-O-methylvitexin 2''-O-alpha-L-rhamnoside",
                "7-O-methylvitexin 2''-O-beta-L-rhamnoside",
                "D-glucopyranosyl-(1->4)-aldehydo-D-mannose",
                "allolactose",
                "alpha,beta-trehalose",
                "alpha-L-rhamnopyranosyl-(1->2)-beta-D-glucopyranose",
                "alpha-allolactose",
                "alpha-cellobiose",
                "alpha-lactose",
                "alpha-mannobiose",
                "benzyl beta-primeveroside",
                "beta-allolactose",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-melibiose",
                "cellobiose",
                "cyclobis-(1->6)-alpha-nigerosyl",
                "formononetin 7-O-rutinoside",
                "genistin 7-O-gentiobioside",
                "gentiobiose",
                "gentiobiose octaacetate",
                "inulobiose",
                "irilone-4'-O-[beta-D-glucopyranosyl-(1->6)-beta-D-glucopyranoside]",
                "isomaltose",
                "kojibiose",
                "lactose phosphate",
                "lactulose",
                "laminarabiose",
                "maltose",
                "maltulose",
                "mannobiose",
                "melibiose",
                "nigerose",
                "primeverose",
                "rutinose",
                "sambubiose",
                "sesaminol 2-O-beta-D-gentiobioside",
                "sinapoyl-isovitexin 2''-O-arabinoside",
                "sophorose",
                "sophoroside",
                "sucrose",
                "trehalose",
                "turanose",
                "vicianose"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Sucrose (Suc)",
            "Lactose (Lac)",
            "Maltose (Mal)",
            "Trehalose (Tre)",
            "Cellobiose (Cel)",
            "Gentiobiose (Gen)",
            "Melibiose (Mel)",
            "Turanose (Tur)",
            "Palatinose (Pal)",
            "Nigerose (Nig)",
            "Kojibiose (Koj)",
            "Laminaribiose (Lam)",
            "Sophorose (Sop)",
            "Primeverose (Pri)",
            "Xylobiose (Xyl)",
            "Isomaltose (Iso)",
            "Laminaritriose (Lat)",
            "Cellotriose (Cet)",
            "Mannotriose (Mat)",
            "Panose (Pan)",
            "Isomaltotriose (Imt)",
            "Maltotriose (Mat)",
            "Melezitose (Mez)",
            "Raffinose (Raf)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sucrose (Suc)",
                "Lactose (Lac)",
                "Maltose (Mal)",
                "Trehalose (Tre)",
                "Cellobiose (Cel)",
                "Gentiobiose (Gen)",
                "Melibiose (Mel)",
                "Turanose (Tur)",
                "Nigerose (Nig)",
                "Kojibiose (Koj)",
                "Laminaribiose (Lam)",
                "Sophorose (Sop)",
                "Primeverose (Pri)",
                "Xylobiose (Xyl)",
                "Isomaltose (Iso)"
            ],
            "mismatches": [
                "Palatinose (Pal)",
                "Laminaritriose (Lat)",
                "Cellotriose (Cet)",
                "Mannotriose (Mat)",
                "Panose (Pan)",
                "Isomaltotriose (Imt)",
                "Maltotriose (Mat)",
                "Melezitose (Mez)",
                "Raffinose (Raf)"
            ],
            "true_referents": [
                "1-O-acetyl-beta-maltose",
                "2-phenylethyl beta-primeveroside",
                "6-hydroxyluteolin 7-O-laminaribioside",
                "alpha,beta-trehalose",
                "alpha-L-rhamnopyranosyl-(1->2)-beta-D-glucopyranose",
                "alpha-cellobiose",
                "alpha-lactose",
                "alpha-maltose",
                "alpha-mannobiose",
                "benzyl beta-primeveroside",
                "beta-D-Gal-(1->4)-beta-D-Xyl-OBn",
                "beta-D-Galf-(1->5)-D-Galf",
                "beta-D-Galp-(1->3)-L-Araf",
                "beta-L-arabinofuranosyl-(1->2)-beta-L-arabinofuranose",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-mannobiose",
                "beta-melibiose",
                "cellobiose",
                "cyclobis-(1->6)-alpha-nigerosyl",
                "galactobiose",
                "gentiobiose",
                "inulobiose",
                "isomaltose",
                "kojibiose",
                "lactose",
                "lactose 6'-phosphate",
                "lactulose",
                "laminarabiose",
                "maltose",
                "maltose phosphate",
                "maltulose",
                "mannobiose",
                "melibionic acid",
                "melibiose",
                "nigerose",
                "pinen-10-yl vicianoside",
                "primeverose",
                "rutinose",
                "sambubiose",
                "sophorose",
                "sophoroside",
                "sucrose",
                "sucrose 6(G)-phosphate",
                "trehalose",
                "trehalose phosphate",
                "turanose",
                "xylobiose"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Fructose (Fru)",
            "Galactose (Gal)",
            "Lactose",
            "Maltose",
            "Isomaltose",
            "Trehalose",
            "Cellobiose",
            "Isomaltulose",
            "Sucrose (Suc)",
            "Lactulose",
            "Melibiose",
            "Raffinose",
            "Stachyose",
            "Verbascose",
            "Isomaltotriose",
            "Isomaltohexose",
            "Isomaltoheptose",
            "Isomaltooctose",
            "Isomaltononose",
            "Isomaltohexaose",
            "Isomaltoylohexose",
            "Isomaltoyloheptose"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Lactose",
                "Maltose",
                "Isomaltose",
                "Trehalose",
                "Cellobiose",
                "Lactulose",
                "Melibiose",
                "Stachyose",
                "Verbascose"
            ],
            "mismatches": [
                "Fructose (Fru)",
                "Galactose (Gal)",
                "Isomaltulose",
                "Sucrose (Suc)",
                "Raffinose",
                "Isomaltotriose",
                "Isomaltohexose",
                "Isomaltoheptose",
                "Isomaltooctose",
                "Isomaltononose",
                "Isomaltohexaose",
                "Isomaltoylohexose",
                "Isomaltoyloheptose"
            ],
            "true_referents": [
                "(2S)-poncirin",
                "1,6-kestotetraose",
                "3'-dehydromaltose",
                "6,6-kestotetraose",
                "D-galactosyl-(1->4)-beta-D-glucose",
                "D-maltobiono-1,5-lactone",
                "alpha-D-galactosyl-(1->2)-beta-D-galactose",
                "alpha-D-galactosyl-(1->3)-D-galactose",
                "alpha-cellobiose",
                "beta-D-Manp-(1->2)-alpha-D-ManpO[CH2]5NH2",
                "beta-L-arabinofuranosyl-(1->2)-beta-L-arabinofuranose",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-melibiose",
                "bis-D-fructose 2',1:2,1'-dianhydride",
                "cellobiose",
                "glycosylxylose",
                "isobemisiose",
                "isomaltose",
                "kojibiose",
                "lactose",
                "lactulose",
                "maltose",
                "maltulose",
                "melibiose",
                "rutinose",
                "sophorose",
                "stachyose",
                "sucrose",
                "sucrose 6(G)-phosphate",
                "trehalose",
                "trehalose phosphate",
                "trehalulose",
                "turanose",
                "verbascose",
                "vicianose",
                "xylobiose"
            ],
            "TP": 9,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            "Sucrose (C12H22O11)",
            "Lactose (C12H22O11)",
            "Maltose (C12H22O11)",
            "Trehalose (C12H22O11)",
            "Isomaltose (C12H22O11)",
            "Gentiobiose (C14H26O11)",
            "Cellobiose (C12H22O11)",
            "Melibiose (C12H22O11)",
            "Sophorose (C14H26O11)",
            "Raffinose (C18H32O16)",
            "Stachyose (C20H36O17)",
            "Verbascose (C22H40O18)",
            "JuglansRegiose (C20H36O17)",
            "Planteose (C20H36O17)",
            "Fucosyllactose (C18H32O16)",
            "Lacto-N-fucopentaose I (C25H44O22)",
            "Lacto-N-difucohexaose I (C28H50O25)",
            "Neolactotriaoside (C18H32O16)",
            "Trifucosyllactose (C21H38O19)",
            "Penta-4G-fucosyllactose (C24H44O22)",
            "Hexa-2-fucosyllactose (C26H48O24)",
            "Hepta-3,6-fucosyllactose (C28H52O26)",
            "Octa-4,6-fucosyllactose (C30H56O28)",
            "Nona-3,6-fucosyllactose (C32H60O30)",
            "Deca-4,6-fucosyllactose (C34H64O32)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sucrose",
                "Lactose",
                "Maltose",
                "Trehalose",
                "Isomaltose",
                "Gentiobiose",
                "Cellobiose",
                "Melibiose",
                "Sophorose",
                "Stachyose",
                "Verbascose"
            ],
            "mismatches": [
                "Raffinose",
                "JuglansRegiose",
                "Planteose",
                "Fucosyllactose",
                "Lacto-N-fucopentaose I",
                "Lacto-N-difucohexaose I",
                "Neolactotriaoside",
                "Trifucosyllactose",
                "Penta-4G-fucosyllactose",
                "Hexa-2-fucosyllactose",
                "Hepta-3,6-fucosyllactose",
                "Octa-4,6-fucosyllactose",
                "Nona-3,6-fucosyllactose",
                "Deca-4,6-fucosyllactose"
            ],
            "true_referents": [
                "1-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "1-O-acetyl-alpha-maltose",
                "1-O-acetyl-beta-maltose",
                "2''-O-(beta-D-glucosyl)isovitexin",
                "2'-fucosyllactose",
                "2,2'-difucosyllactose",
                "2-O-(4-O-beta-D-galactopyranosyl-beta-D-glucopyranosyl)-glycerol",
                "2-O-(N-acetyl-alpha-D-galactosaminyl)-L-fucitol",
                "2-O-(long-chain fatty acyl)-alpha,alpha-trehalose",
                "3'-dehydromaltose",
                "3-O-alpha-rhamnopyranosyl-(1->4)-beta-glucopyranosyl-17-hydroxygeranyllinalool",
                "3-fucosyllactose",
                "6-O-alpha-D-glucopyranosyl-D-fructofuranose",
                "6-O-alpha-D-glucopyranosyl-beta-D-fructofuranose",
                "7-O-[alpha-L-rhamnosyl-(1->2)-beta-D-glucosyl]chrysoeriol",
                "7-O-methylvitexin 2''-O-alpha-L-rhamnoside",
                "7-O-methylvitexin 2''-O-beta-L-rhamnoside",
                "N-acetyl-alpha-D-galactosaminyl-(1->3)-[alpha-L-fucosyl-(1->2)]-beta-D-galactose derivative",
                "acacetin-8-C-neohesperidoside",
                "alpha-cellobiose",
                "alpha-lactose",
                "beta-D-apiofuranosyl-(1->6)-D-glucopyranose",
                "beta-D-fructofuranosyl 6-O-octanoyl-alpha-D-glucopyranoside",
                "beta-D-fructofuranosyl-(2,1)-beta-D-fructofuranose",
                "beta-cellobiose",
                "beta-lactose",
                "beta-maltose",
                "beta-melibiose",
                "cellobiose",
                "genistin 7-O-gentiobioside",
                "gentiobiose",
                "gentiobiose octaacetate",
                "gypenoside XVII",
                "irilone-4'-O-[beta-D-glucopyranosyl-(1->6)-beta-D-glucopyranoside]",
                "isomaltose",
                "lactose phosphate",
                "maltose",
                "melibiose",
                "methyl 2-O-alpha-L-fucopyranosyl-beta-D-galactoside",
                "rubiarbonol A 3-O-beta-D-glucopyranosyl-(1->2)-beta-D-glucopyranoside",
                "sophorose",
                "sophoroside",
                "stachyose",
                "sucrose",
                "sucrose 6(G)-phosphate",
                "trehalose",
                "verbascose"
            ],
            "TP": 11,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "disaccharide",
        "domain": "chemistry",
        "response": [
            {
                "referent": "glucose",
                "identifier": "C6H12O6"
            },
            {
                "referent": "fructose",
                "identifier": "C6H12O6"
            },
            {
                "referent": "sucrose",
                "identifier": "C12H22O11"
            },
            {
                "referent": "lactose",
                "identifier": "C12H22O11"
            },
            {
                "referent": "maltose",
                "identifier": "C12H22O11"
            },
            {
                "referent": "trehalose",
                "identifier": "C12H22O11"
            },
            {
                "referent": "cellobiose",
                "identifier": "C12H22O11"
            },
            {
                "referent": "glycogen",
                "identifier": "C12H22O11"
            },
            {
                "referent": "amylopectin",
                "identifier": "C12H22O11"
            },
            {
                "referent": "chitin",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "chitosan",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "cellulose",
                "identifier": "C6H10O5"
            },
            {
                "referent": "chitin",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "chitosan",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "cellulose",
                "identifier": "C6H10O5"
            },
            {
                "referent": "chitin",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "chitosan",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "cellulose",
                "identifier": "C6H10O5"
            },
            {
                "referent": "chitin",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "chitosan",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "cellulose",
                "identifier": "C6H10O5"
            },
            {
                "referent": "chitin",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "chitosan",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "cellulose",
                "identifier": "C6H10O5"
            },
            {
                "referent": "chitin",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "chitosan",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "cellulose",
                "identifier": "C6H10O5"
            },
            {
                "referent": "chitin",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "chitosan",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "cellulose",
                "identifier": "C6H10O5"
            },
            {
                "referent": "chitin",
                "identifier": "C8H13O5N"
            },
            {
                "referent": "chitosan",
                "identifier": "C8H13O5N"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "sucrose",
                "lactose",
                "maltose",
                "trehalose",
                "cellobiose"
            ],
            "mismatches": [
                "glucose",
                "fructose",
                "glycogen",
                "amylopectin",
                "chitin",
                "chitosan",
                "cellulose"
            ],
            "true_referents": [
                "1-O-acetyl-beta-maltose",
                "2-O-(long-chain fatty acyl)-alpha,alpha-trehalose",
                "3-(4-deoxy-beta-D-gluc-4-enosyluronic acid)-N-acetyl-D-glucosamine",
                "3-O-beta-D-glucosyl-D-glucuronic acid",
                "4-\\{[4-(dimethylamino)phenyl]diazenyl\\}phenyl-beta-lactoside",
                "6-O-alpha-D-glucopyranosyl-D-fructofuranose",
                "6-O-alpha-D-glucopyranosyl-beta-D-fructofuranose",
                "D-galactosyl-(1->4)-beta-D-glucose",
                "N-acetyl-beta-D-galactosaminyl-(1->4)-N-acetyl-beta-D-glucosaminide",
                "N-acetyl-beta-D-glucosaminyl-(1->4)-D-glucosamine",
                "alpha-cellobiose",
                "beta-cellobiose",
                "bis-D-fructose 2',1:2,1'-dianhydride",
                "bis-beta-D-fructofuranose 1,2':2,3'-dianhydride",
                "cellobiose",
                "glycosylxylose",
                "lactose phosphate",
                "maltose",
                "sucrose",
                "trehalose"
            ],
            "TP": 5,
            "FP": 7,
            "FN": 0
        }
    }
]