[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "chlorophyll a (Chl a)",
            "chlorophyll b (Chl b)",
            "chlorophyll c",
            "chlorophyll d",
            "chlorophyll e",
            "bacteriochlorophyll a",
            "bacteriochlorophyll b",
            "bacteriochlorophyll c",
            "bacteriochlorophyll d",
            "bacteriochlorophyll e",
            "bacteriochlorophyll g",
            "bacteriochlorophyll h",
            "bacteriochlorophyll i",
            "bacteriochlorophyll j",
            "pseudobacteriochlorophyll a",
            "pseudobacteriochlorophyll b",
            "phycocyanobilin",
            "phycoerythrobilin",
            "phycocyanin",
            "phycoerythrin",
            "fucoxanthin",
            "astaxanthin",
            "lycopene",
            "zeaxanthin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "chlorophyll a (Chl a)",
                "chlorophyll b (Chl b)",
                "chlorophyll c",
                "chlorophyll d",
                "bacteriochlorophyll a",
                "bacteriochlorophyll b",
                "bacteriochlorophyll c",
                "bacteriochlorophyll e",
                "phycocyanobilin",
                "phycoerythrobilin"
            ],
            "mismatches": [
                "chlorophyll e",
                "bacteriochlorophyll d",
                "bacteriochlorophyll g",
                "bacteriochlorophyll h",
                "bacteriochlorophyll i",
                "bacteriochlorophyll j",
                "pseudobacteriochlorophyll a",
                "pseudobacteriochlorophyll b",
                "phycocyanin",
                "phycoerythrin",
                "fucoxanthin",
                "astaxanthin",
                "lycopene",
                "zeaxanthin"
            ],
            "true_referents": [
                "(2R)-phycocyanobilin",
                "(3E)-phycocyanobilin",
                "(3E)-phycoerythrobilin",
                "Chlorophyll c",
                "S-phycoerythrobilin-L-cysteine",
                "bacteriochlorophyll",
                "bacteriochlorophyll a",
                "bacteriochlorophyll b",
                "bacteriochlorophyll c",
                "bacteriochlorophyll e",
                "bacteriochlorophyllide d",
                "bacteriochlorophyllide g",
                "chlorophyll",
                "chlorophyll a",
                "chlorophyll b",
                "chlorophyll d",
                "phycocyanobilin",
                "phycoerythrobilin"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "Hemoglobin (Hb)",
            "Myoglobin (Mb)",
            "Cytochrome c",
            "Cytochrome b",
            "Cytochrome P450",
            "Cytochrome c oxidase",
            "Cytochrome a",
            "Cytochrome a3",
            "Biliverdin",
            "Bilirubin",
            "Protoporphyrin IX",
            "Coproporphyrinogen III",
            "Uroporphyrinogen III",
            "Chlorophyll a",
            "Chlorophyll b",
            "Chlorophyll c1",
            "Chlorophyll c2",
            "Chlorophyll d",
            "Chlorophyll f",
            "Phycocyanobilin",
            "Phytochromobilin",
            "Vitamin B12 (Cobalamin)",
            "Heme",
            "Erythrocuprein",
            "Leghemoglobin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Biliverdin",
                "Coproporphyrinogen III",
                "Uroporphyrinogen III",
                "Chlorophyll a",
                "Chlorophyll b",
                "Chlorophyll c1",
                "Chlorophyll c2",
                "Chlorophyll d",
                "Chlorophyll f",
                "Phycocyanobilin",
                "Phytochromobilin",
                "Heme"
            ],
            "mismatches": [
                "Hemoglobin (Hb)",
                "Myoglobin (Mb)",
                "Cytochrome c",
                "Cytochrome b",
                "Cytochrome P450",
                "Cytochrome c oxidase",
                "Cytochrome a",
                "Cytochrome a3",
                "Bilirubin",
                "Protoporphyrin IX",
                "Vitamin B12 (Cobalamin)",
                "Erythrocuprein",
                "Leghemoglobin"
            ],
            "true_referents": [
                "(-)-stercobilin",
                "(2R)-phycocyanobilin",
                "(3E)-phycocyanobilin",
                "(3E)-phycoerythrobilin",
                "(3E)-phytochromobilin",
                "(3Z)-phytochromobilin",
                "(E,E)-bilirubin",
                "13(2)-carboxypyropheophorbide a",
                "15-oxo-beta-bilirubin",
                "5-oxo-delta-bilirubin",
                "Biliverdin IX",
                "Chlorophyll c",
                "Deuteroporphyrin IX",
                "bacteriochlorophyll c",
                "biliverdin",
                "biliverdin beta",
                "chlorophyll a",
                "chlorophyll b",
                "chlorophyll c1",
                "chlorophyll c2",
                "chlorophyll d",
                "chlorophyll f",
                "cobalamin",
                "coproporphyrin III",
                "coproporphyrinogen",
                "coproporphyrinogen III",
                "cytoporphyrin",
                "heme",
                "heme a",
                "heme b",
                "heme-cysteine",
                "mesoporphyrin IX",
                "metalloporphyrin",
                "methylcobalamin",
                "phenylporphyrin",
                "phycocyanobilin",
                "phytochromobilin",
                "porphyrin",
                "protoporphyrin",
                "uroporphyrin III",
                "uroporphyrinogen",
                "uroporphyrinogen III"
            ],
            "TP": 12,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "Heme (Fe-protoporphyrin IX)",
            "Chlorophyll a",
            "Chlorophyll b",
            "Chlorophyll c",
            "Chlorophyll d",
            "Chlorophyll f",
            "Bacteriochlorophyll a",
            "Bacteriochlorophyll b",
            "Bacteriochlorophyll c",
            "Bacteriochlorophyll d",
            "Bacteriochlorophyll e",
            "Bacteriochlorophyll g",
            "Biliverdin",
            "Bilirubin",
            "Phycocyanobilin",
            "Phytochromobilin",
            "Urobilin",
            "Stercobilin",
            "Phycocyanin",
            "Phycoerythrin",
            "Phycocyanobilin",
            "Phytochromobilin",
            "Protoporphyrin IX",
            "Coproporphyrin",
            "Uroporphyrin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chlorophyll a",
                "Chlorophyll b",
                "Chlorophyll c",
                "Chlorophyll d",
                "Chlorophyll f",
                "Bacteriochlorophyll a",
                "Bacteriochlorophyll b",
                "Bacteriochlorophyll c",
                "Bacteriochlorophyll e",
                "Biliverdin",
                "Phycocyanobilin",
                "Phytochromobilin",
                "Urobilin",
                "Stercobilin",
                "Coproporphyrin"
            ],
            "mismatches": [
                "Heme (Fe-protoporphyrin IX)",
                "Bacteriochlorophyll d",
                "Bacteriochlorophyll g",
                "Bilirubin",
                "Phycocyanin",
                "Phycoerythrin",
                "Protoporphyrin IX",
                "Uroporphyrin"
            ],
            "true_referents": [
                "(-)-stercobilin",
                "(2R)-phycocyanobilin",
                "(3E)-phycocyanobilin",
                "(3E)-phycoerythrobilin",
                "(3E)-phytochromobilin",
                "(3Z)-phytochromobilin",
                "(E,E)-bilirubin",
                "15-oxo-beta-bilirubin",
                "5-oxo-delta-bilirubin",
                "Biliverdin IX",
                "Chlorophyll c",
                "D-Urobilin",
                "Deuteroporphyrin IX",
                "S-phycoerythrobilin-L-cysteine",
                "bacteriochlorophyll a",
                "bacteriochlorophyll b",
                "bacteriochlorophyll c",
                "bacteriochlorophyll e",
                "bacteriochlorophyllide d",
                "bacteriochlorophyllide g",
                "biliverdin",
                "biliverdin beta",
                "chlorophyll",
                "chlorophyll a",
                "chlorophyll b",
                "chlorophyll d",
                "chlorophyll f",
                "coproporphyrin",
                "coproporphyrin III",
                "coproporphyrinogen",
                "heme",
                "mesoporphyrin IX",
                "phycocyanobilin",
                "phycoerythrobilin",
                "phytochromobilin",
                "protoporphyrin",
                "stercobilin",
                "stercobilinogen",
                "urobilin",
                "urobilinogen"
            ],
            "TP": 15,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "Heme B (HB)",
            "Heme A (HA)",
            "Protoporphyrin IX (PPIX)",
            "Protoporphyrin VII (PPII)",
            "Protoporphyrin III (PPIII)",
            "Uroporphyrin I (UPI)",
            "Uroporphyrin III (UPIII)",
            "Coproporphyrin I (CPI)",
            "Coproporphyrin III (CPIII)",
            "Mesoporphyrin IX (MPIX)",
            "Deuteroporphyrin IX (DPIX)",
            "Vinylheme (VH)",
            "Ethylheme (EH)",
            "Methylheme (MH)",
            "Ferriprotoporphyrin IX (FePPIX)",
            "Ferroprotoporphyrin IX (FePPIX)",
            "Chlorophyll a (Chl a)",
            "Chlorophyll b (Chl b)",
            "Bacteriochlorophyll a (BChl a)",
            "Bacteriochlorophyll b (BChl b)",
            "Porphobilinogen (PBG)",
            "Hydroxymethylbilane (HMB)",
            "Urobilinogen (UBG)",
            "Stercobilin (SCB)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heme B (HB)",
                "Heme A (HA)",
                "Uroporphyrin I (UPI)",
                "Uroporphyrin III (UPIII)",
                "Coproporphyrin I (CPI)",
                "Coproporphyrin III (CPIII)",
                "Mesoporphyrin IX (MPIX)",
                "Deuteroporphyrin IX (DPIX)",
                "Chlorophyll a (Chl a)",
                "Chlorophyll b (Chl b)",
                "Bacteriochlorophyll a (BChl a)",
                "Bacteriochlorophyll b (BChl b)",
                "Urobilinogen (UBG)",
                "Stercobilin (SCB)"
            ],
            "mismatches": [
                "Protoporphyrin IX (PPIX)",
                "Protoporphyrin VII (PPII)",
                "Protoporphyrin III (PPIII)",
                "Vinylheme (VH)",
                "Ethylheme (EH)",
                "Methylheme (MH)",
                "Ferriprotoporphyrin IX (FePPIX)",
                "Ferroprotoporphyrin IX (FePPIX)",
                "Porphobilinogen (PBG)",
                "Hydroxymethylbilane (HMB)"
            ],
            "true_referents": [
                "(-)-stercobilin",
                "Coproporphyrin II",
                "D-Urobilinogen",
                "Deuteroporphyrin IX",
                "Fe-coproporphyrin III",
                "bacteriochlorophyll a",
                "bacteriochlorophyll b",
                "chlorophyll a",
                "chlorophyll b",
                "coproporphyrin",
                "coproporphyrin I",
                "coproporphyrin III",
                "coproporphyrinogen I",
                "diporphyrin",
                "ferroheme",
                "heme a",
                "heme b",
                "hydrogenobyrinic acid",
                "hydrogenobyrinic acid a,c-diamide",
                "meso-meso-diporphyrin",
                "mesoporphyrin IX",
                "mesoporphyrins",
                "mycobilin b",
                "porphyrinogen",
                "porphyrinogens",
                "protoporphyrin",
                "protoporphyrins",
                "stercobilin",
                "stercobilinogen",
                "urobilin",
                "urobilinogen",
                "uroporphyrin",
                "uroporphyrin I",
                "uroporphyrin III",
                "uroporphyrinogen I",
                "uroporphyrinogen III"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "Heme (HEM)",
            "Chlorophyll a (CHLa)",
            "Chlorophyll b (CHLb)",
            "Chlorophyll c (CHLc)",
            "Chlorophyll d (CHLd)",
            "Chlorophyll f (CHLf)",
            "Biliverdin (BVD)",
            "Phycocyanobilin (PCB)",
            "Phycoerythrobilin (PEB)",
            "Phycourobilin (PUB)",
            "Urobilin (UBN)",
            "Stercobilin (SBN)",
            "Protoporphyrin IX (PPIX)",
            "Cobalamin (Vitamin B12)",
            "Bilichrome",
            "Phylloerythrin",
            "Pheophytin a",
            "Pheophytin b",
            "Protochlorophyllide",
            "Bacteriochlorophyll a",
            "Bacteriochlorophyll b",
            "Bacteriochlorophyll c",
            "Bacteriochlorophyll d",
            "Bacteriochlorophyll e"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heme (HEM)",
                "Chlorophyll a (CHLa)",
                "Chlorophyll b (CHLb)",
                "Chlorophyll c (CHLc)",
                "Chlorophyll d (CHLd)",
                "Chlorophyll f (CHLf)",
                "Biliverdin (BVD)",
                "Phycocyanobilin (PCB)",
                "Phycoerythrobilin (PEB)",
                "Urobilin (UBN)",
                "Stercobilin (SBN)",
                "Cobalamin (Vitamin B12)",
                "Pheophytin a",
                "Pheophytin b",
                "Protochlorophyllide",
                "Bacteriochlorophyll a",
                "Bacteriochlorophyll b",
                "Bacteriochlorophyll c",
                "Bacteriochlorophyll e"
            ],
            "mismatches": [
                "Phycourobilin (PUB)",
                "Protoporphyrin IX (PPIX)",
                "Bilichrome",
                "Phylloerythrin",
                "Bacteriochlorophyll d"
            ],
            "true_referents": [
                "(-)-stercobilin",
                "(2R)-phycocyanobilin",
                "(3E)-phycocyanobilin",
                "(3E)-phycoerythrobilin",
                "(4S,10Z,16R)-phycourobilin",
                "Chlorophyll c",
                "D-Urobilin",
                "Deuteroporphyrin IX",
                "PHYCOVIOLOBILIN",
                "S-phycoerythrobilin-L-cysteine",
                "bacteriochlorophyll a",
                "bacteriochlorophyll b",
                "bacteriochlorophyll c",
                "bacteriochlorophyll e",
                "bacteriochlorophyllide d",
                "biladiene",
                "biladiene-ab",
                "biladiene-ac",
                "biliverdin",
                "biliverdin beta",
                "biliverdin delta",
                "chlorophyll a",
                "chlorophyll b",
                "chlorophyll d",
                "chlorophyll f",
                "cobalamin",
                "heme",
                "methylcobalamin",
                "pheophytin",
                "pheophytin a",
                "pheophytin b",
                "phycocyanobilin",
                "phycoerythrobilin",
                "phycourobilin-bis-L-cysteine",
                "protochlorophyllide",
                "protoporphyrin",
                "protoporphyrins",
                "stercobilin",
                "stercobilinogen",
                "urobilin",
                "urobilinogen"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "Heme (C1)",
            "Chlorophyll a (C2)",
            "Chlorophyll b (C3)",
            "Myoglobin (C4)",
            "Hemoglobin (C5)",
            "Cytochrome c (C6)",
            "Cobalamin (Vitamin B12) (C7)",
            "Porphyrin (C8)",
            "Biliverdin (C9)",
            "Bilirubin (C10)",
            "Vitamin B6 (Pyridoxal) (C11)",
            "Uroporphyrin (C12)",
            "Protoporphyrin IX (C13)",
            "Hemin (C14)",
            "Chlorophyll c (C15)",
            "Chlorophyll d (C16)",
            "Bacteriochlorophyll a (C17)",
            "Bacteriochlorophyll b (C18)",
            "Bacteriochlorophyll c (C19)",
            "Bacteriochlorophyll d (C20)",
            "Bacteriochlorophyll e (C21)",
            "Hematoporphyrin (C22)",
            "Manganese porphyrin (C23)",
            "Zinc protoporphyrin (C24)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cobalamin (Vitamin B12) (C7)",
                "Porphyrin (C8)",
                "Biliverdin (C9)",
                "Uroporphyrin (C12)",
                "Hemin (C14)",
                "Chlorophyll c (C15)",
                "Chlorophyll d (C16)",
                "Bacteriochlorophyll a (C17)",
                "Bacteriochlorophyll b (C18)",
                "Bacteriochlorophyll c (C19)",
                "Bacteriochlorophyll e (C21)",
                "Hematoporphyrin (C22)",
                "Zinc protoporphyrin (C24)"
            ],
            "mismatches": [
                "Heme (C1)",
                "Chlorophyll a (C2)",
                "Chlorophyll b (C3)",
                "Myoglobin (C4)",
                "Hemoglobin (C5)",
                "Cytochrome c (C6)",
                "Bilirubin (C10)",
                "Vitamin B6 (Pyridoxal) (C11)",
                "Protoporphyrin IX (C13)",
                "Bacteriochlorophyll d (C20)",
                "Manganese porphyrin (C23)"
            ],
            "true_referents": [
                "(E,E)-bilirubin",
                "15-oxo-beta-bilirubin",
                "5-oxo-delta-bilirubin",
                "Biliverdin IX",
                "Chlorophyll c",
                "Deuteroporphyrin IX",
                "bacteriochlorophyll a",
                "bacteriochlorophyll b",
                "bacteriochlorophyll c",
                "bacteriochlorophyll e",
                "bacteriochlorophyllide d",
                "biliverdin",
                "biliverdin beta",
                "chlorophyll b",
                "chlorophyll c1",
                "chlorophyll c2",
                "chlorophyll d",
                "cobalamin",
                "cobalt(II)-factor IV",
                "cytoporphyrin",
                "hematoporphyrin",
                "heme a",
                "heme b",
                "heme-cysteine",
                "hemin",
                "magnesium porphyrin",
                "methylcobalamin",
                "porphyrin",
                "protoporphyrin",
                "protoporphyrins",
                "uroporphyrin",
                "uroporphyrin I",
                "uroporphyrinogen",
                "zinc protoporphyrin"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "Heme (Hm)",
            "Chlorophyll (Chl)",
            "Cobalamin (Cbl)",
            "Phycocyanobilin (PCB)",
            "Phycoerythrobilin (PEB)",
            "Phytochromobilin (P\u03a6B)",
            "Urobilinogen (Uro)",
            "Biliverdin (Bv)",
            "Cytochrome c (Cyt c)",
            "Cytochrome b (Cyt b)",
            "Cytochrome a (Cyt a)",
            "Cytochrome f (Cyt f)",
            "Cytochrome c1 (Cyt c1)",
            "Cytochrome b6 (Cyt b6)",
            "Cytochrome a3 (Cyt a3)",
            "Cytochrome c3 (Cyt c3)",
            "Cytochrome b5 (Cyt b5)",
            "Cytochrome P450 (CYP)",
            "Protoporphyrin IX (PPIX)",
            "Hemoglobin (Hb)",
            "Myoglobin (Mb)",
            "Catalase (Cat)",
            "Peroxidase (Prx)",
            "Hydrogenobyrinic acid (Hba)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heme (Hm)",
                "Chlorophyll (Chl)",
                "Cobalamin (Cbl)",
                "Phycocyanobilin (PCB)",
                "Phycoerythrobilin (PEB)",
                "Phytochromobilin (P\u03a6B)",
                "Urobilinogen (Uro)",
                "Biliverdin (Bv)",
                "Hydrogenobyrinic acid (Hba)"
            ],
            "mismatches": [
                "Cytochrome c (Cyt c)",
                "Cytochrome b (Cyt b)",
                "Cytochrome a (Cyt a)",
                "Cytochrome f (Cyt f)",
                "Cytochrome c1 (Cyt c1)",
                "Cytochrome b6 (Cyt b6)",
                "Cytochrome a3 (Cyt a3)",
                "Cytochrome c3 (Cyt c3)",
                "Cytochrome b5 (Cyt b5)",
                "Cytochrome P450 (CYP)",
                "Protoporphyrin IX (PPIX)",
                "Hemoglobin (Hb)",
                "Myoglobin (Mb)",
                "Catalase (Cat)",
                "Peroxidase (Prx)"
            ],
            "true_referents": [
                "(-)-stercobilin",
                "(2R)-phycocyanobilin",
                "(3E)-phycocyanobilin",
                "(3E)-phycoerythrobilin",
                "(3E)-phytochromobilin",
                "(3Z)-phytochromobilin",
                "D-Urobilinogen",
                "Deuteroporphyrin IX",
                "Fe-coproporphyrin III",
                "S-phycoerythrobilin-L-cysteine",
                "biliverdin",
                "biliverdin beta",
                "biliverdin delta",
                "chlorophyll",
                "chlorophyll a",
                "chlorophyll c1",
                "chlorophyll f",
                "cobalamin",
                "cobalamins",
                "coproporphyrin III",
                "cytoporphyrin",
                "heme",
                "heme a",
                "heme b",
                "heme-cysteine",
                "hydrogenobyrinic acid",
                "hydrogenobyrinic acid a,c-diamide",
                "metalloporphyrin",
                "phycocyanobilin",
                "phycoerythrobilin",
                "phytochromobilin",
                "porphyrin",
                "protoporphyrin",
                "protoporphyrins",
                "urobilin",
                "urobilinogen"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "Chlorophyll",
            "Heme",
            "Bilirubin",
            "Melanin",
            "Phycocyanin",
            "Phycoerythrin",
            "Phytochrome",
            "Phytoene",
            "Phytofluene",
            "Astaxanthin",
            "Lycopene",
            "Beta-carotene",
            "Zeaxanthin",
            "Lutein",
            "Canthaxanthin",
            "Crocin",
            "Safranal",
            "Bixin",
            "Norbixin",
            "Curcumin",
            "Indigo",
            "Indirubin",
            "Carmine",
            "Erythritol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chlorophyll",
                "Heme"
            ],
            "mismatches": [
                "Bilirubin",
                "Melanin",
                "Phycocyanin",
                "Phycoerythrin",
                "Phytochrome",
                "Phytoene",
                "Phytofluene",
                "Astaxanthin",
                "Lycopene",
                "Beta-carotene",
                "Zeaxanthin",
                "Lutein",
                "Canthaxanthin",
                "Crocin",
                "Safranal",
                "Bixin",
                "Norbixin",
                "Curcumin",
                "Indigo",
                "Indirubin",
                "Carmine",
                "Erythritol"
            ],
            "true_referents": [
                "(-)-stercobilin",
                "(-)-stercobilinogen",
                "(3E)-phycocyanobilin",
                "(3E)-phycoerythrobilin",
                "(3E)-phytochromobilin",
                "(3Z)-phytochromobilin",
                "(E,E)-bilirubin",
                "15-oxo-beta-bilirubin",
                "5-oxo-delta-bilirubin",
                "S-phycoerythrobilin-L-cysteine",
                "Zincphyrin",
                "anaerobilin",
                "bilin",
                "bilins",
                "biliverdin",
                "chlorin",
                "chlorophyll",
                "chlorophyll a",
                "chlorophyll f",
                "corrole",
                "heme",
                "mesobilirubin IXalpha",
                "pheophorbide",
                "pheophorbide a",
                "pheophorbide b",
                "phlorin",
                "phycocyanobilin",
                "phycoerythrobilin",
                "phytochromobilin",
                "porfimer",
                "stercobilin"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "Porphyrin",
            "Heme (heme b)",
            "Cytochrome c",
            "Chlorophyll a",
            "Chlorophyll b",
            "Biliverdin",
            "Bilirubin",
            "Protoporphyrin IX",
            "Uroporphyrin",
            "Coproporphyrin",
            "Hemoglobin",
            "Myoglobin",
            "Cobalamin (Vitamin B12)",
            "Siroheme",
            "Bacteriochlorophyll a",
            "Bacteriochlorophyll b",
            "Phycocyanobilin",
            "Phycoerythrobilin",
            "F430",
            "Ferriprotoporphyrin",
            "Mesoheme",
            "Hematin",
            "Phyllobilins",
            "Verteporphyrin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Porphyrin",
                "Chlorophyll a",
                "Chlorophyll b",
                "Biliverdin",
                "Siroheme",
                "Bacteriochlorophyll a",
                "Bacteriochlorophyll b",
                "Phycocyanobilin",
                "Phycoerythrobilin",
                "Hematin"
            ],
            "mismatches": [
                "Heme (heme b)",
                "Cytochrome c",
                "Bilirubin",
                "Protoporphyrin IX",
                "Uroporphyrin",
                "Coproporphyrin",
                "Hemoglobin",
                "Myoglobin",
                "Cobalamin (Vitamin B12)",
                "F430",
                "Ferriprotoporphyrin",
                "Mesoheme",
                "Phyllobilins",
                "Verteporphyrin"
            ],
            "true_referents": [
                "(2R)-phycocyanobilin",
                "(3E)-phycocyanobilin",
                "(3E)-phycoerythrobilin",
                "(E,E)-bilirubin",
                "15-oxo-beta-bilirubin",
                "5-oxo-delta-bilirubin",
                "Biliverdin IX",
                "Chlorophyll c",
                "Deuteroporphyrin IX",
                "LSM-4252",
                "LSM-5035",
                "PHYCOVIOLOBILIN",
                "S-phycoerythrobilin-L-cysteine",
                "anaerobilin",
                "bacteriochlorophyll a",
                "bacteriochlorophyll b",
                "bacteriochlorophyll c",
                "biliverdin",
                "biliverdin beta",
                "chlorophyll a",
                "chlorophyll b",
                "chloroporphyrin",
                "cobalamin",
                "coenzyme F430",
                "coproporphyrin",
                "coproporphyrin III",
                "coproporphyrinogen",
                "cytoporphyrin",
                "ferroheme",
                "hematin",
                "heme b",
                "heme-amino acid",
                "mesoporphyrin IX",
                "metalloporphyrin",
                "metalloprotoporphyrin",
                "methylcobalamin",
                "mycobilin a",
                "phycocyanobilin",
                "phycoerythrobilin",
                "porphyrin",
                "protoporphyrin",
                "siroheme",
                "uroporphyrin",
                "uroporphyrin I",
                "uroporphyrin III"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "Chlorophyll a (Chl a)",
            "Chlorophyll b (Chl b)",
            "Chlorophyll c (Chl c)",
            "Chlorophyll d (Chl d)",
            "Chlorophyll f (Chl f)",
            "Bacteriochlorophyll a (BChl a)",
            "Bacteriochlorophyll b (BChl b)",
            "Bacteriochlorophyll c (BChl c)",
            "Bacteriochlorophyll d (BChl d)",
            "Bacteriochlorophyll e (BChl e)",
            "Bacteriochlorophyll g (BChl g)",
            "Heme",
            "Hemoglobin",
            "Myoglobin",
            "Cytochrome c",
            "Phytochrome",
            "Phycocyanin",
            "Phycoerythrin",
            "Bilirubin",
            "Biliverdin",
            "Porphyrin",
            "Protoporphyrin IX",
            "Uroporphyrin",
            "Coproporphyrin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chlorophyll a (Chl a)",
                "Chlorophyll b (Chl b)",
                "Chlorophyll c (Chl c)",
                "Chlorophyll d (Chl d)",
                "Chlorophyll f (Chl f)",
                "Bacteriochlorophyll a (BChl a)",
                "Bacteriochlorophyll b (BChl b)",
                "Bacteriochlorophyll c (BChl c)",
                "Bacteriochlorophyll e (BChl e)",
                "Heme",
                "Biliverdin",
                "Porphyrin",
                "Uroporphyrin",
                "Coproporphyrin"
            ],
            "mismatches": [
                "Bacteriochlorophyll d (BChl d)",
                "Bacteriochlorophyll g (BChl g)",
                "Hemoglobin",
                "Myoglobin",
                "Cytochrome c",
                "Phytochrome",
                "Phycocyanin",
                "Phycoerythrin",
                "Bilirubin",
                "Protoporphyrin IX"
            ],
            "true_referents": [
                "(3E)-phycocyanobilin",
                "(3E)-phycoerythrobilin",
                "(3E)-phytochromobilin",
                "(3Z)-phytochromobilin",
                "(E,E)-bilirubin",
                "15-oxo-beta-bilirubin",
                "5-oxo-delta-bilirubin",
                "Biliverdin IX",
                "Chlorophyll c",
                "Deuteroporphyrin IX",
                "S-phycoerythrobilin-L-cysteine",
                "bacteriochlorophyll a",
                "bacteriochlorophyll b",
                "bacteriochlorophyll c",
                "bacteriochlorophyll e",
                "bacteriochlorophyllide d",
                "bacteriochlorophyllide g",
                "biliverdin",
                "biliverdin beta",
                "chlorophyll",
                "chlorophyll a",
                "chlorophyll b",
                "chlorophyll c1",
                "chlorophyll d",
                "chlorophyll f",
                "chloroporphyrin",
                "coproporphyrin",
                "coproporphyrin III",
                "coproporphyrinogen",
                "cytoporphyrin",
                "heme",
                "heme b",
                "heme-amino acid",
                "mesoporphyrin IX",
                "metalloporphyrin",
                "phycocyanobilin",
                "phycoerythrobilin",
                "phytochromobilin",
                "porphyrin",
                "protoporphyrin",
                "uroporphyrin",
                "uroporphyrin I",
                "uroporphyrin III"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "Bilirubin",
            "Biliverdin",
            "Chlorophyll a",
            "Chlorophyll b",
            "Chlorophyll c1",
            "Chlorophyll c2",
            "Chlorophyll d",
            "Chlorophyll f",
            "Bacteriochlorophyll a",
            "Bacteriochlorophyll b",
            "Bacteriochlorophyll c",
            "Bacteriochlorophyll d",
            "Bacteriochlorophyll e",
            "Bacteriochlorophyll g",
            "Heme b",
            "Heme a",
            "Heme c",
            "Heme d1",
            "Heme o",
            "Cobalamin (Vitamin B12)",
            "Coenzyme F430",
            "Siroheme",
            "Phycocyanobilin",
            "Phycoerythrobilin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Biliverdin",
                "Chlorophyll a",
                "Chlorophyll b",
                "Chlorophyll c1",
                "Chlorophyll c2",
                "Chlorophyll d",
                "Chlorophyll f",
                "Bacteriochlorophyll a",
                "Bacteriochlorophyll b",
                "Bacteriochlorophyll e",
                "Heme b",
                "Heme a",
                "Heme o",
                "Cobalamin (Vitamin B12)",
                "Coenzyme F430",
                "Siroheme",
                "Phycocyanobilin",
                "Phycoerythrobilin"
            ],
            "mismatches": [
                "Bilirubin",
                "Bacteriochlorophyll d",
                "Bacteriochlorophyll g",
                "Heme c",
                "Heme d1"
            ],
            "true_referents": [
                "(2R)-phycocyanobilin",
                "(3E)-phycocyanobilin",
                "(3E)-phycoerythrobilin",
                "(E,E)-bilirubin",
                "15,17(3)-seco-F430-17(3)-acid",
                "15-oxo-beta-bilirubin",
                "5-oxo-delta-bilirubin",
                "Biliverdin IX",
                "S-phycoerythrobilin-L-cysteine",
                "bacteriochlorophyll a",
                "bacteriochlorophyll b",
                "bacteriochlorophyll c",
                "bacteriochlorophyll e",
                "bacteriochlorophyllide d",
                "bacteriochlorophyllide g",
                "biliverdin",
                "biliverdin beta",
                "chlorophyll a",
                "chlorophyll b",
                "chlorophyll c1",
                "chlorophyll c2",
                "chlorophyll d",
                "chlorophyll f",
                "cobalamin",
                "coenzyme F430",
                "heme a",
                "heme b",
                "heme o",
                "methylcobalamin",
                "phycocyanobilin",
                "phycoerythrobilin",
                "siroheme"
            ],
            "TP": 18,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "Chlorophyll (Chl)",
            "Heme",
            "Cytochrome c",
            "Vitamin B12",
            "Bilirubin",
            "Biliverdin",
            "Phycobilins",
            "Phycoerythrin",
            "Phycocyanin",
            "Allophycocyanin",
            "Sirohydrochlorin",
            "Coenzyme F430",
            "Isobacteriochlorins",
            "Bacteriochlorophyll",
            "Chlorophyll d",
            "Chlorophyll f",
            "Pheophytin a",
            "Pheophytin b",
            "Pyropheophytin a",
            "Pyropheophytin b",
            "Protochlorophyllide",
            "Chlorophyllide a",
            "Chlorophyllide b",
            "Hematoporphyrin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heme",
                "Biliverdin",
                "Isobacteriochlorins",
                "Bacteriochlorophyll",
                "Chlorophyll d",
                "Chlorophyll f",
                "Pheophytin a",
                "Pheophytin b",
                "Pyropheophytin b",
                "Protochlorophyllide",
                "Chlorophyllide a",
                "Chlorophyllide b",
                "Hematoporphyrin",
                "Coenzyme F430"
            ],
            "mismatches": [
                "Chlorophyll (Chl)",
                "Cytochrome c",
                "Vitamin B12",
                "Bilirubin",
                "Phycobilins",
                "Phycoerythrin",
                "Phycocyanin",
                "Allophycocyanin",
                "Sirohydrochlorin",
                "Pyropheophytin a"
            ],
            "true_referents": [
                "(3E)-phycocyanobilin",
                "(3E)-phycoerythrobilin",
                "(E,E)-bilirubin",
                "132-hydroxy-(132-S)-phaeophytin A",
                "15,17(3)-seco-F430-17(3)-acid",
                "15-oxo-beta-bilirubin",
                "5-oxo-delta-bilirubin",
                "Biliverdin IX",
                "Chlorophyll c",
                "PHYCOVIOLOBILIN",
                "Pyropheophytin b",
                "S-phycoerythrobilin-L-cysteine",
                "bacteriochlorophyll",
                "bacteriochlorophyll c",
                "biliverdin",
                "biliverdin beta",
                "chlorophyll",
                "chlorophyll d",
                "chlorophyll f",
                "chlorophyllide a",
                "chlorophyllide b",
                "cobalamin",
                "cobalt-sirohydrochlorin",
                "coenzyme F430",
                "cytoporphyrin",
                "hematoporphyrin",
                "heme",
                "isobacteriochlorin",
                "isobacteriochlorins",
                "methylcobalamin",
                "pheophytin",
                "pheophytin a",
                "pheophytin b",
                "phycocyanobilin",
                "phycoerythrobilin",
                "porphyrin",
                "protochlorophyllide",
                "pyropheophorbide a",
                "sirohydrochlorin"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "Chlorophyll a (Chl a)",
            "Chlorophyll b (Chl b)",
            "Heme",
            "Vitamin B12 (Cobalamin)",
            "Cytochrome c",
            "Protoporphyrin IX",
            "Bilirubin",
            "Biliverdin",
            "Phycoerythrin",
            "Phycocyanin",
            "Hemoglobin",
            "Myoglobin",
            "Catalase",
            "Peroxidase",
            "Cytochrome P450",
            "Ferredoxin",
            "Siroheme",
            "Coenzyme F430",
            "Corrin",
            "Chlorophyll c1 (Chl c1)",
            "Chlorophyll c2 (Chl c2)",
            "Chlorophyll d (Chl d)",
            "Chlorophyll f (Chl f)",
            "Bacteriochlorophyll a (Bchl a)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chlorophyll a (Chl a)",
                "Chlorophyll b (Chl b)",
                "Heme",
                "Vitamin B12 (Cobalamin)",
                "Biliverdin",
                "Siroheme",
                "Coenzyme F430",
                "Corrin",
                "Chlorophyll c1 (Chl c1)",
                "Chlorophyll c2 (Chl c2)",
                "Chlorophyll d (Chl d)",
                "Chlorophyll f (Chl f)",
                "Bacteriochlorophyll a (Bchl a)"
            ],
            "mismatches": [
                "Cytochrome c",
                "Protoporphyrin IX",
                "Bilirubin",
                "Phycoerythrin",
                "Phycocyanin",
                "Hemoglobin",
                "Myoglobin",
                "Catalase",
                "Peroxidase",
                "Cytochrome P450",
                "Ferredoxin"
            ],
            "true_referents": [
                "(1S)-primary fluorescent chlorophyll catabolite",
                "(3E)-phycocyanobilin",
                "(3E)-phycoerythrobilin",
                "(E,E)-bilirubin",
                "15,17(3)-seco-F430-17(3)-acid",
                "15-oxo-beta-bilirubin",
                "5-oxo-delta-bilirubin",
                "Biliverdin IX",
                "Chlorophyll c",
                "Deuteroporphyrin IX",
                "S-phycoerythrobilin-L-cysteine",
                "bacteriochlorophyll a",
                "bacteriochlorophyll c",
                "biliverdin",
                "biliverdin beta",
                "chlorophyll",
                "chlorophyll a",
                "chlorophyll b",
                "chlorophyll c1",
                "chlorophyll c2",
                "chlorophyll d",
                "chlorophyll f",
                "cobalamin",
                "coenzyme F430",
                "corrin",
                "corrins",
                "cytoporphyrin",
                "heme",
                "heme b",
                "heme-amino acid",
                "mesoporphyrin IX",
                "metalloporphyrin",
                "methylcobalamin",
                "phenylporphyrin",
                "phycocyanobilin",
                "phycoerythrobilin",
                "porphyrin",
                "protoporphyrin",
                "siroheme"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": "[\n    \"Heme (Hb)\", \n    \"Heme (Cytochrome)\", \n    \"Heme (Myoglobin)\", \n    \"Heme (Cytochrome c)\", \n    \"Heme (Cytochrome b)\", \n    \"Heme (Cytochrome oxidase)\", \n    \"Heme (Cytochrome P450)\", \n    \"Heme (Ferritin)\", \n    \"Heme (Hemoglobin)\", \n    \"Heme (Hemocyanin)\", \n    \"Heme (Hemosiderin)\", \n    \"Heme (Lactoferrin)\", \n    \"Heme (Myeloperoxidase)\", \n    \"Heme (Porphyrin)\", \n    \"Heme (Protoporphyrin)\", \n    \"Heme (Sulfhemoglobin)\", \n    \"Heme (Uroporphyrin)\", \n    \"Heme (Vitamin B12)\", \n    \"Heme (Xanthochromic)\", \n    \"Heme (Xanthophyll)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthophylline)\", \n    \"Heme (Xanthoph",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            "Biliverdin (BV)",
            "Bilirubin (BR)",
            "Heme a",
            "Heme b",
            "Heme c",
            "Heme o",
            "Chlorophyll a",
            "Chlorophyll b",
            "Chlorophyll c1",
            "Chlorophyll c2",
            "Chlorophyll d",
            "Bacteriochlorophyll a",
            "Bacteriochlorophyll b",
            "Bacteriochlorophyll c",
            "Bacteriochlorophyll d",
            "Bacteriochlorophyll e",
            "Bacteriochlorophyll f",
            "Pheophytin a",
            "Pheophytin b",
            "Purpurin-18",
            "Purpurin-7",
            "Coproheme III",
            "Coproheme I",
            "Coproheme II"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "biliverdin",
                "heme a",
                "heme b",
                "heme o",
                "chlorophyll a",
                "chlorophyll b",
                "chlorophyll c1",
                "chlorophyll c2",
                "chlorophyll d",
                "bacteriochlorophyll a",
                "bacteriochlorophyll b",
                "bacteriochlorophyll c",
                "bacteriochlorophyll e",
                "pheophytin a",
                "pheophytin b"
            ],
            "mismatches": [
                "bilirubin (BR)",
                "heme c",
                "bacteriochlorophyll d",
                "bacteriochlorophyll f",
                "purpurin-18",
                "purpurin-7",
                "coproheme III",
                "coproheme I",
                "coproheme II"
            ],
            "true_referents": [
                "(E,E)-bilirubin",
                "15-oxo-beta-bilirubin",
                "5-oxo-delta-bilirubin",
                "Coproporphyrin II",
                "D-Urobilin",
                "bacteriochlorophyll a",
                "bacteriochlorophyll b",
                "bacteriochlorophyll c",
                "bacteriochlorophyll e",
                "bacteriochlorophyllide d",
                "bacteriochlorophyllide f",
                "biliverdin",
                "biliverdin beta",
                "biliverdin delta",
                "chlorophyll a",
                "chlorophyll b",
                "chlorophyll c1",
                "chlorophyll c2",
                "chlorophyll d",
                "coproporphyrin",
                "coproporphyrin I",
                "coproporphyrin III",
                "coproporphyrinogen",
                "coproporphyrinogen I",
                "coproporphyrinogen III",
                "ferriheme a3",
                "heme a",
                "heme b",
                "heme o",
                "pheophytin",
                "pheophytin a",
                "pheophytin b",
                "precorrin-7",
                "urobilin",
                "uroporphyrinogen I"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "tetrapyrrole",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "heme",
                "Canonical Name": "Heme"
            },
            {
                "Referent": "chlorophyll",
                "Canonical Name": "Chlorophyll"
            },
            {
                "Referent": "bilirubin",
                "Canonical Name": "Bilirubin"
            },
            {
                "Referent": "cytochrome c",
                "Canonical Name": "Cytochrome c"
            },
            {
                "Referent": "hemoglobin",
                "Canonical Name": "Hemoglobin"
            },
            {
                "Referent": "catalase",
                "Canonical Name": "Catalase"
            },
            {
                "Referent": "tyrosinase",
                "Canonical Name": "Tyrosinase"
            },
            {
                "Referent": "lipoxygenase",
                "Canonical Name": "Lipoxygenase"
            },
            {
                "Referent": "catalase",
                "Canonical Name": "Catalase"
            },
            {
                "Referent": "tyrosinase",
                "Canonical Name": "Tyrosinase"
            },
            {
                "Referent": "lipoxygenase",
                "Canonical Name": "Lipoxygenase"
            },
            {
                "Referent": "catalase",
                "Canonical Name": "Catalase"
            },
            {
                "Referent": "tyrosinase",
                "Canonical Name": "Tyrosinase"
            },
            {
                "Referent": "lipoxygenase",
                "Canonical Name": "Lipoxygenase"
            },
            {
                "Referent": "catalase",
                "Canonical Name": "Catalase"
            },
            {
                "Referent": "tyrosinase",
                "Canonical Name": "Tyrosinase"
            },
            {
                "Referent": "lipoxygenase",
                "Canonical Name": "Lipoxygenase"
            },
            {
                "Referent": "catalase",
                "Canonical Name": "Catalase"
            },
            {
                "Referent": "tyrosinase",
                "Canonical Name": "Tyrosinase"
            },
            {
                "Referent": "lipoxygenase",
                "Canonical Name": "Lipoxygenase"
            },
            {
                "Referent": "catalase",
                "Canonical Name": "Catalase"
            },
            {
                "Referent": "tyrosinase",
                "Canonical Name": "Tyrosinase"
            },
            {
                "Referent": "lipoxygenase",
                "Canonical Name": "Lipoxygenase"
            },
            {
                "Referent": "catalase",
                "Canonical Name": "Catalase"
            },
            {
                "Referent": "tyrosinase",
                "Canonical Name": "Tyrosinase"
            },
            {
                "Referent": "lipoxygenase",
                "Canonical Name": "Lipoxygenase"
            },
            {
                "Referent": "catalase",
                "Canonical Name": "Catalase"
            },
            {
                "Referent": "tyrosinase",
                "Canonical Name": "Tyrosinase"
            },
            {
                "Referent": "lipoxygenase",
                "Canonical Name": "Lipoxygenase"
            },
            {
                "Referent": "catalase",
                "Canonical Name": "Catalase"
            },
            {
                "Referent": "tyrosinase",
                "Canonical Name": "Tyrosinase"
            },
            {
                "Referent": "lipoxygenase",
                "Canonical Name": "Lipoxygenase"
            },
            {
                "Referent": "catalase",
                "Canonical Name": "Catalase"
            },
            {
                "Referent": "tyrosinase",
                "Canonical Name": "Tyrosinase"
            },
            {
                "Referent": "lipoxygenase",
                "Canonical Name": "Lipoxygenase"
            },
            {
                "Referent": "catalase",
                "Canonical Name": "Catalase"
            },
            {
                "Referent": "tyrosinase",
                "Canonical Name": "Tyrosinase"
            },
            {
                "Referent": "lipoxygenase",
                "Canonical Name": "Lipoxygenase"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "heme",
                "chlorophyll"
            ],
            "mismatches": [
                "bilirubin",
                "cytochrome c",
                "hemoglobin",
                "catalase",
                "tyrosinase",
                "lipoxygenase"
            ],
            "true_referents": [
                "(E,E)-bilirubin",
                "4E,15Z-bilirubin IXa",
                "5-oxo-delta-bilirubin",
                "7(1)-hydroxychlorophyll a",
                "chlorophyll",
                "heme",
                "heme b",
                "heme-cysteine"
            ],
            "TP": 2,
            "FP": 6,
            "FN": 0
        }
    }
]