[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "erythroblast (EB)",
            "normoblast",
            "reticulocyte (Ret)",
            "erythrocyte (RBC)",
            "orthochromatic erythroblast",
            "prorhombroid erythroblast",
            "basophilic erythroblast",
            "polychromatophilic erythroblast",
            "karyorrhexis erythroblast",
            "erythroid colony forming unit (CFU-E)",
            "proerythroblast",
            "basophilic normoblast",
            "polychromatophilic normoblast",
            "orthochromatic normoblast",
            "erythrocyte progenitor cell",
            "erythroid burst forming unit (BFU-E)",
            "erythroid precursor cell",
            "erythrocyte stem cell",
            "erythroid-committed progenitor",
            "erythroid progenitor",
            "erythroid-committed cell",
            "erythroid-committed precursor cell",
            "erythroid-committed stem cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "erythroblast (EB)",
                "normoblast",
                "reticulocyte (Ret)",
                "erythrocyte (RBC)",
                "orthochromatic erythroblast",
                "prorhombroid erythroblast",
                "basophilic erythroblast",
                "polychromatophilic erythroblast",
                "karyorrhexis erythroblast",
                "erythroid colony forming unit (CFU-E)",
                "proerythroblast",
                "basophilic normoblast",
                "polychromatophilic normoblast",
                "orthochromatic normoblast",
                "erythrocyte progenitor cell",
                "erythroid burst forming unit (BFU-E)",
                "erythroid precursor cell",
                "erythrocyte stem cell",
                "erythroid-committed progenitor",
                "erythroid progenitor",
                "erythroid-committed cell",
                "erythroid-committed precursor cell",
                "erythroid-committed stem cell"
            ],
            "mismatches": [],
            "true_referents": [
                "basophilic erythroblast",
                "basophilic normoblast",
                "erythroblast (EB)",
                "erythrocyte (RBC)",
                "erythrocyte progenitor cell",
                "erythrocyte stem cell",
                "erythroid burst forming unit (BFU-E)",
                "erythroid colony forming unit (CFU-E)",
                "erythroid precursor cell",
                "erythroid progenitor",
                "erythroid-committed cell",
                "erythroid-committed precursor cell",
                "erythroid-committed progenitor",
                "erythroid-committed stem cell",
                "karyorrhexis erythroblast",
                "normoblast",
                "orthochromatic erythroblast",
                "orthochromatic normoblast",
                "polychromatophilic erythroblast",
                "polychromatophilic normoblast",
                "proerythroblast",
                "prorhombroid erythroblast",
                "reticulocyte (Ret)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "Proerythroblast (Basophilic erythroblast)",
            "Basophilic erythroblast",
            "Polychromatic erythroblast",
            "Orthochromatic erythroblast (Normoblast)",
            "Reticulocyte",
            "Mature erythrocyte (Red blood cell)",
            "Erythroid progenitor cell",
            "Erythroid burst-forming unit (BFU-E)",
            "Erythroid colony-forming unit (CFU-E)",
            "Early erythroid progenitor",
            "Late erythroid progenitor",
            "Erythrocyte precursor cell",
            "Erythroblast",
            "Nucleated red blood cell",
            "Immature red blood cell",
            "Erythrocyte precursor",
            "Erythrocyte stem cell",
            "Erythroid stem cell",
            "Erythrocyte progenitor cell",
            "Erythrocyte precursor stage",
            "Erythrocyte lineage cell",
            "Erythroid lineage cell",
            "Reticulocyte stage cell",
            "Mature erythrocyte stage cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Proerythroblast (Basophilic erythroblast)",
                "Basophilic erythroblast",
                "Polychromatic erythroblast",
                "Orthochromatic erythroblast (Normoblast)",
                "Reticulocyte",
                "Mature erythrocyte (Red blood cell)",
                "Erythroid progenitor cell",
                "Erythroid burst-forming unit (BFU-E)",
                "Erythroid colony-forming unit (CFU-E)",
                "Early erythroid progenitor",
                "Late erythroid progenitor",
                "Erythrocyte precursor cell",
                "Erythroblast",
                "Nucleated red blood cell",
                "Immature red blood cell",
                "Erythrocyte precursor",
                "Erythrocyte stem cell",
                "Erythroid stem cell",
                "Erythrocyte progenitor cell",
                "Erythrocyte precursor stage",
                "Erythrocyte lineage cell",
                "Erythroid lineage cell",
                "Reticulocyte stage cell",
                "Mature erythrocyte stage cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Basophilic erythroblast",
                "Early erythroid progenitor",
                "Erythroblast",
                "Erythrocyte lineage cell",
                "Erythrocyte precursor",
                "Erythrocyte precursor cell",
                "Erythrocyte precursor stage",
                "Erythrocyte progenitor cell",
                "Erythrocyte stem cell",
                "Erythroid burst-forming unit (BFU-E)",
                "Erythroid colony-forming unit (CFU-E)",
                "Erythroid lineage cell",
                "Erythroid progenitor cell",
                "Erythroid stem cell",
                "Immature red blood cell",
                "Late erythroid progenitor",
                "Mature erythrocyte (Red blood cell)",
                "Mature erythrocyte stage cell",
                "Nucleated red blood cell",
                "Orthochromatic erythroblast (Normoblast)",
                "Polychromatic erythroblast",
                "Proerythroblast (Basophilic erythroblast)",
                "Reticulocyte",
                "Reticulocyte stage cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "Erythroblast (Proerythroblast)",
            "Basophilic Erythroblast",
            "Polychromatophilic Erythroblast",
            "Orthochromatic Erythroblast",
            "Reticulocyte",
            "Normoblast",
            "Erythrocyte",
            "Megakaryocyte Erythroid Progenitor",
            "Common Myeloid Progenitor",
            "Erythroid Colony-Forming Unit",
            "Burst-Forming Unit-Erythroid",
            "Colony-Forming Unit-Erythroid",
            "Erythroid Progenitor Cell",
            "Erythroid Blast",
            "Erythroid Precursor",
            "Erythroid Colony",
            "Erythroid Burst",
            "Erythroid Colony-Forming Unit (CFU-E)",
            "Erythroid Progenitor (EP)",
            "Erythroid Colony-Forming Unit (CFU-E)",
            "Erythroid Blast Forming Unit (BFU-E)",
            "Erythroid Colony-Forming Unit (CFU-E)",
            "Erythroid Blast",
            "Erythroid Precursor"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Erythroblast (Proerythroblast)",
                "Basophilic Erythroblast",
                "Polychromatophilic Erythroblast",
                "Orthochromatic Erythroblast",
                "Reticulocyte",
                "Normoblast",
                "Erythrocyte",
                "Megakaryocyte Erythroid Progenitor",
                "Common Myeloid Progenitor",
                "Erythroid Colony-Forming Unit",
                "Burst-Forming Unit-Erythroid",
                "Colony-Forming Unit-Erythroid",
                "Erythroid Progenitor Cell",
                "Erythroid Blast",
                "Erythroid Precursor",
                "Erythroid Colony",
                "Erythroid Burst",
                "Erythroid Colony-Forming Unit (CFU-E)",
                "Erythroid Progenitor (EP)",
                "Erythroid Blast Forming Unit (BFU-E)"
            ],
            "mismatches": [],
            "true_referents": [
                "Basophilic Erythroblast",
                "Burst-Forming Unit-Erythroid",
                "Colony-Forming Unit-Erythroid",
                "Common Myeloid Progenitor",
                "Erythroblast (Proerythroblast)",
                "Erythrocyte",
                "Erythroid Blast",
                "Erythroid Blast Forming Unit (BFU-E)",
                "Erythroid Burst",
                "Erythroid Colony",
                "Erythroid Colony-Forming Unit",
                "Erythroid Colony-Forming Unit (CFU-E)",
                "Erythroid Precursor",
                "Erythroid Progenitor (EP)",
                "Erythroid Progenitor Cell",
                "Megakaryocyte Erythroid Progenitor",
                "Normoblast",
                "Orthochromatic Erythroblast",
                "Polychromatophilic Erythroblast",
                "Reticulocyte"
            ],
            "TP": 20,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "Proerythroblast (ProE)",
            "Basophilic Erythroblast (BasoE)",
            "Polychromatic Erythroblast (PolyE)",
            "Orthochromatic Erythroblast (OrthoE)",
            "Reticulocyte (Ret)",
            "Erythrocyte (RBC)",
            "Erythroblast CFU-E (CFU-E)",
            "Erythroblast BFU-E (BFU-E)",
            "Erythroblast Progenitor Cell",
            "Erythrocyte Precursor Cell",
            "Normoblast (general term for erythroblasts)",
            "Hemoglobin-containing Erythroblast",
            "Enucleated Erythrocyte Precursor",
            "Late Erythroblast",
            "Early Erythroblast",
            "Anucleate Reticulocyte",
            "Mature Erythrocyte",
            "Human Erythrocyte",
            "Mouse Erythrocyte",
            "Chicken Erythrocyte",
            "Fetal Erythroblast",
            "Adult Erythroblast",
            "Erythrocyte Ghost Cell",
            "Spherocyte (abnormal RBC)",
            "Poikilocytic Erythrocyte (abnormal RBC shape)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Proerythroblast (ProE)",
                "Basophilic Erythroblast (BasoE)",
                "Polychromatic Erythroblast (PolyE)",
                "Orthochromatic Erythroblast (OrthoE)",
                "Reticulocyte (Ret)",
                "Erythrocyte (RBC)",
                "Erythroblast CFU-E (CFU-E)",
                "Erythroblast BFU-E (BFU-E)",
                "Erythroblast Progenitor Cell",
                "Erythrocyte Precursor Cell",
                "Normoblast (general term for erythroblasts)",
                "Hemoglobin-containing Erythroblast",
                "Enucleated Erythrocyte Precursor",
                "Late Erythroblast",
                "Early Erythroblast",
                "Anucleate Reticulocyte",
                "Mature Erythrocyte",
                "Human Erythrocyte",
                "Mouse Erythrocyte",
                "Chicken Erythrocyte",
                "Fetal Erythroblast",
                "Adult Erythroblast",
                "Erythrocyte Ghost Cell",
                "Spherocyte (abnormal RBC)"
            ],
            "mismatches": [
                "Poikilocytic Erythrocyte (abnormal RBC shape)"
            ],
            "true_referents": [
                "Adult Erythroblast",
                "Anucleate Reticulocyte",
                "Basophilic Erythroblast (BasoE)",
                "Chicken Erythrocyte",
                "Early Erythroblast",
                "Enucleated Erythrocyte Precursor",
                "Erythroblast BFU-E (BFU-E)",
                "Erythroblast CFU-E (CFU-E)",
                "Erythroblast Progenitor Cell",
                "Erythrocyte (RBC)",
                "Erythrocyte Ghost Cell",
                "Erythrocyte Precursor Cell",
                "Fetal Erythroblast",
                "Hemoglobin-containing Erythroblast",
                "Human Erythrocyte",
                "Late Erythroblast",
                "Mature Erythrocyte",
                "Mouse Erythrocyte",
                "Normoblast (general term for erythroblasts)",
                "Orthochromatic Erythroblast (OrthoE)",
                "Polychromatic Erythroblast (PolyE)",
                "Proerythroblast (ProE)",
                "Reticulocyte (Ret)",
                "Spherocyte (abnormal RBC)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "Erythroblast",
            "Proerythroblast",
            "Basophilic erythroblast",
            "Polychromatic erythroblast",
            "Orthochromatic erythroblast",
            "Reticulocyte",
            "Normoblast",
            "Pronormoblast",
            "Rubriblast",
            "Prorubricyte",
            "Basophilic normoblast",
            "Polychromatophilic normoblast",
            "Orthochromatophilic normoblast",
            "Erythrocyte",
            "Colony-forming unit-erythroid (CFU-E)",
            "Burst-forming unit-erythroid (BFU-E)",
            "Hemocytoblast",
            "Erythroid progenitor cell",
            "Erythroid precursor cell",
            "Erythroid stem cell",
            "Erythroid lineage cell",
            "Late erythroblast",
            "Early erythroblast",
            "Intermediate erythroblast"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Erythroblast",
                "Proerythroblast",
                "Basophilic erythroblast",
                "Polychromatic erythroblast",
                "Orthochromatic erythroblast",
                "Reticulocyte",
                "Normoblast",
                "Pronormoblast",
                "Rubriblast",
                "Prorubricyte",
                "Basophilic normoblast",
                "Polychromatophilic normoblast",
                "Orthochromatophilic normoblast",
                "Erythrocyte",
                "Colony-forming unit-erythroid (CFU-E)",
                "Burst-forming unit-erythroid (BFU-E)",
                "Hemocytoblast",
                "Erythroid progenitor cell",
                "Erythroid precursor cell",
                "Erythroid stem cell",
                "Erythroid lineage cell",
                "Late erythroblast",
                "Early erythroblast",
                "Intermediate erythroblast"
            ],
            "mismatches": [],
            "true_referents": [
                "Basophilic erythroblast",
                "Basophilic normoblast",
                "Burst-forming unit-erythroid (BFU-E)",
                "Colony-forming unit-erythroid (CFU-E)",
                "Early erythroblast",
                "Erythroblast",
                "Erythrocyte",
                "Erythroid lineage cell",
                "Erythroid precursor cell",
                "Erythroid progenitor cell",
                "Erythroid stem cell",
                "Hemocytoblast",
                "Intermediate erythroblast",
                "Late erythroblast",
                "Normoblast",
                "Orthochromatic erythroblast",
                "Orthochromatophilic normoblast",
                "Polychromatic erythroblast",
                "Polychromatophilic normoblast",
                "Proerythroblast",
                "Pronormoblast",
                "Prorubricyte",
                "Reticulocyte",
                "Rubriblast"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "Proerythroblast (PE)",
            "Basophilic Erythroblast (BE)",
            "Polychromatic Erythroblast (PE)",
            "Orthochromatic Erythroblast (OE)",
            "Reticulocyte (RE)",
            "Erythrocyte (E)",
            "Hemocytoblast (HC)",
            "Erythroid Colony-forming Unit (CFU-E)",
            "Erythroid Progenitor Cell (EPC)",
            "Myeloid Progenitor Cell (MPC)",
            "Burst-forming Unit Erythroid (BFU-E)",
            "Erythrocyte Precursor Cell (EPC)",
            "Mature Erythrocyte (ME)",
            "Erythroblast (EB)",
            "Erythroid Stem Cell (ESC)",
            "Erythroid Lineage Cell (ELC)",
            "Erythrocytic Cell (EC)",
            "Early Erythroblast (EE)",
            "Late Erythroblast (LE)",
            "Erythropoietic Cell (EpC)",
            "Nucleated Red Blood Cell (NRBC)",
            "Immature Erythrocyte (IE)",
            "Erythrocytic Progenitor (EP)",
            "Erythropoiesis-committed Cell (ECC)",
            "Erythrocyte Precursor (EP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Proerythroblast (PE)",
                "Basophilic Erythroblast (BE)",
                "Polychromatic Erythroblast (PE)",
                "Orthochromatic Erythroblast (OE)",
                "Reticulocyte (RE)",
                "Erythrocyte (E)",
                "Hemocytoblast (HC)",
                "Erythroid Colony-forming Unit (CFU-E)",
                "Erythroid Progenitor Cell (EPC)",
                "Myeloid Progenitor Cell (MPC)",
                "Burst-forming Unit Erythroid (BFU-E)",
                "Erythrocyte Precursor Cell (EPC)",
                "Mature Erythrocyte (ME)",
                "Erythroblast (EB)",
                "Erythroid Stem Cell (ESC)",
                "Erythroid Lineage Cell (ELC)",
                "Erythrocytic Cell (EC)",
                "Early Erythroblast (EE)",
                "Late Erythroblast (LE)",
                "Erythropoietic Cell (EpC)",
                "Nucleated Red Blood Cell (NRBC)",
                "Immature Erythrocyte (IE)",
                "Erythrocytic Progenitor (EP)",
                "Erythropoiesis-committed Cell (ECC)"
            ],
            "mismatches": [
                "Erythrocyte Precursor (EP)"
            ],
            "true_referents": [
                "Basophilic Erythroblast (BE)",
                "Burst-forming Unit Erythroid (BFU-E)",
                "Early Erythroblast (EE)",
                "Erythroblast (EB)",
                "Erythrocyte (E)",
                "Erythrocyte Precursor Cell (EPC)",
                "Erythrocytic Cell (EC)",
                "Erythrocytic Progenitor (EP)",
                "Erythroid Colony-forming Unit (CFU-E)",
                "Erythroid Lineage Cell (ELC)",
                "Erythroid Progenitor Cell (EPC)",
                "Erythroid Stem Cell (ESC)",
                "Erythropoiesis-committed Cell (ECC)",
                "Erythropoietic Cell (EpC)",
                "Hemocytoblast (HC)",
                "Immature Erythrocyte (IE)",
                "Late Erythroblast (LE)",
                "Mature Erythrocyte (ME)",
                "Myeloid Progenitor Cell (MPC)",
                "Nucleated Red Blood Cell (NRBC)",
                "Orthochromatic Erythroblast (OE)",
                "Polychromatic Erythroblast (PE)",
                "Proerythroblast (PE)",
                "Reticulocyte (RE)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "Proerythroblast (ProE)",
            "Basophilic Erythroblast (BasoE)",
            "Polychromatophilic Erythroblast (PolyE)",
            "Orthochromatic Erythroblast (OrthoE)",
            "Reticulocyte (Retic)",
            "Mature Red Blood Cell (RBC)",
            "Erythroid Progenitor Cell (EPC)",
            "CFU-E (Colony Forming Unit-Erythroid)",
            "BFU-E (Burst Forming Unit-Erythroid)",
            "Multipotent Hematopoietic Stem Cell (HSC)",
            "Common Myeloid Progenitor (CMP)",
            "Megakaryocyte-Erythroid Progenitor (MEP)",
            "Primitive Erythroblast",
            "Erythroid Precursor Cell",
            "Late Basophilic Erythroblast",
            "Late Polychromatophilic Erythroblast",
            "Late Orthochromatic Erythroblast",
            "Early Basophilic Erythroblast",
            "Early Polychromatophilic Erythroblast",
            "Early Orthochromatic Erythroblast",
            "Late Reticulocyte",
            "Early Reticulocyte",
            "Late Erythroblast",
            "Early Erythroblast"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Proerythroblast (ProE)",
                "Basophilic Erythroblast (BasoE)",
                "Polychromatophilic Erythroblast (PolyE)",
                "Orthochromatic Erythroblast (OrthoE)",
                "Reticulocyte (Retic)",
                "Mature Red Blood Cell (RBC)",
                "Erythroid Progenitor Cell (EPC)",
                "CFU-E (Colony Forming Unit-Erythroid)",
                "BFU-E (Burst Forming Unit-Erythroid)",
                "Multipotent Hematopoietic Stem Cell (HSC)",
                "Common Myeloid Progenitor (CMP)",
                "Megakaryocyte-Erythroid Progenitor (MEP)",
                "Primitive Erythroblast",
                "Erythroid Precursor Cell",
                "Late Basophilic Erythroblast",
                "Late Polychromatophilic Erythroblast",
                "Late Orthochromatic Erythroblast",
                "Early Basophilic Erythroblast",
                "Early Polychromatophilic Erythroblast",
                "Early Orthochromatic Erythroblast",
                "Late Reticulocyte",
                "Early Reticulocyte",
                "Late Erythroblast",
                "Early Erythroblast"
            ],
            "mismatches": [],
            "true_referents": [
                "BFU-E (Burst Forming Unit-Erythroid)",
                "Basophilic Erythroblast (BasoE)",
                "CFU-E (Colony Forming Unit-Erythroid)",
                "Common Myeloid Progenitor (CMP)",
                "Early Basophilic Erythroblast",
                "Early Erythroblast",
                "Early Orthochromatic Erythroblast",
                "Early Polychromatophilic Erythroblast",
                "Early Reticulocyte",
                "Erythroid Precursor Cell",
                "Erythroid Progenitor Cell (EPC)",
                "Late Basophilic Erythroblast",
                "Late Erythroblast",
                "Late Orthochromatic Erythroblast",
                "Late Polychromatophilic Erythroblast",
                "Late Reticulocyte",
                "Mature Red Blood Cell (RBC)",
                "Megakaryocyte-Erythroid Progenitor (MEP)",
                "Multipotent Hematopoietic Stem Cell (HSC)",
                "Orthochromatic Erythroblast (OrthoE)",
                "Polychromatophilic Erythroblast (PolyE)",
                "Primitive Erythroblast",
                "Proerythroblast (ProE)",
                "Reticulocyte (Retic)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "erythroblast",
            "normoblast",
            "reticulocyte",
            "mature red blood cell",
            "proerythroblast",
            "basophilic erythroblast",
            "polychromatophilic erythroblast",
            "orthochromic erythroblast",
            "nucleated red blood cell",
            "megaloblast",
            "microcyte",
            "spherocyte",
            "ovalocyte",
            "target cell",
            "elliptocyte",
            "schistocyte",
            "acanthocyte",
            "drepanocyte",
            "teardrop cell",
            "stomatocyte",
            "pappenheimer body",
            "heinz body",
            "howell-jolly body",
            "cabot ring"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "erythroblast",
                "normoblast",
                "reticulocyte",
                "mature red blood cell",
                "proerythroblast",
                "basophilic erythroblast",
                "polychromatophilic erythroblast",
                "orthochromic erythroblast",
                "nucleated red blood cell",
                "megaloblast",
                "microcyte",
                "spherocyte",
                "ovalocyte",
                "target cell",
                "elliptocyte",
                "schistocyte",
                "acanthocyte",
                "drepanocyte",
                "teardrop cell",
                "stomatocyte",
                "pappenheimer body",
                "heinz body",
                "howell-jolly body",
                "cabot ring"
            ],
            "mismatches": [],
            "true_referents": [
                "acanthocyte",
                "basophilic erythroblast",
                "cabot ring",
                "drepanocyte",
                "elliptocyte",
                "erythroblast",
                "heinz body",
                "howell-jolly body",
                "mature red blood cell",
                "megaloblast",
                "microcyte",
                "normoblast",
                "nucleated red blood cell",
                "orthochromic erythroblast",
                "ovalocyte",
                "pappenheimer body",
                "polychromatophilic erythroblast",
                "proerythroblast",
                "reticulocyte",
                "schistocyte",
                "spherocyte",
                "stomatocyte",
                "target cell",
                "teardrop cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "Hematopoietic stem cell (HSC)",
            "Common myeloid progenitor (CMP)",
            "Megakaryocyte-erythroid progenitor (MEP)",
            "Burst-forming unit-erythroid (BFU-E)",
            "Colony-forming unit-erythroid (CFU-E)",
            "Erythroid progenitor cell",
            "Proerythroblast",
            "Basophilic erythroblast",
            "Polychromatic erythroblast",
            "Orthochromatic erythroblast (Normoblast)",
            "Reticulocyte",
            "Erythrocyte (RBC)",
            "Erythroblast",
            "Normoblast",
            "Erythropoietin-responsive progenitor",
            "Erythroid colony-forming unit (ECFU)",
            "K562 cell line",
            "HEL cell line",
            "Human erythroid progenitor cell",
            "Mouse erythroid progenitor cell",
            "Erythropoietic precursor cell",
            "Late erythroblast",
            "Early erythroblast",
            "Erythroid precursor cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hematopoietic stem cell (HSC)",
                "Common myeloid progenitor (CMP)",
                "Megakaryocyte-erythroid progenitor (MEP)",
                "Burst-forming unit-erythroid (BFU-E)",
                "Colony-forming unit-erythroid (CFU-E)",
                "Erythroid progenitor cell",
                "Proerythroblast",
                "Basophilic erythroblast",
                "Polychromatic erythroblast",
                "Orthochromatic erythroblast (Normoblast)",
                "Reticulocyte",
                "Erythrocyte (RBC)",
                "Erythroblast",
                "Normoblast",
                "Erythropoietin-responsive progenitor",
                "Erythroid colony-forming unit (ECFU)",
                "K562 cell line",
                "HEL cell line",
                "Human erythroid progenitor cell",
                "Mouse erythroid progenitor cell",
                "Erythropoietic precursor cell",
                "Late erythroblast",
                "Early erythroblast",
                "Erythroid precursor cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Basophilic erythroblast",
                "Burst-forming unit-erythroid (BFU-E)",
                "Colony-forming unit-erythroid (CFU-E)",
                "Common myeloid progenitor (CMP)",
                "Early erythroblast",
                "Erythroblast",
                "Erythrocyte (RBC)",
                "Erythroid colony-forming unit (ECFU)",
                "Erythroid precursor cell",
                "Erythroid progenitor cell",
                "Erythropoietic precursor cell",
                "Erythropoietin-responsive progenitor",
                "HEL cell line",
                "Hematopoietic stem cell (HSC)",
                "Human erythroid progenitor cell",
                "K562 cell line",
                "Late erythroblast",
                "Megakaryocyte-erythroid progenitor (MEP)",
                "Mouse erythroid progenitor cell",
                "Normoblast",
                "Orthochromatic erythroblast (Normoblast)",
                "Polychromatic erythroblast",
                "Proerythroblast",
                "Reticulocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "Hematopoietic stem cell (HSC)",
            "Multipotent progenitor cell (MPP)",
            "Common myeloid progenitor (CMP)",
            "Megakaryocyte-erythroid progenitor (MEP)",
            "Burst-forming unit-erythroid (BFU-E)",
            "Colony-forming unit-erythroid (CFU-E)",
            "Proerythroblast",
            "Basophilic erythroblast",
            "Polychromatic erythroblast",
            "Orthochromatic erythroblast",
            "Reticulocyte",
            "Mature erythrocyte (RBC)",
            "Nucleated red blood cell (nRBC)",
            "Erythroid island macrophage",
            "Stress erythroid progenitor (SEP)",
            "Erythroid Kruppel-like factor (EKLF)",
            "Erythropoietin-responsive progenitor cell",
            "Erythroid denucleating cell",
            "Erythroid nuclear extrusion body",
            "Erythroid enucleation",
            "Erythroid mitochondria",
            "Erythroid membrane skeleton",
            "Erythroid spectrin",
            "Erythroid ankyrin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hematopoietic stem cell (HSC)",
                "Multipotent progenitor cell (MPP)",
                "Common myeloid progenitor (CMP)",
                "Megakaryocyte-erythroid progenitor (MEP)",
                "Burst-forming unit-erythroid (BFU-E)",
                "Colony-forming unit-erythroid (CFU-E)",
                "Proerythroblast",
                "Basophilic erythroblast",
                "Polychromatic erythroblast",
                "Orthochromatic erythroblast",
                "Reticulocyte",
                "Mature erythrocyte (RBC)",
                "Nucleated red blood cell (nRBC)",
                "Erythroid island macrophage",
                "Stress erythroid progenitor (SEP)",
                "Erythroid Kruppel-like factor (EKLF)",
                "Erythropoietin-responsive progenitor cell",
                "Erythroid denucleating cell",
                "Erythroid nuclear extrusion body",
                "Erythroid enucleation",
                "Erythroid mitochondria",
                "Erythroid membrane skeleton",
                "Erythroid spectrin",
                "Erythroid ankyrin"
            ],
            "mismatches": [],
            "true_referents": [
                "Basophilic erythroblast",
                "Burst-forming unit-erythroid (BFU-E)",
                "Colony-forming unit-erythroid (CFU-E)",
                "Common myeloid progenitor (CMP)",
                "Erythroid Kruppel-like factor (EKLF)",
                "Erythroid ankyrin",
                "Erythroid denucleating cell",
                "Erythroid enucleation",
                "Erythroid island macrophage",
                "Erythroid membrane skeleton",
                "Erythroid mitochondria",
                "Erythroid nuclear extrusion body",
                "Erythroid spectrin",
                "Erythropoietin-responsive progenitor cell",
                "Hematopoietic stem cell (HSC)",
                "Mature erythrocyte (RBC)",
                "Megakaryocyte-erythroid progenitor (MEP)",
                "Multipotent progenitor cell (MPP)",
                "Nucleated red blood cell (nRBC)",
                "Orthochromatic erythroblast",
                "Polychromatic erythroblast",
                "Proerythroblast",
                "Reticulocyte",
                "Stress erythroid progenitor (SEP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "Hematopoietic stem cell (HSC)",
            "Common myeloid progenitor (CMP)",
            "Megakaryocyte-erythrocyte progenitor (MEP)",
            "Burst-forming unit-erythroid (BFU-E)",
            "Colony-forming unit-erythroid (CFU-E)",
            "Proerythroblast",
            "Basophilic erythroblast",
            "Polychromatic erythroblast",
            "Orthochromatic erythroblast",
            "Reticulocyte",
            "Mature red blood cell (Erythrocyte)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hematopoietic stem cell (HSC)",
                "Common myeloid progenitor (CMP)",
                "Megakaryocyte-erythrocyte progenitor (MEP)",
                "Burst-forming unit-erythroid (BFU-E)",
                "Colony-forming unit-erythroid (CFU-E)",
                "Proerythroblast",
                "Basophilic erythroblast",
                "Polychromatic erythroblast",
                "Orthochromatic erythroblast",
                "Reticulocyte",
                "Mature red blood cell (Erythrocyte)"
            ],
            "mismatches": [],
            "true_referents": [
                "Basophilic erythroblast",
                "Burst-forming unit-erythroid (BFU-E)",
                "Colony-forming unit-erythroid (CFU-E)",
                "Common myeloid progenitor (CMP)",
                "Hematopoietic stem cell (HSC)",
                "Mature red blood cell (Erythrocyte)",
                "Megakaryocyte-erythrocyte progenitor (MEP)",
                "Orthochromatic erythroblast",
                "Polychromatic erythroblast",
                "Proerythroblast",
                "Reticulocyte"
            ],
            "TP": 11,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "Proerythroblast (ProEB)",
            "Basophilic erythroblast (BasoEB)",
            "Polychromatic erythroblast (PolyEB)",
            "Orthochromatic erythroblast (OrthoEB)",
            "Reticulocyte (Retic)",
            "Erythrocyte (RBC)",
            "Burst-forming unit-erythroid (BFU-E)",
            "Colony-forming unit-erythroid (CFU-E)",
            "Erythroid progenitor cell",
            "Erythroid precursor cell",
            "Hematopoietic stem cell (HSC)",
            "Multipotent progenitor cell (MPP)",
            "Common myeloid progenitor (CMP)",
            "Megakaryocyte-erythroid progenitor (MEP)",
            "Erythropoietin-responsive cell",
            "Erythropoietin receptor-expressing cell",
            "Hemoglobin-producing cell",
            "Enucleated cell (in mammals)",
            "Biconcave disc-shaped cell",
            "Anucleate cell (in mammals)",
            "Erythroid burst colony",
            "Erythroid colony-forming cell",
            "Erythroid colony",
            "Erythroid lineage cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Proerythroblast (ProEB)",
                "Basophilic erythroblast (BasoEB)",
                "Polychromatic erythroblast (PolyEB)",
                "Orthochromatic erythroblast (OrthoEB)",
                "Reticulocyte (Retic)",
                "Erythrocyte (RBC)",
                "Burst-forming unit-erythroid (BFU-E)",
                "Colony-forming unit-erythroid (CFU-E)",
                "Erythroid progenitor cell",
                "Erythroid precursor cell",
                "Hematopoietic stem cell (HSC)",
                "Multipotent progenitor cell (MPP)",
                "Common myeloid progenitor (CMP)",
                "Megakaryocyte-erythroid progenitor (MEP)",
                "Erythropoietin-responsive cell",
                "Erythropoietin receptor-expressing cell",
                "Hemoglobin-producing cell",
                "Enucleated cell (in mammals)",
                "Biconcave disc-shaped cell",
                "Anucleate cell (in mammals)",
                "Erythroid burst colony",
                "Erythroid colony-forming cell",
                "Erythroid colony",
                "Erythroid lineage cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Anucleate cell (in mammals)",
                "Basophilic erythroblast (BasoEB)",
                "Biconcave disc-shaped cell",
                "Burst-forming unit-erythroid (BFU-E)",
                "Colony-forming unit-erythroid (CFU-E)",
                "Common myeloid progenitor (CMP)",
                "Enucleated cell (in mammals)",
                "Erythrocyte (RBC)",
                "Erythroid burst colony",
                "Erythroid colony",
                "Erythroid colony-forming cell",
                "Erythroid lineage cell",
                "Erythroid precursor cell",
                "Erythroid progenitor cell",
                "Erythropoietin receptor-expressing cell",
                "Erythropoietin-responsive cell",
                "Hematopoietic stem cell (HSC)",
                "Hemoglobin-producing cell",
                "Megakaryocyte-erythroid progenitor (MEP)",
                "Multipotent progenitor cell (MPP)",
                "Orthochromatic erythroblast (OrthoEB)",
                "Polychromatic erythroblast (PolyEB)",
                "Proerythroblast (ProEB)",
                "Reticulocyte (Retic)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "Erythrocyte (RBC)",
            "Reticulocyte",
            "Normoblast",
            "Proerythroblast",
            "Erythroblast",
            "Polychromatophilic erythroblast",
            "Orthochromatic erythroblast",
            "Erythroid progenitor cell",
            "Erythroid precursor cell",
            "Erythroid stem cell",
            "Erythroid colony-forming unit (CFU-E)",
            "Erythroid burst-forming unit (BFU-E)",
            "Hematopoietic stem cell (HSC)",
            "Myeloid progenitor cell",
            "Myeloid precursor cell",
            "Myeloblast",
            "Promyelocyte",
            "Myelocyte",
            "Metamyelocyte",
            "Band neutrophil",
            "Segmented neutrophil",
            "Eosinophil",
            "Basophil",
            "Monocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Erythrocyte (RBC)",
                "Reticulocyte",
                "Normoblast",
                "Proerythroblast",
                "Erythroblast",
                "Polychromatophilic erythroblast",
                "Orthochromatic erythroblast",
                "Erythroid progenitor cell",
                "Erythroid precursor cell",
                "Erythroid stem cell",
                "Erythroid colony-forming unit (CFU-E)",
                "Erythroid burst-forming unit (BFU-E)",
                "Hematopoietic stem cell (HSC)",
                "Myeloid progenitor cell",
                "Myeloid precursor cell",
                "Myeloblast",
                "Promyelocyte",
                "Myelocyte",
                "Metamyelocyte",
                "Band neutrophil",
                "Segmented neutrophil",
                "Eosinophil",
                "Basophil",
                "Monocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "Band neutrophil",
                "Basophil",
                "Eosinophil",
                "Erythroblast",
                "Erythrocyte (RBC)",
                "Erythroid burst-forming unit (BFU-E)",
                "Erythroid colony-forming unit (CFU-E)",
                "Erythroid precursor cell",
                "Erythroid progenitor cell",
                "Erythroid stem cell",
                "Hematopoietic stem cell (HSC)",
                "Metamyelocyte",
                "Monocyte",
                "Myeloblast",
                "Myelocyte",
                "Myeloid precursor cell",
                "Myeloid progenitor cell",
                "Normoblast",
                "Orthochromatic erythroblast",
                "Polychromatophilic erythroblast",
                "Proerythroblast",
                "Promyelocyte",
                "Reticulocyte",
                "Segmented neutrophil"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "Erythroblast (Erb)",
            "Proerythroblast",
            "Basophilic erythroblast",
            "Polychromatophilic erythroblast",
            "Orthochromatic erythroblast",
            "Reticulocyte",
            "Erythroid progenitor cell",
            "Erythroid precursor cell",
            "Erythroid stem cell",
            "Fetal erythroblast",
            "Fetal erythrocyte",
            "Erythroid colony-forming unit (CFU-E)",
            "Erythroid burst-forming unit (BFU-E)",
            "Erythroid progenitor",
            "Erythroid precursor",
            "Erythroid stem",
            "Erythroid precursor cell of the bone marrow",
            "Erythroid progenitor cell of the bone marrow",
            "Erythroid stem cell of the bone marrow",
            "Fetal erythroid progenitor cell",
            "Fetal erythroid precursor cell",
            "Fetal erythroid stem cell",
            "Erythroid precursor cell of the fetal liver",
            "Erythroid progenitor cell of the fetal liver",
            "Erythroid stem cell of the fetal liver"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Erythroblast (Erb)",
                "Proerythroblast",
                "Basophilic erythroblast",
                "Polychromatophilic erythroblast",
                "Orthochromatic erythroblast",
                "Reticulocyte",
                "Erythroid progenitor cell",
                "Erythroid precursor cell",
                "Erythroid stem cell",
                "Fetal erythroblast",
                "Fetal erythrocyte",
                "Erythroid colony-forming unit (CFU-E)",
                "Erythroid burst-forming unit (BFU-E)",
                "Erythroid progenitor",
                "Erythroid precursor",
                "Erythroid stem",
                "Erythroid precursor cell of the bone marrow",
                "Erythroid progenitor cell of the bone marrow",
                "Erythroid stem cell of the bone marrow",
                "Fetal erythroid progenitor cell",
                "Fetal erythroid precursor cell",
                "Fetal erythroid stem cell",
                "Erythroid precursor cell of the fetal liver",
                "Erythroid progenitor cell of the fetal liver"
            ],
            "mismatches": [
                "Erythroid stem cell of the fetal liver"
            ],
            "true_referents": [
                "Basophilic erythroblast",
                "Erythroblast (Erb)",
                "Erythroid burst-forming unit (BFU-E)",
                "Erythroid colony-forming unit (CFU-E)",
                "Erythroid precursor",
                "Erythroid precursor cell",
                "Erythroid precursor cell of the bone marrow",
                "Erythroid precursor cell of the fetal liver",
                "Erythroid progenitor",
                "Erythroid progenitor cell",
                "Erythroid progenitor cell of the bone marrow",
                "Erythroid progenitor cell of the fetal liver",
                "Erythroid stem",
                "Erythroid stem cell",
                "Erythroid stem cell of the bone marrow",
                "Fetal erythroblast",
                "Fetal erythrocyte",
                "Fetal erythroid precursor cell",
                "Fetal erythroid progenitor cell",
                "Fetal erythroid stem cell",
                "Orthochromatic erythroblast",
                "Polychromatophilic erythroblast",
                "Proerythroblast",
                "Reticulocyte"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": [
            "Proerythroblast (BFU-E)",
            "Early normoblast (Ery-A)",
            "Intermediate normoblast (Ery-B)",
            "Late normoblast (Ery-C)",
            "Reticulocyte",
            "Metarubricyte",
            "Orthochromatic erythroblast",
            "Polychromatic erythroblast",
            "Basophilic erythroblast",
            "Chromophilic erythroblast",
            "Hemocytoblast",
            "Primitive erythroblast",
            "Definitive erythroblast",
            "Hemangioblast",
            "Hemogenic endothelial cell",
            "Mesodermal hematopoietic cell",
            "Early hematopoietic stem cell",
            "Hematopoietic stem cell",
            "Multipotent hematopoietic progenitor",
            "Common myeloid progenitor",
            "Granulocyte-monocyte progenitor",
            "Colony-forming unit-erythroid (CFU-E)",
            "Colony-forming unit-granulocyte, erythroid, monocyte, and megakaryocyte (CFU-GEMM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Proerythroblast (BFU-E)",
                "Early normoblast (Ery-A)",
                "Intermediate normoblast (Ery-B)",
                "Late normoblast (Ery-C)",
                "Reticulocyte",
                "Metarubricyte",
                "Orthochromatic erythroblast",
                "Polychromatic erythroblast",
                "Basophilic erythroblast",
                "Chromophilic erythroblast",
                "Hemocytoblast",
                "Primitive erythroblast",
                "Definitive erythroblast",
                "Hemangioblast",
                "Hemogenic endothelial cell",
                "Mesodermal hematopoietic cell",
                "Early hematopoietic stem cell",
                "Hematopoietic stem cell",
                "Multipotent hematopoietic progenitor",
                "Common myeloid progenitor",
                "Granulocyte-monocyte progenitor",
                "Colony-forming unit-erythroid (CFU-E)",
                "Colony-forming unit-granulocyte, erythroid, monocyte, and megakaryocyte (CFU-GEMM)"
            ],
            "mismatches": [],
            "true_referents": [
                "Basophilic erythroblast",
                "Chromophilic erythroblast",
                "Colony-forming unit-erythroid (CFU-E)",
                "Colony-forming unit-granulocyte, erythroid, monocyte, and megakaryocyte (CFU-GEMM)",
                "Common myeloid progenitor",
                "Definitive erythroblast",
                "Early hematopoietic stem cell",
                "Early normoblast (Ery-A)",
                "Granulocyte-monocyte progenitor",
                "Hemangioblast",
                "Hematopoietic stem cell",
                "Hemocytoblast",
                "Hemogenic endothelial cell",
                "Intermediate normoblast (Ery-B)",
                "Late normoblast (Ery-C)",
                "Mesodermal hematopoietic cell",
                "Metarubricyte",
                "Multipotent hematopoietic progenitor",
                "Orthochromatic erythroblast",
                "Polychromatic erythroblast",
                "Primitive erythroblast",
                "Proerythroblast (BFU-E)",
                "Reticulocyte"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "erythroid cell",
        "domain": "biology",
        "response": {
            "referent": "erythrocyte"
        },
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "erythrocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "referent: erythrocyte"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 0
        }
    }
]