[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Eosinophil",
            "Basophil",
            "Monocyte",
            "Macrophage",
            "Dendritic cell",
            "Myeloid progenitor cell (MPC)",
            "Myeloblast",
            "Promyelocyte",
            "Myelocyte",
            "Metamyelocyte",
            "Band cell",
            "Granulocyte",
            "Myeloid dendritic cell",
            "Conventional dendritic cell",
            "Plasmacytoid dendritic cell",
            "Neutrophilic myelocyte",
            "Neutrophilic metamyelocyte",
            "Neutrophilic band cell",
            "Eosinophilic myelocyte",
            "Eosinophilic metamyelocyte",
            "Eosinophilic band cell",
            "Basophilic myelocyte",
            "Basophilic metamyelocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Eosinophil",
                "Basophil",
                "Monocyte",
                "Macrophage",
                "Dendritic cell",
                "Myeloid progenitor cell (MPC)",
                "Myeloblast",
                "Promyelocyte",
                "Myelocyte",
                "Metamyelocyte",
                "Band cell",
                "Granulocyte",
                "Myeloid dendritic cell",
                "Conventional dendritic cell",
                "Plasmacytoid dendritic cell",
                "Neutrophilic myelocyte",
                "Neutrophilic metamyelocyte",
                "Neutrophilic band cell",
                "Eosinophilic myelocyte",
                "Eosinophilic metamyelocyte",
                "Eosinophilic band cell",
                "Basophilic myelocyte",
                "Basophilic metamyelocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "Band cell",
                "Basophil",
                "Basophilic metamyelocyte",
                "Basophilic myelocyte",
                "Conventional dendritic cell",
                "Dendritic cell",
                "Eosinophil",
                "Eosinophilic band cell",
                "Eosinophilic metamyelocyte",
                "Eosinophilic myelocyte",
                "Granulocyte",
                "Macrophage",
                "Metamyelocyte",
                "Monocyte",
                "Myeloblast",
                "Myelocyte",
                "Myeloid dendritic cell",
                "Myeloid progenitor cell (MPC)",
                "Neutrophil (PMN)",
                "Neutrophilic band cell",
                "Neutrophilic metamyelocyte",
                "Neutrophilic myelocyte",
                "Plasmacytoid dendritic cell",
                "Promyelocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Monocyte (CD14+ cell)",
            "Dendritic cell (DC)",
            "Macrophage (M\u03a6)",
            "Mast cell (MC)",
            "Granulocyte (e.g., Neutrophil, Eosinophil, Basophil)",
            "Neutrophil (PMN)",
            "Eosinophil",
            "Basophil",
            "Mast cell (Mastocyte)",
            "Erythrocyte (Red blood cell)",
            "Megakaryocyte",
            "Myeloblast",
            "Promyelocyte",
            "Myelocyte",
            "Metamyelocyte",
            "Band cell (Stab cell)",
            "Monoblast",
            "Promonocyte",
            "Osteoclast",
            "Microglia",
            "Kupffer cell",
            "Alveolar macrophage",
            "Tissue macrophage",
            "Langerhans cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Monocyte (CD14+ cell)",
                "Dendritic cell (DC)",
                "Macrophage (M\u03a6)",
                "Mast cell (MC)",
                "Granulocyte (e.g., Neutrophil, Eosinophil, Basophil)",
                "Neutrophil (PMN)",
                "Eosinophil",
                "Basophil",
                "Mast cell (Mastocyte)",
                "Erythrocyte (Red blood cell)",
                "Megakaryocyte",
                "Myeloblast",
                "Promyelocyte",
                "Myelocyte",
                "Metamyelocyte",
                "Band cell (Stab cell)",
                "Monoblast",
                "Promonocyte",
                "Osteoclast",
                "Microglia",
                "Kupffer cell",
                "Alveolar macrophage",
                "Tissue macrophage",
                "Langerhans cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage",
                "Band cell (Stab cell)",
                "Basophil",
                "Dendritic cell (DC)",
                "Eosinophil",
                "Erythrocyte (Red blood cell)",
                "Granulocyte (e.g., Neutrophil, Eosinophil, Basophil)",
                "Kupffer cell",
                "Langerhans cell",
                "Macrophage (M\u03a6)",
                "Mast cell (MC)",
                "Mast cell (Mastocyte)",
                "Megakaryocyte",
                "Metamyelocyte",
                "Microglia",
                "Monoblast",
                "Monocyte (CD14+ cell)",
                "Myeloblast",
                "Myelocyte",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Promonocyte",
                "Promyelocyte",
                "Tissue macrophage"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Monocyte",
            "Macrophage",
            "Neutrophil",
            "Eosinophil",
            "Basophil",
            "Mast Cell",
            "Dendritic Cell",
            "Erythroblast",
            "Megakaryocyte",
            "Platelet",
            "Myeloblast",
            "Promyelocyte",
            "Myelocyte",
            "Metamyelocyte",
            "Band Cell",
            "Segmented Neutrophil",
            "Osteoclast",
            "Langerhans Cell",
            "Interdigitating Dendritic Cell",
            "Follicular Dendritic Cell",
            "Plasmacytoid Dendritic Cell",
            "Mast Cell Progenitor",
            "Common Myeloid Progenitor (CMP)",
            "Granulocyte-Macrophage Progenitor (GMP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Monocyte",
                "Macrophage",
                "Neutrophil",
                "Eosinophil",
                "Basophil",
                "Mast Cell",
                "Dendritic Cell",
                "Erythroblast",
                "Megakaryocyte",
                "Platelet",
                "Myeloblast",
                "Promyelocyte",
                "Myelocyte",
                "Metamyelocyte",
                "Band Cell",
                "Segmented Neutrophil",
                "Osteoclast",
                "Langerhans Cell",
                "Interdigitating Dendritic Cell",
                "Follicular Dendritic Cell",
                "Plasmacytoid Dendritic Cell",
                "Mast Cell Progenitor",
                "Common Myeloid Progenitor (CMP)",
                "Granulocyte-Macrophage Progenitor (GMP)"
            ],
            "mismatches": [],
            "true_referents": [
                "Band Cell",
                "Basophil",
                "Common Myeloid Progenitor (CMP)",
                "Dendritic Cell",
                "Eosinophil",
                "Erythroblast",
                "Follicular Dendritic Cell",
                "Granulocyte-Macrophage Progenitor (GMP)",
                "Interdigitating Dendritic Cell",
                "Langerhans Cell",
                "Macrophage",
                "Mast Cell",
                "Mast Cell Progenitor",
                "Megakaryocyte",
                "Metamyelocyte",
                "Monocyte",
                "Myeloblast",
                "Myelocyte",
                "Neutrophil",
                "Osteoclast",
                "Plasmacytoid Dendritic Cell",
                "Platelet",
                "Promyelocyte",
                "Segmented Neutrophil"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Eosinophil (EOS)",
            "Basophil (BAS)",
            "Mast Cell (MC)",
            "Monocyte (MON)",
            "Macrophage (M\u03a6)",
            "Dendritic Cell (DC)",
            "Myeloblast",
            "Promyelocyte",
            "Myelocyte",
            "Metamyelocyte",
            "Band Neutrophil",
            "Granulocyte-Macrophage Progenitor (GMP)",
            "Megakaryocyte-Erythrocyte Progenitor (MEP)",
            "Common Myeloid Progenitor (CMP)",
            "Granulocyte Monocyte Progenitor (GMP)",
            "Histiocyte",
            "Langerhans Cell",
            "Interstitial Dendritic Cell",
            "Plasmacytoid Dendritic Cell (pDC)",
            "Conventional Dendritic Cell (cDC)",
            "Osteoclast",
            "Alveolar Macrophage",
            "Microglia"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Eosinophil (EOS)",
                "Basophil (BAS)",
                "Mast Cell (MC)",
                "Monocyte (MON)",
                "Macrophage (M\u03a6)",
                "Dendritic Cell (DC)",
                "Myeloblast",
                "Promyelocyte",
                "Myelocyte",
                "Metamyelocyte",
                "Band Neutrophil",
                "Granulocyte-Macrophage Progenitor (GMP)",
                "Megakaryocyte-Erythrocyte Progenitor (MEP)",
                "Common Myeloid Progenitor (CMP)",
                "Granulocyte Monocyte Progenitor (GMP)",
                "Histiocyte",
                "Langerhans Cell",
                "Interstitial Dendritic Cell",
                "Plasmacytoid Dendritic Cell (pDC)",
                "Conventional Dendritic Cell (cDC)",
                "Osteoclast",
                "Alveolar Macrophage",
                "Microglia"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar Macrophage",
                "Band Neutrophil",
                "Basophil (BAS)",
                "Common Myeloid Progenitor (CMP)",
                "Conventional Dendritic Cell (cDC)",
                "Dendritic Cell (DC)",
                "Eosinophil (EOS)",
                "Granulocyte Monocyte Progenitor (GMP)",
                "Granulocyte-Macrophage Progenitor (GMP)",
                "Histiocyte",
                "Interstitial Dendritic Cell",
                "Langerhans Cell",
                "Macrophage (M\u03a6)",
                "Mast Cell (MC)",
                "Megakaryocyte-Erythrocyte Progenitor (MEP)",
                "Metamyelocyte",
                "Microglia",
                "Monocyte (MON)",
                "Myeloblast",
                "Myelocyte",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Plasmacytoid Dendritic Cell (pDC)",
                "Promyelocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Neutrophil",
            "Eosinophil",
            "Basophil",
            "Monocyte",
            "Macrophage",
            "Dendritic Cell",
            "Mast Cell",
            "Megakaryocyte",
            "Erythrocyte",
            "Myeloid-Derived Suppressor Cell (MDSC)",
            "Granulocyte",
            "Promyelocyte",
            "Myeloblast",
            "Band Cell",
            "Reticulocyte",
            "Platelet",
            "Langerhans Cell",
            "Kupffer Cell",
            "Osteoclast",
            "Alveolar Macrophage",
            "Microglia",
            "Histiocyte",
            "Sinusoidal Endothelial Cell",
            "Polymorphonuclear Leukocyte (PMN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil",
                "Eosinophil",
                "Basophil",
                "Monocyte",
                "Macrophage",
                "Dendritic Cell",
                "Mast Cell",
                "Megakaryocyte",
                "Erythrocyte",
                "Myeloid-Derived Suppressor Cell (MDSC)",
                "Granulocyte",
                "Promyelocyte",
                "Myeloblast",
                "Band Cell",
                "Reticulocyte",
                "Platelet",
                "Langerhans Cell",
                "Kupffer Cell",
                "Osteoclast",
                "Alveolar Macrophage",
                "Microglia",
                "Histiocyte",
                "Sinusoidal Endothelial Cell",
                "Polymorphonuclear Leukocyte (PMN)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar Macrophage",
                "Band Cell",
                "Basophil",
                "Dendritic Cell",
                "Eosinophil",
                "Erythrocyte",
                "Granulocyte",
                "Histiocyte",
                "Kupffer Cell",
                "Langerhans Cell",
                "Macrophage",
                "Mast Cell",
                "Megakaryocyte",
                "Microglia",
                "Monocyte",
                "Myeloblast",
                "Myeloid-Derived Suppressor Cell (MDSC)",
                "Neutrophil",
                "Osteoclast",
                "Platelet",
                "Polymorphonuclear Leukocyte (PMN)",
                "Promyelocyte",
                "Reticulocyte",
                "Sinusoidal Endothelial Cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Monocyte (MON)",
            "Macrophage (M\u03a6)",
            "Neutrophil (NEUT)",
            "Eosinophil (EOS)",
            "Basophil (BASO)",
            "Dendritic cell (DC)",
            "Myeloid-derived suppressor cell (MDSC)",
            "Granulocyte (GRA)",
            "Megakaryocyte (MK)",
            "Erythrocyte (RBC)",
            "Platelet (PLT)",
            "Bone marrow stromal cell (BMSC)",
            "Myeloid progenitor cell (CMP)",
            "Common myeloid progenitor (CMP)",
            "Immature dendritic cell (IDC)",
            "Tissue-resident macrophage (TRM)",
            "Alveolar macrophage (AM)",
            "Kupffer cell (KC)",
            "Microglia (MG)",
            "Osteoclast (OC)",
            "Mast cell (MC)",
            "Langerhans cell (LC)",
            "Fetal liver macrophage (FLM)",
            "Tumor-associated macrophage (TAM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Monocyte (MON)",
                "Macrophage (M\u03a6)",
                "Neutrophil (NEUT)",
                "Eosinophil (EOS)",
                "Basophil (BASO)",
                "Dendritic cell (DC)",
                "Myeloid-derived suppressor cell (MDSC)",
                "Granulocyte (GRA)",
                "Megakaryocyte (MK)",
                "Erythrocyte (RBC)",
                "Platelet (PLT)",
                "Bone marrow stromal cell (BMSC)",
                "Myeloid progenitor cell (CMP)",
                "Common myeloid progenitor (CMP)",
                "Immature dendritic cell (IDC)",
                "Tissue-resident macrophage (TRM)",
                "Alveolar macrophage (AM)",
                "Kupffer cell (KC)",
                "Microglia (MG)",
                "Osteoclast (OC)",
                "Mast cell (MC)",
                "Langerhans cell (LC)",
                "Fetal liver macrophage (FLM)",
                "Tumor-associated macrophage (TAM)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage (AM)",
                "Basophil (BASO)",
                "Bone marrow stromal cell (BMSC)",
                "Common myeloid progenitor (CMP)",
                "Dendritic cell (DC)",
                "Eosinophil (EOS)",
                "Erythrocyte (RBC)",
                "Fetal liver macrophage (FLM)",
                "Granulocyte (GRA)",
                "Immature dendritic cell (IDC)",
                "Kupffer cell (KC)",
                "Langerhans cell (LC)",
                "Macrophage (M\u03a6)",
                "Mast cell (MC)",
                "Megakaryocyte (MK)",
                "Microglia (MG)",
                "Monocyte (MON)",
                "Myeloid progenitor cell (CMP)",
                "Myeloid-derived suppressor cell (MDSC)",
                "Neutrophil (NEUT)",
                "Osteoclast (OC)",
                "Platelet (PLT)",
                "Tissue-resident macrophage (TRM)",
                "Tumor-associated macrophage (TAM)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Neutrophils (NEU)",
            "Eosinophils (EOS)",
            "Basophils (BASO)",
            "Monocytes (MO)",
            "Mast Cells (MC)",
            "Dendritic Cells (DC)",
            "Macrophages (M\u03a6)",
            "Megakaryocytes (MK)",
            "Erythroblasts (EB)",
            "Myeloblasts (MB)",
            "Promyelocytes (PM)",
            "Myelocytes (MYC)",
            "Metamyelocytes (MM)",
            "Band Cells (BC)",
            "Platelets (PLT)",
            "Red Blood Cells (RBC)",
            "Microglia (MG)",
            "Osteoclasts (OC)",
            "Kupffer Cells (KC)",
            "Langerhans Cells (LC)",
            "Alveolar Macrophages (AM)",
            "Interstitial Macrophages (IM)",
            "Perivascular Macrophages (PVM)",
            "Sinusoidal Macrophages (SM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophils (NEU)",
                "Eosinophils (EOS)",
                "Basophils (BASO)",
                "Monocytes (MO)",
                "Mast Cells (MC)",
                "Dendritic Cells (DC)",
                "Macrophages (M\u03a6)",
                "Megakaryocytes (MK)",
                "Erythroblasts (EB)",
                "Myeloblasts (MB)",
                "Promyelocytes (PM)",
                "Myelocytes (MYC)",
                "Metamyelocytes (MM)",
                "Band Cells (BC)",
                "Platelets (PLT)",
                "Red Blood Cells (RBC)",
                "Microglia (MG)",
                "Osteoclasts (OC)",
                "Kupffer Cells (KC)",
                "Langerhans Cells (LC)",
                "Alveolar Macrophages (AM)",
                "Interstitial Macrophages (IM)",
                "Perivascular Macrophages (PVM)",
                "Sinusoidal Macrophages (SM)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar Macrophages (AM)",
                "Band Cells (BC)",
                "Basophils (BASO)",
                "Dendritic Cells (DC)",
                "Eosinophils (EOS)",
                "Erythroblasts (EB)",
                "Interstitial Macrophages (IM)",
                "Kupffer Cells (KC)",
                "Langerhans Cells (LC)",
                "Macrophages (M\u03a6)",
                "Mast Cells (MC)",
                "Megakaryocytes (MK)",
                "Metamyelocytes (MM)",
                "Microglia (MG)",
                "Monocytes (MO)",
                "Myeloblasts (MB)",
                "Myelocytes (MYC)",
                "Neutrophils (NEU)",
                "Osteoclasts (OC)",
                "Perivascular Macrophages (PVM)",
                "Platelets (PLT)",
                "Promyelocytes (PM)",
                "Red Blood Cells (RBC)",
                "Sinusoidal Macrophages (SM)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Neutrophil",
            "Eosinophil",
            "Basophil",
            "Monocyte",
            "Macrophage",
            "Dendritic cell",
            "Mast cell",
            "Granulocyte",
            "Myeloblast",
            "Promyelocyte",
            "Myelocyte",
            "Metamyelocyte",
            "Band cell",
            "Polymorphonuclear leukocyte",
            "Plasmacytoid dendritic cell",
            "Langerhans cell",
            "Microglia",
            "Osteoclast",
            "Kupffer cell",
            "Alveolar macrophage",
            "Peritoneal macrophage",
            "Histiocyte",
            "Splenic macrophage",
            "Red pulp macrophage"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil",
                "Eosinophil",
                "Basophil",
                "Monocyte",
                "Macrophage",
                "Dendritic cell",
                "Mast cell",
                "Granulocyte",
                "Myeloblast",
                "Promyelocyte",
                "Myelocyte",
                "Metamyelocyte",
                "Band cell",
                "Polymorphonuclear leukocyte",
                "Plasmacytoid dendritic cell",
                "Langerhans cell",
                "Microglia",
                "Osteoclast",
                "Kupffer cell",
                "Alveolar macrophage",
                "Peritoneal macrophage",
                "Histiocyte",
                "Splenic macrophage",
                "Red pulp macrophage"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage",
                "Band cell",
                "Basophil",
                "Dendritic cell",
                "Eosinophil",
                "Granulocyte",
                "Histiocyte",
                "Kupffer cell",
                "Langerhans cell",
                "Macrophage",
                "Mast cell",
                "Metamyelocyte",
                "Microglia",
                "Monocyte",
                "Myeloblast",
                "Myelocyte",
                "Neutrophil",
                "Osteoclast",
                "Peritoneal macrophage",
                "Plasmacytoid dendritic cell",
                "Polymorphonuclear leukocyte",
                "Promyelocyte",
                "Red pulp macrophage",
                "Splenic macrophage"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Neutrophil (NEU)",
            "Eosinophil (EOS)",
            "Basophil (BASO)",
            "Monocyte (MONO)",
            "Macrophage",
            "Dendritic Cell (DC)",
            "Mast Cell",
            "Myeloblast",
            "Promyelocyte",
            "Myelocyte",
            "Metamyelocyte",
            "Band Neutrophil",
            "Plasma Cell",
            "Megakaryocyte",
            "Erythroblast",
            "Granulocyte",
            "Myelomonocyte",
            "Myeloid-Derived Suppressor Cell (MDSC)",
            "Langerhans Cell",
            "Microglia",
            "Osteoclast",
            "Promonocyte",
            "Plasmatocyte",
            "Basophilic Granulocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (NEU)",
                "Eosinophil (EOS)",
                "Basophil (BASO)",
                "Monocyte (MONO)",
                "Macrophage",
                "Dendritic Cell (DC)",
                "Mast Cell",
                "Myeloblast",
                "Promyelocyte",
                "Myelocyte",
                "Metamyelocyte",
                "Band Neutrophil",
                "Plasma Cell",
                "Megakaryocyte",
                "Erythroblast",
                "Granulocyte",
                "Myelomonocyte",
                "Myeloid-Derived Suppressor Cell (MDSC)",
                "Langerhans Cell",
                "Microglia",
                "Osteoclast",
                "Promonocyte",
                "Plasmatocyte",
                "Basophilic Granulocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "Band Neutrophil",
                "Basophil (BASO)",
                "Basophilic Granulocyte",
                "Dendritic Cell (DC)",
                "Eosinophil (EOS)",
                "Erythroblast",
                "Granulocyte",
                "Langerhans Cell",
                "Macrophage",
                "Mast Cell",
                "Megakaryocyte",
                "Metamyelocyte",
                "Microglia",
                "Monocyte (MONO)",
                "Myeloblast",
                "Myelocyte",
                "Myeloid-Derived Suppressor Cell (MDSC)",
                "Myelomonocyte",
                "Neutrophil (NEU)",
                "Osteoclast",
                "Plasma Cell",
                "Plasmatocyte",
                "Promonocyte",
                "Promyelocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Monocyte",
            "Macrophage",
            "Dendritic cell (DC)",
            "Eosinophil",
            "Basophil",
            "Mast cell",
            "Megakaryocyte",
            "Erythrocyte",
            "Myeloid-derived suppressor cell (MDSC)",
            "Osteoclast",
            "Kupffer cell",
            "Alveolar macrophage",
            "Microglia",
            "Langerhans cell",
            "Myeloblast",
            "Promyelocyte",
            "Myelocyte",
            "Metamyelocyte",
            "Band neutrophil",
            "Promonocyte",
            "Monoblast",
            "Erythroblast",
            "Megakaryoblast"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Monocyte",
                "Macrophage",
                "Dendritic cell (DC)",
                "Eosinophil",
                "Basophil",
                "Mast cell",
                "Megakaryocyte",
                "Erythrocyte",
                "Myeloid-derived suppressor cell (MDSC)",
                "Osteoclast",
                "Kupffer cell",
                "Alveolar macrophage",
                "Microglia",
                "Langerhans cell",
                "Myeloblast",
                "Promyelocyte",
                "Myelocyte",
                "Metamyelocyte",
                "Band neutrophil",
                "Promonocyte",
                "Monoblast",
                "Erythroblast",
                "Megakaryoblast"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage",
                "Band neutrophil",
                "Basophil",
                "Dendritic cell (DC)",
                "Eosinophil",
                "Erythroblast",
                "Erythrocyte",
                "Kupffer cell",
                "Langerhans cell",
                "Macrophage",
                "Mast cell",
                "Megakaryoblast",
                "Megakaryocyte",
                "Metamyelocyte",
                "Microglia",
                "Monoblast",
                "Monocyte",
                "Myeloblast",
                "Myelocyte",
                "Myeloid-derived suppressor cell (MDSC)",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Promonocyte",
                "Promyelocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Eosinophil",
            "Basophil",
            "Monocyte",
            "Macrophage (M\u03a6)",
            "Dendritic cell (DC)",
            "Langerhans cell (LC)",
            "Microglia",
            "Osteoclast",
            "Mast cell",
            "Megakaryocyte",
            "Erythrocyte",
            "Myeloblast",
            "Monoblast",
            "Promonocyte",
            "Promyelocyte",
            "Myelocyte",
            "Metamyelocyte",
            "Band cell",
            "Kupffer cell",
            "Alveolar macrophage",
            "Histiocyte",
            "Hematopoietic stem cell (HSC)",
            "Common myeloid progenitor (CMP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Eosinophil",
                "Basophil",
                "Monocyte",
                "Macrophage (M\u03a6)",
                "Dendritic cell (DC)",
                "Langerhans cell (LC)",
                "Microglia",
                "Osteoclast",
                "Mast cell",
                "Megakaryocyte",
                "Erythrocyte",
                "Myeloblast",
                "Monoblast",
                "Promonocyte",
                "Promyelocyte",
                "Myelocyte",
                "Metamyelocyte",
                "Band cell",
                "Kupffer cell",
                "Alveolar macrophage",
                "Histiocyte",
                "Hematopoietic stem cell (HSC)",
                "Common myeloid progenitor (CMP)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar macrophage",
                "Band cell",
                "Basophil",
                "Common myeloid progenitor (CMP)",
                "Dendritic cell (DC)",
                "Eosinophil",
                "Erythrocyte",
                "Hematopoietic stem cell (HSC)",
                "Histiocyte",
                "Kupffer cell",
                "Langerhans cell (LC)",
                "Macrophage (M\u03a6)",
                "Mast cell",
                "Megakaryocyte",
                "Metamyelocyte",
                "Microglia",
                "Monoblast",
                "Monocyte",
                "Myeloblast",
                "Myelocyte",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Promonocyte",
                "Promyelocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Neutrophil (PMN)",
            "Eosinophil",
            "Basophil",
            "Monocyte",
            "Mast Cell",
            "Dendritic Cell",
            "Macrophage",
            "Osteoclast",
            "Microglia",
            "Langerhans Cell",
            "Megakaryocyte",
            "Erythrocyte (RBC)",
            "Platelets",
            "Myeloblast",
            "Promyelocyte",
            "Myelocyte",
            "Metamyelocyte",
            "Band Cell",
            "Monoblast",
            "Promonocyte",
            "Monocyte Precursor",
            "Myeloid-derived Suppressor Cell (MDSC)",
            "Myeloid Progenitor Cell",
            "Hematopoietic Stem Cell (HSC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (PMN)",
                "Eosinophil",
                "Basophil",
                "Monocyte",
                "Mast Cell",
                "Dendritic Cell",
                "Macrophage",
                "Osteoclast",
                "Microglia",
                "Langerhans Cell",
                "Megakaryocyte",
                "Erythrocyte (RBC)",
                "Platelets",
                "Myeloblast",
                "Promyelocyte",
                "Myelocyte",
                "Metamyelocyte",
                "Band Cell",
                "Monoblast",
                "Promonocyte",
                "Monocyte Precursor",
                "Myeloid-derived Suppressor Cell (MDSC)",
                "Myeloid Progenitor Cell",
                "Hematopoietic Stem Cell (HSC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Band Cell",
                "Basophil",
                "Dendritic Cell",
                "Eosinophil",
                "Erythrocyte (RBC)",
                "Hematopoietic Stem Cell (HSC)",
                "Langerhans Cell",
                "Macrophage",
                "Mast Cell",
                "Megakaryocyte",
                "Metamyelocyte",
                "Microglia",
                "Monoblast",
                "Monocyte",
                "Monocyte Precursor",
                "Myeloblast",
                "Myelocyte",
                "Myeloid Progenitor Cell",
                "Myeloid-derived Suppressor Cell (MDSC)",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Platelets",
                "Promonocyte",
                "Promyelocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Neutrophil (NEUT)",
            "Eosinophil (EOS)",
            "Basophil (BASO)",
            "Monocyte (MONO)",
            "Macrophage (M\u03a6)",
            "Dendritic Cell (DC)",
            "Mast Cell (MC)",
            "Osteoclast (OC)",
            "Microglia (MG)",
            "Kupffer Cell (KC)",
            "Alveolar Macrophage (AM)",
            "Histiocyte (HIST)",
            "Langerhans Cell (LC)",
            "Myeloid-Derived Suppressor Cell (MDSC)",
            "Tumor-Associated Macrophage (TAM)",
            "Inflammatory Monocyte (iMONO)",
            "Resident Macrophage (rM\u03a6)",
            "Interstitial Dendritic Cell (iDC)",
            "Plasmacytoid Dendritic Cell (pDC)",
            "Myeloid Progenitor Cell (MPC)",
            "Common Myeloid Progenitor (CMP)",
            "Granulocyte-Monocyte Progenitor (GMP)",
            "Megakaryocyte-Erythroid Progenitor (MEP)",
            "Myeloid Stem Cell (MSC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neutrophil (NEUT)",
                "Eosinophil (EOS)",
                "Basophil (BASO)",
                "Monocyte (MONO)",
                "Macrophage (M\u03a6)",
                "Dendritic Cell (DC)",
                "Mast Cell (MC)",
                "Osteoclast (OC)",
                "Microglia (MG)",
                "Kupffer Cell (KC)",
                "Alveolar Macrophage (AM)",
                "Histiocyte (HIST)",
                "Langerhans Cell (LC)",
                "Myeloid-Derived Suppressor Cell (MDSC)",
                "Tumor-Associated Macrophage (TAM)",
                "Inflammatory Monocyte (iMONO)",
                "Resident Macrophage (rM\u03a6)",
                "Interstitial Dendritic Cell (iDC)",
                "Plasmacytoid Dendritic Cell (pDC)",
                "Myeloid Progenitor Cell (MPC)",
                "Common Myeloid Progenitor (CMP)",
                "Granulocyte-Monocyte Progenitor (GMP)",
                "Megakaryocyte-Erythroid Progenitor (MEP)",
                "Myeloid Stem Cell (MSC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alveolar Macrophage (AM)",
                "Basophil (BASO)",
                "Common Myeloid Progenitor (CMP)",
                "Dendritic Cell (DC)",
                "Eosinophil (EOS)",
                "Granulocyte-Monocyte Progenitor (GMP)",
                "Histiocyte (HIST)",
                "Inflammatory Monocyte (iMONO)",
                "Interstitial Dendritic Cell (iDC)",
                "Kupffer Cell (KC)",
                "Langerhans Cell (LC)",
                "Macrophage (M\u03a6)",
                "Mast Cell (MC)",
                "Megakaryocyte-Erythroid Progenitor (MEP)",
                "Microglia (MG)",
                "Monocyte (MONO)",
                "Myeloid Progenitor Cell (MPC)",
                "Myeloid Stem Cell (MSC)",
                "Myeloid-Derived Suppressor Cell (MDSC)",
                "Neutrophil (NEUT)",
                "Osteoclast (OC)",
                "Plasmacytoid Dendritic Cell (pDC)",
                "Resident Macrophage (rM\u03a6)",
                "Tumor-Associated Macrophage (TAM)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Dendritic cells (DCs)",
            "Monocytes",
            "Macrophages",
            "Granulocytes",
            "Neutrophils",
            "Eosinophils",
            "Basophils",
            "Mast cells",
            "Myeloid-derived suppressor cells (MDSCs)",
            "Myeloid cells in the bone marrow",
            "Myeloid progenitor cells",
            "Myeloblasts",
            "Promyelocytes",
            "Myelocytes",
            "Metamyelocytes",
            "Band cells",
            "Segmented neutrophils",
            "Eosinophilic granulocytes",
            "Basophilic granulocytes",
            "Myeloid leukemia cells",
            "Acute myeloid leukemia (AML) cells",
            "Chronic myeloid leukemia (CML) cells",
            "Myeloid-derived growth factors",
            "Myeloid-specific transcription factors",
            "Myeloid cell-specific surface markers"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Dendritic cells (DCs)",
                "Monocytes",
                "Macrophages",
                "Granulocytes",
                "Neutrophils",
                "Eosinophils",
                "Basophils",
                "Mast cells",
                "Myeloid-derived suppressor cells (MDSCs)",
                "Myeloid cells in the bone marrow",
                "Myeloid progenitor cells",
                "Myeloblasts",
                "Promyelocytes",
                "Myelocytes",
                "Metamyelocytes",
                "Band cells",
                "Segmented neutrophils",
                "Eosinophilic granulocytes",
                "Basophilic granulocytes",
                "Myeloid leukemia cells",
                "Acute myeloid leukemia (AML) cells",
                "Chronic myeloid leukemia (CML) cells",
                "Myeloid-derived growth factors",
                "Myeloid-specific transcription factors"
            ],
            "mismatches": [
                "Myeloid cell-specific surface markers"
            ],
            "true_referents": [
                "Acute myeloid leukemia (AML) cells",
                "Band cells",
                "Basophilic granulocytes",
                "Basophils",
                "Chronic myeloid leukemia (CML) cells",
                "Dendritic cells (DCs)",
                "Eosinophilic granulocytes",
                "Eosinophils",
                "Granulocytes",
                "Macrophages",
                "Mast cells",
                "Metamyelocytes",
                "Monocytes",
                "Myeloblasts",
                "Myelocytes",
                "Myeloid cells in the bone marrow",
                "Myeloid leukemia cells",
                "Myeloid progenitor cells",
                "Myeloid-derived growth factors",
                "Myeloid-derived suppressor cells (MDSCs)",
                "Myeloid-specific transcription factors",
                "Neutrophils",
                "Promyelocytes",
                "Segmented neutrophils"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": [
            "Monocyte (CD14+)",
            "Macrophage (M\u03a6)",
            "Neutrophil (PMN)",
            "Eosinophil",
            "Basophil",
            "Dendritic cell (DC)",
            "Myeloid-derived suppressor cell (MDSC)",
            "Osteoclast",
            "Tumor-associated macrophage (TAM)",
            "Bone marrow-derived macrophage (BMDM)",
            "Kupffer cell",
            "Langerhans cell",
            "Microglia",
            " Foam cell",
            "M2 macrophage",
            "Classically activated macrophage (CAM)",
            "Alternatively activated macrophage (AAM)",
            "Macrophage-1 (M\u03c61)",
            "Macrophage-2 (M\u03c62)",
            "Interferon-\u03b3-activated macrophage (IFN-\u03b3-AM)",
            "Il-4-activated macrophage (IL-4-AM)",
            "Immunosuppressive macrophage",
            "Pro-inflammatory macrophage",
            "Tissue-resident macrophage"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Monocyte (CD14+)",
                "Macrophage (M\u03a6)",
                "Neutrophil (PMN)",
                "Eosinophil",
                "Basophil",
                "Dendritic cell (DC)",
                "Myeloid-derived suppressor cell (MDSC)",
                "Osteoclast",
                "Tumor-associated macrophage (TAM)",
                "Bone marrow-derived macrophage (BMDM)",
                "Kupffer cell",
                "Langerhans cell",
                "Microglia",
                " Foam cell",
                "M2 macrophage",
                "Classically activated macrophage (CAM)",
                "Alternatively activated macrophage (AAM)",
                "Macrophage-1 (M\u03c61)",
                "Macrophage-2 (M\u03c62)",
                "Interferon-\u03b3-activated macrophage (IFN-\u03b3-AM)",
                "Il-4-activated macrophage (IL-4-AM)",
                "Immunosuppressive macrophage",
                "Pro-inflammatory macrophage",
                "Tissue-resident macrophage"
            ],
            "mismatches": [],
            "true_referents": [
                " Foam cell",
                "Alternatively activated macrophage (AAM)",
                "Basophil",
                "Bone marrow-derived macrophage (BMDM)",
                "Classically activated macrophage (CAM)",
                "Dendritic cell (DC)",
                "Eosinophil",
                "Il-4-activated macrophage (IL-4-AM)",
                "Immunosuppressive macrophage",
                "Interferon-\u03b3-activated macrophage (IFN-\u03b3-AM)",
                "Kupffer cell",
                "Langerhans cell",
                "M2 macrophage",
                "Macrophage (M\u03a6)",
                "Macrophage-1 (M\u03c61)",
                "Macrophage-2 (M\u03c62)",
                "Microglia",
                "Monocyte (CD14+)",
                "Myeloid-derived suppressor cell (MDSC)",
                "Neutrophil (PMN)",
                "Osteoclast",
                "Pro-inflammatory macrophage",
                "Tissue-resident macrophage",
                "Tumor-associated macrophage (TAM)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "myeloid cell",
        "domain": "biology",
        "response": "[\n    {\n        \"Canonical name\": \"Basophil\" (BASO)\n    },\n    {\n        \"Canonical name\": \"Eosinophil\" (EOS)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Monocyte\" (MONO)\n    },\n    {\n        \"Canonical name\": \"Lymphocyte\" (LYMPH)\n    },\n    {\n        \"Canonical name\": \"Myeloblast\" (MYELO)\n    },\n    {\n        \"Canonical name\": \"Promyelocyte\" (PROMO)\n    },\n    {\n        \"Canonical name\": \"Myelocyte\" (MYELO)\n    },\n    {\n        \"Canonical name\": \"Metamyelocyte\" (METAMYELO)\n    },\n    {\n        \"Canonical name\": \"Band cell\" (BAND)\n    },\n    {\n        \"Canonical name\": \"Eosinophil\" (EOS)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    },\n    {\n        \"Canonical name\": \"Neutrophil\" (NEU)\n    }\n]",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]