[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "B cell (B)",
            "Plasma cell",
            "Memory B cell",
            "Pre-B cell",
            "Immature B cell",
            "Follicular B cell",
            "Marginal zone B cell",
            "B-1 cell",
            "B-2 cell",
            "Germinal center B cell",
            "Transitional B cell",
            "Splenic B cell",
            "Tonsillar B cell",
            "Mucosal B cell",
            "Bronchus-associated lymphoid tissue (BALT) B cell",
            "Gut-associated lymphoid tissue (GALT) B cell",
            "Peripheral B cell",
            "Central memory B cell",
            "Effector memory B cell",
            "Antigen-experienced B cell",
            "Na\u00efve B cell",
            "Isotype-switched B cell",
            "Unswitched B cell",
            "Plasmablast"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "B cell (B)",
                "Plasma cell",
                "Memory B cell",
                "Pre-B cell",
                "Immature B cell",
                "Follicular B cell",
                "Marginal zone B cell",
                "B-1 cell",
                "B-2 cell",
                "Germinal center B cell",
                "Transitional B cell",
                "Splenic B cell",
                "Tonsillar B cell",
                "Mucosal B cell",
                "Bronchus-associated lymphoid tissue (BALT) B cell",
                "Gut-associated lymphoid tissue (GALT) B cell",
                "Peripheral B cell",
                "Central memory B cell",
                "Effector memory B cell",
                "Antigen-experienced B cell",
                "Na\u00efve B cell",
                "Isotype-switched B cell",
                "Unswitched B cell",
                "Plasmablast"
            ],
            "mismatches": [],
            "true_referents": [
                "Antigen-experienced B cell",
                "B cell (B)",
                "B-1 cell",
                "B-2 cell",
                "Bronchus-associated lymphoid tissue (BALT) B cell",
                "Central memory B cell",
                "Effector memory B cell",
                "Follicular B cell",
                "Germinal center B cell",
                "Gut-associated lymphoid tissue (GALT) B cell",
                "Immature B cell",
                "Isotype-switched B cell",
                "Marginal zone B cell",
                "Memory B cell",
                "Mucosal B cell",
                "Na\u00efve B cell",
                "Peripheral B cell",
                "Plasma cell",
                "Plasmablast",
                "Pre-B cell",
                "Splenic B cell",
                "Tonsillar B cell",
                "Transitional B cell",
                "Unswitched B cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "B cell (B lymphocyte)",
            "Plasma cell",
            "Memory B cell",
            "Activated B cell",
            "Naive B cell",
            "Marginal zone B cell",
            "Follicular B cell",
            "Germinal center B cell",
            "B-1 cell",
            "B-2 cell",
            "B10 cell",
            "Breg cell (B regulatory cell)",
            "CD5+ B cell",
            "CD27+ B cell",
            "CD19+ B cell",
            "CD20+ B cell",
            "CD38+ B cell",
            "CD138+ B cell",
            "IgM+ B cell",
            "IgD+ B cell",
            "IgG+ B cell",
            "IgA+ B cell",
            "IgE+ B cell",
            "IgM+ IgD+ B cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "B cell (B lymphocyte)",
                "Plasma cell",
                "Memory B cell",
                "Activated B cell",
                "Naive B cell",
                "Marginal zone B cell",
                "Follicular B cell",
                "Germinal center B cell",
                "B-1 cell",
                "B-2 cell",
                "B10 cell",
                "Breg cell (B regulatory cell)",
                "CD5+ B cell",
                "CD27+ B cell",
                "CD19+ B cell",
                "CD20+ B cell",
                "CD38+ B cell",
                "CD138+ B cell",
                "IgM+ B cell",
                "IgD+ B cell",
                "IgG+ B cell",
                "IgA+ B cell",
                "IgE+ B cell",
                "IgM+ IgD+ B cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated B cell",
                "B cell (B lymphocyte)",
                "B-1 cell",
                "B-2 cell",
                "B10 cell",
                "Breg cell (B regulatory cell)",
                "CD138+ B cell",
                "CD19+ B cell",
                "CD20+ B cell",
                "CD27+ B cell",
                "CD38+ B cell",
                "CD5+ B cell",
                "Follicular B cell",
                "Germinal center B cell",
                "IgA+ B cell",
                "IgD+ B cell",
                "IgE+ B cell",
                "IgG+ B cell",
                "IgM+ B cell",
                "IgM+ IgD+ B cell",
                "Marginal zone B cell",
                "Memory B cell",
                "Naive B cell",
                "Plasma cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "B cell (B lymphocyte)",
            "Plasma cell",
            "Memory B cell",
            "Follicular B cell",
            "Marginal zone B cell",
            "B-1a cell",
            "B-1b cell",
            "Plasmacytoid dendritic cell",
            "Naive B cell",
            "Germinal center B cell",
            "Activated B cell",
            "Memory B-1 cell",
            "Memory B-2 cell",
            "B regulatory cell",
            "Memory plasma cell",
            "T follicular helper cell (Tfh cell)",
            "T follicular regulatory cell (Tfr cell)",
            "CD5+ B cell",
            "CD27+ memory B cell",
            "CD27- memory B cell",
            "CD138+ plasma cell",
            "CD38+ plasma cell",
            "CD38- plasma cell",
            "Immature B cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "B cell (B lymphocyte)",
                "Plasma cell",
                "Memory B cell",
                "Follicular B cell",
                "Marginal zone B cell",
                "B-1a cell",
                "B-1b cell",
                "Plasmacytoid dendritic cell",
                "Naive B cell",
                "Germinal center B cell",
                "Activated B cell",
                "Memory B-1 cell",
                "Memory B-2 cell",
                "B regulatory cell",
                "Memory plasma cell",
                "T follicular helper cell (Tfh cell)",
                "T follicular regulatory cell (Tfr cell)",
                "CD5+ B cell",
                "CD27+ memory B cell",
                "CD27- memory B cell",
                "CD138+ plasma cell",
                "CD38+ plasma cell",
                "CD38- plasma cell",
                "Immature B cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated B cell",
                "B cell (B lymphocyte)",
                "B regulatory cell",
                "B-1a cell",
                "B-1b cell",
                "CD138+ plasma cell",
                "CD27+ memory B cell",
                "CD27- memory B cell",
                "CD38+ plasma cell",
                "CD38- plasma cell",
                "CD5+ B cell",
                "Follicular B cell",
                "Germinal center B cell",
                "Immature B cell",
                "Marginal zone B cell",
                "Memory B cell",
                "Memory B-1 cell",
                "Memory B-2 cell",
                "Memory plasma cell",
                "Naive B cell",
                "Plasma cell",
                "Plasmacytoid dendritic cell",
                "T follicular helper cell (Tfh cell)",
                "T follicular regulatory cell (Tfr cell)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "B lymphocyte (B cell)",
            "Plasma cell",
            "Memory B cell",
            "Marginal zone B cell",
            "B-1 B cell",
            "Follicular dendritic cell (FDC) - antigen presentation to B cells",
            "Pro-B cell",
            "Pre-B cell",
            "Immature B cell",
            "Transitional B cell",
            "Mature naive B cell",
            "Activated B cell",
            "Plasma blasts",
            "IgM-secreting B cells",
            "IgG-secreting B cells",
            "IgA-secreting B cells",
            "IgE-secreting B cells",
            "B cell chronic lymphocytic leukemia (B-CLL) cell",
            "Multiple myeloma cell",
            "Waldenstr\u00f6m macroglobulinemia cell",
            "B cell lymphoma cell (various subtypes)",
            "Human B cell line (e.g., Raji, Daudi)",
            "Mouse B cell line (e.g., Sp2/0, NS0)",
            "Hybridoma cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "B lymphocyte (B cell)",
                "Plasma cell",
                "Memory B cell",
                "Marginal zone B cell",
                "B-1 B cell",
                "Follicular dendritic cell (FDC) - antigen presentation to B cells",
                "Pro-B cell",
                "Pre-B cell",
                "Immature B cell",
                "Transitional B cell",
                "Mature naive B cell",
                "Activated B cell",
                "Plasma blasts",
                "IgM-secreting B cells",
                "IgG-secreting B cells",
                "IgA-secreting B cells",
                "IgE-secreting B cells",
                "B cell chronic lymphocytic leukemia (B-CLL) cell",
                "Multiple myeloma cell",
                "Waldenstr\u00f6m macroglobulinemia cell",
                "B cell lymphoma cell (various subtypes)",
                "Human B cell line (e.g., Raji, Daudi)",
                "Mouse B cell line (e.g., Sp2/0, NS0)",
                "Hybridoma cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated B cell",
                "B cell chronic lymphocytic leukemia (B-CLL) cell",
                "B cell lymphoma cell (various subtypes)",
                "B lymphocyte (B cell)",
                "B-1 B cell",
                "Follicular dendritic cell (FDC) - antigen presentation to B cells",
                "Human B cell line (e.g., Raji, Daudi)",
                "Hybridoma cell",
                "IgA-secreting B cells",
                "IgE-secreting B cells",
                "IgG-secreting B cells",
                "IgM-secreting B cells",
                "Immature B cell",
                "Marginal zone B cell",
                "Mature naive B cell",
                "Memory B cell",
                "Mouse B cell line (e.g., Sp2/0, NS0)",
                "Multiple myeloma cell",
                "Plasma blasts",
                "Plasma cell",
                "Pre-B cell",
                "Pro-B cell",
                "Transitional B cell",
                "Waldenstr\u00f6m macroglobulinemia cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "B Cell (BC)",
            "Plasma Cell (PC)",
            "Memory B Cell (MBC)",
            "Naive B Cell (NBC)",
            "Activated B Cell (ABC)",
            "Follicular B Cell (FOB)",
            "Marginal Zone B Cell (MZB)",
            "Regulatory B Cell (Breg)",
            "B-1 Cell (B1)",
            "B-2 Cell (B2)",
            "Germinal Center B Cell (GCB)",
            "Transitional B Cell (TBC)",
            "B Cell Subset 1 (BCS1)",
            "B Cell Subset 2 (BCS2)",
            "B Cell Subset 3 (BCS3)",
            "B Cell Subset 4 (BCS4)",
            "B Cell Subset 5 (BCS5)",
            "B Cell Subset 6 (BCS6)",
            "B Cell Subset 7 (BCS7)",
            "B Cell Subset 8 (BCS8)",
            "B Cell Subset 9 (BCS9)",
            "B Cell Subset 10 (BCS10)",
            "B Cell Subset 11 (BCS11)",
            "B Cell Subset 12 (BCS12)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "B Cell (BC)",
                "Plasma Cell (PC)",
                "Memory B Cell (MBC)",
                "Naive B Cell (NBC)",
                "Activated B Cell (ABC)",
                "Follicular B Cell (FOB)",
                "Marginal Zone B Cell (MZB)",
                "Regulatory B Cell (Breg)",
                "B-1 Cell (B1)",
                "B-2 Cell (B2)",
                "Germinal Center B Cell (GCB)",
                "Transitional B Cell (TBC)",
                "B Cell Subset 1 (BCS1)",
                "B Cell Subset 2 (BCS2)",
                "B Cell Subset 3 (BCS3)",
                "B Cell Subset 4 (BCS4)",
                "B Cell Subset 5 (BCS5)",
                "B Cell Subset 6 (BCS6)",
                "B Cell Subset 7 (BCS7)",
                "B Cell Subset 8 (BCS8)",
                "B Cell Subset 9 (BCS9)",
                "B Cell Subset 10 (BCS10)",
                "B Cell Subset 11 (BCS11)",
                "B Cell Subset 12 (BCS12)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated B Cell (ABC)",
                "B Cell (BC)",
                "B Cell Subset 1 (BCS1)",
                "B Cell Subset 10 (BCS10)",
                "B Cell Subset 11 (BCS11)",
                "B Cell Subset 12 (BCS12)",
                "B Cell Subset 2 (BCS2)",
                "B Cell Subset 3 (BCS3)",
                "B Cell Subset 4 (BCS4)",
                "B Cell Subset 5 (BCS5)",
                "B Cell Subset 6 (BCS6)",
                "B Cell Subset 7 (BCS7)",
                "B Cell Subset 8 (BCS8)",
                "B Cell Subset 9 (BCS9)",
                "B-1 Cell (B1)",
                "B-2 Cell (B2)",
                "Follicular B Cell (FOB)",
                "Germinal Center B Cell (GCB)",
                "Marginal Zone B Cell (MZB)",
                "Memory B Cell (MBC)",
                "Naive B Cell (NBC)",
                "Plasma Cell (PC)",
                "Regulatory B Cell (Breg)",
                "Transitional B Cell (TBC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "B Lymphocyte (B cell)",
            "Plasma Cell",
            "Memory B Cell",
            "Follicular B Cell",
            "Marginal Zone B Cell",
            "Activated B Cell",
            "Germinal Center B Cell",
            "Transitional B Cell",
            "Regulatory B Cell",
            "IgM B Cell",
            "IgG B Cell",
            "IgA B Cell",
            "IgE B Cell",
            "CD19+ B Cell",
            "CD20+ B Cell",
            "CD27+ Memory B Cell",
            "CD138+ Plasma Cell",
            "Naive B Cell",
            "Autoantibody-producing B Cell",
            "Vaccine-induced B Cell",
            "T-dependent B Cell",
            "T-independent B Cell",
            "B1 Cell",
            "B2 Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "B Lymphocyte (B cell)",
                "Plasma Cell",
                "Memory B Cell",
                "Follicular B Cell",
                "Marginal Zone B Cell",
                "Activated B Cell",
                "Germinal Center B Cell",
                "Transitional B Cell",
                "Regulatory B Cell",
                "IgM B Cell",
                "IgG B Cell",
                "IgA B Cell",
                "IgE B Cell",
                "CD19+ B Cell",
                "CD20+ B Cell",
                "CD27+ Memory B Cell",
                "CD138+ Plasma Cell",
                "Naive B Cell",
                "Autoantibody-producing B Cell",
                "Vaccine-induced B Cell",
                "T-dependent B Cell",
                "T-independent B Cell",
                "B1 Cell",
                "B2 Cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated B Cell",
                "Autoantibody-producing B Cell",
                "B Lymphocyte (B cell)",
                "B1 Cell",
                "B2 Cell",
                "CD138+ Plasma Cell",
                "CD19+ B Cell",
                "CD20+ B Cell",
                "CD27+ Memory B Cell",
                "Follicular B Cell",
                "Germinal Center B Cell",
                "IgA B Cell",
                "IgE B Cell",
                "IgG B Cell",
                "IgM B Cell",
                "Marginal Zone B Cell",
                "Memory B Cell",
                "Naive B Cell",
                "Plasma Cell",
                "Regulatory B Cell",
                "T-dependent B Cell",
                "T-independent B Cell",
                "Transitional B Cell",
                "Vaccine-induced B Cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "B Cell (B lymphocyte)",
            "Plasma Cell",
            "Memory B Cell",
            "Follicular B Cell",
            "Marginal Zone B Cell",
            "B1 Cell",
            "B2 Cell",
            "Activated B Cell",
            "Naive B Cell",
            "Regulatory B Cell (Breg)",
            "Transitional B Cell",
            "Germinative Center B Cell",
            "Memory Plasma Cell",
            "Long-lived Plasma Cell",
            "Short-lived Plasma Cell",
            "Mature B Cell",
            "Immature B Cell",
            "Pro-B Cell",
            "Pre-B Cell",
            "Large Pre-BII Cell",
            "Small Pre-BII Cell",
            "Plasmablast",
            "Early Plasmablast",
            "Late Plasmablast"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "B Cell (B lymphocyte)",
                "Plasma Cell",
                "Memory B Cell",
                "Follicular B Cell",
                "Marginal Zone B Cell",
                "B1 Cell",
                "B2 Cell",
                "Activated B Cell",
                "Naive B Cell",
                "Regulatory B Cell (Breg)",
                "Transitional B Cell",
                "Germinative Center B Cell",
                "Memory Plasma Cell",
                "Long-lived Plasma Cell",
                "Short-lived Plasma Cell",
                "Mature B Cell",
                "Immature B Cell",
                "Pro-B Cell",
                "Pre-B Cell",
                "Large Pre-BII Cell",
                "Small Pre-BII Cell",
                "Plasmablast",
                "Early Plasmablast",
                "Late Plasmablast"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated B Cell",
                "B Cell (B lymphocyte)",
                "B1 Cell",
                "B2 Cell",
                "Early Plasmablast",
                "Follicular B Cell",
                "Germinative Center B Cell",
                "Immature B Cell",
                "Large Pre-BII Cell",
                "Late Plasmablast",
                "Long-lived Plasma Cell",
                "Marginal Zone B Cell",
                "Mature B Cell",
                "Memory B Cell",
                "Memory Plasma Cell",
                "Naive B Cell",
                "Plasma Cell",
                "Plasmablast",
                "Pre-B Cell",
                "Pro-B Cell",
                "Regulatory B Cell (Breg)",
                "Short-lived Plasma Cell",
                "Small Pre-BII Cell",
                "Transitional B Cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "B cell",
            "T cell",
            "Natural killer cell",
            "Plasma cell",
            "Memory B cell",
            "Memory T cell",
            "Regulatory T cell",
            "Dendritic cell",
            "Macrophage",
            "Neutrophil",
            "Eosinophil",
            "Basophil",
            "Mast cell",
            "Monocyte",
            "Lymphoblast",
            "Pre-B cell",
            "Pre-T cell",
            "Pro-B cell",
            "Pro-T cell",
            "Double positive thymocyte",
            "Double negative thymocyte",
            "Naive B cell",
            "Naive T cell",
            "Follicular dendritic cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "B cell",
                "T cell",
                "Natural killer cell",
                "Plasma cell",
                "Memory B cell",
                "Memory T cell",
                "Regulatory T cell",
                "Dendritic cell",
                "Macrophage",
                "Neutrophil",
                "Eosinophil",
                "Basophil",
                "Mast cell",
                "Monocyte",
                "Lymphoblast",
                "Pre-B cell",
                "Pre-T cell",
                "Pro-B cell",
                "Pro-T cell",
                "Double positive thymocyte",
                "Double negative thymocyte",
                "Naive B cell",
                "Naive T cell",
                "Follicular dendritic cell"
            ],
            "mismatches": [],
            "true_referents": [
                "B cell",
                "Basophil",
                "Dendritic cell",
                "Double negative thymocyte",
                "Double positive thymocyte",
                "Eosinophil",
                "Follicular dendritic cell",
                "Lymphoblast",
                "Macrophage",
                "Mast cell",
                "Memory B cell",
                "Memory T cell",
                "Monocyte",
                "Naive B cell",
                "Naive T cell",
                "Natural killer cell",
                "Neutrophil",
                "Plasma cell",
                "Pre-B cell",
                "Pre-T cell",
                "Pro-B cell",
                "Pro-T cell",
                "Regulatory T cell",
                "T cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "Na\u00efve B cell",
            "Plasma cell (PC)",
            "Memory B cell",
            "Germinal center B cell",
            "Follicular B cell",
            "Marginal zone B cell",
            "B-1 cell",
            "B-2 cell",
            "Regulatory B cell (B_REG)",
            "Activated B cell",
            "Transitional B cell",
            "Plasmablast",
            "Pre-B cell",
            "IgM-secreting B cell",
            "IgG-secreting B cell",
            "IgA-secreting B cell",
            "Marginal zone precursor B cell",
            "B cell acute lymphoblastic leukemia cell",
            "Burkitt lymphoma B cell line",
            "Diffuse large B cell lymphoma cell",
            "Chronic lymphocytic leukemia B cell",
            "Plasmacyte",
            "Innate-like B cell",
            "B-lymphocyte",
            "B cell progenitor"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Na\u00efve B cell",
                "Plasma cell (PC)",
                "Memory B cell",
                "Germinal center B cell",
                "Follicular B cell",
                "Marginal zone B cell",
                "B-1 cell",
                "B-2 cell",
                "Regulatory B cell (B_REG)",
                "Activated B cell",
                "Transitional B cell",
                "Plasmablast",
                "Pre-B cell",
                "IgM-secreting B cell",
                "IgG-secreting B cell",
                "IgA-secreting B cell",
                "Marginal zone precursor B cell",
                "B cell acute lymphoblastic leukemia cell",
                "Burkitt lymphoma B cell line",
                "Diffuse large B cell lymphoma cell",
                "Chronic lymphocytic leukemia B cell",
                "Plasmacyte",
                "Innate-like B cell",
                "B-lymphocyte"
            ],
            "mismatches": [
                "B cell progenitor"
            ],
            "true_referents": [
                "Activated B cell",
                "B cell acute lymphoblastic leukemia cell",
                "B-1 cell",
                "B-2 cell",
                "B-lymphocyte",
                "Burkitt lymphoma B cell line",
                "Chronic lymphocytic leukemia B cell",
                "Diffuse large B cell lymphoma cell",
                "Follicular B cell",
                "Germinal center B cell",
                "IgA-secreting B cell",
                "IgG-secreting B cell",
                "IgM-secreting B cell",
                "Innate-like B cell",
                "Marginal zone B cell",
                "Marginal zone precursor B cell",
                "Memory B cell",
                "Na\u00efve B cell",
                "Plasma cell (PC)",
                "Plasmablast",
                "Plasmacyte",
                "Pre-B cell",
                "Regulatory B cell (B_REG)",
                "Transitional B cell"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "B lymphocyte (B cell)",
            "Plasma cell",
            "Memory B cell",
            "Follicular B cell",
            "Marginal zone B cell",
            "B-1 cell",
            "Regulatory B cell (Breg)",
            "Plasmablast",
            "Germinal center B cell",
            "Transitional B cell",
            "Naive B cell",
            "Activated B cell",
            "Antibody-secreting cell (ASC)",
            "Long-lived plasma cell",
            "Short-lived plasma cell",
            "Immature B cell",
            "Pre-B cell",
            "Pro-B cell",
            "B-2 cell",
            "Mature B cell",
            "Effector B cell",
            "IgM-secreting B cell",
            "IgG-secreting B cell",
            "IgA-secreting B cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "B lymphocyte (B cell)",
                "Plasma cell",
                "Memory B cell",
                "Follicular B cell",
                "Marginal zone B cell",
                "B-1 cell",
                "Regulatory B cell (Breg)",
                "Plasmablast",
                "Germinal center B cell",
                "Transitional B cell",
                "Naive B cell",
                "Activated B cell",
                "Antibody-secreting cell (ASC)",
                "Long-lived plasma cell",
                "Short-lived plasma cell",
                "Immature B cell",
                "Pre-B cell",
                "Pro-B cell",
                "B-2 cell",
                "Mature B cell",
                "Effector B cell",
                "IgM-secreting B cell",
                "IgG-secreting B cell",
                "IgA-secreting B cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated B cell",
                "Antibody-secreting cell (ASC)",
                "B lymphocyte (B cell)",
                "B-1 cell",
                "B-2 cell",
                "Effector B cell",
                "Follicular B cell",
                "Germinal center B cell",
                "IgA-secreting B cell",
                "IgG-secreting B cell",
                "IgM-secreting B cell",
                "Immature B cell",
                "Long-lived plasma cell",
                "Marginal zone B cell",
                "Mature B cell",
                "Memory B cell",
                "Naive B cell",
                "Plasma cell",
                "Plasmablast",
                "Pre-B cell",
                "Pro-B cell",
                "Regulatory B cell (Breg)",
                "Short-lived plasma cell",
                "Transitional B cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "B lymphocyte (B cell)",
            "Plasma cell",
            "Memory B cell",
            "Follicular B cell",
            "Marginal zone B cell",
            "B-1 cell",
            "B-2 cell",
            "Regulatory B cell (Breg)",
            "Transitional B cell",
            "Naive B cell",
            "Germinal center B cell",
            "Plasmablast",
            "Long-lived plasma cell",
            "Short-lived plasma cell",
            "IgM-expressing B cell",
            "IgD-expressing B cell",
            "IgG-expressing B cell",
            "IgA-expressing B cell",
            "IgE-expressing B cell",
            "CD19+ B cell",
            "CD20+ B cell",
            "CD21+ B cell",
            "CD22+ B cell",
            "CD27+ B cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "B lymphocyte (B cell)",
                "Plasma cell",
                "Memory B cell",
                "Follicular B cell",
                "Marginal zone B cell",
                "B-1 cell",
                "B-2 cell",
                "Regulatory B cell (Breg)",
                "Transitional B cell",
                "Naive B cell",
                "Germinal center B cell",
                "Plasmablast",
                "Long-lived plasma cell",
                "Short-lived plasma cell",
                "IgM-expressing B cell",
                "IgD-expressing B cell",
                "IgG-expressing B cell",
                "IgA-expressing B cell",
                "IgE-expressing B cell",
                "CD19+ B cell",
                "CD20+ B cell",
                "CD21+ B cell",
                "CD22+ B cell",
                "CD27+ B cell"
            ],
            "mismatches": [],
            "true_referents": [
                "B lymphocyte (B cell)",
                "B-1 cell",
                "B-2 cell",
                "CD19+ B cell",
                "CD20+ B cell",
                "CD21+ B cell",
                "CD22+ B cell",
                "CD27+ B cell",
                "Follicular B cell",
                "Germinal center B cell",
                "IgA-expressing B cell",
                "IgD-expressing B cell",
                "IgE-expressing B cell",
                "IgG-expressing B cell",
                "IgM-expressing B cell",
                "Long-lived plasma cell",
                "Marginal zone B cell",
                "Memory B cell",
                "Naive B cell",
                "Plasma cell",
                "Plasmablast",
                "Regulatory B cell (Breg)",
                "Short-lived plasma cell",
                "Transitional B cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "B lymphocyte (B cell)",
            "Plasma cell",
            "Memory B cell",
            "Marginal zone B cell",
            "Follicular B cell",
            "Regulatory B cell",
            "Breg cell",
            "Immature B cell",
            "Transitional B cell",
            "Naive B cell",
            "Activated B cell",
            "Plasmablast",
            "IgM+ B cell",
            "IgG+ B cell",
            "IgA+ B cell",
            "IgE+ B cell",
            "IgD+ B cell",
            "Bone marrow B cell",
            "Peripheral blood B cell",
            "Splenic B cell",
            "Lymph node B cell",
            "Mucosal B cell",
            "Peritoneal B cell",
            "Bursal B cell (in birds)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "B lymphocyte (B cell)",
                "Plasma cell",
                "Memory B cell",
                "Marginal zone B cell",
                "Follicular B cell",
                "Regulatory B cell",
                "Breg cell",
                "Immature B cell",
                "Transitional B cell",
                "Naive B cell",
                "Activated B cell",
                "Plasmablast",
                "IgM+ B cell",
                "IgG+ B cell",
                "IgA+ B cell",
                "IgE+ B cell",
                "IgD+ B cell",
                "Bone marrow B cell",
                "Peripheral blood B cell",
                "Splenic B cell",
                "Lymph node B cell",
                "Mucosal B cell",
                "Peritoneal B cell",
                "Bursal B cell (in birds)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated B cell",
                "B lymphocyte (B cell)",
                "Bone marrow B cell",
                "Breg cell",
                "Bursal B cell (in birds)",
                "Follicular B cell",
                "IgA+ B cell",
                "IgD+ B cell",
                "IgE+ B cell",
                "IgG+ B cell",
                "IgM+ B cell",
                "Immature B cell",
                "Lymph node B cell",
                "Marginal zone B cell",
                "Memory B cell",
                "Mucosal B cell",
                "Naive B cell",
                "Peripheral blood B cell",
                "Peritoneal B cell",
                "Plasma cell",
                "Plasmablast",
                "Regulatory B cell",
                "Splenic B cell",
                "Transitional B cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "Plasma Cell (PC)",
            "B Lymphocyte (B Cell)",
            "Memory B Cell",
            "Follicular B Cell",
            "Marginal Zone B Cell",
            "Germinal Center B Cell",
            "Plasmablast",
            "Naive B Cell",
            "Regulatory B Cell (Breg)",
            "Innate-like B Cell",
            "B-1 Cell",
            "B-2 Cell",
            "Antibody-Secreting Cell (ASC)",
            "Plasma Blast",
            "Plasma Cell Precursor",
            "Activated B Cell",
            "Antigen-Experienced B Cell",
            "Antigen-Specific B Cell",
            "Isotype-Switched B Cell",
            "IgM Memory B Cell",
            "IgG Memory B Cell",
            "IgA Memory B Cell",
            "IgE Memory B Cell",
            "Transitional B Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Plasma Cell (PC)",
                "B Lymphocyte (B Cell)",
                "Memory B Cell",
                "Follicular B Cell",
                "Marginal Zone B Cell",
                "Germinal Center B Cell",
                "Plasmablast",
                "Naive B Cell",
                "Regulatory B Cell (Breg)",
                "Innate-like B Cell",
                "B-1 Cell",
                "B-2 Cell",
                "Antibody-Secreting Cell (ASC)",
                "Plasma Blast",
                "Plasma Cell Precursor",
                "Activated B Cell",
                "Antigen-Experienced B Cell",
                "Antigen-Specific B Cell",
                "Isotype-Switched B Cell",
                "IgM Memory B Cell",
                "IgG Memory B Cell",
                "IgA Memory B Cell",
                "IgE Memory B Cell",
                "Transitional B Cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated B Cell",
                "Antibody-Secreting Cell (ASC)",
                "Antigen-Experienced B Cell",
                "Antigen-Specific B Cell",
                "B Lymphocyte (B Cell)",
                "B-1 Cell",
                "B-2 Cell",
                "Follicular B Cell",
                "Germinal Center B Cell",
                "IgA Memory B Cell",
                "IgE Memory B Cell",
                "IgG Memory B Cell",
                "IgM Memory B Cell",
                "Innate-like B Cell",
                "Isotype-Switched B Cell",
                "Marginal Zone B Cell",
                "Memory B Cell",
                "Naive B Cell",
                "Plasma Blast",
                "Plasma Cell (PC)",
                "Plasma Cell Precursor",
                "Plasmablast",
                "Regulatory B Cell (Breg)",
                "Transitional B Cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "B cell (B lymphocyte)",
            "Plasma cell",
            "Activated B cell",
            "B lymphocyte",
            "B cell precursor",
            "Immunoblast",
            "Large granular lymphocyte",
            "Marginal zone B cell",
            "Follicular B cell",
            "Activated plasma cell",
            "Plasmablast",
            "Antigen-presenting B cell",
            "Memory B cell",
            "Naive B cell",
            "Transitional B cell",
            "T-independent B cell",
            "T-dependent B cell",
            "B1 B cell",
            "B2 B cell",
            "CD19+ B cell",
            "CD20+ B cell",
            "CD21+ B cell",
            "CD22+ B cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "B cell (B lymphocyte)",
                "Plasma cell",
                "Activated B cell",
                "B lymphocyte",
                "B cell precursor",
                "Immunoblast",
                "Large granular lymphocyte",
                "Marginal zone B cell",
                "Follicular B cell",
                "Activated plasma cell",
                "Plasmablast",
                "Antigen-presenting B cell",
                "Memory B cell",
                "Naive B cell",
                "Transitional B cell",
                "T-independent B cell",
                "T-dependent B cell",
                "B1 B cell",
                "B2 B cell",
                "CD19+ B cell",
                "CD20+ B cell",
                "CD21+ B cell",
                "CD22+ B cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated B cell",
                "Activated plasma cell",
                "Antigen-presenting B cell",
                "B cell (B lymphocyte)",
                "B cell precursor",
                "B lymphocyte",
                "B1 B cell",
                "B2 B cell",
                "CD19+ B cell",
                "CD20+ B cell",
                "CD21+ B cell",
                "CD22+ B cell",
                "Follicular B cell",
                "Immunoblast",
                "Large granular lymphocyte",
                "Marginal zone B cell",
                "Memory B cell",
                "Naive B cell",
                "Plasma cell",
                "Plasmablast",
                "T-dependent B cell",
                "T-independent B cell",
                "Transitional B cell"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            "B cell (B)",
            "Plasmablast (PB)",
            "Naive B cell (NBC)",
            "Activated B cell (ABC)",
            "Memory B cell (MBC)",
            "Plasma cell (PC)",
            "Marginal zone B cell (MZB)",
            "Follicular B cell (FBC)",
            "CD5+ B cell",
            "B-1 cell",
            "B-2 cell",
            "IgD+ CD27+ B cell",
            "IgM+ CD27+ B cell",
            "IgM+ CD27- B cell",
            " Transitional B cell (T1, T2, T3)",
            "Regulatory B cell (Breg)",
            "B cell receptor edited cell",
            "Anergic B cell",
            "Effector B cell",
            "Central memory B cell (CMBC)",
            "Effector memory B cell (EMBC)",
            "Tissue-like memory B cell",
            "Stem cell memory B cell",
            "Antibody-secreting cell (ASC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "B cell (B)",
                "Plasmablast (PB)",
                "Naive B cell (NBC)",
                "Activated B cell (ABC)",
                "Memory B cell (MBC)",
                "Plasma cell (PC)",
                "Marginal zone B cell (MZB)",
                "Follicular B cell (FBC)",
                "CD5+ B cell",
                "B-1 cell",
                "B-2 cell",
                "IgD+ CD27+ B cell",
                "IgM+ CD27+ B cell",
                "IgM+ CD27- B cell",
                "Transitional B cell (T1, T2, T3)",
                "Regulatory B cell (Breg)",
                "B cell receptor edited cell",
                "Anergic B cell",
                "Effector B cell",
                "Central memory B cell (CMBC)",
                "Effector memory B cell (EMBC)",
                "Tissue-like memory B cell",
                "Stem cell memory B cell",
                "Antibody-secreting cell (ASC)"
            ],
            "mismatches": [],
            "true_referents": [
                " Transitional B cell (T1, T2, T3)",
                "Activated B cell (ABC)",
                "Anergic B cell",
                "Antibody-secreting cell (ASC)",
                "B cell (B)",
                "B cell receptor edited cell",
                "B-1 cell",
                "B-2 cell",
                "CD5+ B cell",
                "Central memory B cell (CMBC)",
                "Effector B cell",
                "Effector memory B cell (EMBC)",
                "Follicular B cell (FBC)",
                "IgD+ CD27+ B cell",
                "IgM+ CD27+ B cell",
                "IgM+ CD27- B cell",
                "Marginal zone B cell (MZB)",
                "Memory B cell (MBC)",
                "Naive B cell (NBC)",
                "Plasma cell (PC)",
                "Plasmablast (PB)",
                "Regulatory B cell (Breg)",
                "Stem cell memory B cell",
                "Tissue-like memory B cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "antibody-producing cell",
        "domain": "biology",
        "response": [
            {
                "Referent": "lymphocyte",
                "Canonical Name": "Lymphocyte"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "lymphocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"lymphocyte\", \"Canonical Name\": \"Lymphocyte\"}"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 0
        }
    }
]