[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte (K)",
            "Melanocyte (M)",
            "Langerhans cell (LC)",
            "Merkel cell (MC)",
            "Eccrine sweat gland duct cell (SGD)",
            "Eccrine sweat gland myoepithelial cell (SGME)",
            "Sebaceous gland cell (SGC)",
            "Hair matrix cell (HMC)",
            "Hair shaft cell (HSC)",
            "Hair follicle bulge cell (HFC)",
            "Caf\u00e9-au-lait spot cell (CLS)",
            "Nail matrix cell (NMC)",
            "Nail bed cell (NBC)",
            "Nail plate cell (NPC)",
            "Stratum corneum cell (SCC)",
            "Stratum lucidum cell (SLC)",
            "Stratum granulosum cell (SGC)",
            "Stratum spinosum cell (SSC)",
            "Stratum basale cell (SBC)",
            "Epidermal dendritic cell (EDC)",
            "Epidermal dendritic cell (EDC)",
            "Epidermal dendritic cell (EDC)",
            "Epidermal dendritic cell (EDC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte (K)",
                "Melanocyte (M)",
                "Langerhans cell (LC)",
                "Merkel cell (MC)",
                "Eccrine sweat gland duct cell (SGD)",
                "Eccrine sweat gland myoepithelial cell (SGME)",
                "Sebaceous gland cell (SGC)",
                "Hair matrix cell (HMC)",
                "Hair shaft cell (HSC)",
                "Hair follicle bulge cell (HFC)",
                "Caf\u00e9-au-lait spot cell (CLS)",
                "Nail matrix cell (NMC)",
                "Nail bed cell (NBC)",
                "Nail plate cell (NPC)",
                "Stratum corneum cell (SCC)",
                "Stratum lucidum cell (SLC)",
                "Stratum granulosum cell (SGC)",
                "Stratum spinosum cell (SSC)",
                "Stratum basale cell (SBC)",
                "Epidermal dendritic cell (EDC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Caf\u00e9-au-lait spot cell (CLS)",
                "Eccrine sweat gland duct cell (SGD)",
                "Eccrine sweat gland myoepithelial cell (SGME)",
                "Epidermal dendritic cell (EDC)",
                "Hair follicle bulge cell (HFC)",
                "Hair matrix cell (HMC)",
                "Hair shaft cell (HSC)",
                "Keratinocyte (K)",
                "Langerhans cell (LC)",
                "Melanocyte (M)",
                "Merkel cell (MC)",
                "Nail bed cell (NBC)",
                "Nail matrix cell (NMC)",
                "Nail plate cell (NPC)",
                "Sebaceous gland cell (SGC)",
                "Stratum basale cell (SBC)",
                "Stratum corneum cell (SCC)",
                "Stratum granulosum cell (SGC)",
                "Stratum lucidum cell (SLC)",
                "Stratum spinosum cell (SSC)"
            ],
            "TP": 20,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte (Keratinocyte)",
            "Stratum corneum cell (Stratum corneum cell)",
            "Corneocyte (Corneocyte)",
            "Desmosome (Desmosome)",
            "Lamellar body (Lamellar body)",
            "Filaggrin (Filaggrin)",
            "Involucrin (Involucrin)",
            "Loricrin (Loricrin)",
            "Keratohyalin granule (Keratohyalin granule)",
            "Granular cell (Granular cell)",
            "Enucleated keratinocyte (Enucleated keratinocyte)",
            "Cornified envelope (Cornified envelope)",
            "Profilaggrin (Profilaggrin)",
            "Transglutaminase (Transglutaminase)",
            "Natural moisturizing factor (NMF)",
            "Lipid bilayer (Lipid bilayer)",
            "Sphingomyelin (Sphingomyelin)",
            "Ceramide (Ceramide)",
            "Cholesterol (Cholesterol)",
            "Free fatty acid (FFA)",
            "Elastin (Elastin)",
            "Collagen type VII (Collagen VII)",
            "Laminin-5 (Laminin-5)",
            "Integrin (Integrin)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte (Keratinocyte)",
                "Stratum corneum cell (Stratum corneum cell)",
                "Corneocyte (Corneocyte)",
                "Desmosome (Desmosome)",
                "Lamellar body (Lamellar body)",
                "Filaggrin (Filaggrin)",
                "Involucrin (Involucrin)",
                "Loricrin (Loricrin)",
                "Keratohyalin granule (Keratohyalin granule)",
                "Granular cell (Granular cell)",
                "Enucleated keratinocyte (Enucleated keratinocyte)",
                "Cornified envelope (Cornified envelope)",
                "Profilaggrin (Profilaggrin)",
                "Transglutaminase (Transglutaminase)",
                "Natural moisturizing factor (NMF)",
                "Lipid bilayer (Lipid bilayer)",
                "Sphingomyelin (Sphingomyelin)",
                "Ceramide (Ceramide)",
                "Cholesterol (Cholesterol)",
                "Free fatty acid (FFA)",
                "Elastin (Elastin)",
                "Collagen type VII (Collagen VII)",
                "Laminin-5 (Laminin-5)",
                "Integrin (Integrin)"
            ],
            "mismatches": [],
            "true_referents": [
                "Ceramide (Ceramide)",
                "Cholesterol (Cholesterol)",
                "Collagen type VII (Collagen VII)",
                "Corneocyte (Corneocyte)",
                "Cornified envelope (Cornified envelope)",
                "Desmosome (Desmosome)",
                "Elastin (Elastin)",
                "Enucleated keratinocyte (Enucleated keratinocyte)",
                "Filaggrin (Filaggrin)",
                "Free fatty acid (FFA)",
                "Granular cell (Granular cell)",
                "Integrin (Integrin)",
                "Involucrin (Involucrin)",
                "Keratinocyte (Keratinocyte)",
                "Keratohyalin granule (Keratohyalin granule)",
                "Lamellar body (Lamellar body)",
                "Laminin-5 (Laminin-5)",
                "Lipid bilayer (Lipid bilayer)",
                "Loricrin (Loricrin)",
                "Natural moisturizing factor (NMF)",
                "Profilaggrin (Profilaggrin)",
                "Sphingomyelin (Sphingomyelin)",
                "Stratum corneum cell (Stratum corneum cell)",
                "Transglutaminase (Transglutaminase)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte",
            "Melanocyte",
            "Langerhans cell",
            "Merkel cell",
            "Epidermal stem cell",
            "Basal cell",
            "Stratum corneum cell",
            "Stratum lucidum cell",
            "Stratum granulosum cell",
            "Stratum spinosum cell",
            "Stratum basale cell",
            "Epidermal dendritic cell",
            "Epidermal dendritic cell",
            "Epidermal fibroblast",
            "Epidermal Schwann cell",
            "Epidermal immune cell",
            "Epidermal macrophage",
            "Epidermal T cell",
            "Epidermal B cell",
            "Epidermal natural killer cell",
            "Epidermal dendritic cell",
            "Epidermal Langerhans cell",
            "Epidermal Merkel cell",
            "Epidermal melanocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte",
                "Melanocyte",
                "Langerhans cell",
                "Merkel cell",
                "Epidermal stem cell",
                "Basal cell",
                "Stratum corneum cell",
                "Stratum lucidum cell",
                "Stratum granulosum cell",
                "Stratum spinosum cell",
                "Stratum basale cell",
                "Epidermal dendritic cell",
                "Epidermal fibroblast",
                "Epidermal Schwann cell",
                "Epidermal immune cell",
                "Epidermal macrophage",
                "Epidermal T cell",
                "Epidermal B cell",
                "Epidermal natural killer cell",
                "Epidermal Langerhans cell",
                "Epidermal Merkel cell",
                "Epidermal melanocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "Basal cell",
                "Epidermal B cell",
                "Epidermal Langerhans cell",
                "Epidermal Merkel cell",
                "Epidermal Schwann cell",
                "Epidermal T cell",
                "Epidermal dendritic cell",
                "Epidermal fibroblast",
                "Epidermal immune cell",
                "Epidermal macrophage",
                "Epidermal melanocyte",
                "Epidermal natural killer cell",
                "Epidermal stem cell",
                "Keratinocyte",
                "Langerhans cell",
                "Melanocyte",
                "Merkel cell",
                "Stratum basale cell",
                "Stratum corneum cell",
                "Stratum granulosum cell",
                "Stratum lucidum cell",
                "Stratum spinosum cell"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte (KRT)",
            "Stratum corneum cell",
            "Basal cell keratinocyte (BCK)",
            "Squamous cell keratinocyte (SCK)",
            "Granular cell keratinocyte (GCK)",
            "Prickle cell keratinocyte (PCK)",
            "Differentiated keratinocyte",
            "Undifferentiated keratinocyte",
            "Epidermal keratinocyte",
            "Keratinized cell",
            "Non-pigmenting keratinocyte",
            "Suprabasal keratinocyte",
            "Tonofilament-containing cell",
            "Cell producing filaggrin",
            "Cell producing loricrin",
            "Cell producing involucrin",
            "Cell expressing E-cadherin",
            "Cell undergoing cornification",
            "Cell forming epidermal barrier",
            "Cell contributing to skin waterproofing",
            "Cell involved in wound healing (epidermal)",
            "Cell sensitive to UV radiation",
            "Cell capable of apoptosis (epidermal)",
            "Cell participating in immune response (epidermal)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte (KRT)",
                "Stratum corneum cell",
                "Basal cell keratinocyte (BCK)",
                "Squamous cell keratinocyte (SCK)",
                "Granular cell keratinocyte (GCK)",
                "Prickle cell keratinocyte (PCK)",
                "Differentiated keratinocyte",
                "Undifferentiated keratinocyte",
                "Epidermal keratinocyte",
                "Keratinized cell",
                "Non-pigmenting keratinocyte",
                "Suprabasal keratinocyte",
                "Tonofilament-containing cell",
                "Cell producing filaggrin",
                "Cell producing loricrin",
                "Cell producing involucrin",
                "Cell expressing E-cadherin",
                "Cell undergoing cornification",
                "Cell forming epidermal barrier",
                "Cell contributing to skin waterproofing",
                "Cell involved in wound healing (epidermal)",
                "Cell sensitive to UV radiation",
                "Cell capable of apoptosis (epidermal)",
                "Cell participating in immune response (epidermal)"
            ],
            "mismatches": [],
            "true_referents": [
                "Basal cell keratinocyte (BCK)",
                "Cell capable of apoptosis (epidermal)",
                "Cell contributing to skin waterproofing",
                "Cell expressing E-cadherin",
                "Cell forming epidermal barrier",
                "Cell involved in wound healing (epidermal)",
                "Cell participating in immune response (epidermal)",
                "Cell producing filaggrin",
                "Cell producing involucrin",
                "Cell producing loricrin",
                "Cell sensitive to UV radiation",
                "Cell undergoing cornification",
                "Differentiated keratinocyte",
                "Epidermal keratinocyte",
                "Granular cell keratinocyte (GCK)",
                "Keratinized cell",
                "Keratinocyte (KRT)",
                "Non-pigmenting keratinocyte",
                "Prickle cell keratinocyte (PCK)",
                "Squamous cell keratinocyte (SCK)",
                "Stratum corneum cell",
                "Suprabasal keratinocyte",
                "Tonofilament-containing cell",
                "Undifferentiated keratinocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte (KC)",
            "Melanocyte (MC)",
            "Langerhans cell (LC)",
            "Merkel cell (MeC)",
            "Basal cell (BC)",
            "Squamous cell (SC)",
            "Granular cell (GC)",
            "Prickle cell (PC)",
            "Clear cell (ClC)",
            "Dendritic cell (DC)",
            "Epidermal stem cell (ESC)",
            "Stratum corneum cell (SCC)",
            "Stratum lucidum cell (SLC)",
            "Stratum granulosum cell (SGC)",
            "Stratum spinosum cell (SSpC)",
            "Stratum basale cell (SBC)",
            "Corneocyte (CoC)",
            "Horny cell (HC)",
            "Epidermal keratinocyte (EKC)",
            "Epidermal melanocyte (EMC)",
            "Epidermal dendritic cell (EDC)",
            "Epidermal Merkel cell (EMeC)",
            "Epidermal Langerhans cell (ELC)",
            "Epidermal clear cell (EClC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte (KC)",
                "Melanocyte (MC)",
                "Langerhans cell (LC)",
                "Merkel cell (MeC)",
                "Basal cell (BC)",
                "Squamous cell (SC)",
                "Granular cell (GC)",
                "Prickle cell (PC)",
                "Clear cell (ClC)",
                "Dendritic cell (DC)",
                "Epidermal stem cell (ESC)",
                "Stratum corneum cell (SCC)",
                "Stratum lucidum cell (SLC)",
                "Stratum granulosum cell (SGC)",
                "Stratum spinosum cell (SSpC)",
                "Stratum basale cell (SBC)",
                "Corneocyte (CoC)",
                "Horny cell (HC)",
                "Epidermal keratinocyte (EKC)",
                "Epidermal melanocyte (EMC)",
                "Epidermal dendritic cell (EDC)",
                "Epidermal Merkel cell (EMeC)",
                "Epidermal Langerhans cell (ELC)",
                "Epidermal clear cell (EClC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Basal cell (BC)",
                "Clear cell (ClC)",
                "Corneocyte (CoC)",
                "Dendritic cell (DC)",
                "Epidermal Langerhans cell (ELC)",
                "Epidermal Merkel cell (EMeC)",
                "Epidermal clear cell (EClC)",
                "Epidermal dendritic cell (EDC)",
                "Epidermal keratinocyte (EKC)",
                "Epidermal melanocyte (EMC)",
                "Epidermal stem cell (ESC)",
                "Granular cell (GC)",
                "Horny cell (HC)",
                "Keratinocyte (KC)",
                "Langerhans cell (LC)",
                "Melanocyte (MC)",
                "Merkel cell (MeC)",
                "Prickle cell (PC)",
                "Squamous cell (SC)",
                "Stratum basale cell (SBC)",
                "Stratum corneum cell (SCC)",
                "Stratum granulosum cell (SGC)",
                "Stratum lucidum cell (SLC)",
                "Stratum spinosum cell (SSpC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte (K1)",
            "Melanocyte (M1)",
            "Langerhans cell (L1)",
            "Merkel cell (M1)",
            "Basal cell (B1)",
            "Squamous cell (S1)",
            "Sebocyte (S2)",
            "Adipocyte (A1)",
            "Dendritic cell (D1)",
            "Fibroblast (F1)",
            "Endothelial cell (E1)",
            "Epidermal stem cell (E2)",
            "Pacinian corpuscle cell (P1)",
            "Ruffini ending cell (R1)",
            "Hair follicle stem cell (H1)",
            "Matrix cell (M2)",
            "Keratin-producing cell (K2)",
            "Stratum corneum cell (S3)",
            "Stratum granulosum cell (S4)",
            "Stratum spinosum cell (S5)",
            "Stratum basale cell (S6)",
            "Lipid-laden cell (L2)",
            "Immune cell (I1)",
            "Inflammatory cell (I2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte (K1)",
                "Melanocyte (M1)",
                "Langerhans cell (L1)",
                "Merkel cell (M1)",
                "Basal cell (B1)",
                "Squamous cell (S1)",
                "Sebocyte (S2)",
                "Adipocyte (A1)",
                "Dendritic cell (D1)",
                "Fibroblast (F1)",
                "Endothelial cell (E1)",
                "Epidermal stem cell (E2)",
                "Pacinian corpuscle cell (P1)",
                "Ruffini ending cell (R1)",
                "Hair follicle stem cell (H1)",
                "Matrix cell (M2)",
                "Keratin-producing cell (K2)",
                "Stratum corneum cell (S3)",
                "Stratum granulosum cell (S4)",
                "Stratum spinosum cell (S5)",
                "Stratum basale cell (S6)",
                "Lipid-laden cell (L2)",
                "Immune cell (I1)",
                "Inflammatory cell (I2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (A1)",
                "Basal cell (B1)",
                "Dendritic cell (D1)",
                "Endothelial cell (E1)",
                "Epidermal stem cell (E2)",
                "Fibroblast (F1)",
                "Hair follicle stem cell (H1)",
                "Immune cell (I1)",
                "Inflammatory cell (I2)",
                "Keratin-producing cell (K2)",
                "Keratinocyte (K1)",
                "Langerhans cell (L1)",
                "Lipid-laden cell (L2)",
                "Matrix cell (M2)",
                "Melanocyte (M1)",
                "Merkel cell (M1)",
                "Pacinian corpuscle cell (P1)",
                "Ruffini ending cell (R1)",
                "Sebocyte (S2)",
                "Squamous cell (S1)",
                "Stratum basale cell (S6)",
                "Stratum corneum cell (S3)",
                "Stratum granulosum cell (S4)",
                "Stratum spinosum cell (S5)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte (KC)",
            "Melanocyte (MC)",
            "Langerhans cell (LC)",
            "Merkel cell (MerkC)",
            "Stem cell (SC)",
            "Basal cell (BC)",
            "Transit amplifying cell (TAC)",
            "Spinous cell (SpC)",
            "Granular cell (GC)",
            "Corneocyte (CorC)",
            "Melanosome (MelS)",
            "Melanoblast (MelB)",
            "Melanoma cell (MelC)",
            "Epidermal dendritic cell (EDC)",
            "Epidermal T cell (ETC)",
            "Epidermal B cell (EBC)",
            "Epidermal Natural Killer cell (ENKC)",
            "Epidermal Macrophage (EMa)",
            "Epidermal Neutrophil (EN)",
            "Epidermal Monocyte (EMo)",
            "Epidermal Lymphocyte (EL)",
            "Epidermal Basophil (EB)",
            "Epidermal Eosinophil (EE)",
            "Epidermal Mast cell (EMaC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte (KC)",
                "Melanocyte (MC)",
                "Langerhans cell (LC)",
                "Merkel cell (MerkC)",
                "Stem cell (SC)",
                "Basal cell (BC)",
                "Transit amplifying cell (TAC)",
                "Spinous cell (SpC)",
                "Granular cell (GC)",
                "Corneocyte (CorC)",
                "Melanosome (MelS)",
                "Melanoblast (MelB)",
                "Melanoma cell (MelC)",
                "Epidermal dendritic cell (EDC)",
                "Epidermal T cell (ETC)",
                "Epidermal B cell (EBC)",
                "Epidermal Natural Killer cell (ENKC)",
                "Epidermal Macrophage (EMa)",
                "Epidermal Neutrophil (EN)",
                "Epidermal Monocyte (EMo)",
                "Epidermal Lymphocyte (EL)",
                "Epidermal Basophil (EB)",
                "Epidermal Eosinophil (EE)",
                "Epidermal Mast cell (EMaC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Basal cell (BC)",
                "Corneocyte (CorC)",
                "Epidermal B cell (EBC)",
                "Epidermal Basophil (EB)",
                "Epidermal Eosinophil (EE)",
                "Epidermal Lymphocyte (EL)",
                "Epidermal Macrophage (EMa)",
                "Epidermal Mast cell (EMaC)",
                "Epidermal Monocyte (EMo)",
                "Epidermal Natural Killer cell (ENKC)",
                "Epidermal Neutrophil (EN)",
                "Epidermal T cell (ETC)",
                "Epidermal dendritic cell (EDC)",
                "Granular cell (GC)",
                "Keratinocyte (KC)",
                "Langerhans cell (LC)",
                "Melanoblast (MelB)",
                "Melanocyte (MC)",
                "Melanoma cell (MelC)",
                "Melanosome (MelS)",
                "Merkel cell (MerkC)",
                "Spinous cell (SpC)",
                "Stem cell (SC)",
                "Transit amplifying cell (TAC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte",
            "Melanocyte",
            "Langerhans cell",
            "Merkel cell",
            "Squamous cell",
            "Basal cell",
            "Epidermal cell",
            "Stratum corneum cell",
            "Stratum granulosum cell",
            "Stratum spinosum cell",
            "Stratum basale cell",
            "Dendritic cell",
            "Fibroblast",
            "Sebocyte",
            "Sweat gland cell",
            "Hair follicle cell",
            "Epidermal stem cell",
            "Keratocyte",
            "Desquamated cell",
            "Corneocyte",
            "Epithelial cell",
            "Cutaneous cell",
            "Skin cell",
            "Epidermal keratinocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte",
                "Melanocyte",
                "Langerhans cell",
                "Merkel cell",
                "Squamous cell",
                "Basal cell",
                "Epidermal cell",
                "Stratum corneum cell",
                "Stratum granulosum cell",
                "Stratum spinosum cell",
                "Stratum basale cell",
                "Dendritic cell",
                "Fibroblast",
                "Sebocyte",
                "Sweat gland cell",
                "Hair follicle cell",
                "Epidermal stem cell",
                "Keratocyte",
                "Desquamated cell",
                "Corneocyte",
                "Epithelial cell",
                "Cutaneous cell",
                "Skin cell",
                "Epidermal keratinocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "Basal cell",
                "Corneocyte",
                "Cutaneous cell",
                "Dendritic cell",
                "Desquamated cell",
                "Epidermal cell",
                "Epidermal keratinocyte",
                "Epidermal stem cell",
                "Epithelial cell",
                "Fibroblast",
                "Hair follicle cell",
                "Keratinocyte",
                "Keratocyte",
                "Langerhans cell",
                "Melanocyte",
                "Merkel cell",
                "Sebocyte",
                "Skin cell",
                "Squamous cell",
                "Stratum basale cell",
                "Stratum corneum cell",
                "Stratum granulosum cell",
                "Stratum spinosum cell",
                "Sweat gland cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Corneocyte (CC)",
            "Dead Keratinocyte",
            "Compact Corneocyte",
            "Amorphous Corneocyte",
            "Lamellar Corneocyte",
            "Hydrated Corneocyte",
            "Dehydrated Corneocyte",
            "Cornified Corneocyte",
            "Reconstituted Corneocyte",
            "Damaged Corneocyte",
            "UV-Exposed Corneocyte",
            "Inflamed Corneocyte",
            "Aging Corneocyte",
            "Hyperkeratotic Corneocyte",
            "Hypokeratotic Corneocyte",
            "Barrier Corneocyte",
            "Scaly Corneocyte",
            "Frictional Corneocyte",
            "Squamous Corneocyte",
            "Mutated Corneocyte",
            "Phytoncide Corneocyte",
            "Corneocyte from Human Epidermis",
            "Corneocyte from Mouse Epidermis",
            "Antigen-Presenting Corneocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Corneocyte (CC)",
                "Dead Keratinocyte",
                "Compact Corneocyte",
                "Amorphous Corneocyte",
                "Lamellar Corneocyte",
                "Hydrated Corneocyte",
                "Dehydrated Corneocyte",
                "Cornified Corneocyte",
                "Reconstituted Corneocyte",
                "Damaged Corneocyte",
                "UV-Exposed Corneocyte",
                "Inflamed Corneocyte",
                "Aging Corneocyte",
                "Hyperkeratotic Corneocyte",
                "Hypokeratotic Corneocyte",
                "Barrier Corneocyte",
                "Scaly Corneocyte",
                "Frictional Corneocyte",
                "Squamous Corneocyte",
                "Mutated Corneocyte",
                "Phytoncide Corneocyte",
                "Corneocyte from Human Epidermis",
                "Corneocyte from Mouse Epidermis",
                "Antigen-Presenting Corneocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "Aging Corneocyte",
                "Amorphous Corneocyte",
                "Antigen-Presenting Corneocyte",
                "Barrier Corneocyte",
                "Compact Corneocyte",
                "Corneocyte (CC)",
                "Corneocyte from Human Epidermis",
                "Corneocyte from Mouse Epidermis",
                "Cornified Corneocyte",
                "Damaged Corneocyte",
                "Dead Keratinocyte",
                "Dehydrated Corneocyte",
                "Frictional Corneocyte",
                "Hydrated Corneocyte",
                "Hyperkeratotic Corneocyte",
                "Hypokeratotic Corneocyte",
                "Inflamed Corneocyte",
                "Lamellar Corneocyte",
                "Mutated Corneocyte",
                "Phytoncide Corneocyte",
                "Reconstituted Corneocyte",
                "Scaly Corneocyte",
                "Squamous Corneocyte",
                "UV-Exposed Corneocyte"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte",
            "Melanocyte",
            "Langerhans cell",
            "Merkel cell",
            "Basal cell",
            "Spinous cell",
            "Granular cell",
            "Stratum corneum cell",
            "Epidermal stem cell",
            "Transit amplifying cell",
            "Squamous cell",
            "Dendritic cell (epidermal)",
            "Clear cell (Toker cell)",
            "Suprabasal cell",
            "Corneocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte",
                "Melanocyte",
                "Langerhans cell",
                "Merkel cell",
                "Basal cell",
                "Spinous cell",
                "Granular cell",
                "Stratum corneum cell",
                "Epidermal stem cell",
                "Transit amplifying cell",
                "Squamous cell",
                "Dendritic cell (epidermal)",
                "Clear cell (Toker cell)",
                "Suprabasal cell",
                "Corneocyte"
            ],
            "mismatches": [],
            "true_referents": [
                "Basal cell",
                "Clear cell (Toker cell)",
                "Corneocyte",
                "Dendritic cell (epidermal)",
                "Epidermal stem cell",
                "Granular cell",
                "Keratinocyte",
                "Langerhans cell",
                "Melanocyte",
                "Merkel cell",
                "Spinous cell",
                "Squamous cell",
                "Stratum corneum cell",
                "Suprabasal cell",
                "Transit amplifying cell"
            ],
            "TP": 15,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte",
            "Melanocyte",
            "Langerhans cell",
            "Merkel cell",
            "Corneocyte",
            "Spinous cell",
            "Granular cell",
            "Basal cell",
            "Stem cell of epidermis",
            "Epidermal dendritic cell",
            "Epidermal T cell",
            "Epidermal \u03b3\u03b4 T cell",
            "CD8+ T cell in epidermis",
            "Intraepidermal nerve fiber",
            "Intraepidermal sweat duct cell",
            "Intraepidermal sebaceous gland cell",
            "Intraepidermal hair follicle cell",
            "Intraepidermal arrector pili muscle cell",
            "Intraepidermal apocrine gland cell",
            "Intraepidermal eccrine gland cell",
            "Tonofilament in epidermal cell",
            "Desmosome in epidermal cell",
            "Melanosome in epidermal cell",
            "Keratin filament in epidermal cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte",
                "Melanocyte",
                "Langerhans cell",
                "Merkel cell",
                "Corneocyte",
                "Spinous cell",
                "Granular cell",
                "Basal cell",
                "Stem cell of epidermis",
                "Epidermal dendritic cell",
                "Epidermal T cell",
                "Epidermal \u03b3\u03b4 T cell",
                "CD8+ T cell in epidermis",
                "Intraepidermal nerve fiber",
                "Intraepidermal sweat duct cell",
                "Intraepidermal sebaceous gland cell",
                "Intraepidermal hair follicle cell",
                "Intraepidermal arrector pili muscle cell",
                "Intraepidermal apocrine gland cell",
                "Intraepidermal eccrine gland cell",
                "Tonofilament in epidermal cell",
                "Desmosome in epidermal cell",
                "Melanosome in epidermal cell",
                "Keratin filament in epidermal cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Basal cell",
                "CD8+ T cell in epidermis",
                "Corneocyte",
                "Desmosome in epidermal cell",
                "Epidermal T cell",
                "Epidermal dendritic cell",
                "Epidermal \u03b3\u03b4 T cell",
                "Granular cell",
                "Intraepidermal apocrine gland cell",
                "Intraepidermal arrector pili muscle cell",
                "Intraepidermal eccrine gland cell",
                "Intraepidermal hair follicle cell",
                "Intraepidermal nerve fiber",
                "Intraepidermal sebaceous gland cell",
                "Intraepidermal sweat duct cell",
                "Keratin filament in epidermal cell",
                "Keratinocyte",
                "Langerhans cell",
                "Melanocyte",
                "Melanosome in epidermal cell",
                "Merkel cell",
                "Spinous cell",
                "Stem cell of epidermis",
                "Tonofilament in epidermal cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte (KC)",
            "Merkel cell (MC)",
            "Melanocyte (MC)",
            "Langerhans cell (LC)",
            "Dendritic epidermal T cell (DETC)",
            "Lymphocyte (LC)",
            "Fibroblast (FB)",
            "Adipocyte (AC)",
            "Mast cell (MC)",
            "Macrophage (M\u03a6)",
            "Endothelial cell (EC)",
            "Pericyte (PC)",
            "Smooth muscle cell (SMC)",
            "Nerve cell (NC)",
            "Stem cell (SC)",
            "Transit amplifying cell (TAC)",
            "Corneocyte (CC)",
            "Basal cell (BC)",
            "Spinous cell (SC)",
            "Granular cell (GC)",
            "Stratum corneum cell (SCC)",
            "Stratum lucidum cell (SLC)",
            "Stratum granulosum cell (SGC)",
            "Stratum spinosum cell (SSC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte (KC)",
                "Merkel cell (MC)",
                "Melanocyte (MC)",
                "Langerhans cell (LC)",
                "Dendritic epidermal T cell (DETC)",
                "Lymphocyte (LC)",
                "Fibroblast (FB)",
                "Adipocyte (AC)",
                "Mast cell (MC)",
                "Macrophage (M\u03a6)",
                "Endothelial cell (EC)",
                "Pericyte (PC)",
                "Smooth muscle cell (SMC)",
                "Nerve cell (NC)",
                "Stem cell (SC)",
                "Transit amplifying cell (TAC)",
                "Corneocyte (CC)",
                "Basal cell (BC)",
                "Spinous cell (SC)",
                "Granular cell (GC)",
                "Stratum corneum cell (SCC)",
                "Stratum lucidum cell (SLC)",
                "Stratum granulosum cell (SGC)",
                "Stratum spinosum cell (SSC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (AC)",
                "Basal cell (BC)",
                "Corneocyte (CC)",
                "Dendritic epidermal T cell (DETC)",
                "Endothelial cell (EC)",
                "Fibroblast (FB)",
                "Granular cell (GC)",
                "Keratinocyte (KC)",
                "Langerhans cell (LC)",
                "Lymphocyte (LC)",
                "Macrophage (M\u03a6)",
                "Mast cell (MC)",
                "Melanocyte (MC)",
                "Merkel cell (MC)",
                "Nerve cell (NC)",
                "Pericyte (PC)",
                "Smooth muscle cell (SMC)",
                "Spinous cell (SC)",
                "Stem cell (SC)",
                "Stratum corneum cell (SCC)",
                "Stratum granulosum cell (SGC)",
                "Stratum lucidum cell (SLC)",
                "Stratum spinosum cell (SSC)",
                "Transit amplifying cell (TAC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte (KC)",
            "Melanocyte (MC)",
            "Langerhans Cell (LC)",
            "Merkel Cell (MRC)",
            "Corneocyte",
            "Basal Cell (BC)",
            "Spinous Cell (SC)",
            "Granular Cell (GC)",
            "Stratum Corneum Cell (SCC)",
            "Epidermal Stem Cell (ESC)",
            "Epidermal Melanocyte (EMC)",
            "Epidermal Langerhans Cell (ELC)",
            "Epidermal Merkel Cell (EMrC)",
            "Epidermal Basal Cell (EBC)",
            "Epidermal Spinous Cell (ESC)",
            "Epidermal Granular Cell (EGC)",
            "Epidermal Stratum Corneum Cell (ESCC)",
            "Epidermis Keratinocyte (EK)",
            "Epidermis Melanocyte (EM)",
            "Epidermis Langerhans Cell (ELC)",
            "Epidermis Merkel Cell (EMrC)",
            "Epidermis Basal Cell (EBC)",
            "Epidermis Spinous Cell (ESC)",
            "Epidermis Granular Cell (EGC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte (KC)",
                "Melanocyte (MC)",
                "Langerhans Cell (LC)",
                "Merkel Cell (MRC)",
                "Corneocyte",
                "Basal Cell (BC)",
                "Spinous Cell (SC)",
                "Granular Cell (GC)",
                "Stratum Corneum Cell (SCC)",
                "Epidermal Stem Cell (ESC)",
                "Epidermal Melanocyte (EMC)",
                "Epidermal Langerhans Cell (ELC)",
                "Epidermal Merkel Cell (EMrC)",
                "Epidermal Basal Cell (EBC)",
                "Epidermal Spinous Cell (ESC)",
                "Epidermal Granular Cell (EGC)",
                "Epidermal Stratum Corneum Cell (ESCC)",
                "Epidermis Keratinocyte (EK)",
                "Epidermis Melanocyte (EM)",
                "Epidermis Langerhans Cell (ELC)",
                "Epidermis Merkel Cell (EMrC)",
                "Epidermis Basal Cell (EBC)",
                "Epidermis Spinous Cell (ESC)",
                "Epidermis Granular Cell (EGC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Basal Cell (BC)",
                "Corneocyte",
                "Epidermal Basal Cell (EBC)",
                "Epidermal Granular Cell (EGC)",
                "Epidermal Langerhans Cell (ELC)",
                "Epidermal Melanocyte (EMC)",
                "Epidermal Merkel Cell (EMrC)",
                "Epidermal Spinous Cell (ESC)",
                "Epidermal Stem Cell (ESC)",
                "Epidermal Stratum Corneum Cell (ESCC)",
                "Epidermis Basal Cell (EBC)",
                "Epidermis Granular Cell (EGC)",
                "Epidermis Keratinocyte (EK)",
                "Epidermis Langerhans Cell (ELC)",
                "Epidermis Melanocyte (EM)",
                "Epidermis Merkel Cell (EMrC)",
                "Epidermis Spinous Cell (ESC)",
                "Granular Cell (GC)",
                "Keratinocyte (KC)",
                "Langerhans Cell (LC)",
                "Melanocyte (MC)",
                "Merkel Cell (MRC)",
                "Spinous Cell (SC)",
                "Stratum Corneum Cell (SCC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte (Ker)",
            "Epidermal cell",
            "Squamous cell",
            "Stratum corneum cell",
            "Stratum lucidum cell",
            "Stratum granulosum cell",
            "Stratum spinosum cell",
            "Stratum basale cell",
            "Corneum cell",
            "Lucidum cell",
            "Granulosum cell",
            "Spinosum cell",
            "Basale cell",
            "Epidermal keratinocyte",
            "Squamous epithelial cell",
            "Cutaneous epithelial cell",
            "Dermal-epidermal junction cell",
            "Skin surface cell",
            "Outermost skin cell",
            "Non-vascular skin cell",
            "Epidermal basal layer cell",
            "Epidermal spinous layer cell",
            "Epidermal granular layer cell",
            "Epidermal clear layer cell",
            "Cutaneous epithelial keratinocyte"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte (Ker)",
                "Epidermal cell",
                "Squamous cell",
                "Stratum corneum cell",
                "Stratum lucidum cell",
                "Stratum granulosum cell",
                "Stratum spinosum cell",
                "Stratum basale cell",
                "Corneum cell",
                "Lucidum cell",
                "Granulosum cell",
                "Spinosum cell",
                "Basale cell",
                "Epidermal keratinocyte",
                "Squamous epithelial cell",
                "Cutaneous epithelial cell",
                "Dermal-epidermal junction cell",
                "Skin surface cell",
                "Outermost skin cell",
                "Non-vascular skin cell",
                "Epidermal basal layer cell",
                "Epidermal spinous layer cell",
                "Epidermal granular layer cell",
                "Epidermal clear layer cell"
            ],
            "mismatches": [
                "Cutaneous epithelial keratinocyte"
            ],
            "true_referents": [
                "Basale cell",
                "Corneum cell",
                "Cutaneous epithelial cell",
                "Dermal-epidermal junction cell",
                "Epidermal basal layer cell",
                "Epidermal cell",
                "Epidermal clear layer cell",
                "Epidermal granular layer cell",
                "Epidermal keratinocyte",
                "Epidermal spinous layer cell",
                "Granulosum cell",
                "Keratinocyte (Ker)",
                "Lucidum cell",
                "Non-vascular skin cell",
                "Outermost skin cell",
                "Skin surface cell",
                "Spinosum cell",
                "Squamous cell",
                "Squamous epithelial cell",
                "Stratum basale cell",
                "Stratum corneum cell",
                "Stratum granulosum cell",
                "Stratum lucidum cell",
                "Stratum spinosum cell"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            "Keratinocyte (KC)",
            "Epidermal cell",
            "Stratum corneum cell",
            "Stratum lucidum cell",
            "Stratum granulosum cell",
            "Stratum spinosum cell",
            "Stratum basale cell",
            "Melanocyte",
            "Langerhans cell",
            "Merkel cell",
            "Dendritic epidermal T cell",
            "Gamma delta T cell",
            "Epidermal stem cell",
            "Basal cell",
            "Principial cell",
            "Interfollicular epidermal cell",
            "Hair follicle stem cell",
            "Sebaceous gland stem cell",
            "Sweat gland stem cell",
            "Apical progenitor cell",
            "Basal progenitor cell",
            "Spinous layer cell",
            "Granular layer cell",
            "Corneocyte",
            "Epidermal progenitor cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Keratinocyte (KC)",
                "Epidermal cell",
                "Stratum corneum cell",
                "Stratum lucidum cell",
                "Stratum granulosum cell",
                "Stratum spinosum cell",
                "Stratum basale cell",
                "Melanocyte",
                "Langerhans cell",
                "Merkel cell",
                "Dendritic epidermal T cell",
                "Gamma delta T cell",
                "Epidermal stem cell",
                "Basal cell",
                "Principial cell",
                "Interfollicular epidermal cell",
                "Hair follicle stem cell",
                "Sebaceous gland stem cell",
                "Sweat gland stem cell",
                "Apical progenitor cell",
                "Basal progenitor cell",
                "Spinous layer cell",
                "Granular layer cell",
                "Corneocyte"
            ],
            "mismatches": [
                "Epidermal progenitor cell"
            ],
            "true_referents": [
                "Apical progenitor cell",
                "Basal cell",
                "Basal progenitor cell",
                "Corneocyte",
                "Dendritic epidermal T cell",
                "Epidermal cell",
                "Epidermal stem cell",
                "Gamma delta T cell",
                "Granular layer cell",
                "Hair follicle stem cell",
                "Interfollicular epidermal cell",
                "Keratinocyte (KC)",
                "Langerhans cell",
                "Melanocyte",
                "Merkel cell",
                "Principial cell",
                "Sebaceous gland stem cell",
                "Spinous layer cell",
                "Stratum basale cell",
                "Stratum corneum cell",
                "Stratum granulosum cell",
                "Stratum lucidum cell",
                "Stratum spinosum cell",
                "Sweat gland stem cell"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "epidermal cell",
        "domain": "biology",
        "response": [
            {
                "Referent": "epidermal cells",
                "Canonical name": "epidermal cells"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "epidermal cells"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"epidermal cells\", \"Canonical name\": \"epidermal cells\"}"
            ],
            "TP": 1,
            "FP": 0,
            "FN": 0
        }
    }
]