[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Pituitary cell (PC)",
            "Thyroid follicular cell (TFC)",
            "Parathyroid cell (PCaT)",
            "Insulin-producing beta cell (\u03b2-cell)",
            "Glucagon-producing alpha cell (\u03b1-cell)",
            "Somatostatin-producing delta cell (\u03b4-cell)",
            "Pancreatic polypeptide-producing PP cell",
            "Cholecystokinin-producing I cell",
            "Gastrin-producing G cell",
            "Prolactin-producing lactotroph (LacT)",
            "Growth hormone-producing somatotroph (SomT)",
            "Thyrotropin-producing thyrotroph (ThyT)",
            "Adrenocorticotropic hormone-producing corticotroph (CorT)",
            "Melanocyte-stimulating hormone-producing melanotroph (MelT)",
            "Oxytocin-producing neurosecretory cell (NSC-O)",
            "Vasopressin-producing neurosecretory cell (NSC-V)",
            "Thymus epithelial cell (TEC)",
            "Thymic hormone-producing thymocyte",
            "Adrenal medulla cell (AMC)",
            "Adrenal cortex cell (ACC)",
            "Ovarian granulosa cell (OGC)",
            "Luteinizing cell (LC)",
            "Testicular Leydig cell (TL)",
            "Testicular Sertoli cell (TS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Pituitary cell (PC)",
                "Thyroid follicular cell (TFC)",
                "Parathyroid cell (PCaT)",
                "Insulin-producing beta cell (\u03b2-cell)",
                "Glucagon-producing alpha cell (\u03b1-cell)",
                "Somatostatin-producing delta cell (\u03b4-cell)",
                "Pancreatic polypeptide-producing PP cell",
                "Cholecystokinin-producing I cell",
                "Gastrin-producing G cell",
                "Prolactin-producing lactotroph (LacT)",
                "Growth hormone-producing somatotroph (SomT)",
                "Thyrotropin-producing thyrotroph (ThyT)",
                "Adrenocorticotropic hormone-producing corticotroph (CorT)",
                "Melanocyte-stimulating hormone-producing melanotroph (MelT)",
                "Oxytocin-producing neurosecretory cell (NSC-O)",
                "Vasopressin-producing neurosecretory cell (NSC-V)",
                "Thymus epithelial cell (TEC)",
                "Thymic hormone-producing thymocyte",
                "Adrenal medulla cell (AMC)",
                "Adrenal cortex cell (ACC)",
                "Ovarian granulosa cell (OGC)",
                "Luteinizing cell (LC)",
                "Testicular Leydig cell (TL)",
                "Testicular Sertoli cell (TS)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenal cortex cell (ACC)",
                "Adrenal medulla cell (AMC)",
                "Adrenocorticotropic hormone-producing corticotroph (CorT)",
                "Cholecystokinin-producing I cell",
                "Gastrin-producing G cell",
                "Glucagon-producing alpha cell (\u03b1-cell)",
                "Growth hormone-producing somatotroph (SomT)",
                "Insulin-producing beta cell (\u03b2-cell)",
                "Luteinizing cell (LC)",
                "Melanocyte-stimulating hormone-producing melanotroph (MelT)",
                "Ovarian granulosa cell (OGC)",
                "Oxytocin-producing neurosecretory cell (NSC-O)",
                "Pancreatic polypeptide-producing PP cell",
                "Parathyroid cell (PCaT)",
                "Pituitary cell (PC)",
                "Prolactin-producing lactotroph (LacT)",
                "Somatostatin-producing delta cell (\u03b4-cell)",
                "Testicular Leydig cell (TL)",
                "Testicular Sertoli cell (TS)",
                "Thymic hormone-producing thymocyte",
                "Thymus epithelial cell (TEC)",
                "Thyroid follicular cell (TFC)",
                "Thyrotropin-producing thyrotroph (ThyT)",
                "Vasopressin-producing neurosecretory cell (NSC-V)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Alpha cell (\u03b1-cell)",
            "Beta cell (\u03b2-cell)",
            "Delta cell (\u03b4-cell)",
            "PP cell (PP-cell)",
            "Acinar cell (Pancreatic acinar cell)",
            "Pituitary somatotroph",
            "Pituitary lactotroph",
            "Pituitary thyrotroph",
            "Pituitary gonadotroph",
            "Pituitary corticotroph",
            "Pituitary melanotroph",
            "Parafollicular cell (C cell)",
            "Adrenal cortical cell",
            "Adrenal medullary cell",
            "Thymic epithelial cell",
            "Thymic nurse cell",
            "Thyroid follicular cell",
            "Thyroid parafollicular cell (C cell)",
            "Pinealocyte",
            "Melanocyte",
            "Enteroendocrine cell",
            "Enterochromaffin cell",
            "Enterochromaffin-like cell",
            "Kupffer cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alpha cell (\u03b1-cell)",
                "Beta cell (\u03b2-cell)",
                "Delta cell (\u03b4-cell)",
                "PP cell (PP-cell)",
                "Acinar cell (Pancreatic acinar cell)",
                "Pituitary somatotroph",
                "Pituitary lactotroph",
                "Pituitary thyrotroph",
                "Pituitary gonadotroph",
                "Pituitary corticotroph",
                "Pituitary melanotroph",
                "Parafollicular cell (C cell)",
                "Adrenal cortical cell",
                "Adrenal medullary cell",
                "Thymic epithelial cell",
                "Thymic nurse cell",
                "Thyroid follicular cell",
                "Thyroid parafollicular cell (C cell)",
                "Pinealocyte",
                "Melanocyte",
                "Enteroendocrine cell",
                "Enterochromaffin cell",
                "Enterochromaffin-like cell",
                "Kupffer cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Acinar cell (Pancreatic acinar cell)",
                "Adrenal cortical cell",
                "Adrenal medullary cell",
                "Alpha cell (\u03b1-cell)",
                "Beta cell (\u03b2-cell)",
                "Delta cell (\u03b4-cell)",
                "Enterochromaffin cell",
                "Enterochromaffin-like cell",
                "Enteroendocrine cell",
                "Kupffer cell",
                "Melanocyte",
                "PP cell (PP-cell)",
                "Parafollicular cell (C cell)",
                "Pinealocyte",
                "Pituitary corticotroph",
                "Pituitary gonadotroph",
                "Pituitary lactotroph",
                "Pituitary melanotroph",
                "Pituitary somatotroph",
                "Pituitary thyrotroph",
                "Thymic epithelial cell",
                "Thymic nurse cell",
                "Thyroid follicular cell",
                "Thyroid parafollicular cell (C cell)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Chief Cell (Parietal Cell)",
            "G Cell",
            "D Cell",
            "ECL Cell",
            "K Cell",
            "Pancreatic Alpha Cell",
            "Pancreatic Beta Cell",
            "Pancreatic Delta Cell",
            "Pancreatic PP Cell",
            "Pancreatic Epsilon Cell",
            "Anterior Pituitary Cell",
            "Posterior Pituitary Cell",
            "Thyrotroph",
            "Corticotroph",
            "Somatotroph",
            "Lactotroph",
            "Gonadotroph",
            "Parathyroid Chief Cell",
            "Oxyphilic Cell",
            "Clear Cell",
            "Chromaffin Cell",
            "Follicular Cell",
            "Parafollicular Cell",
            "Leydig Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Chief Cell (Parietal Cell)",
                "G Cell",
                "D Cell",
                "ECL Cell",
                "K Cell",
                "Pancreatic Alpha Cell",
                "Pancreatic Beta Cell",
                "Pancreatic Delta Cell",
                "Pancreatic PP Cell",
                "Pancreatic Epsilon Cell",
                "Anterior Pituitary Cell",
                "Posterior Pituitary Cell",
                "Thyrotroph",
                "Corticotroph",
                "Somatotroph",
                "Lactotroph",
                "Gonadotroph",
                "Parathyroid Chief Cell",
                "Oxyphilic Cell",
                "Clear Cell",
                "Chromaffin Cell",
                "Follicular Cell",
                "Parafollicular Cell",
                "Leydig Cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Anterior Pituitary Cell",
                "Chief Cell (Parietal Cell)",
                "Chromaffin Cell",
                "Clear Cell",
                "Corticotroph",
                "D Cell",
                "ECL Cell",
                "Follicular Cell",
                "G Cell",
                "Gonadotroph",
                "K Cell",
                "Lactotroph",
                "Leydig Cell",
                "Oxyphilic Cell",
                "Pancreatic Alpha Cell",
                "Pancreatic Beta Cell",
                "Pancreatic Delta Cell",
                "Pancreatic Epsilon Cell",
                "Pancreatic PP Cell",
                "Parafollicular Cell",
                "Parathyroid Chief Cell",
                "Posterior Pituitary Cell",
                "Somatotroph",
                "Thyrotroph"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Pituitary Somatotroph (PIT-SOM)",
            "Thyroid Follicular Cell (THY-FOL)",
            "Parathyroid Chief Cell (PTH-CHIEF)",
            "Adrenal Zona Glomerulosa Cell (ADR-ZGLOM)",
            "Adrenal Zona Fasciculata Cell (ADR-ZFAS)",
            "Adrenal Zona Reticularis Cell (ADR-ZRET)",
            "Pancreatic Beta Cell (PAN-B)",
            "Pancreatic Alpha Cell (PAN-A)",
            "Pancreatic Delta Cell (PAN-D)",
            "Ovarian Granulosa Cell (OVA-GRAN)",
            "Ovarian Theca Cell (OVA-THEC)",
            "Testicular Leydig Cell (TES-LEY)",
            "Pinealocyte (PIN)",
            "Hypothalamic Neurosecretory Cell (HYP-NS)",
            "Gastric G Cell (GAS-G)",
            "Intestinal Enteroendocrine Cell (INT-EE)",
            "Renal Juxtaglomerular Cell (REN-J)",
            "Cardiac Atrial Myocyte (CAR-ATM)",
            "Kidney Distal Convoluted Tubule Cell (KDT)",
            "Placental Syncytiotrophoblast (PLC-SYNC)",
            "Adipocyte (ADIP)",
            "Lung Clara Cell (LUN-CLARA)",
            "Neurohypophyseal Pituicyte (NHP)",
            "Calcitonin-secreting Parafollicular Cell (C-CELL)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Pituitary Somatotroph (PIT-SOM)",
                "Thyroid Follicular Cell (THY-FOL)",
                "Parathyroid Chief Cell (PTH-CHIEF)",
                "Adrenal Zona Glomerulosa Cell (ADR-ZGLOM)",
                "Adrenal Zona Fasciculata Cell (ADR-ZFAS)",
                "Adrenal Zona Reticularis Cell (ADR-ZRET)",
                "Pancreatic Beta Cell (PAN-B)",
                "Pancreatic Alpha Cell (PAN-A)",
                "Pancreatic Delta Cell (PAN-D)",
                "Ovarian Granulosa Cell (OVA-GRAN)",
                "Ovarian Theca Cell (OVA-THEC)",
                "Testicular Leydig Cell (TES-LEY)",
                "Pinealocyte (PIN)",
                "Hypothalamic Neurosecretory Cell (HYP-NS)",
                "Gastric G Cell (GAS-G)",
                "Intestinal Enteroendocrine Cell (INT-EE)",
                "Renal Juxtaglomerular Cell (REN-J)",
                "Cardiac Atrial Myocyte (CAR-ATM)",
                "Kidney Distal Convoluted Tubule Cell (KDT)",
                "Placental Syncytiotrophoblast (PLC-SYNC)",
                "Adipocyte (ADIP)",
                "Lung Clara Cell (LUN-CLARA)",
                "Neurohypophyseal Pituicyte (NHP)",
                "Calcitonin-secreting Parafollicular Cell (C-CELL)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (ADIP)",
                "Adrenal Zona Fasciculata Cell (ADR-ZFAS)",
                "Adrenal Zona Glomerulosa Cell (ADR-ZGLOM)",
                "Adrenal Zona Reticularis Cell (ADR-ZRET)",
                "Calcitonin-secreting Parafollicular Cell (C-CELL)",
                "Cardiac Atrial Myocyte (CAR-ATM)",
                "Gastric G Cell (GAS-G)",
                "Hypothalamic Neurosecretory Cell (HYP-NS)",
                "Intestinal Enteroendocrine Cell (INT-EE)",
                "Kidney Distal Convoluted Tubule Cell (KDT)",
                "Lung Clara Cell (LUN-CLARA)",
                "Neurohypophyseal Pituicyte (NHP)",
                "Ovarian Granulosa Cell (OVA-GRAN)",
                "Ovarian Theca Cell (OVA-THEC)",
                "Pancreatic Alpha Cell (PAN-A)",
                "Pancreatic Beta Cell (PAN-B)",
                "Pancreatic Delta Cell (PAN-D)",
                "Parathyroid Chief Cell (PTH-CHIEF)",
                "Pinealocyte (PIN)",
                "Pituitary Somatotroph (PIT-SOM)",
                "Placental Syncytiotrophoblast (PLC-SYNC)",
                "Renal Juxtaglomerular Cell (REN-J)",
                "Testicular Leydig Cell (TES-LEY)",
                "Thyroid Follicular Cell (THY-FOL)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Thyroid Follicular Cell (TFC)",
            "Parafollicular Cell (C Cell)",
            "Adrenal Cortex Cell",
            "Adrenal Medulla Cell",
            "Pituitary Somatotroph",
            "Pituitary Lactotroph",
            "Pituitary Gonadotroph",
            "Pituitary Thyrotroph",
            "Pituitary Corticotroph",
            "Pinealocyte",
            "Pancreatic Alpha Cell",
            "Pancreatic Beta Cell",
            "Pancreatic Delta Cell",
            "Pancreatic PP Cell",
            "Ovarian Theca Cell",
            "Ovarian Granulosa Cell",
            "Testicular Leydig Cell",
            "Testicular Sertoli Cell",
            "Parathyroid Chief Cell",
            "Parathyroid Oxyphil Cell",
            "Placental Syncytiotrophoblast",
            "Placental Cytotrophoblast",
            "Hypothalamic Neurosecretory Cell",
            "Enteroendocrine Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Thyroid Follicular Cell (TFC)",
                "Parafollicular Cell (C Cell)",
                "Adrenal Cortex Cell",
                "Adrenal Medulla Cell",
                "Pituitary Somatotroph",
                "Pituitary Lactotroph",
                "Pituitary Gonadotroph",
                "Pituitary Thyrotroph",
                "Pituitary Corticotroph",
                "Pinealocyte",
                "Pancreatic Alpha Cell",
                "Pancreatic Beta Cell",
                "Pancreatic Delta Cell",
                "Pancreatic PP Cell",
                "Ovarian Theca Cell",
                "Ovarian Granulosa Cell",
                "Testicular Leydig Cell",
                "Testicular Sertoli Cell",
                "Parathyroid Chief Cell",
                "Parathyroid Oxyphil Cell",
                "Placental Syncytiotrophoblast",
                "Placental Cytotrophoblast",
                "Hypothalamic Neurosecretory Cell",
                "Enteroendocrine Cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenal Cortex Cell",
                "Adrenal Medulla Cell",
                "Enteroendocrine Cell",
                "Hypothalamic Neurosecretory Cell",
                "Ovarian Granulosa Cell",
                "Ovarian Theca Cell",
                "Pancreatic Alpha Cell",
                "Pancreatic Beta Cell",
                "Pancreatic Delta Cell",
                "Pancreatic PP Cell",
                "Parafollicular Cell (C Cell)",
                "Parathyroid Chief Cell",
                "Parathyroid Oxyphil Cell",
                "Pinealocyte",
                "Pituitary Corticotroph",
                "Pituitary Gonadotroph",
                "Pituitary Lactotroph",
                "Pituitary Somatotroph",
                "Pituitary Thyrotroph",
                "Placental Cytotrophoblast",
                "Placental Syncytiotrophoblast",
                "Testicular Leydig Cell",
                "Testicular Sertoli Cell",
                "Thyroid Follicular Cell (TFC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Thyroid follicular cell (TFC)",
            "Adrenal cortex cell (ACC)",
            "Pancreatic beta cell (PBC)",
            "Pituitary gland cell (PGC)",
            "Ovarian follicle cell (OFC)",
            "Testicular Leydig cell (TLC)",
            "Hypothalamic neurosecretory cell (HNC)",
            "Parathyroid chief cell (PCC)",
            "Pinealocyte (PC)",
            "Islet of Langerhans cell (ILC)",
            "Adrenal medulla chromaffin cell (AMCC)",
            "Gastric G cell (GGC)",
            "Intestinal enteroendocrine cell (IEC)",
            "Placental trophoblast cell (PTC)",
            "Kidney juxtaglomerular cell (KJC)",
            "Thymic epithelial cell (TEC)",
            "Adipose tissue adipocyte (ATA)",
            "Cardiac atrial myocyte (CAM)",
            "Skin keratinocyte (SKC)",
            "Bone osteoblast (BO)",
            "Liver hepatocyte (LH)",
            "Mast cell (MC)",
            "Neuroendocrine cell (NEC)",
            "Salivary gland acinar cell (SGAC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Thyroid follicular cell (TFC)",
                "Adrenal cortex cell (ACC)",
                "Pancreatic beta cell (PBC)",
                "Pituitary gland cell (PGC)",
                "Ovarian follicle cell (OFC)",
                "Testicular Leydig cell (TLC)",
                "Hypothalamic neurosecretory cell (HNC)",
                "Parathyroid chief cell (PCC)",
                "Pinealocyte (PC)",
                "Islet of Langerhans cell (ILC)",
                "Adrenal medulla chromaffin cell (AMCC)",
                "Gastric G cell (GGC)",
                "Intestinal enteroendocrine cell (IEC)",
                "Placental trophoblast cell (PTC)",
                "Kidney juxtaglomerular cell (KJC)",
                "Thymic epithelial cell (TEC)",
                "Adipose tissue adipocyte (ATA)",
                "Cardiac atrial myocyte (CAM)",
                "Skin keratinocyte (SKC)",
                "Bone osteoblast (BO)",
                "Liver hepatocyte (LH)",
                "Mast cell (MC)",
                "Neuroendocrine cell (NEC)",
                "Salivary gland acinar cell (SGAC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipose tissue adipocyte (ATA)",
                "Adrenal cortex cell (ACC)",
                "Adrenal medulla chromaffin cell (AMCC)",
                "Bone osteoblast (BO)",
                "Cardiac atrial myocyte (CAM)",
                "Gastric G cell (GGC)",
                "Hypothalamic neurosecretory cell (HNC)",
                "Intestinal enteroendocrine cell (IEC)",
                "Islet of Langerhans cell (ILC)",
                "Kidney juxtaglomerular cell (KJC)",
                "Liver hepatocyte (LH)",
                "Mast cell (MC)",
                "Neuroendocrine cell (NEC)",
                "Ovarian follicle cell (OFC)",
                "Pancreatic beta cell (PBC)",
                "Parathyroid chief cell (PCC)",
                "Pinealocyte (PC)",
                "Pituitary gland cell (PGC)",
                "Placental trophoblast cell (PTC)",
                "Salivary gland acinar cell (SGAC)",
                "Skin keratinocyte (SKC)",
                "Testicular Leydig cell (TLC)",
                "Thymic epithelial cell (TEC)",
                "Thyroid follicular cell (TFC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Pituitary Gland Somatotrophs (PGS)",
            "Pituitary Gland Lactotrophs (PGL)",
            "Pituitary Gland Corticotrophs (PGC)",
            "Pituitary Gland Melanotrophs (PGM)",
            "Pituitary Gland Thyrotrophs (PGT)",
            "Pituitary Gland Gonadotrophs (PGG)",
            "Adrenal Gland Zona Glomerulosa Cells (AGZGC)",
            "Adrenal Gland Zona Fasciculata Cells (AGZFC)",
            "Adrenal Gland Zona Reticularis Cells (AGZRC)",
            "Adrenal Gland Medulla Chromaffin Cells (AGMCC)",
            "Thyroid Gland Follicular Cells (TGFC)",
            "Thyroid Gland Parafollicular Cells (TGPC)",
            "Parathyroid Gland Chief Cells (PGCC)",
            "Parathyroid Gland Oxyphil Cells (PGOC)",
            "Pineal Gland Pinealocytes (PGP)",
            "Pancreas Alpha Cells (PAC)",
            "Pancreas Beta Cells (PBC)",
            "Pancreas Delta Cells (PDC)",
            "Pancreas PP Cells (PPC)",
            "Pancreas Epsilon Cells (PEC)",
            "Ovaries Granulosa Cells (OGC)",
            "Ovaries Theca Cells (OTC)",
            "Testes Leydig Cells (TLC)",
            "Testes Sertoli Cells (TSC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Pituitary Gland Somatotrophs (PGS)",
                "Pituitary Gland Lactotrophs (PGL)",
                "Pituitary Gland Corticotrophs (PGC)",
                "Pituitary Gland Melanotrophs (PGM)",
                "Pituitary Gland Thyrotrophs (PGT)",
                "Pituitary Gland Gonadotrophs (PGG)",
                "Adrenal Gland Zona Glomerulosa Cells (AGZGC)",
                "Adrenal Gland Zona Fasciculata Cells (AGZFC)",
                "Adrenal Gland Zona Reticularis Cells (AGZRC)",
                "Adrenal Gland Medulla Chromaffin Cells (AGMCC)",
                "Thyroid Gland Follicular Cells (TGFC)",
                "Thyroid Gland Parafollicular Cells (TGPC)",
                "Parathyroid Gland Chief Cells (PGCC)",
                "Parathyroid Gland Oxyphil Cells (PGOC)",
                "Pineal Gland Pinealocytes (PGP)",
                "Pancreas Alpha Cells (PAC)",
                "Pancreas Beta Cells (PBC)",
                "Pancreas Delta Cells (PDC)",
                "Pancreas PP Cells (PPC)",
                "Pancreas Epsilon Cells (PEC)",
                "Ovaries Granulosa Cells (OGC)",
                "Ovaries Theca Cells (OTC)",
                "Testes Leydig Cells (TLC)",
                "Testes Sertoli Cells (TSC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenal Gland Medulla Chromaffin Cells (AGMCC)",
                "Adrenal Gland Zona Fasciculata Cells (AGZFC)",
                "Adrenal Gland Zona Glomerulosa Cells (AGZGC)",
                "Adrenal Gland Zona Reticularis Cells (AGZRC)",
                "Ovaries Granulosa Cells (OGC)",
                "Ovaries Theca Cells (OTC)",
                "Pancreas Alpha Cells (PAC)",
                "Pancreas Beta Cells (PBC)",
                "Pancreas Delta Cells (PDC)",
                "Pancreas Epsilon Cells (PEC)",
                "Pancreas PP Cells (PPC)",
                "Parathyroid Gland Chief Cells (PGCC)",
                "Parathyroid Gland Oxyphil Cells (PGOC)",
                "Pineal Gland Pinealocytes (PGP)",
                "Pituitary Gland Corticotrophs (PGC)",
                "Pituitary Gland Gonadotrophs (PGG)",
                "Pituitary Gland Lactotrophs (PGL)",
                "Pituitary Gland Melanotrophs (PGM)",
                "Pituitary Gland Somatotrophs (PGS)",
                "Pituitary Gland Thyrotrophs (PGT)",
                "Testes Leydig Cells (TLC)",
                "Testes Sertoli Cells (TSC)",
                "Thyroid Gland Follicular Cells (TGFC)",
                "Thyroid Gland Parafollicular Cells (TGPC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Endocrine cell",
            "Thyroid follicular cell",
            "Pancreatic alpha cell",
            "Pancreatic beta cell",
            "Adrenal cortex cell",
            "Pituitary gland cell",
            "Parathyroid chief cell",
            "Ovarian granulosa cell",
            "Testicular Leydig cell",
            "Pineal gland cell",
            "Thymus gland cell",
            "Adipose tissue cell",
            "Gastric G cell",
            "Intestinal enteroendocrine cell",
            "Hypothalamic neurosecretory cell",
            "Adrenal medulla cell",
            "Pituitary somatotroph cell",
            "Pituitary corticotroph cell",
            "Pituitary thyrotroph cell",
            "Pituitary lactotroph cell",
            "Pituitary gonadotroph cell",
            "Pituitary melanotroph cell",
            "Parathyroid oxyphil cell",
            "Adrenal chromaffin cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Endocrine cell",
                "Thyroid follicular cell",
                "Pancreatic alpha cell",
                "Pancreatic beta cell",
                "Adrenal cortex cell",
                "Pituitary gland cell",
                "Parathyroid chief cell",
                "Ovarian granulosa cell",
                "Testicular Leydig cell",
                "Pineal gland cell",
                "Thymus gland cell",
                "Adipose tissue cell",
                "Gastric G cell",
                "Intestinal enteroendocrine cell",
                "Hypothalamic neurosecretory cell",
                "Adrenal medulla cell",
                "Pituitary somatotroph cell",
                "Pituitary corticotroph cell",
                "Pituitary thyrotroph cell",
                "Pituitary lactotroph cell",
                "Pituitary gonadotroph cell",
                "Pituitary melanotroph cell",
                "Parathyroid oxyphil cell",
                "Adrenal chromaffin cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipose tissue cell",
                "Adrenal chromaffin cell",
                "Adrenal cortex cell",
                "Adrenal medulla cell",
                "Endocrine cell",
                "Gastric G cell",
                "Hypothalamic neurosecretory cell",
                "Intestinal enteroendocrine cell",
                "Ovarian granulosa cell",
                "Pancreatic alpha cell",
                "Pancreatic beta cell",
                "Parathyroid chief cell",
                "Parathyroid oxyphil cell",
                "Pineal gland cell",
                "Pituitary corticotroph cell",
                "Pituitary gland cell",
                "Pituitary gonadotroph cell",
                "Pituitary lactotroph cell",
                "Pituitary melanotroph cell",
                "Pituitary somatotroph cell",
                "Pituitary thyrotroph cell",
                "Testicular Leydig cell",
                "Thymus gland cell",
                "Thyroid follicular cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Beta cells (\u03b2 cells)",
            "Alpha cells (\u03b1 cells)",
            "Delta cells (\u03b4 cells)",
            "PP cells (F cells)",
            "Somatotrophs",
            "Lactotrophs",
            "Corticotrophs",
            "Thyrotrophs",
            "Gonadotrophs",
            "Pinealocytes",
            "Thyrocytes (Follicular cells)",
            "Parafollicular cells (C cells)",
            "Chromaffin cells",
            "Zona glomerulosa cells",
            "Zona fasciculata cells",
            "Zona reticularis cells",
            "Leydig cells",
            "Granulosa cells",
            "Thymic epithelial cells",
            "Pituicytes",
            "Oxyphil cells",
            "Melanotrophs",
            "Magnocellular neurons",
            "Ovarian theca cells"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Beta cells (\u03b2 cells)",
                "Alpha cells (\u03b1 cells)",
                "Delta cells (\u03b4 cells)",
                "PP cells (F cells)",
                "Somatotrophs",
                "Lactotrophs",
                "Corticotrophs",
                "Thyrotrophs",
                "Gonadotrophs",
                "Pinealocytes",
                "Thyrocytes (Follicular cells)",
                "Parafollicular cells (C cells)",
                "Chromaffin cells",
                "Zona glomerulosa cells",
                "Zona fasciculata cells",
                "Zona reticularis cells",
                "Leydig cells",
                "Granulosa cells",
                "Thymic epithelial cells",
                "Pituicytes",
                "Oxyphil cells",
                "Melanotrophs",
                "Magnocellular neurons",
                "Ovarian theca cells"
            ],
            "mismatches": [],
            "true_referents": [
                "Alpha cells (\u03b1 cells)",
                "Beta cells (\u03b2 cells)",
                "Chromaffin cells",
                "Corticotrophs",
                "Delta cells (\u03b4 cells)",
                "Gonadotrophs",
                "Granulosa cells",
                "Lactotrophs",
                "Leydig cells",
                "Magnocellular neurons",
                "Melanotrophs",
                "Ovarian theca cells",
                "Oxyphil cells",
                "PP cells (F cells)",
                "Parafollicular cells (C cells)",
                "Pinealocytes",
                "Pituicytes",
                "Somatotrophs",
                "Thymic epithelial cells",
                "Thyrocytes (Follicular cells)",
                "Thyrotrophs",
                "Zona fasciculata cells",
                "Zona glomerulosa cells",
                "Zona reticularis cells"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Thyroid follicular cell",
            "Adrenal cortical cell",
            "Pancreatic islet alpha cell",
            "Pancreatic islet beta cell",
            "Pituitary somatotroph",
            "Pituitary lactotroph",
            "Pituitary thyrotroph",
            "Pituitary gonadotroph",
            "Pituitary corticotroph",
            "Parathyroid chief cell",
            "Pinealocyte",
            "Leydig cell",
            "Theca cell",
            "Granulosa cell",
            "Juxtaglomerular cell",
            "Enterochromaffin cell",
            "Enteroendocrine K cell",
            "Enteroendocrine L cell",
            "Enteroendocrine I cell",
            "Enteroendocrine S cell",
            "C cell (parafollicular cell)",
            "Chromaffin cell",
            "Oxyntic cell",
            "Renin-secreting cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Thyroid follicular cell",
                "Adrenal cortical cell",
                "Pancreatic islet alpha cell",
                "Pancreatic islet beta cell",
                "Pituitary somatotroph",
                "Pituitary lactotroph",
                "Pituitary thyrotroph",
                "Pituitary gonadotroph",
                "Pituitary corticotroph",
                "Parathyroid chief cell",
                "Pinealocyte",
                "Leydig cell",
                "Theca cell",
                "Granulosa cell",
                "Juxtaglomerular cell",
                "Enterochromaffin cell",
                "Enteroendocrine K cell",
                "Enteroendocrine L cell",
                "Enteroendocrine I cell",
                "Enteroendocrine S cell",
                "C cell (parafollicular cell)",
                "Chromaffin cell",
                "Oxyntic cell",
                "Renin-secreting cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenal cortical cell",
                "C cell (parafollicular cell)",
                "Chromaffin cell",
                "Enterochromaffin cell",
                "Enteroendocrine I cell",
                "Enteroendocrine K cell",
                "Enteroendocrine L cell",
                "Enteroendocrine S cell",
                "Granulosa cell",
                "Juxtaglomerular cell",
                "Leydig cell",
                "Oxyntic cell",
                "Pancreatic islet alpha cell",
                "Pancreatic islet beta cell",
                "Parathyroid chief cell",
                "Pinealocyte",
                "Pituitary corticotroph",
                "Pituitary gonadotroph",
                "Pituitary lactotroph",
                "Pituitary somatotroph",
                "Pituitary thyrotroph",
                "Renin-secreting cell",
                "Theca cell",
                "Thyroid follicular cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Thyroid follicular cell",
            "Adrenal chromaffin cell",
            "Anterior pituitary cell",
            "Posterior pituitary cell",
            "Pancreatic alpha cell",
            "Pancreatic beta cell",
            "Pancreatic delta cell",
            "Pancreatic PP cell",
            "Thyroid parafollicular cell (C cell)",
            "Parathyroid chief cell",
            "Adrenal cortical cell",
            "Leydig cell",
            "Theca interna cell",
            "Corpus luteum cell",
            "Juxtaglomerular cell (JG cell)",
            "Macula densa cell",
            "Pinealocyte",
            "Thymic epithelial cell",
            "Enteroendocrine cell",
            "Ovarian granulosa cell",
            "Sertoli cell",
            "Hepatic stellate cell (Ito cell)",
            "Adipocyte",
            "Osteoblast"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Thyroid follicular cell",
                "Adrenal chromaffin cell",
                "Anterior pituitary cell",
                "Posterior pituitary cell",
                "Pancreatic alpha cell",
                "Pancreatic beta cell",
                "Pancreatic delta cell",
                "Pancreatic PP cell",
                "Thyroid parafollicular cell (C cell)",
                "Parathyroid chief cell",
                "Adrenal cortical cell",
                "Leydig cell",
                "Theca interna cell",
                "Corpus luteum cell",
                "Juxtaglomerular cell (JG cell)",
                "Macula densa cell",
                "Pinealocyte",
                "Thymic epithelial cell",
                "Enteroendocrine cell",
                "Ovarian granulosa cell",
                "Sertoli cell",
                "Hepatic stellate cell (Ito cell)",
                "Adipocyte",
                "Osteoblast"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "Adrenal chromaffin cell",
                "Adrenal cortical cell",
                "Anterior pituitary cell",
                "Corpus luteum cell",
                "Enteroendocrine cell",
                "Hepatic stellate cell (Ito cell)",
                "Juxtaglomerular cell (JG cell)",
                "Leydig cell",
                "Macula densa cell",
                "Osteoblast",
                "Ovarian granulosa cell",
                "Pancreatic PP cell",
                "Pancreatic alpha cell",
                "Pancreatic beta cell",
                "Pancreatic delta cell",
                "Parathyroid chief cell",
                "Pinealocyte",
                "Posterior pituitary cell",
                "Sertoli cell",
                "Theca interna cell",
                "Thymic epithelial cell",
                "Thyroid follicular cell",
                "Thyroid parafollicular cell (C cell)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Thyroid follicular cell (TFC)",
            "Adrenal cortical cell (ACC)",
            "Pituitary cell (PC)",
            "Ovarian theca cell (OTC)",
            "Testicular Leydig cell (TLC)",
            "Pancreatic islet cell (PIC)",
            "Parathyroid cell (PTC)",
            "Pineal cell (PNC)",
            "Hypothalamic neurosecretory cell (HNC)",
            "Placental syncytiotrophoblast cell (PSTC)",
            "Adipocyte (AC)",
            "Gastric G cell (GGC)",
            "Intestinal enteroendocrine cell (IEC)",
            "Renal juxtaglomerular cell (RJC)",
            "Cardiac atrial natriuretic cell (CANC)",
            "Thymic epithelial cell (TEC)",
            "Skin melanocyte (SM)",
            "Liver hepatocyte (LH)",
            "Kidney mesangial cell (KMC)",
            "Bone osteoblast (BO)",
            "Cartilage chondrocyte (CC)",
            "Smooth muscle cell (SMC)",
            "Mast cell (MC)",
            "Macrophage (M)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Thyroid follicular cell (TFC)",
                "Adrenal cortical cell (ACC)",
                "Pituitary cell (PC)",
                "Ovarian theca cell (OTC)",
                "Testicular Leydig cell (TLC)",
                "Pancreatic islet cell (PIC)",
                "Parathyroid cell (PTC)",
                "Pineal cell (PNC)",
                "Hypothalamic neurosecretory cell (HNC)",
                "Placental syncytiotrophoblast cell (PSTC)",
                "Adipocyte (AC)",
                "Gastric G cell (GGC)",
                "Intestinal enteroendocrine cell (IEC)",
                "Renal juxtaglomerular cell (RJC)",
                "Cardiac atrial natriuretic cell (CANC)",
                "Thymic epithelial cell (TEC)",
                "Skin melanocyte (SM)",
                "Liver hepatocyte (LH)",
                "Kidney mesangial cell (KMC)",
                "Bone osteoblast (BO)",
                "Cartilage chondrocyte (CC)",
                "Smooth muscle cell (SMC)",
                "Mast cell (MC)",
                "Macrophage (M)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte (AC)",
                "Adrenal cortical cell (ACC)",
                "Bone osteoblast (BO)",
                "Cardiac atrial natriuretic cell (CANC)",
                "Cartilage chondrocyte (CC)",
                "Gastric G cell (GGC)",
                "Hypothalamic neurosecretory cell (HNC)",
                "Intestinal enteroendocrine cell (IEC)",
                "Kidney mesangial cell (KMC)",
                "Liver hepatocyte (LH)",
                "Macrophage (M)",
                "Mast cell (MC)",
                "Ovarian theca cell (OTC)",
                "Pancreatic islet cell (PIC)",
                "Parathyroid cell (PTC)",
                "Pineal cell (PNC)",
                "Pituitary cell (PC)",
                "Placental syncytiotrophoblast cell (PSTC)",
                "Renal juxtaglomerular cell (RJC)",
                "Skin melanocyte (SM)",
                "Smooth muscle cell (SMC)",
                "Testicular Leydig cell (TLC)",
                "Thymic epithelial cell (TEC)",
                "Thyroid follicular cell (TFC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Adrenal Gland Cell (AGC)",
            "Islet of Langerhans Cell (ILC)",
            "Pineal Gland Cell (PGC)",
            "Pituitary Gland Cell (PitGC)",
            "Thyroid Gland Cell (TGC)",
            "Parathyroid Gland Cell (ParGC)",
            "Pancreatic Islet Cell (PIC)",
            "Ovarian Follicular Cell (OFC)",
            "Testicular Leydig Cell (TLC)",
            "Hypothalamic Neurosecretory Cell (HNC)",
            "Posterior Pituitary Cell (PPC)",
            "Anterior Pituitary Cell (APC)",
            "Thyroid Parafollicular Cell (TPC)",
            "Parathyroid Chief Cell (PCC)",
            "Pancreatic Acinar Cell (PAC)",
            "Adrenal Medullary Cell (AMC)",
            "Pineal Gland Photoreceptor Cell (PGPC)",
            "Ovarian Theca Cell (OTC)",
            "Testicular Sertoli Cell (TSC)",
            "Hypothalamic Neurosecretory Magnocellular Cell (HNMC)",
            "Posterior Pituitary Neurosecretory Cell (PPNC)",
            "Anterior Pituitary Gonadotropic Cell (APGC)",
            "Thyroid Follicular Cell (TFC)",
            "Parathyroid Oxyphil Cell (POC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenal Gland Cell (AGC)",
                "Islet of Langerhans Cell (ILC)",
                "Pineal Gland Cell (PGC)",
                "Pituitary Gland Cell (PitGC)",
                "Thyroid Gland Cell (TGC)",
                "Parathyroid Gland Cell (ParGC)",
                "Pancreatic Islet Cell (PIC)",
                "Ovarian Follicular Cell (OFC)",
                "Testicular Leydig Cell (TLC)",
                "Hypothalamic Neurosecretory Cell (HNC)",
                "Posterior Pituitary Cell (PPC)",
                "Anterior Pituitary Cell (APC)",
                "Thyroid Parafollicular Cell (TPC)",
                "Parathyroid Chief Cell (PCC)",
                "Pancreatic Acinar Cell (PAC)",
                "Adrenal Medullary Cell (AMC)",
                "Pineal Gland Photoreceptor Cell (PGPC)",
                "Ovarian Theca Cell (OTC)",
                "Testicular Sertoli Cell (TSC)",
                "Hypothalamic Neurosecretory Magnocellular Cell (HNMC)",
                "Posterior Pituitary Neurosecretory Cell (PPNC)",
                "Anterior Pituitary Gonadotropic Cell (APGC)",
                "Thyroid Follicular Cell (TFC)",
                "Parathyroid Oxyphil Cell (POC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenal Gland Cell (AGC)",
                "Adrenal Medullary Cell (AMC)",
                "Anterior Pituitary Cell (APC)",
                "Anterior Pituitary Gonadotropic Cell (APGC)",
                "Hypothalamic Neurosecretory Cell (HNC)",
                "Hypothalamic Neurosecretory Magnocellular Cell (HNMC)",
                "Islet of Langerhans Cell (ILC)",
                "Ovarian Follicular Cell (OFC)",
                "Ovarian Theca Cell (OTC)",
                "Pancreatic Acinar Cell (PAC)",
                "Pancreatic Islet Cell (PIC)",
                "Parathyroid Chief Cell (PCC)",
                "Parathyroid Gland Cell (ParGC)",
                "Parathyroid Oxyphil Cell (POC)",
                "Pineal Gland Cell (PGC)",
                "Pineal Gland Photoreceptor Cell (PGPC)",
                "Pituitary Gland Cell (PitGC)",
                "Posterior Pituitary Cell (PPC)",
                "Posterior Pituitary Neurosecretory Cell (PPNC)",
                "Testicular Leydig Cell (TLC)",
                "Testicular Sertoli Cell (TSC)",
                "Thyroid Follicular Cell (TFC)",
                "Thyroid Gland Cell (TGC)",
                "Thyroid Parafollicular Cell (TPC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Adrenal Cortical Cell (AdCC)",
            "Anterior Pituitary Cell",
            "Corticotropin-Releasing Hormone (CRH) Cell",
            "Follicle-Stimulating Hormone (FSH) Cell",
            "Gonadotropin-Releasing Hormone (GnRH) Cell",
            "Insulinoma Cell",
            "Luteinizing Hormone (LH) Cell",
            "Melanotropin-Releasing Hormone (MHR) Cell",
            "Melatonin-Producing Cell",
            "Oxytocin-Producing Cell",
            "Prolactin-Producing Cell",
            "Prolactin-Releasing Hormone (PRH) Cell",
            "Somatostatin-Producing Cell",
            "Somatotropin-Releasing Hormone (SRH) Cell",
            "Thyroid-Stimulating Hormone (TSH) Cell",
            "Thyrotropin-Releasing Hormone (TRH) Cell",
            "Vasopressin-Producing Cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenal Cortical Cell (AdCC)",
                "Anterior Pituitary Cell",
                "Corticotropin-Releasing Hormone (CRH) Cell",
                "Follicle-Stimulating Hormone (FSH) Cell",
                "Gonadotropin-Releasing Hormone (GnRH) Cell",
                "Insulinoma Cell",
                "Luteinizing Hormone (LH) Cell",
                "Melanotropin-Releasing Hormone (MHR) Cell",
                "Melatonin-Producing Cell",
                "Oxytocin-Producing Cell",
                "Prolactin-Producing Cell",
                "Prolactin-Releasing Hormone (PRH) Cell",
                "Somatostatin-Producing Cell",
                "Somatotropin-Releasing Hormone (SRH) Cell",
                "Thyroid-Stimulating Hormone (TSH) Cell",
                "Thyrotropin-Releasing Hormone (TRH) Cell",
                "Vasopressin-Producing Cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenal Cortical Cell (AdCC)",
                "Anterior Pituitary Cell",
                "Corticotropin-Releasing Hormone (CRH) Cell",
                "Follicle-Stimulating Hormone (FSH) Cell",
                "Gonadotropin-Releasing Hormone (GnRH) Cell",
                "Insulinoma Cell",
                "Luteinizing Hormone (LH) Cell",
                "Melanotropin-Releasing Hormone (MHR) Cell",
                "Melatonin-Producing Cell",
                "Oxytocin-Producing Cell",
                "Prolactin-Producing Cell",
                "Prolactin-Releasing Hormone (PRH) Cell",
                "Somatostatin-Producing Cell",
                "Somatotropin-Releasing Hormone (SRH) Cell",
                "Thyroid-Stimulating Hormone (TSH) Cell",
                "Thyrotropin-Releasing Hormone (TRH) Cell",
                "Vasopressin-Producing Cell"
            ],
            "TP": 17,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Adrenocorticotropic cells (ACTH) in Pituitary gland",
            "Gonadotropes in Pituitary gland",
            "Thyrotropes in Pituitary gland",
            "Lactotropes in Pituitary gland",
            "Somatotropes in Pituitary gland",
            "Corticotropes in Pituitary gland",
            "Melanotropes in Pituitary gland",
            "Parathyroid cells in Parathyroid gland",
            "Thyroid epithelial cells in Thyroid gland",
            "Adrenal cortical cells in Adrenal gland",
            "Adrenal medullary cells in Adrenal gland",
            "Pancreatic beta cells in Pancreas",
            "Pancreatic alpha cells in Pancreas",
            "Pancreatic delta cells in Pancreas",
            "Pancreatic PP cells in Pancreas",
            "Oxytocinergic neurons in Hypothalamus",
            "Vasopressinergic neurons in Hypothalamus",
            "Gonadotropin-releasing hormone (GnRH) neurons in Hypothalamus",
            "Corticotropin-releasing hormone (CRH) neurons in Hypothalamus",
            "Thyrotropin-releasing hormone (TRH) neurons in Hypothalamus",
            "Growth hormone-releasing hormone (GHRH) neurons in Hypothalamus"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenocorticotropic cells (ACTH) in Pituitary gland",
                "Gonadotropes in Pituitary gland",
                "Thyrotropes in Pituitary gland",
                "Lactotropes in Pituitary gland",
                "Somatotropes in Pituitary gland",
                "Corticotropes in Pituitary gland",
                "Melanotropes in Pituitary gland",
                "Parathyroid cells in Parathyroid gland",
                "Thyroid epithelial cells in Thyroid gland",
                "Adrenal cortical cells in Adrenal gland",
                "Adrenal medullary cells in Adrenal gland",
                "Pancreatic beta cells in Pancreas",
                "Pancreatic alpha cells in Pancreas",
                "Pancreatic delta cells in Pancreas",
                "Pancreatic PP cells in Pancreas",
                "Oxytocinergic neurons in Hypothalamus",
                "Vasopressinergic neurons in Hypothalamus",
                "Gonadotropin-releasing hormone (GnRH) neurons in Hypothalamus",
                "Corticotropin-releasing hormone (CRH) neurons in Hypothalamus",
                "Thyrotropin-releasing hormone (TRH) neurons in Hypothalamus",
                "Growth hormone-releasing hormone (GHRH) neurons in Hypothalamus"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenal cortical cells in Adrenal gland",
                "Adrenal medullary cells in Adrenal gland",
                "Adrenocorticotropic cells (ACTH) in Pituitary gland",
                "Corticotropes in Pituitary gland",
                "Corticotropin-releasing hormone (CRH) neurons in Hypothalamus",
                "Gonadotropes in Pituitary gland",
                "Gonadotropin-releasing hormone (GnRH) neurons in Hypothalamus",
                "Growth hormone-releasing hormone (GHRH) neurons in Hypothalamus",
                "Lactotropes in Pituitary gland",
                "Melanotropes in Pituitary gland",
                "Oxytocinergic neurons in Hypothalamus",
                "Pancreatic PP cells in Pancreas",
                "Pancreatic alpha cells in Pancreas",
                "Pancreatic beta cells in Pancreas",
                "Pancreatic delta cells in Pancreas",
                "Parathyroid cells in Parathyroid gland",
                "Somatotropes in Pituitary gland",
                "Thyroid epithelial cells in Thyroid gland",
                "Thyrotropes in Pituitary gland",
                "Thyrotropin-releasing hormone (TRH) neurons in Hypothalamus",
                "Vasopressinergic neurons in Hypothalamus"
            ],
            "TP": 21,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            {
                "Referent": "pituitary gland",
                "Canonical name": "pituitary gland"
            },
            {
                "Referent": "thyroid gland",
                "Canonical name": "thyroid gland"
            },
            {
                "Referent": "adrenal gland",
                "Canonical name": "adrenal gland"
            },
            {
                "Referent": "parathyroid gland",
                "Canonical name": "parathyroid gland"
            },
            {
                "Referent": "pancreas",
                "Canonical name": "pancreas"
            },
            {
                "Referent": "gonads",
                "Canonical name": "gonads"
            },
            {
                "Referent": "thymus gland",
                "Canonical name": "thymus gland"
            },
            {
                "Referent": "spleen",
                "Canonical name": "spleen"
            },
            {
                "Referent": "lymph nodes",
                "Canonical name": "lymph nodes"
            },
            {
                "Referent": "testes",
                "Canonical name": "testes"
            },
            {
                "Referent": "ovaries",
                "Canonical name": "ovaries"
            },
            {
                "Referent": "prostate gland",
                "Canonical name": "prostate gland"
            },
            {
                "Referent": "uterus",
                "Canonical name": "uterus"
            },
            {
                "Referent": "fallopian tubes",
                "Canonical name": "fallopian tubes"
            },
            {
                "Referent": "cervix",
                "Canonical name": "cervix"
            },
            {
                "Referent": "vagina",
                "Canonical name": "vagina"
            },
            {
                "Referent": "kidneys",
                "Canonical name": "kidneys"
            },
            {
                "Referent": "adrenal medulla",
                "Canonical name": "adrenal medulla"
            },
            {
                "Referent": "pituitary gland",
                "Canonical name": "pituitary gland"
            },
            {
                "Referent": "thyroid gland",
                "Canonical name": "thyroid gland"
            },
            {
                "Referent": "adrenal gland",
                "Canonical name": "adrenal gland"
            },
            {
                "Referent": "parathyroid gland",
                "Canonical name": "parathyroid gland"
            },
            {
                "Referent": "pancreas",
                "Canonical name": "pancreas"
            },
            {
                "Referent": "gonads",
                "Canonical name": "gonads"
            },
            {
                "Referent": "thymus gland",
                "Canonical name": "thymus gland"
            },
            {
                "Referent": "spleen",
                "Canonical name": "spleen"
            },
            {
                "Referent": "lymph nodes",
                "Canonical name": "lymph nodes"
            },
            {
                "Referent": "testes",
                "Canonical name": "testes"
            },
            {
                "Referent": "ovaries",
                "Canonical name": "ovaries"
            },
            {
                "Referent": "prostate gland",
                "Canonical name": "prostate gland"
            },
            {
                "Referent": "uterus",
                "Canonical name": "uterus"
            },
            {
                "Referent": "fallopian tubes",
                "Canonical name": "fallopian tubes"
            },
            {
                "Referent": "cervix",
                "Canonical name": "cervix"
            },
            {
                "Referent": "vagina",
                "Canonical name": "vagina"
            },
            {
                "Referent": "kidneys",
                "Canonical name": "kidneys"
            },
            {
                "Referent": "adrenal medulla",
                "Canonical name": "adrenal medulla"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "pituitary gland",
                "thyroid gland",
                "adrenal gland",
                "parathyroid gland",
                "pancreas",
                "gonads",
                "thymus gland",
                "spleen",
                "lymph nodes",
                "testes",
                "ovaries",
                "prostate gland",
                "uterus",
                "fallopian tubes",
                "cervix",
                "vagina",
                "kidneys",
                "adrenal medulla"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"adrenal gland\", \"Canonical name\": \"adrenal gland\"}",
                "{\"Referent\": \"adrenal medulla\", \"Canonical name\": \"adrenal medulla\"}",
                "{\"Referent\": \"cervix\", \"Canonical name\": \"cervix\"}",
                "{\"Referent\": \"fallopian tubes\", \"Canonical name\": \"fallopian tubes\"}",
                "{\"Referent\": \"gonads\", \"Canonical name\": \"gonads\"}",
                "{\"Referent\": \"kidneys\", \"Canonical name\": \"kidneys\"}",
                "{\"Referent\": \"lymph nodes\", \"Canonical name\": \"lymph nodes\"}",
                "{\"Referent\": \"ovaries\", \"Canonical name\": \"ovaries\"}",
                "{\"Referent\": \"pancreas\", \"Canonical name\": \"pancreas\"}",
                "{\"Referent\": \"parathyroid gland\", \"Canonical name\": \"parathyroid gland\"}",
                "{\"Referent\": \"pituitary gland\", \"Canonical name\": \"pituitary gland\"}",
                "{\"Referent\": \"prostate gland\", \"Canonical name\": \"prostate gland\"}",
                "{\"Referent\": \"spleen\", \"Canonical name\": \"spleen\"}",
                "{\"Referent\": \"testes\", \"Canonical name\": \"testes\"}",
                "{\"Referent\": \"thymus gland\", \"Canonical name\": \"thymus gland\"}",
                "{\"Referent\": \"thyroid gland\", \"Canonical name\": \"thyroid gland\"}",
                "{\"Referent\": \"uterus\", \"Canonical name\": \"uterus\"}",
                "{\"Referent\": \"vagina\", \"Canonical name\": \"vagina\"}"
            ],
            "TP": 18,
            "FP": 0,
            "FN": 0
        }
    }
]