[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Adrenal medulla cell (APUD cell)",
            "Beta cell of the pancreas (B cell)",
            "Pituitary somatotroph cell (GH cell)",
            "Pituitary thyrotroph cell (TSH cell)",
            "Pituitary corticotroph cell (ACTH cell)",
            "Pituitary lactotroph cell (PRL cell)",
            "Pituitary gonadotroph cell (LH/FSH cell)",
            "Parathyroid cell (PTH cell)",
            "Thyroid follicular cell (T cell)",
            "Thyroid parafollicular cell (C cell)",
            "Ovarian granulosa cell (G cell)",
            "Ovarian theca cell (T cell)",
            "Testicular Leydig cell (L cell)",
            "Testicular Sertoli cell (S cell)",
            "Ovarian luteal cell (L cell)",
            "Gastric enterochromaffin-like cell (ECL cell)",
            "Intestinal enterochromaffin cell (EC cell)",
            "Small intestine D cell (D cell)",
            "Pancreatic alpha cell (A cell)",
            "Pancreatic delta cell (D cell)",
            "Colon C cell (C cell)",
            "Adrenal zona glomerulosa cell (ZG cell)",
            "Adrenal zona fasciculata cell (ZF cell)",
            "Adrenal zona reticularis cell (ZR cell)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenal medulla cell (APUD cell)",
                "Beta cell of the pancreas (B cell)",
                "Pituitary somatotroph cell (GH cell)",
                "Pituitary thyrotroph cell (TSH cell)",
                "Pituitary corticotroph cell (ACTH cell)",
                "Pituitary lactotroph cell (PRL cell)",
                "Pituitary gonadotroph cell (LH/FSH cell)",
                "Parathyroid cell (PTH cell)",
                "Thyroid follicular cell (T cell)",
                "Thyroid parafollicular cell (C cell)",
                "Ovarian granulosa cell (G cell)",
                "Ovarian theca cell (T cell)",
                "Testicular Leydig cell (L cell)",
                "Testicular Sertoli cell (S cell)",
                "Ovarian luteal cell (L cell)",
                "Gastric enterochromaffin-like cell (ECL cell)",
                "Intestinal enterochromaffin cell (EC cell)",
                "Small intestine D cell (D cell)",
                "Pancreatic alpha cell (A cell)",
                "Pancreatic delta cell (D cell)",
                "Colon C cell (C cell)",
                "Adrenal zona glomerulosa cell (ZG cell)",
                "Adrenal zona fasciculata cell (ZF cell)",
                "Adrenal zona reticularis cell (ZR cell)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenal medulla cell (APUD cell)",
                "Adrenal zona fasciculata cell (ZF cell)",
                "Adrenal zona glomerulosa cell (ZG cell)",
                "Adrenal zona reticularis cell (ZR cell)",
                "Beta cell of the pancreas (B cell)",
                "Colon C cell (C cell)",
                "Gastric enterochromaffin-like cell (ECL cell)",
                "Intestinal enterochromaffin cell (EC cell)",
                "Ovarian granulosa cell (G cell)",
                "Ovarian luteal cell (L cell)",
                "Ovarian theca cell (T cell)",
                "Pancreatic alpha cell (A cell)",
                "Pancreatic delta cell (D cell)",
                "Parathyroid cell (PTH cell)",
                "Pituitary corticotroph cell (ACTH cell)",
                "Pituitary gonadotroph cell (LH/FSH cell)",
                "Pituitary lactotroph cell (PRL cell)",
                "Pituitary somatotroph cell (GH cell)",
                "Pituitary thyrotroph cell (TSH cell)",
                "Small intestine D cell (D cell)",
                "Testicular Leydig cell (L cell)",
                "Testicular Sertoli cell (S cell)",
                "Thyroid follicular cell (T cell)",
                "Thyroid parafollicular cell (C cell)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Alpha cell (\u03b1-cell)",
            "Beta cell (\u03b2-cell)",
            "Delta cell (\u03b4-cell)",
            "PP cell (PP-cell)",
            "Gamma cell (\u03b3-cell)",
            "G cell",
            "D cell",
            "Enterochromaffin-like cell (ECL cell)",
            "Somatostatin cell (SS cell)",
            "Thymic stromal lymphopoietin cell (TSLP cell)",
            "Insulin-producing cell",
            "Glucagon-producing cell",
            "Somatostatin-producing cell",
            "Pancreatic polypeptide-producing cell",
            "Gastrin cell",
            "Cholecystokinin cell",
            "Secretin cell",
            "Histamine cell",
            "Adrenocorticotropic hormone cell (ACTH cell)",
            "Melanocyte-stimulating hormone cell (MSH cell)",
            "Prolactin cell",
            "Growth hormone cell (GH cell)",
            "Thyroid-stimulating hormone cell (TSH cell)",
            "Luteinizing hormone cell (LH cell)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alpha cell (\u03b1-cell)",
                "Beta cell (\u03b2-cell)",
                "Delta cell (\u03b4-cell)",
                "PP cell (PP-cell)",
                "Gamma cell (\u03b3-cell)",
                "G cell",
                "D cell",
                "Enterochromaffin-like cell (ECL cell)",
                "Somatostatin cell (SS cell)",
                "Thymic stromal lymphopoietin cell (TSLP cell)",
                "Insulin-producing cell",
                "Glucagon-producing cell",
                "Somatostatin-producing cell",
                "Pancreatic polypeptide-producing cell",
                "Gastrin cell",
                "Cholecystokinin cell",
                "Secretin cell",
                "Histamine cell",
                "Adrenocorticotropic hormone cell (ACTH cell)",
                "Melanocyte-stimulating hormone cell (MSH cell)",
                "Prolactin cell",
                "Growth hormone cell (GH cell)",
                "Thyroid-stimulating hormone cell (TSH cell)",
                "Luteinizing hormone cell (LH cell)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenocorticotropic hormone cell (ACTH cell)",
                "Alpha cell (\u03b1-cell)",
                "Beta cell (\u03b2-cell)",
                "Cholecystokinin cell",
                "D cell",
                "Delta cell (\u03b4-cell)",
                "Enterochromaffin-like cell (ECL cell)",
                "G cell",
                "Gamma cell (\u03b3-cell)",
                "Gastrin cell",
                "Glucagon-producing cell",
                "Growth hormone cell (GH cell)",
                "Histamine cell",
                "Insulin-producing cell",
                "Luteinizing hormone cell (LH cell)",
                "Melanocyte-stimulating hormone cell (MSH cell)",
                "PP cell (PP-cell)",
                "Pancreatic polypeptide-producing cell",
                "Prolactin cell",
                "Secretin cell",
                "Somatostatin cell (SS cell)",
                "Somatostatin-producing cell",
                "Thymic stromal lymphopoietin cell (TSLP cell)",
                "Thyroid-stimulating hormone cell (TSH cell)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Alpha cell (\u03b1-cell)",
            "Beta cell (\u03b2-cell)",
            "Delta cell (\u03b4-cell)",
            "Epsilon cell (\u03b5-cell)",
            "F cell",
            "G cell",
            "I cell",
            "K cell",
            "L cell",
            "M cell",
            "N cell",
            "P cell",
            "PP cell",
            "S cell",
            "T cell (Thyroid)",
            "C cell (Parathyroid)",
            "Chief cell",
            "Oxyphil cell",
            "Zymogen cell",
            "Parafollicular cell",
            "Marginal cell",
            "Interstitial cell of Leydig",
            "Theca cell",
            "Granulosa cell",
            "Pituicytes"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alpha cell (\u03b1-cell)",
                "Beta cell (\u03b2-cell)",
                "Delta cell (\u03b4-cell)",
                "Epsilon cell (\u03b5-cell)",
                "F cell",
                "G cell",
                "I cell",
                "K cell",
                "L cell",
                "M cell",
                "N cell",
                "P cell",
                "PP cell",
                "S cell",
                "T cell (Thyroid)",
                "C cell (Parathyroid)",
                "Chief cell",
                "Oxyphil cell",
                "Zymogen cell",
                "Parafollicular cell",
                "Marginal cell",
                "Interstitial cell of Leydig",
                "Theca cell",
                "Granulosa cell"
            ],
            "mismatches": [
                "Pituicytes"
            ],
            "true_referents": [
                "Alpha cell (\u03b1-cell)",
                "Beta cell (\u03b2-cell)",
                "C cell (Parathyroid)",
                "Chief cell",
                "Delta cell (\u03b4-cell)",
                "Epsilon cell (\u03b5-cell)",
                "F cell",
                "G cell",
                "Granulosa cell",
                "I cell",
                "Interstitial cell of Leydig",
                "K cell",
                "L cell",
                "M cell",
                "Marginal cell",
                "N cell",
                "Oxyphil cell",
                "P cell",
                "PP cell",
                "Parafollicular cell",
                "S cell",
                "T cell (Thyroid)",
                "Theca cell",
                "Zymogen cell"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Pancreatic Beta Cell (\u03b2-cell)",
            "Pancreatic Alpha Cell (\u03b1-cell)",
            "Thyroid Follicular Cell (TFC)",
            "Parathyroid Chief Cell (PTC)",
            "Adrenal Medullary Chromaffin Cell (AMC)",
            "Adrenal Cortical Zona Glomerulosa Cell (ZGC)",
            "Adrenal Cortical Zona Fasciculata Cell (ZFC)",
            "Adrenal Cortical Zona Reticularis Cell (ZRC)",
            "Hypothalamic Neurosecretory Cell (HNC)",
            "Pituitary Somatotroph (Som)",
            "Pituitary Lactotroph (Lac)",
            "Pituitary Corticotroph (Cort)",
            "Pituitary Thyrotroph (Thy)",
            "Pituitary Gonadotroph (Gon)",
            "Pinealocyte (Pineal cell)",
            "Gastric G Cell",
            "Intestinal Enteroendocrine K Cell",
            "Intestinal Enteroendocrine L Cell",
            "Renal Juxtaglomerular Cell (JGC)",
            "Ovarian Granulosa Cell (GC)",
            "Ovarian Theca Cell (TC)",
            "Testicular Leydig Cell (LC)",
            "Placental Syncytiotrophoblast (STB)",
            "C-Cell of the Thyroid (Parafollicular cell)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Pancreatic Beta Cell (\u03b2-cell)",
                "Pancreatic Alpha Cell (\u03b1-cell)",
                "Thyroid Follicular Cell (TFC)",
                "Parathyroid Chief Cell (PTC)",
                "Adrenal Medullary Chromaffin Cell (AMC)",
                "Adrenal Cortical Zona Glomerulosa Cell (ZGC)",
                "Adrenal Cortical Zona Fasciculata Cell (ZFC)",
                "Adrenal Cortical Zona Reticularis Cell (ZRC)",
                "Hypothalamic Neurosecretory Cell (HNC)",
                "Pituitary Somatotroph (Som)",
                "Pituitary Lactotroph (Lac)",
                "Pituitary Corticotroph (Cort)",
                "Pituitary Thyrotroph (Thy)",
                "Pituitary Gonadotroph (Gon)",
                "Pinealocyte (Pineal cell)",
                "Gastric G Cell",
                "Intestinal Enteroendocrine K Cell",
                "Intestinal Enteroendocrine L Cell",
                "Renal Juxtaglomerular Cell (JGC)",
                "Ovarian Granulosa Cell (GC)",
                "Ovarian Theca Cell (TC)",
                "Testicular Leydig Cell (LC)",
                "Placental Syncytiotrophoblast (STB)",
                "C-Cell of the Thyroid (Parafollicular cell)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenal Cortical Zona Fasciculata Cell (ZFC)",
                "Adrenal Cortical Zona Glomerulosa Cell (ZGC)",
                "Adrenal Cortical Zona Reticularis Cell (ZRC)",
                "Adrenal Medullary Chromaffin Cell (AMC)",
                "C-Cell of the Thyroid (Parafollicular cell)",
                "Gastric G Cell",
                "Hypothalamic Neurosecretory Cell (HNC)",
                "Intestinal Enteroendocrine K Cell",
                "Intestinal Enteroendocrine L Cell",
                "Ovarian Granulosa Cell (GC)",
                "Ovarian Theca Cell (TC)",
                "Pancreatic Alpha Cell (\u03b1-cell)",
                "Pancreatic Beta Cell (\u03b2-cell)",
                "Parathyroid Chief Cell (PTC)",
                "Pinealocyte (Pineal cell)",
                "Pituitary Corticotroph (Cort)",
                "Pituitary Gonadotroph (Gon)",
                "Pituitary Lactotroph (Lac)",
                "Pituitary Somatotroph (Som)",
                "Pituitary Thyrotroph (Thy)",
                "Placental Syncytiotrophoblast (STB)",
                "Renal Juxtaglomerular Cell (JGC)",
                "Testicular Leydig Cell (LC)",
                "Thyroid Follicular Cell (TFC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Thyroid follicular cell (TFC)",
            "Parathyroid chief cell (PCC)",
            "Adrenal cortex cell (ACC)",
            "Adrenal medulla chromaffin cell (AMCC)",
            "Pancreatic beta cell (PBC)",
            "Pancreatic alpha cell (PAC)",
            "Pancreatic delta cell (PDC)",
            "Anterior pituitary somatotroph (APS)",
            "Anterior pituitary lactotroph (APL)",
            "Anterior pituitary corticotroph (APC)",
            "Anterior pituitary thyrotroph (APT)",
            "Anterior pituitary gonadotroph (APG)",
            "Posterior pituitary pituicyte (PPP)",
            "Ovarian granulosa cell (OGC)",
            "Ovarian theca cell (OTC)",
            "Leydig cell (LC)",
            "Sertoli cell (SC)",
            "Pinealocyte (PC)",
            "Enteroendocrine cell (EEC)",
            "Gastric G cell (GGC)",
            "Gastric D cell (GDC)",
            "Gastric ECL cell (GECLC)",
            "Atrial myocyte (AM)",
            "Juxtaglomerular cell (JGC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Thyroid follicular cell (TFC)",
                "Parathyroid chief cell (PCC)",
                "Adrenal cortex cell (ACC)",
                "Adrenal medulla chromaffin cell (AMCC)",
                "Pancreatic beta cell (PBC)",
                "Pancreatic alpha cell (PAC)",
                "Pancreatic delta cell (PDC)",
                "Anterior pituitary somatotroph (APS)",
                "Anterior pituitary lactotroph (APL)",
                "Anterior pituitary corticotroph (APC)",
                "Anterior pituitary thyrotroph (APT)",
                "Anterior pituitary gonadotroph (APG)",
                "Posterior pituitary pituicyte (PPP)",
                "Ovarian granulosa cell (OGC)",
                "Ovarian theca cell (OTC)",
                "Leydig cell (LC)",
                "Sertoli cell (SC)",
                "Pinealocyte (PC)",
                "Enteroendocrine cell (EEC)",
                "Gastric G cell (GGC)",
                "Gastric D cell (GDC)",
                "Gastric ECL cell (GECLC)",
                "Atrial myocyte (AM)",
                "Juxtaglomerular cell (JGC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenal cortex cell (ACC)",
                "Adrenal medulla chromaffin cell (AMCC)",
                "Anterior pituitary corticotroph (APC)",
                "Anterior pituitary gonadotroph (APG)",
                "Anterior pituitary lactotroph (APL)",
                "Anterior pituitary somatotroph (APS)",
                "Anterior pituitary thyrotroph (APT)",
                "Atrial myocyte (AM)",
                "Enteroendocrine cell (EEC)",
                "Gastric D cell (GDC)",
                "Gastric ECL cell (GECLC)",
                "Gastric G cell (GGC)",
                "Juxtaglomerular cell (JGC)",
                "Leydig cell (LC)",
                "Ovarian granulosa cell (OGC)",
                "Ovarian theca cell (OTC)",
                "Pancreatic alpha cell (PAC)",
                "Pancreatic beta cell (PBC)",
                "Pancreatic delta cell (PDC)",
                "Parathyroid chief cell (PCC)",
                "Pinealocyte (PC)",
                "Posterior pituitary pituicyte (PPP)",
                "Sertoli cell (SC)",
                "Thyroid follicular cell (TFC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Alpha cell (\u03b1-cell)",
            "Beta cell (\u03b2-cell)",
            "Delta cell (\u03b4-cell)",
            "Gamma cell (\u03b3-cell)",
            "PP cell (Pancreatic Polypeptide cell)",
            "Enteroendocrine cell",
            "Chromaffin cell",
            "Thyroid follicular cell",
            "Parafollicular cell (C cell)",
            "Adrenal cortex cell",
            "Leydig cell",
            "Sertoli cell",
            "Granulosa cell",
            "Theca cell",
            "Oxyphil cell",
            "Chief cell",
            "Pinealocyte",
            "Islet of Langerhans cell",
            "Neuroendocrine cell",
            "Adipocyte",
            "Gastric G cell",
            "Intestinal K cell",
            "Cardiac myocyte (endocrine function)",
            "Placental trophoblast cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alpha cell (\u03b1-cell)",
                "Beta cell (\u03b2-cell)",
                "Delta cell (\u03b4-cell)",
                "Gamma cell (\u03b3-cell)",
                "PP cell (Pancreatic Polypeptide cell)",
                "Enteroendocrine cell",
                "Chromaffin cell",
                "Thyroid follicular cell",
                "Parafollicular cell (C cell)",
                "Adrenal cortex cell",
                "Leydig cell",
                "Sertoli cell",
                "Granulosa cell",
                "Theca cell",
                "Oxyphil cell",
                "Chief cell",
                "Pinealocyte",
                "Islet of Langerhans cell",
                "Neuroendocrine cell",
                "Adipocyte",
                "Gastric G cell",
                "Intestinal K cell",
                "Cardiac myocyte (endocrine function)",
                "Placental trophoblast cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "Adrenal cortex cell",
                "Alpha cell (\u03b1-cell)",
                "Beta cell (\u03b2-cell)",
                "Cardiac myocyte (endocrine function)",
                "Chief cell",
                "Chromaffin cell",
                "Delta cell (\u03b4-cell)",
                "Enteroendocrine cell",
                "Gamma cell (\u03b3-cell)",
                "Gastric G cell",
                "Granulosa cell",
                "Intestinal K cell",
                "Islet of Langerhans cell",
                "Leydig cell",
                "Neuroendocrine cell",
                "Oxyphil cell",
                "PP cell (Pancreatic Polypeptide cell)",
                "Parafollicular cell (C cell)",
                "Pinealocyte",
                "Placental trophoblast cell",
                "Sertoli cell",
                "Theca cell",
                "Thyroid follicular cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Pancreatic Alpha Cell (\u03b1-cell)",
            "Pancreatic Beta Cell (\u03b2-cell)",
            "Pancreatic Delta Cell (\u03b4-cell)",
            "Pancreatic PP Cell (PP-cell)",
            "Pancreatic Epsilon Cell (\u03b5-cell)",
            "Thyroid Follicular Cell (TFC)",
            "Parathyroid Chief Cell (PCC)",
            "Adrenal Cortex Zona Glomerulosa Cell (ZGC)",
            "Adrenal Cortex Zona Fasciculata Cell (ZFC)",
            "Adrenal Cortex Zona Reticularis Cell (ZRC)",
            "Adrenal Medulla Chromaffin Cell (AMCC)",
            "Pituitary Anterior Lobe Somatotrope (PALS)",
            "Pituitary Anterior Lobe Lactotrope (PALL)",
            "Pituitary Anterior Lobe Corticotrope (PALC)",
            "Pituitary Anterior Lobe Thyrotrope (PALT)",
            "Pituitary Anterior Lobe Gonadotrope (PALG)",
            "Pituitary Posterior Lobe Magnocellular Neurosecretory Cell (PLMNC)",
            "Pituitary Posterior Lobe Parvocellular Neurosecretory Cell (PLPNC)",
            "Pineal Gland Pinealocyte (PGP)",
            "Hypothalamic Neuroendocrine Cell (HNC)",
            "Ovarian Granulosa Cell (OGC)",
            "Testicular Leydig Cell (TLC)",
            "Testicular Sertoli Cell (TSC)",
            "Placental Trophoblast Cell (PTC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Pancreatic Alpha Cell (\u03b1-cell)",
                "Pancreatic Beta Cell (\u03b2-cell)",
                "Pancreatic Delta Cell (\u03b4-cell)",
                "Pancreatic PP Cell (PP-cell)",
                "Pancreatic Epsilon Cell (\u03b5-cell)",
                "Thyroid Follicular Cell (TFC)",
                "Parathyroid Chief Cell (PCC)",
                "Adrenal Cortex Zona Glomerulosa Cell (ZGC)",
                "Adrenal Cortex Zona Fasciculata Cell (ZFC)",
                "Adrenal Cortex Zona Reticularis Cell (ZRC)",
                "Adrenal Medulla Chromaffin Cell (AMCC)",
                "Pituitary Anterior Lobe Somatotrope (PALS)",
                "Pituitary Anterior Lobe Lactotrope (PALL)",
                "Pituitary Anterior Lobe Corticotrope (PALC)",
                "Pituitary Anterior Lobe Thyrotrope (PALT)",
                "Pituitary Anterior Lobe Gonadotrope (PALG)",
                "Pituitary Posterior Lobe Magnocellular Neurosecretory Cell (PLMNC)",
                "Pituitary Posterior Lobe Parvocellular Neurosecretory Cell (PLPNC)",
                "Pineal Gland Pinealocyte (PGP)",
                "Hypothalamic Neuroendocrine Cell (HNC)",
                "Ovarian Granulosa Cell (OGC)",
                "Testicular Leydig Cell (TLC)",
                "Testicular Sertoli Cell (TSC)",
                "Placental Trophoblast Cell (PTC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenal Cortex Zona Fasciculata Cell (ZFC)",
                "Adrenal Cortex Zona Glomerulosa Cell (ZGC)",
                "Adrenal Cortex Zona Reticularis Cell (ZRC)",
                "Adrenal Medulla Chromaffin Cell (AMCC)",
                "Hypothalamic Neuroendocrine Cell (HNC)",
                "Ovarian Granulosa Cell (OGC)",
                "Pancreatic Alpha Cell (\u03b1-cell)",
                "Pancreatic Beta Cell (\u03b2-cell)",
                "Pancreatic Delta Cell (\u03b4-cell)",
                "Pancreatic Epsilon Cell (\u03b5-cell)",
                "Pancreatic PP Cell (PP-cell)",
                "Parathyroid Chief Cell (PCC)",
                "Pineal Gland Pinealocyte (PGP)",
                "Pituitary Anterior Lobe Corticotrope (PALC)",
                "Pituitary Anterior Lobe Gonadotrope (PALG)",
                "Pituitary Anterior Lobe Lactotrope (PALL)",
                "Pituitary Anterior Lobe Somatotrope (PALS)",
                "Pituitary Anterior Lobe Thyrotrope (PALT)",
                "Pituitary Posterior Lobe Magnocellular Neurosecretory Cell (PLMNC)",
                "Pituitary Posterior Lobe Parvocellular Neurosecretory Cell (PLPNC)",
                "Placental Trophoblast Cell (PTC)",
                "Testicular Leydig Cell (TLC)",
                "Testicular Sertoli Cell (TSC)",
                "Thyroid Follicular Cell (TFC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Pancreatic beta cell",
            "Thyroid follicular cell",
            "Adrenal cortex cell",
            "Pituitary gonadotroph cell",
            "Parathyroid chief cell",
            "Ovarian granulosa cell",
            "Testicular Leydig cell",
            "Adipocyte",
            "Hypothalamic neurosecretory cell",
            "Gastric G cell",
            "Intestinal enteroendocrine cell",
            "Pinealocyte",
            "Pituitary lactotroph cell",
            "Thymic epithelial cell",
            "Adrenal medulla chromaffin cell",
            "Pituitary corticotroph cell",
            "Adrenal zona reticularis cell",
            "Thyroid parafollicular cell",
            "Hepatocyte",
            "Renal juxtaglomerular cell",
            "Adrenal zona fasciculata cell",
            "Placental syncytiotrophoblast cell",
            "Pituitary somatotroph cell",
            "Adrenal zona glomerulosa cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Pancreatic beta cell",
                "Thyroid follicular cell",
                "Adrenal cortex cell",
                "Pituitary gonadotroph cell",
                "Parathyroid chief cell",
                "Ovarian granulosa cell",
                "Testicular Leydig cell",
                "Adipocyte",
                "Hypothalamic neurosecretory cell",
                "Gastric G cell",
                "Intestinal enteroendocrine cell",
                "Pinealocyte",
                "Pituitary lactotroph cell",
                "Thymic epithelial cell",
                "Adrenal medulla chromaffin cell",
                "Pituitary corticotroph cell",
                "Adrenal zona reticularis cell",
                "Thyroid parafollicular cell",
                "Hepatocyte",
                "Renal juxtaglomerular cell",
                "Adrenal zona fasciculata cell",
                "Placental syncytiotrophoblast cell",
                "Pituitary somatotroph cell",
                "Adrenal zona glomerulosa cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "Adrenal cortex cell",
                "Adrenal medulla chromaffin cell",
                "Adrenal zona fasciculata cell",
                "Adrenal zona glomerulosa cell",
                "Adrenal zona reticularis cell",
                "Gastric G cell",
                "Hepatocyte",
                "Hypothalamic neurosecretory cell",
                "Intestinal enteroendocrine cell",
                "Ovarian granulosa cell",
                "Pancreatic beta cell",
                "Parathyroid chief cell",
                "Pinealocyte",
                "Pituitary corticotroph cell",
                "Pituitary gonadotroph cell",
                "Pituitary lactotroph cell",
                "Pituitary somatotroph cell",
                "Placental syncytiotrophoblast cell",
                "Renal juxtaglomerular cell",
                "Testicular Leydig cell",
                "Thymic epithelial cell",
                "Thyroid follicular cell",
                "Thyroid parafollicular cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Pancreatic beta cell (\u03b2 cell)",
            "Pancreatic alpha cell (\u03b1 cell)",
            "Pancreatic delta cell (\u03b4 cell)",
            "Pancreatic PP cell",
            "Parathyroid chief cell",
            "Thyroid follicular cell",
            "Thyroid parafollicular cell (C cell)",
            "Adrenal cortical cell",
            "Adrenal medullary chromaffin cell",
            "Pituitary somatotroph",
            "Pituitary lactotroph",
            "Pituitary corticotroph",
            "Pituitary thyrotroph",
            "Pituitary gonadotroph",
            "Pinealocyte",
            "Enteroendocrine L cell",
            "Enteroendocrine G cell",
            "Enteroendocrine S cell",
            "Enteroendocrine I cell",
            "Leydig cell",
            "Granulosa cell",
            "Renal EPO-producing interstitial cell",
            "Pulmonary neuroendocrine cell",
            "Neuroendocrine pancreatic epsilon cell",
            "Thymic endocrine cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Pancreatic beta cell (\u03b2 cell)",
                "Pancreatic alpha cell (\u03b1 cell)",
                "Pancreatic delta cell (\u03b4 cell)",
                "Pancreatic PP cell",
                "Parathyroid chief cell",
                "Thyroid follicular cell",
                "Thyroid parafollicular cell (C cell)",
                "Adrenal cortical cell",
                "Adrenal medullary chromaffin cell",
                "Pituitary somatotroph",
                "Pituitary lactotroph",
                "Pituitary corticotroph",
                "Pituitary thyrotroph",
                "Pituitary gonadotroph",
                "Pinealocyte",
                "Enteroendocrine L cell",
                "Enteroendocrine G cell",
                "Enteroendocrine S cell",
                "Enteroendocrine I cell",
                "Leydig cell",
                "Granulosa cell",
                "Renal EPO-producing interstitial cell",
                "Pulmonary neuroendocrine cell",
                "Neuroendocrine pancreatic epsilon cell"
            ],
            "mismatches": [
                "Thymic endocrine cell"
            ],
            "true_referents": [
                "Adrenal cortical cell",
                "Adrenal medullary chromaffin cell",
                "Enteroendocrine G cell",
                "Enteroendocrine I cell",
                "Enteroendocrine L cell",
                "Enteroendocrine S cell",
                "Granulosa cell",
                "Leydig cell",
                "Neuroendocrine pancreatic epsilon cell",
                "Pancreatic PP cell",
                "Pancreatic alpha cell (\u03b1 cell)",
                "Pancreatic beta cell (\u03b2 cell)",
                "Pancreatic delta cell (\u03b4 cell)",
                "Parathyroid chief cell",
                "Pinealocyte",
                "Pituitary corticotroph",
                "Pituitary gonadotroph",
                "Pituitary lactotroph",
                "Pituitary somatotroph",
                "Pituitary thyrotroph",
                "Pulmonary neuroendocrine cell",
                "Renal EPO-producing interstitial cell",
                "Thyroid follicular cell",
                "Thyroid parafollicular cell (C cell)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Pancreatic beta cell (\u03b2 cell)",
            "Thyroid follicular cell",
            "Adrenal cortical cell",
            "Pituitary somatotroph",
            "Leydig cell",
            "Ovarian granulosa cell",
            "Pinealocyte",
            "Parathyroid chief cell",
            "Gastric G cell",
            "Enteroendocrine K cell",
            "Juxtaglomerular cell",
            "Chromaffin cell",
            "Pancreatic alpha cell (\u03b1 cell)",
            "Thyroid C cell (parafollicular cell)",
            "Pituitary gonadotroph",
            "Sertoli cell",
            "Ovarian theca cell",
            "Enterochromaffin cell",
            "Pancreatic delta cell (\u03b4 cell)",
            "Pituitary corticotroph",
            "Pituitary lactotroph",
            "Pituitary thyrotroph",
            "Enteroendocrine L cell",
            "Renin-secreting cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Pancreatic beta cell (\u03b2 cell)",
                "Thyroid follicular cell",
                "Adrenal cortical cell",
                "Pituitary somatotroph",
                "Leydig cell",
                "Ovarian granulosa cell",
                "Pinealocyte",
                "Parathyroid chief cell",
                "Gastric G cell",
                "Enteroendocrine K cell",
                "Juxtaglomerular cell",
                "Chromaffin cell",
                "Pancreatic alpha cell (\u03b1 cell)",
                "Thyroid C cell (parafollicular cell)",
                "Pituitary gonadotroph",
                "Sertoli cell",
                "Ovarian theca cell",
                "Enterochromaffin cell",
                "Pancreatic delta cell (\u03b4 cell)",
                "Pituitary corticotroph",
                "Pituitary lactotroph",
                "Pituitary thyrotroph",
                "Enteroendocrine L cell",
                "Renin-secreting cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenal cortical cell",
                "Chromaffin cell",
                "Enterochromaffin cell",
                "Enteroendocrine K cell",
                "Enteroendocrine L cell",
                "Gastric G cell",
                "Juxtaglomerular cell",
                "Leydig cell",
                "Ovarian granulosa cell",
                "Ovarian theca cell",
                "Pancreatic alpha cell (\u03b1 cell)",
                "Pancreatic beta cell (\u03b2 cell)",
                "Pancreatic delta cell (\u03b4 cell)",
                "Parathyroid chief cell",
                "Pinealocyte",
                "Pituitary corticotroph",
                "Pituitary gonadotroph",
                "Pituitary lactotroph",
                "Pituitary somatotroph",
                "Pituitary thyrotroph",
                "Renin-secreting cell",
                "Sertoli cell",
                "Thyroid C cell (parafollicular cell)",
                "Thyroid follicular cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Alpha cells (\u03b1 cells)",
            "Beta cells (\u03b2 cells)",
            "Delta cells (\u03b4 cells)",
            "Gamma cells (\u03b3 cells)",
            "Epsilon cells (\u03b5 cells)",
            "PP cells",
            "D1 cells",
            "Enterochromaffin cells (EC cells)",
            "G cells",
            "I cells",
            "K cells",
            "L cells",
            "M cells",
            "N cells",
            "P cells",
            "S cells",
            "X cells",
            "Chief cells",
            "Oxyphil cells",
            "Pituitary acidophil cells",
            "Pituitary basophil cells",
            "Pituitary chromophobe cells",
            "Leydig cells",
            "Sertoli cells"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alpha cells (\u03b1 cells)",
                "Beta cells (\u03b2 cells)",
                "Delta cells (\u03b4 cells)",
                "Gamma cells (\u03b3 cells)",
                "Epsilon cells (\u03b5 cells)",
                "PP cells",
                "D1 cells",
                "Enterochromaffin cells (EC cells)",
                "G cells",
                "I cells",
                "K cells",
                "L cells",
                "M cells",
                "N cells",
                "P cells",
                "S cells",
                "X cells",
                "Chief cells",
                "Oxyphil cells",
                "Pituitary acidophil cells",
                "Pituitary basophil cells",
                "Pituitary chromophobe cells",
                "Leydig cells",
                "Sertoli cells"
            ],
            "mismatches": [],
            "true_referents": [
                "Alpha cells (\u03b1 cells)",
                "Beta cells (\u03b2 cells)",
                "Chief cells",
                "D1 cells",
                "Delta cells (\u03b4 cells)",
                "Enterochromaffin cells (EC cells)",
                "Epsilon cells (\u03b5 cells)",
                "G cells",
                "Gamma cells (\u03b3 cells)",
                "I cells",
                "K cells",
                "L cells",
                "Leydig cells",
                "M cells",
                "N cells",
                "Oxyphil cells",
                "P cells",
                "PP cells",
                "Pituitary acidophil cells",
                "Pituitary basophil cells",
                "Pituitary chromophobe cells",
                "S cells",
                "Sertoli cells",
                "X cells"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Alpha cell (\u03b1 cell)",
            "Beta cell (\u03b2 cell)",
            "Delta cell (\u03b4 cell)",
            "Epsilon cell (\u03b5 cell)",
            "Follicular cell",
            "Leydig cell",
            "Sertoli cell",
            "Theca cell",
            "Thyroid follicular cell",
            "Adrenal cortex cell",
            "Adrenal medulla cell",
            "Parathyroid cell",
            "Pituitary cell",
            "Pancreatic islet cell",
            "Adipocyte",
            "Ovarian cell",
            "Testicular cell",
            "Pinealocyte",
            "Enteroendocrine cell",
            "Hypothalamic neurosecretory cell",
            "Thymic epithelial cell",
            "Placental cell",
            "Kidney cell",
            "Liver cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alpha cell (\u03b1 cell)",
                "Beta cell (\u03b2 cell)",
                "Delta cell (\u03b4 cell)",
                "Epsilon cell (\u03b5 cell)",
                "Follicular cell",
                "Leydig cell",
                "Sertoli cell",
                "Theca cell",
                "Thyroid follicular cell",
                "Adrenal cortex cell",
                "Adrenal medulla cell",
                "Parathyroid cell",
                "Pituitary cell",
                "Pancreatic islet cell",
                "Adipocyte",
                "Ovarian cell",
                "Testicular cell",
                "Pinealocyte",
                "Enteroendocrine cell",
                "Hypothalamic neurosecretory cell",
                "Thymic epithelial cell",
                "Placental cell",
                "Kidney cell",
                "Liver cell"
            ],
            "mismatches": [],
            "true_referents": [
                "Adipocyte",
                "Adrenal cortex cell",
                "Adrenal medulla cell",
                "Alpha cell (\u03b1 cell)",
                "Beta cell (\u03b2 cell)",
                "Delta cell (\u03b4 cell)",
                "Enteroendocrine cell",
                "Epsilon cell (\u03b5 cell)",
                "Follicular cell",
                "Hypothalamic neurosecretory cell",
                "Kidney cell",
                "Leydig cell",
                "Liver cell",
                "Ovarian cell",
                "Pancreatic islet cell",
                "Parathyroid cell",
                "Pinealocyte",
                "Pituitary cell",
                "Placental cell",
                "Sertoli cell",
                "Testicular cell",
                "Theca cell",
                "Thymic epithelial cell",
                "Thyroid follicular cell"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Adrenal Cortical Cell (ACC)",
            "Adrenal Medullary Cell (AMC)",
            "Anterior Pituitary Cell (APC)",
            "Beta Cell (BC)",
            "Chief Cell (CC)",
            "Delta Cell (DC)",
            "Ectopic Hormone-Producing Cell (EHPC)",
            "Enterochromaffin Cell (EC)",
            "Folliculostellate Cell (FSC)",
            "Gonadotroph Cell (GC)",
            "Islet Cell (IC)",
            "Lactotroph Cell (LC)",
            "Melanotroph Cell (MC)",
            "Neuroendocrine Cell (NEC)",
            "Oxyphil Cell (OC)",
            "Parathyroid Cell (PC)",
            "Pinealocyte (PNC)",
            "Posterior Pituitary Cell (PPC)",
            "Principal Cell (PRC)",
            "Prolactin-Secreting Cell (PSC)",
            "Somatotroph Cell (SC)",
            "Thyrotroph Cell (TC)",
            "Thyroid Follicular Cell (TFC)",
            "Thyroid Parafollicular Cell (TPFC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenal Cortical Cell (ACC)",
                "Adrenal Medullary Cell (AMC)",
                "Anterior Pituitary Cell (APC)",
                "Beta Cell (BC)",
                "Chief Cell (CC)",
                "Delta Cell (DC)",
                "Ectopic Hormone-Producing Cell (EHPC)",
                "Enterochromaffin Cell (EC)",
                "Folliculostellate Cell (FSC)",
                "Gonadotroph Cell (GC)",
                "Islet Cell (IC)",
                "Lactotroph Cell (LC)",
                "Melanotroph Cell (MC)",
                "Neuroendocrine Cell (NEC)",
                "Oxyphil Cell (OC)",
                "Parathyroid Cell (PC)",
                "Pinealocyte (PNC)",
                "Posterior Pituitary Cell (PPC)",
                "Principal Cell (PRC)",
                "Prolactin-Secreting Cell (PSC)",
                "Somatotroph Cell (SC)",
                "Thyrotroph Cell (TC)",
                "Thyroid Follicular Cell (TFC)",
                "Thyroid Parafollicular Cell (TPFC)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenal Cortical Cell (ACC)",
                "Adrenal Medullary Cell (AMC)",
                "Anterior Pituitary Cell (APC)",
                "Beta Cell (BC)",
                "Chief Cell (CC)",
                "Delta Cell (DC)",
                "Ectopic Hormone-Producing Cell (EHPC)",
                "Enterochromaffin Cell (EC)",
                "Folliculostellate Cell (FSC)",
                "Gonadotroph Cell (GC)",
                "Islet Cell (IC)",
                "Lactotroph Cell (LC)",
                "Melanotroph Cell (MC)",
                "Neuroendocrine Cell (NEC)",
                "Oxyphil Cell (OC)",
                "Parathyroid Cell (PC)",
                "Pinealocyte (PNC)",
                "Posterior Pituitary Cell (PPC)",
                "Principal Cell (PRC)",
                "Prolactin-Secreting Cell (PSC)",
                "Somatotroph Cell (SC)",
                "Thyroid Follicular Cell (TFC)",
                "Thyroid Parafollicular Cell (TPFC)",
                "Thyrotroph Cell (TC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Pancreatic beta cells (\u03b2-cells) (INS-1 cells)",
            "Adrenal medullary chromaffin cells",
            "Thyroid follicular cells (T3/T4-producing cells)",
            "Pituitary gland cells (e.g. somatotropes, lactotropes)",
            "Anterior pituitary corticotropes (ACTH-producing cells)",
            "Posterior pituitary neurohypophysial cells (oxytocin/vasopressin-producing cells)",
            "Thyroid parafollicular cells (calcitonin-producing cells)",
            "Adrenal cortical cells (glucocorticoid-producing cells)",
            "Pancreatic alpha cells (\u03b1-cells) (glucagon-producing cells)",
            "Gonadotropes (FSH/LH-producing cells)",
            "Thyrotropes (TSH-producing cells)",
            "Adrenal medullary sympathetic neurons",
            "Islet cells (pancreatic islets of Langerhans)",
            "Pituitary gonadotropes (FSH/LH-producing cells)",
            "Thyroid C cells (calcitonin-producing cells)",
            "Adrenal cortical zona glomerulosa cells (aldosterone-producing cells)",
            "Pancreatic delta cells (\u03b4-cells) (somatostatin-producing cells)",
            "Thyroid follicular epithelial cells (T3/T4-producing cells)",
            "Pituitary somatotropes (growth hormone-producing cells)",
            "Adrenal cortical zona fasciculata cells (glucocorticoid-producing cells)",
            "Pancreatic PP cells (pancreatic polypeptide-producing cells)",
            "Gastric G cells (gastrin-producing cells)",
            "Adrenal cortical zona reticularis cells (androgens-producing cells)",
            "Thyroid parafollicular C cells (calcitonin-producing cells)",
            "Pituitary lactotropes (prolactin-producing cells)",
            "Adrenal medullary paraganglioma cells"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Pancreatic beta cells (\u03b2-cells) (INS-1 cells)",
                "Adrenal medullary chromaffin cells",
                "Thyroid follicular cells (T3/T4-producing cells)",
                "Pituitary gland cells (e.g. somatotropes, lactotropes)",
                "Anterior pituitary corticotropes (ACTH-producing cells)",
                "Posterior pituitary neurohypophysial cells (oxytocin/vasopressin-producing cells)",
                "Thyroid parafollicular cells (calcitonin-producing cells)",
                "Adrenal cortical cells (glucocorticoid-producing cells)",
                "Pancreatic alpha cells (\u03b1-cells) (glucagon-producing cells)",
                "Gonadotropes (FSH/LH-producing cells)",
                "Thyrotropes (TSH-producing cells)",
                "Adrenal medullary sympathetic neurons",
                "Islet cells (pancreatic islets of Langerhans)",
                "Pituitary gonadotropes (FSH/LH-producing cells)",
                "Thyroid C cells (calcitonin-producing cells)",
                "Adrenal cortical zona glomerulosa cells (aldosterone-producing cells)",
                "Pancreatic delta cells (\u03b4-cells) (somatostatin-producing cells)",
                "Thyroid follicular epithelial cells (T3/T4-producing cells)",
                "Pituitary somatotropes (growth hormone-producing cells)",
                "Adrenal cortical zona fasciculata cells (glucocorticoid-producing cells)",
                "Pancreatic PP cells (pancreatic polypeptide-producing cells)",
                "Gastric G cells (gastrin-producing cells)",
                "Adrenal cortical zona reticularis cells (androgens-producing cells)",
                "Thyroid parafollicular C cells (calcitonin-producing cells)"
            ],
            "mismatches": [
                "Pituitary lactotropes (prolactin-producing cells)",
                "Adrenal medullary paraganglioma cells"
            ],
            "true_referents": [
                "Adrenal cortical cells (glucocorticoid-producing cells)",
                "Adrenal cortical zona fasciculata cells (glucocorticoid-producing cells)",
                "Adrenal cortical zona glomerulosa cells (aldosterone-producing cells)",
                "Adrenal cortical zona reticularis cells (androgens-producing cells)",
                "Adrenal medullary chromaffin cells",
                "Adrenal medullary sympathetic neurons",
                "Anterior pituitary corticotropes (ACTH-producing cells)",
                "Gastric G cells (gastrin-producing cells)",
                "Gonadotropes (FSH/LH-producing cells)",
                "Islet cells (pancreatic islets of Langerhans)",
                "Pancreatic PP cells (pancreatic polypeptide-producing cells)",
                "Pancreatic alpha cells (\u03b1-cells) (glucagon-producing cells)",
                "Pancreatic beta cells (\u03b2-cells) (INS-1 cells)",
                "Pancreatic delta cells (\u03b4-cells) (somatostatin-producing cells)",
                "Pituitary gland cells (e.g. somatotropes, lactotropes)",
                "Pituitary gonadotropes (FSH/LH-producing cells)",
                "Pituitary somatotropes (growth hormone-producing cells)",
                "Posterior pituitary neurohypophysial cells (oxytocin/vasopressin-producing cells)",
                "Thyroid C cells (calcitonin-producing cells)",
                "Thyroid follicular cells (T3/T4-producing cells)",
                "Thyroid follicular epithelial cells (T3/T4-producing cells)",
                "Thyroid parafollicular C cells (calcitonin-producing cells)",
                "Thyroid parafollicular cells (calcitonin-producing cells)",
                "Thyrotropes (TSH-producing cells)"
            ],
            "TP": 24,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            "Insulin-producing beta cell (\u03b2-cell)",
            "Glucagon-producing alpha cell (\u03b1-cell)",
            "Somatostatin-producing delta cell (\u03b4-cell)",
            "Pancreatic polypeptide-producing PP cell (PP-cell)",
            "Gastrin-producing G cell",
            "Cholecystokinin-producing I cell",
            "Secretin-producing S cell",
            "Motilin-producing M cell",
            "Ghrelin-producing P/D1 cell",
            "Corticotropic cell (corticotroph)",
            "Thyrotropic cell (thyrotroph)",
            "Gonadotropic cell (gonadotroph)",
            "Lactotropic cell (lactotroph)",
            "Somatotropic cell (somatotroph)",
            "Parathyroid chief cell",
            "Oxytocin-producing magnocellular neuron",
            "Vasopressin-producing magnocellular neuron",
            "Adrenocorticotropic hormone-producing cell (corticotroph)",
            "Follicle-stimulating hormone-producing cell (gonadotroph)",
            "Luteinizing hormone-producing cell (gonadotroph)",
            "Prolactin-producing lactotroph",
            "Thyroid-stimulating hormone-producing cell (thyrotroph)",
            "Growth hormone-producing cell (somatotroph)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin-producing beta cell (\u03b2-cell)",
                "Glucagon-producing alpha cell (\u03b1-cell)",
                "Somatostatin-producing delta cell (\u03b4-cell)",
                "Pancreatic polypeptide-producing PP cell (PP-cell)",
                "Gastrin-producing G cell",
                "Cholecystokinin-producing I cell",
                "Secretin-producing S cell",
                "Motilin-producing M cell",
                "Ghrelin-producing P/D1 cell",
                "Corticotropic cell (corticotroph)",
                "Thyrotropic cell (thyrotroph)",
                "Gonadotropic cell (gonadotroph)",
                "Lactotropic cell (lactotroph)",
                "Somatotropic cell (somatotroph)",
                "Parathyroid chief cell",
                "Oxytocin-producing magnocellular neuron",
                "Vasopressin-producing magnocellular neuron",
                "Adrenocorticotropic hormone-producing cell (corticotroph)",
                "Follicle-stimulating hormone-producing cell (gonadotroph)",
                "Luteinizing hormone-producing cell (gonadotroph)",
                "Prolactin-producing lactotroph",
                "Thyroid-stimulating hormone-producing cell (thyrotroph)",
                "Growth hormone-producing cell (somatotroph)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenocorticotropic hormone-producing cell (corticotroph)",
                "Cholecystokinin-producing I cell",
                "Corticotropic cell (corticotroph)",
                "Follicle-stimulating hormone-producing cell (gonadotroph)",
                "Gastrin-producing G cell",
                "Ghrelin-producing P/D1 cell",
                "Glucagon-producing alpha cell (\u03b1-cell)",
                "Gonadotropic cell (gonadotroph)",
                "Growth hormone-producing cell (somatotroph)",
                "Insulin-producing beta cell (\u03b2-cell)",
                "Lactotropic cell (lactotroph)",
                "Luteinizing hormone-producing cell (gonadotroph)",
                "Motilin-producing M cell",
                "Oxytocin-producing magnocellular neuron",
                "Pancreatic polypeptide-producing PP cell (PP-cell)",
                "Parathyroid chief cell",
                "Prolactin-producing lactotroph",
                "Secretin-producing S cell",
                "Somatostatin-producing delta cell (\u03b4-cell)",
                "Somatotropic cell (somatotroph)",
                "Thyroid-stimulating hormone-producing cell (thyrotroph)",
                "Thyrotropic cell (thyrotroph)",
                "Vasopressin-producing magnocellular neuron"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "endocrine cell",
        "domain": "biology",
        "response": [
            {
                "Referent": "pituitary gland (PIT)",
                "Canonical name": "pituitary gland"
            },
            {
                "Referent": "thyroid gland (THY)",
                "Canonical name": "thyroid gland"
            },
            {
                "Referent": "parathyroid gland (PAR)",
                "Canonical name": "parathyroid gland"
            },
            {
                "Referent": "adrenal gland (ADR)",
                "Canonical name": "adrenal gland"
            },
            {
                "Referent": "pancreas (PAN)",
                "Canonical name": "pancreas"
            },
            {
                "Referent": "gonads (GON)",
                "Canonical name": "gonads"
            },
            {
                "Referent": "thymus gland (THY)",
                "Canonical name": "thymus gland"
            },
            {
                "Referent": "spleen (SPL)",
                "Canonical name": "spleen"
            },
            {
                "Referent": "lymph nodes (LYM)",
                "Canonical name": "lymph nodes"
            },
            {
                "Referent": "thymus gland (THY)",
                "Canonical name": "thymus gland"
            },
            {
                "Referent": "bone marrow (BMR)",
                "Canonical name": "bone marrow"
            },
            {
                "Referent": "testes (TES)",
                "Canonical name": "testes"
            },
            {
                "Referent": "ovaries (OVX)",
                "Canonical name": "ovaries"
            },
            {
                "Referent": "prostate gland (PRT)",
                "Canonical name": "prostate gland"
            },
            {
                "Referent": "uterus (UTE)",
                "Canonical name": "uterus"
            },
            {
                "Referent": "vagina (VAG)",
                "Canonical name": "vagina"
            },
            {
                "Referent": "corpus luteum (CLT)",
                "Canonical name": "corpus luteum"
            },
            {
                "Referent": "placenta (PLA)",
                "Canonical name": "placenta"
            },
            {
                "Referent": "menstrual cycle (MEN)",
                "Canonical name": "menstrual cycle"
            },
            {
                "Referent": "pregnancy (PREG)",
                "Canonical name": "pregnancy"
            },
            {
                "Referent": "lactation (LAC)",
                "Canonical name": "lactation"
            },
            {
                "Referent": "menopause (MENO)",
                "Canonical name": "menopause"
            },
            {
                "Referent": "pregnancy (PREG)",
                "Canonical name": "pregnancy"
            },
            {
                "Referent": "lactation (LAC)",
                "Canonical name": "lactation"
            },
            {
                "Referent": "menopause (MENO)",
                "Canonical name": "menopause"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "pituitary gland",
                "thyroid gland",
                "parathyroid gland",
                "adrenal gland",
                "pancreas",
                "gonads",
                "thymus gland",
                "spleen",
                "lymph nodes",
                "bone marrow",
                "testes",
                "ovaries",
                "prostate gland",
                "uterus",
                "vagina",
                "corpus luteum",
                "placenta",
                "menstrual cycle",
                "pregnancy",
                "lactation",
                "menopause"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"adrenal gland (ADR)\", \"Canonical name\": \"adrenal gland\"}",
                "{\"Referent\": \"bone marrow (BMR)\", \"Canonical name\": \"bone marrow\"}",
                "{\"Referent\": \"corpus luteum (CLT)\", \"Canonical name\": \"corpus luteum\"}",
                "{\"Referent\": \"gonads (GON)\", \"Canonical name\": \"gonads\"}",
                "{\"Referent\": \"lactation (LAC)\", \"Canonical name\": \"lactation\"}",
                "{\"Referent\": \"lymph nodes (LYM)\", \"Canonical name\": \"lymph nodes\"}",
                "{\"Referent\": \"menopause (MENO)\", \"Canonical name\": \"menopause\"}",
                "{\"Referent\": \"menstrual cycle (MEN)\", \"Canonical name\": \"menstrual cycle\"}",
                "{\"Referent\": \"ovaries (OVX)\", \"Canonical name\": \"ovaries\"}",
                "{\"Referent\": \"pancreas (PAN)\", \"Canonical name\": \"pancreas\"}",
                "{\"Referent\": \"parathyroid gland (PAR)\", \"Canonical name\": \"parathyroid gland\"}",
                "{\"Referent\": \"pituitary gland (PIT)\", \"Canonical name\": \"pituitary gland\"}",
                "{\"Referent\": \"placenta (PLA)\", \"Canonical name\": \"placenta\"}",
                "{\"Referent\": \"pregnancy (PREG)\", \"Canonical name\": \"pregnancy\"}",
                "{\"Referent\": \"prostate gland (PRT)\", \"Canonical name\": \"prostate gland\"}",
                "{\"Referent\": \"spleen (SPL)\", \"Canonical name\": \"spleen\"}",
                "{\"Referent\": \"testes (TES)\", \"Canonical name\": \"testes\"}",
                "{\"Referent\": \"thymus gland (THY)\", \"Canonical name\": \"thymus gland\"}",
                "{\"Referent\": \"thyroid gland (THY)\", \"Canonical name\": \"thyroid gland\"}",
                "{\"Referent\": \"uterus (UTE)\", \"Canonical name\": \"uterus\"}",
                "{\"Referent\": \"vagina (VAG)\", \"Canonical name\": \"vagina\"}"
            ],
            "TP": 21,
            "FP": 0,
            "FN": 0
        }
    }
]