[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "Glucagon (GCG)",
            "Growth Hormone-Releasing Hormone (GHRH)",
            "Somatostatin (SST)",
            "Vasopressin (AVP)",
            "Oxytocin (OXT)",
            "Gastrin-Releasing Peptide (GRP)",
            "Neuropeptide Y (NPY)",
            "Prolactin-Releasing Peptide (PrRP)",
            "Galanin (GAL)",
            "Neurotensin (NTS)",
            "Secretin (SCT)",
            "Cholecystokinin (CCK)",
            "Ghrelin (GHRL)",
            "Peptide YY (PYY)",
            "Pancreatic Polypeptide (PPY)",
            "Adrenocorticotropic Hormone (ACTH)",
            "Melanocyte-Stimulating Hormone (MSH)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Luteinizing Hormone-Releasing Hormone (LHRH)",
            "Parathyroid Hormone (PTH)",
            "Adiponectin",
            "Angiotensin II",
            "Erythropoietin (EPO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin (INS)",
                "Glucagon (GCG)",
                "Growth Hormone-Releasing Hormone (GHRH)",
                "Somatostatin (SST)",
                "Vasopressin (AVP)",
                "Oxytocin (OXT)",
                "Secretin (SCT)",
                "Ghrelin (GHRL)",
                "Peptide YY (PYY)",
                "Pancreatic Polypeptide (PPY)",
                "Adrenocorticotropic Hormone (ACTH)",
                "Melanocyte-Stimulating Hormone (MSH)",
                "Thyrotropin-Releasing Hormone (TRH)",
                "Parathyroid Hormone (PTH)",
                "Adiponectin",
                "Angiotensin II"
            ],
            "mismatches": [
                "Gastrin-Releasing Peptide (GRP)",
                "Neuropeptide Y (NPY)",
                "Prolactin-Releasing Peptide (PrRP)",
                "Galanin (GAL)",
                "Neurotensin (NTS)",
                "Cholecystokinin (CCK)",
                "Luteinizing Hormone-Releasing Hormone (LHRH)",
                "Erythropoietin (EPO)"
            ],
            "true_referents": [
                "Adipokines",
                "Adiponectin",
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "C-Peptide",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Glucagon",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulin Glargine",
                "Insulins",
                "Islet Amyloid Polypeptide",
                "Leptin",
                "Luteinizing Hormone",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Oxytocin",
                "Pancreatic Polypeptide",
                "Parathyroid Hormone",
                "Parathyroid Hormone-Related Protein",
                "Peptide PHI",
                "Peptide YY",
                "Proglucagon",
                "Proinsulin",
                "Prolactin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Thyrotropin",
                "Thyrotropin-Releasing Hormone",
                "Vasopressins",
                "beta-Lipotropin",
                "beta-MSH"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Adrenocorticotropic hormone (ACTH)",
            "Antidiuretic hormone (ADH)",
            "Cholecystokinin (CCK)",
            "Gastrin",
            "Glucagon",
            "Gonadotropin-releasing hormone (GnRH)",
            "Growth hormone-releasing hormone (GHRH)",
            "Growth hormone (GH)",
            "Luteinizing hormone (LH)",
            "Melanocyte-stimulating hormone (MSH)",
            "Oxytocin",
            "Parathyroid hormone (PTH)",
            "Prolactin",
            "Secretin",
            "Somatostatin",
            "Somatotropin",
            "Thyroid-stimulating hormone (TSH)",
            "Vasoactive intestinal peptide (VIP)",
            "Vasopressin",
            "Corticotropin",
            "Thymosin",
            "Erythropoietin",
            "Calcitonin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenocorticotropic hormone (ACTH)",
                "Calcitonin",
                "Corticotropin",
                "Gastrin",
                "Glucagon",
                "Gonadotropin-releasing hormone (GnRH)",
                "Growth hormone-releasing hormone (GHRH)",
                "Growth hormone (GH)",
                "Luteinizing hormone (LH)",
                "Melanocyte-stimulating hormone (MSH)",
                "Oxytocin",
                "Parathyroid hormone (PTH)",
                "Prolactin",
                "Secretin",
                "Somatostatin",
                "Vasoactive intestinal peptide (VIP)",
                "Vasopressin",
                "Thymosin"
            ],
            "mismatches": [
                "Antidiuretic hormone (ADH)",
                "Cholecystokinin (CCK)",
                "Somatotropin",
                "Thyroid-stimulating hormone (TSH)",
                "Erythropoietin"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Glucagon",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Luteinizing Hormone",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Menotropins",
                "Oxytocin",
                "Parathyroid Hormone",
                "Parathyroid Hormone-Related Protein",
                "Procalcitonin",
                "Proglucagon",
                "Prolactin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Terlipressin",
                "Thymalfasin",
                "Thymosin",
                "Thyrotropin",
                "Thyrotropin Alfa",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "beta Subunit Luteinizing Hormone",
                "beta-Lipotropin",
                "beta-MSH"
            ],
            "TP": 18,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "Glucagon (GCG)",
            "Growth Hormone-Releasing Hormone (GHRH)",
            "Somatostatin (SST)",
            "Adrenocorticotropic Hormone (ACTH)",
            "Thyroid-Stimulating Hormone (TSH)",
            "Luteinizing Hormone-Releasing Hormone (LHRH)",
            "Oxytocin (OXT)",
            "Vasopressin (AVP)",
            "Prolactin-Releasing Hormone (PRH)",
            "Gastrin",
            "Cholecystokinin (CCK)",
            "Secretin (SCT)",
            "Motilin (MLN)",
            "Neuropeptide Y (NPY)",
            "Substance P (SP)",
            "Angiotensin II (ANG II)",
            "Bradykinin (BK)",
            "Endothelin (ET)",
            "Neurotensin (NTS)",
            "Calcitonin (CT)",
            "Parathyroid Hormone (PTH)",
            "Ghrelin",
            "Orexin (OX)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin",
                "Glucagon",
                "Growth Hormone-Releasing Hormone",
                "Somatostatin",
                "Adrenocorticotropic Hormone",
                "Oxytocin",
                "Vasopressin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Motilin",
                "Angiotensin II",
                "Calcitonin",
                "Parathyroid Hormone",
                "Ghrelin"
            ],
            "mismatches": [
                "Thyroid-Stimulating Hormone",
                "Luteinizing Hormone-Releasing Hormone",
                "Gastrin",
                "Cholecystokinin",
                "Neuropeptide Y",
                "Substance P",
                "Bradykinin",
                "Endothelin",
                "Neurotensin",
                "Orexin"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Bombesin",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Glucagon",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulin Glargine",
                "Insulins",
                "Leptin",
                "Luteinizing Hormone",
                "Lypressin",
                "Motilin",
                "Nafarelin",
                "Oxytocin",
                "Parathyroid Hormone",
                "Parathyroid Hormone-Related Protein",
                "Peptide YY",
                "Procalcitonin",
                "Proglucagon",
                "Proinsulin",
                "Prolactin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Thyrotropin",
                "Thyrotropin Alfa",
                "Thyrotropin-Releasing Hormone",
                "Vasopressins",
                "beta-Endorphin",
                "gamma-Endorphin"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "Glucagon (GCG)",
            "Growth Hormone-Releasing Hormone (GHRH)",
            "Somatostatin (SST)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Prolactin-Releasing Hormone (PRH)",
            "Prolactin-Inhibiting Hormone (PIH)",
            "Gonadotropin-Releasing Hormone (GnRH)",
            "Luteinizing Hormone-Releasing Hormone (LHRH)",
            "Follicle-Stimulating Hormone-Releasing Hormone (FSHRH)",
            "Cholecystokinin (CCK)",
            "Gastrin (GAS)",
            "Secretin (SEC)",
            "Motilin (MTL)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Substance P (SP)",
            "Neuropeptide Y (NPY)",
            "Endorphins (END)",
            "Enkephalins (ENK)",
            "Dynorphins (DYN)",
            "Oxycontin (OXT)",
            "Vasopressin (AVP)",
            "Atrial Natriuretic Peptide (ANP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin",
                "Glucagon",
                "Growth Hormone-Releasing Hormone",
                "Somatostatin",
                "Thyrotropin-Releasing Hormone",
                "Corticotropin-Releasing Hormone",
                "Prolactin-Releasing Hormone",
                "Gonadotropin-Releasing Hormone",
                "Gastrin",
                "Secretin",
                "Motilin",
                "Vasoactive Intestinal Peptide",
                "Vasopressin"
            ],
            "mismatches": [
                "Prolactin-Inhibiting Hormone",
                "Luteinizing Hormone-Releasing Hormone",
                "Follicle-Stimulating Hormone-Releasing Hormone",
                "Cholecystokinin",
                "Substance P",
                "Neuropeptide Y",
                "Endorphins",
                "Enkephalins",
                "Dynorphins",
                "Oxycontin",
                "Atrial Natriuretic Peptide"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Arginine Vasopressin",
                "Atrial Natriuretic Factor",
                "Brain Natriuretic Peptide",
                "Buserelin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Follicle Stimulating Hormone",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Glucagon",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulin Glargine",
                "Insulins",
                "Luteinizing Hormone",
                "Lypressin",
                "Motilin",
                "Natriuretic Peptides",
                "Pancreatic Polypeptide",
                "Peptide YY",
                "Proglucagon",
                "Proinsulin",
                "Prolactin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Thyrotropin",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-Endorphin",
                "gamma-Endorphin"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "Glucagon (GCG)",
            "Adrenocorticotropic hormone (ACTH)",
            "Oxytocin (OXT)",
            "Vasopressin (AVP)",
            "Calcitonin (CALCA)",
            "Parathyroid hormone (PTH)",
            "Gastrin (GAST)",
            "Cholecystokinin (CCK)",
            "Somatostatin (SST)",
            "Ghrelin (GHRL)",
            "Thyrotropin-releasing hormone (TRH)",
            "Corticotropin-releasing hormone (CRH)",
            "Growth hormone-releasing hormone (GHRH)",
            "Gonadotropin-releasing hormone (GnRH)",
            "Melanocyte-stimulating hormone (MSH)",
            "Prolactin-releasing peptide (PrRP)",
            "Neuropeptide Y (NPY)",
            "Endothelin (EDN1)",
            "Angiotensin (AGT)",
            "Atrial natriuretic peptide (ANP)",
            "Brain natriuretic peptide (BNP)",
            "Kisspeptin (KISS1)",
            "Motilin (MLN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin",
                "Glucagon",
                "Adrenocorticotropic Hormone",
                "Oxytocin",
                "Vasopressin",
                "Calcitonin",
                "Parathyroid Hormone",
                "Gastrins",
                "Somatostatin",
                "Ghrelin",
                "Thyrotropin-Releasing Hormone",
                "Corticotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Gonadotropin-Releasing Hormone",
                "Melanocyte-Stimulating Hormones",
                "Motilin",
                "Brain Natriuretic Peptide"
            ],
            "mismatches": [
                "Cholecystokinin",
                "Prolactin-releasing peptide",
                "Neuropeptide Y",
                "Endothelin",
                "Angiotensin",
                "Atrial natriuretic peptide",
                "Kisspeptin"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Atrial Natriuretic Factor",
                "Brain Natriuretic Peptide",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Glucagon",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulin Glargine",
                "Insulins",
                "Leptin",
                "Luteinizing Hormone",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Motilin",
                "Nafarelin",
                "Natriuretic Peptides",
                "Oxytocin",
                "Parathyroid Hormone",
                "Parathyroid Hormone-Related Protein",
                "Peptide YY",
                "Procalcitonin",
                "Proglucagon",
                "Proinsulin",
                "Prolactin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Thyrotropin",
                "Thyrotropin-Releasing Hormone",
                "Vasopressins",
                "beta-MSH"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "Glucagon (GCG)",
            "Somatostatin (SST)",
            "Vasopressin (AVP)",
            "Oxytocin (OXT)",
            "Adrenocorticotropic hormone (ACTH)",
            "Thyroid-stimulating hormone (TSH)",
            "Luteinizing hormone (LH)",
            "Follicle-stimulating hormone (FSH)",
            "Parathyroid hormone (PTH)",
            "Calcitonin (CALC)",
            "Cholecystokinin (CCK)",
            "Gastrin (GAST)",
            "Secretin (SECR)",
            "Neuropeptide Y (NPY)",
            "Substance P (SP)",
            "Atrial natriuretic peptide (ANP)",
            "Brain natriuretic peptide (BNP)",
            "Erythropoietin (EPO)",
            "Prolactin (PRL)",
            "Growth hormone-releasing hormone (GHRH)",
            "Corticotropin-releasing hormone (CRH)",
            "Angiotensin II (ANG II)",
            "Melanocyte-stimulating hormone (MSH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin",
                "Glucagon",
                "Somatostatin",
                "Vasopressin",
                "Oxytocin",
                "Adrenocorticotropic Hormone",
                "Luteinizing Hormone",
                "Follicle Stimulating Hormone",
                "Parathyroid Hormone",
                "Calcitonin",
                "Gastrins",
                "Secretin",
                "Atrial Natriuretic Factor",
                "Brain Natriuretic Peptide",
                "Prolactin",
                "Growth Hormone-Releasing Hormone",
                "Corticotropin-Releasing Hormone",
                "Angiotensin II",
                "Melanocyte-Stimulating Hormones"
            ],
            "mismatches": [
                "Thyroid-stimulating hormone (TSH)",
                "Cholecystokinin (CCK)",
                "Neuropeptide Y (NPY)",
                "Substance P (SP)",
                "Erythropoietin (EPO)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Atrial Natriuretic Factor",
                "Brain Natriuretic Peptide",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Follicle Stimulating Hormone",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Glucagon",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Follicle Stimulating Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulin Glargine",
                "Insulins",
                "Luteinizing Hormone",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Natriuretic Peptides",
                "Oxytocin",
                "Pancreatic Polypeptide",
                "Parathyroid Hormone",
                "Parathyroid Hormone-Related Protein",
                "Peptide YY",
                "Procalcitonin",
                "Proglucagon",
                "Proinsulin",
                "Prolactin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Thyrotropin",
                "Thyrotropin Alfa",
                "Thyrotropin-Releasing Hormone",
                "Vasopressins",
                "beta Subunit Luteinizing Hormone",
                "beta-Endorphin",
                "beta-Lipotropin",
                "beta-MSH",
                "gamma-Endorphin"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "Glucagon (GCG)",
            "Growth Hormone (GH)",
            "Adrenocorticotropic Hormone (ACTH)",
            "Antidiuretic Hormone (ADH)",
            "Oxytocin (OT)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Gonadotropin-Releasing Hormone (GnRH)",
            "Follicle-stimulating Hormone (FSH)",
            "Luteinizing Hormone (LH)",
            "Thyroid-Stimulating Hormone (TSH)",
            "Prolactin (PRL)",
            "Melanocyte-stimulating Hormone (MSH)",
            "Endorphins",
            "Enkephalins",
            "Somatostatin (SST)",
            "Vasopressin (VP)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Parathyroid Hormone (PTH)",
            "Calcitonin (CT)",
            "Secretin",
            "Gastrin",
            "Cholecystokinin (CCK)",
            "Ghrelin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin",
                "Glucagon",
                "Growth Hormone",
                "Adrenocorticotropic Hormone",
                "Oxytocin",
                "Thyrotropin-Releasing Hormone",
                "Gonadotropin-Releasing Hormone",
                "Follicle Stimulating Hormone",
                "Luteinizing Hormone",
                "Prolactin",
                "Melanocyte-Stimulating Hormones",
                "Somatostatin",
                "Vasopressin",
                "Corticotropin-Releasing Hormone",
                "Parathyroid Hormone",
                "Calcitonin",
                "Secretin",
                "Ghrelin"
            ],
            "mismatches": [
                "Antidiuretic Hormone",
                "Thyroid-Stimulating Hormone",
                "Endorphins",
                "Enkephalins",
                "Gastrin",
                "Cholecystokinin"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Arginine Vasopressin",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Follicle Stimulating Hormone",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Glucagon",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Follicle Stimulating Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulin Glargine",
                "Insulins",
                "Leptin",
                "Luteinizing Hormone",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Oxytocin",
                "Parathyroid Hormone",
                "Parathyroid Hormone-Related Protein",
                "Procalcitonin",
                "Proglucagon",
                "Proinsulin",
                "Prolactin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Terlipressin",
                "Thyrotropin",
                "Thyrotropin Alfa",
                "Thyrotropin-Releasing Hormone",
                "Vasopressins",
                "alpha-Endorphin",
                "beta Subunit Luteinizing Hormone",
                "beta-Endorphin",
                "beta-MSH",
                "gamma-Endorphin"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Insulin",
            "Glucagon",
            "Growth hormone",
            "Oxytocin",
            "Vasopressin",
            "Adrenocorticotropic hormone",
            "Thyroid-stimulating hormone",
            "Follicle-stimulating hormone",
            "Luteinizing hormone",
            "Prolactin",
            "Melanocyte-stimulating hormone",
            "Calcitonin",
            "Parathyroid hormone",
            "Adrenomedullin",
            "Erythropoietin",
            "Corticotropin-releasing hormone",
            "Gastrin",
            "Secretin",
            "Cholecystokinin",
            "Leptin",
            "Ghrelin",
            "Motilin",
            "Somatostatin",
            "Substance P"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin",
                "Glucagon",
                "Growth hormone",
                "Oxytocin",
                "Adrenocorticotropic hormone",
                "Follicle-stimulating hormone",
                "Luteinizing hormone",
                "Prolactin",
                "Melanocyte-stimulating hormone",
                "Calcitonin",
                "Parathyroid hormone",
                "Adrenomedullin",
                "Corticotropin-releasing hormone",
                "Secretin",
                "Leptin",
                "Ghrelin",
                "Motilin",
                "Somatostatin"
            ],
            "mismatches": [
                "Vasopressin",
                "Thyroid-stimulating hormone",
                "Erythropoietin",
                "Gastrin",
                "Cholecystokinin",
                "Substance P"
            ],
            "true_referents": [
                "Adipokines",
                "Adiponectin",
                "Adrenocorticotropic Hormone",
                "Adrenomedullin",
                "Buserelin",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Follicle Stimulating Hormone",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Glucagon",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Follicle Stimulating Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulins",
                "Leptin",
                "Long-Acting Insulin",
                "Luteinizing Hormone",
                "Lypressin",
                "Melanocortins",
                "Melanocyte-Stimulating Hormones",
                "Menotropins",
                "Motilin",
                "Nafarelin",
                "Oxytocin",
                "Parathyroid Hormone",
                "Parathyroid Hormone-Related Protein",
                "Pro-Opiomelanocortin",
                "Procalcitonin",
                "Proglucagon",
                "Prolactin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Terlipressin",
                "Thyrotropin",
                "Thyrotropin Alfa",
                "Thyrotropin-Releasing Hormone",
                "Vasopressins",
                "beta Subunit Luteinizing Hormone",
                "beta-Endorphin",
                "beta-Lipotropin"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "Glucagon (GCG)",
            "Oxytocin (OXT)",
            "Vasopressin (AVP)",
            "Growth Hormone (GH)",
            "Adrenocorticotropic Hormone (ACTH)",
            "Thyroid-Stimulating Hormone (TSH)",
            "Luteinizing Hormone (LH)",
            "Follicle-Stimulating Hormone (FSH)",
            "Prolactin (PRL)",
            "Beta-endorphin (EDN)",
            "Neuropeptide Y (NPY)",
            "Erythropoietin (EPO)",
            "Calcitonin",
            "Gastrin",
            "Cholecystokinin (CCK)",
            "Glucose-dependent Insulinotropic Peptide (GIP)",
            "Glucagon-like Peptide-1 (GLP-1)",
            "Glucagon-like Peptide-2 (GLP-2)",
            "Somatostatin (SST)",
            "Leptin (LEP)",
            "Ghrelin (GHR)",
            "Secretin (SCT)",
            "Amylin (AMY)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin",
                "Glucagon",
                "Oxytocin",
                "Vasopressin",
                "Growth Hormone",
                "Adrenocorticotropic Hormone",
                "Luteinizing Hormone",
                "Follicle-Stimulating Hormone",
                "Prolactin",
                "Calcitonin",
                "Somatostatin",
                "Leptin",
                "Ghrelin",
                "Secretin"
            ],
            "mismatches": [
                "Thyroid-Stimulating Hormone",
                "Beta-endorphin",
                "Neuropeptide Y",
                "Erythropoietin",
                "Gastrin",
                "Cholecystokinin",
                "Glucose-dependent Insulinotropic Peptide",
                "Glucagon-like Peptide-1",
                "Glucagon-like Peptide-2",
                "Amylin"
            ],
            "true_referents": [
                "Adipokines",
                "Adiponectin",
                "Adrenocorticotropic Hormone",
                "Arginine Vasopressin",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Follicle Stimulating Hormone",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Glucagon",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Follicle Stimulating Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulin Glargine",
                "Insulins",
                "Islet Amyloid Polypeptide",
                "Leptin",
                "Luteinizing Hormone",
                "Lypressin",
                "Oxytocin",
                "Parathyroid Hormone",
                "Peptide YY",
                "Procalcitonin",
                "Proglucagon",
                "Proinsulin",
                "Prolactin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Thyrotropin",
                "Thyrotropin Alfa",
                "Thyrotropin-Releasing Hormone",
                "Vasopressins",
                "alpha-Endorphin",
                "beta Subunit Luteinizing Hormone",
                "beta-Endorphin",
                "beta-Lipotropin",
                "gamma-Lipotropin"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "Glucagon (GCG)",
            "Oxytocin (OXT)",
            "Vasopressin (AVP)",
            "Somatostatin (SST)",
            "Ghrelin",
            "Leptin",
            "Calcitonin (CALC)",
            "Parathyroid hormone (PTH)",
            "Growth hormone-releasing hormone (GHRH)",
            "Gonadotropin-releasing hormone (GnRH)",
            "Corticotropin-releasing hormone (CRH)",
            "Thyrotropin-releasing hormone (TRH)",
            "Melanocyte-stimulating hormone (MSH)",
            "Adrenocorticotropic hormone (ACTH)",
            "Follicle-stimulating hormone (FSH)",
            "Luteinizing hormone (LH)",
            "Thyroid-stimulating hormone (TSH)",
            "Angiotensin II",
            "Bradykinin",
            "Cholecystokinin (CCK)",
            "Gastrin",
            "Secretin",
            "Motilin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin (INS)",
                "Glucagon (GCG)",
                "Oxytocin (OXT)",
                "Vasopressin (AVP)",
                "Somatostatin (SST)",
                "Ghrelin",
                "Leptin",
                "Calcitonin (CALC)",
                "Parathyroid hormone (PTH)",
                "Growth hormone-releasing hormone (GHRH)",
                "Gonadotropin-releasing hormone (GnRH)",
                "Corticotropin-releasing hormone (CRH)",
                "Thyrotropin-releasing hormone (TRH)",
                "Melanocyte-stimulating hormone (MSH)",
                "Adrenocorticotropic hormone (ACTH)",
                "Follicle-stimulating hormone (FSH)",
                "Luteinizing hormone (LH)",
                "Angiotensin II",
                "Gastrin",
                "Secretin",
                "Motilin"
            ],
            "mismatches": [
                "Bradykinin",
                "Cholecystokinin (CCK)",
                "Thyroid-stimulating hormone (TSH)"
            ],
            "true_referents": [
                "Adipokines",
                "Adiponectin",
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Buserelin",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Follicle Stimulating Hormone",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Glucagon",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Follicle Stimulating Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulin Glargine",
                "Insulins",
                "Leptin",
                "Luteinizing Hormone",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Motilin",
                "Nafarelin",
                "Oxytocin",
                "Parathyroid Hormone",
                "Parathyroid Hormone-Related Protein",
                "Procalcitonin",
                "Proglucagon",
                "Proinsulin",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Thyrotropin",
                "Thyrotropin Alfa",
                "Thyrotropin-Releasing Hormone",
                "Vasopressins",
                "beta Subunit Luteinizing Hormone",
                "beta-MSH"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "Glucagon (GCG)",
            "Somatostatin (SST)",
            "Thyroid-stimulating hormone (TSH)",
            "Adrenocorticotropic hormone (ACTH)",
            "Growth hormone (GH)",
            "Prolactin (PRL)",
            "Follicle-stimulating hormone (FSH)",
            "Luteinizing hormone (LH)",
            "Oxytocin (OXT)",
            "Vasopressin (AVP)",
            "Calcitonin (CT)",
            "Parathyroid hormone (PTH)",
            "Atrial natriuretic peptide (ANP)",
            "Brain natriuretic peptide (BNP)",
            "Gastrin (GAST)",
            "Cholecystokinin (CCK)",
            "Secretin (SCT)",
            "Motilin (MLN)",
            "Ghrelin (GHRL)",
            "Leptin (LEP)",
            "Neuropeptide Y (NPY)",
            "Substance P (SP)",
            "Vasoactive intestinal peptide (VIP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin (INS)",
                "Glucagon (GCG)",
                "Somatostatin (SST)",
                "Adrenocorticotropic hormone (ACTH)",
                "Growth hormone (GH)",
                "Prolactin (PRL)",
                "Follicle-stimulating hormone (FSH)",
                "Luteinizing hormone (LH)",
                "Oxytocin (OXT)",
                "Vasopressin (AVP)",
                "Calcitonin (CT)",
                "Parathyroid hormone (PTH)",
                "Brain natriuretic peptide (BNP)",
                "Secretin (SCT)",
                "Motilin (MLN)",
                "Ghrelin (GHRL)",
                "Leptin (LEP)",
                "Vasoactive intestinal peptide (VIP)"
            ],
            "mismatches": [
                "Thyroid-stimulating hormone (TSH)",
                "Atrial natriuretic peptide (ANP)",
                "Gastrin (GAST)",
                "Cholecystokinin (CCK)",
                "Neuropeptide Y (NPY)",
                "Substance P (SP)"
            ],
            "true_referents": [
                "Adipokines",
                "Adiponectin",
                "Adrenocorticotropic Hormone",
                "Arginine Vasopressin",
                "Atrial Natriuretic Factor",
                "Brain Natriuretic Peptide",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Follicle Stimulating Hormone",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Glucagon",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Follicle Stimulating Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulin Glargine",
                "Insulins",
                "Leptin",
                "Luteinizing Hormone",
                "Lypressin",
                "Motilin",
                "Nafarelin",
                "Natriuretic Peptides",
                "Oxytocin",
                "Parathyroid Hormone",
                "Parathyroid Hormone-Related Protein",
                "Peptide YY",
                "Procalcitonin",
                "Proglucagon",
                "Proinsulin",
                "Prolactin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Thyrotropin",
                "Thyrotropin Alfa",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "beta Subunit Luteinizing Hormone",
                "beta-Endorphin",
                "gamma-Endorphin"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "Glucagon (GCG)",
            "Somatostatin (SST)",
            "Ghrelin (GHRL)",
            "Leptin (LEP)",
            "Adiponectin (ADIPOQ)",
            "Oxytocin (OXT)",
            "Vasopressin (AVP)",
            "Angiotensin II (AGT)",
            "Bradykinin (BK)",
            "Calcitonin (CALCA)",
            "Parathyroid Hormone (PTH)",
            "Thyroid-Stimulating Hormone (TSH)",
            "Follicle-Stimulating Hormone (FSH)",
            "Luteinizing Hormone (LH)",
            "Growth Hormone-Releasing Hormone (GHRH)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Gonadotropin-Releasing Hormone (GnRH)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Prolactin-Releasing Hormone (PRH)",
            "Melanocyte-Stimulating Hormone (MSH)",
            "Gastrin (GAST)",
            "Cholecystokinin (CCK)",
            "Secretin (SCT)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin (INS)",
                "Glucagon (GCG)",
                "Somatostatin (SST)",
                "Ghrelin (GHRL)",
                "Leptin (LEP)",
                "Adiponectin (ADIPOQ)",
                "Oxytocin (OXT)",
                "Vasopressin (AVP)",
                "Angiotensin II (AGT)",
                "Calcitonin (CALCA)",
                "Parathyroid Hormone (PTH)",
                "Follicle-Stimulating Hormone (FSH)",
                "Luteinizing Hormone (LH)",
                "Growth Hormone-Releasing Hormone (GHRH)",
                "Corticotropin-Releasing Hormone (CRH)",
                "Gonadotropin-Releasing Hormone (GnRH)",
                "Thyrotropin-Releasing Hormone (TRH)",
                "Secretin (SCT)"
            ],
            "mismatches": [
                "Bradykinin (BK)",
                "Thyroid-Stimulating Hormone (TSH)",
                "Prolactin-Releasing Hormone (PRH)",
                "Melanocyte-Stimulating Hormone (MSH)",
                "Gastrin (GAST)",
                "Cholecystokinin (CCK)"
            ],
            "true_referents": [
                "Adipokines",
                "Adiponectin",
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Bombesin",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Follicle Stimulating Hormone",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Glucagon",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Follicle Stimulating Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulin Glargine",
                "Insulins",
                "Leptin",
                "Luteinizing Hormone",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Oxytocin",
                "Parathyroid Hormone",
                "Parathyroid Hormone-Related Protein",
                "Procalcitonin",
                "Proglucagon",
                "Proinsulin",
                "Prolactin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Thyrotropin",
                "Thyrotropin Alfa",
                "Thyrotropin-Releasing Hormone",
                "Vasopressins",
                "beta Subunit Luteinizing Hormone",
                "beta-MSH"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Insulin (INS)",
            "Glucagon (GCG)",
            "Adrenocorticotropic hormone (ACTH)",
            "Thyroid-stimulating hormone (TSH)",
            "Follicle-stimulating hormone (FSH)",
            "Luteinizing hormone (LH)",
            "Growth hormone (GH)",
            "Prolactin (PRL)",
            "Antidiuretic hormone (ADH)",
            "Oxytocin (OXT)",
            "Parathyroid hormone (PTH)",
            "Calcitonin (CT)",
            "Ghrelin (GHRL)",
            "Leptin (LEP)",
            "Cholecystokinin (CCK)",
            "Gastrin (GAS)",
            "Secretin (SCT)",
            "Motilin (MOT)",
            "Vasoactive intestinal peptide (VIP)",
            "Substance P (SP)",
            "Neuropeptide Y (NPY)",
            "Somatostatin (SST)",
            "Corticotropin-releasing hormone (CRH)",
            "Thyrotropin-releasing hormone (TRH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Insulin",
                "Glucagon",
                "Adrenocorticotropic Hormone",
                "Follicle Stimulating Hormone",
                "Luteinizing Hormone",
                "Growth Hormone",
                "Prolactin",
                "Oxytocin",
                "Parathyroid Hormone",
                "Calcitonin",
                "Ghrelin",
                "Leptin",
                "Gastrins",
                "Secretin",
                "Motilin",
                "Vasoactive Intestinal Peptide",
                "Somatostatin",
                "Corticotropin-Releasing Hormone",
                "Thyrotropin-Releasing Hormone"
            ],
            "mismatches": [
                "Thyroid-stimulating hormone",
                "Antidiuretic hormone",
                "Cholecystokinin",
                "Substance P",
                "Neuropeptide Y"
            ],
            "true_referents": [
                "Adipokines",
                "Adiponectin",
                "Adrenocorticotropic Hormone",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Follicle Stimulating Hormone",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Glucagon",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Follicle Stimulating Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulin Glargine",
                "Insulins",
                "Leptin",
                "Luteinizing Hormone",
                "Lypressin",
                "Motilin",
                "Nafarelin",
                "Ornipressin",
                "Oxytocin",
                "Parathyroid Hormone",
                "Parathyroid Hormone-Related Protein",
                "Peptide YY",
                "Procalcitonin",
                "Proglucagon",
                "Proinsulin",
                "Prolactin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Terlipressin",
                "Thyrotropin",
                "Thyrotropin Alfa",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "beta Subunit Luteinizing Hormone",
                "beta-Endorphin",
                "gamma-Endorphin"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Adrenocorticotropic hormone (ACTH)",
            "Angiotensin-converting enzyme inhibitor (ACEI)",
            "Antidiuretic hormone (ADH)",
            "Bombesin",
            "Calcitonin",
            "Cholecystokinin (CCK)",
            "Corticotropin-releasing factor (CRF)",
            "Endorphin",
            "Gastrin",
            "Growth hormone",
            "Insulin",
            "Leptin",
            "Melanocyte-stimulating hormone (MSH)",
            "Melatonin",
            "Oxytocin",
            "Parathyroid hormone (PTH)",
            "Prolactin",
            "Somatostatin",
            "Thyroid-stimulating hormone (TSH)",
            "Vasopressin",
            "Vasoactive intestinal peptide (VIP)",
            "Vitamin D-binding protein"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenocorticotropic hormone (ACTH)",
                "Bombesin",
                "Calcitonin",
                "Growth hormone",
                "Insulin",
                "Leptin",
                "Oxytocin",
                "Parathyroid hormone (PTH)",
                "Prolactin",
                "Somatostatin",
                "Vasoactive intestinal peptide (VIP)"
            ],
            "mismatches": [
                "Angiotensin-converting enzyme inhibitor (ACEI)",
                "Antidiuretic hormone (ADH)",
                "Cholecystokinin (CCK)",
                "Corticotropin-releasing factor (CRF)",
                "Endorphin",
                "Gastrin",
                "Melanocyte-stimulating hormone (MSH)",
                "Melatonin",
                "Thyroid-stimulating hormone (TSH)",
                "Vasopressin",
                "Vitamin D-binding protein"
            ],
            "true_referents": [
                "Adipokines",
                "Adiponectin",
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Bombesin",
                "Buserelin",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Gastric Inhibitory Polypeptide",
                "Gastrins",
                "Ghrelin",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulins",
                "Leptin",
                "Long-Acting Insulin",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Oxytocin",
                "Parathyroid Hormone",
                "Parathyroid Hormone-Related Protein",
                "Procalcitonin",
                "Prolactin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Terlipressin",
                "Thyrotropin",
                "Thyrotropin Alfa",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-Endorphin",
                "beta-MSH"
            ],
            "TP": 11,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            "Adiponectin (ADIPOQ)",
            "Angiotensinogen (AGT)",
            "Atrial natriuretic peptide (ANP)",
            "Brain natriuretic peptide (BNP)",
            "Calcitonin (CALCA)",
            "Cortistatin (CORT)",
            "Ghrelin (GHRL)",
            "Growth hormone-releasing hormone (GHRH)",
            "Insulin (INS)",
            "Motilin (MLN)",
            "Neuromedin U (NMU)",
            "Neuropeptide Y (NPY)",
            "Oxytocin (OXT)",
            "Pancreatic polypeptide (PP)",
            "Peptide YY (PYY)",
            "Pituitary adenylate cyclase-activating polypeptide (PACAP)",
            "Secretin (SCT)",
            "Somatostatin (SST)",
            "Thyrotropin-releasing hormone (TRH)",
            "Vasoactive intestinal peptide (VIP)",
            "Vasopressin (AVP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adiponectin",
                "Brain natriuretic peptide",
                "Calcitonin",
                "Ghrelin",
                "Growth hormone-releasing hormone",
                "Insulin",
                "Motilin",
                "Oxytocin",
                "Pancreatic polypeptide",
                "Peptide YY",
                "Secretin",
                "Somatostatin",
                "Thyrotropin-releasing hormone",
                "Vasoactive intestinal peptide"
            ],
            "mismatches": [
                "Angiotensinogen (AGT)",
                "Atrial natriuretic peptide (ANP)",
                "Cortistatin (CORT)",
                "Neuromedin U (NMU)",
                "Neuropeptide Y (NPY)",
                "Pituitary adenylate cyclase-activating polypeptide (PACAP)",
                "Vasopressin (AVP)"
            ],
            "true_referents": [
                "Adipokines",
                "Adiponectin",
                "Angiotensin I",
                "Angiotensin III",
                "Angiotensins",
                "Arginine Vasopressin",
                "Atrial Natriuretic Factor",
                "Brain Natriuretic Peptide",
                "C-Peptide",
                "Calcitonin",
                "Cosyntropin",
                "Gastric Inhibitory Polypeptide",
                "Ghrelin",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone",
                "Growth Hormone-Releasing Hormone",
                "Human Growth Hormone",
                "Insulin",
                "Insulins",
                "Islet Amyloid Polypeptide",
                "Leptin",
                "Lypressin",
                "Motilin",
                "Nafarelin",
                "Natriuretic Peptides",
                "Oxytocin",
                "Pancreatic Polypeptide",
                "Parathyroid Hormone",
                "Peptide PHI",
                "Peptide YY",
                "Pituitary Gonadotropins",
                "Pituitary Hormones",
                "Procalcitonin",
                "Proinsulin",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Thyrotropin",
                "Thyrotropin-Releasing Hormone",
                "Urofollitropin",
                "Urotensins",
                "Vasoactive Intestinal Peptide",
                "Vasopressins"
            ],
            "TP": 14,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "peptide hormone",
        "domain": "biology",
        "response": [
            [
                "Referent",
                "Angiotensin II"
            ],
            [
                "Referent",
                "Calcitonin"
            ],
            [
                "Referent",
                "Insulin"
            ],
            [
                "Referent",
                "Oxytocin"
            ]
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Angiotensin II",
                "Calcitonin",
                "Insulin",
                "Oxytocin"
            ],
            "mismatches": [],
            "true_referents": [
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Calcitonin",
                "Cosyntropin",
                "Human Regular Insulin",
                "Insulin",
                "Insulins",
                "Oxytocin",
                "Parathyroid Hormone",
                "Procalcitonin"
            ],
            "TP": 4,
            "FP": 0,
            "FN": 0
        }
    }
]