[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Neuropeptide Y (NPY)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Somatostatin (SST)",
            "Enkephalin",
            "Substance P",
            "Dynorphin",
            "Galanin",
            "Neurotensin",
            "Cholecystokinin (CCK)",
            "Orexin (Hypocretin)",
            "Gastrin-Releasing Peptide (GRP)",
            "Neurotrophins",
            "Corticotropin-Releasing Factor (CRF)",
            "Neuropeptide FF (NPFF)",
            "Neuropeptide Y Receptor Agonists",
            "Tachykinins",
            "Angiotensin II",
            "Galanin-like Peptide (GALP)",
            "Neuropeptide W (NPW)",
            "Neuropeptide S (NPS)",
            "Opioid Peptides",
            "Tachykinin Peptides",
            "Tachykinin Receptor Antagonists",
            "Galanin Peptides"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neuropeptide Y (NPY)",
                "Vasoactive Intestinal Peptide (VIP)",
                "Somatostatin (SST)",
                "Substance P",
                "Dynorphin",
                "Galanin",
                "Neurotensin",
                "Gastrin-Releasing Peptide (GRP)",
                "Tachykinins",
                "Angiotensin II",
                "Galanin-like Peptide (GALP)",
                "Opioid Peptides"
            ],
            "mismatches": [
                "Enkephalin",
                "Cholecystokinin (CCK)",
                "Orexin (Hypocretin)",
                "Neurotrophins",
                "Corticotropin-Releasing Factor (CRF)",
                "Neuropeptide FF (NPFF)",
                "Neuropeptide Y Receptor Agonists",
                "Neuropeptide W (NPW)",
                "Neuropeptide S (NPS)",
                "Tachykinin Peptides",
                "Tachykinin Receptor Antagonists",
                "Galanin Peptides"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Bombesin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Delta Sleep-Inducing Peptide",
                "Dynorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Growth Hormone-Releasing Hormone",
                "Kisspeptins",
                "Leucine Enkephalin",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Opioid Peptides",
                "Orexins",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "alpha-Endorphin"
            ],
            "TP": 12,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Vasopressin (AVP)",
            "Oxytocin (OXT)",
            "Neurotensin (NT)",
            "Galanin (GAL)",
            "Bombesin (BBS)",
            "Neurokinin A (NKA)",
            "Neurokinin B (NKB)",
            "Cholecystokinin (CCK)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Gastrin-Releasing Peptide (GRP)",
            "Neuropeptide Y (NPY)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Somatostatin (SST)",
            "Angiotensin II (Ang II)",
            "Dynorphin (DYN)",
            "Enkephalin (ENK)",
            "Endorphin (END)",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Gastrin (GAS)",
            "Motilin (MTL)",
            "Pituitary Adenylate Cyclase-Activating Peptide (PACAP)",
            "Urocortin (Ucn)",
            "Islet-1 Neuronal Differentiation Factor (ISL1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Vasopressin",
                "Neurotensin",
                "Galanin",
                "Bombesin",
                "Neurokinin A",
                "Neurokinin B",
                "Vasoactive Intestinal Peptide",
                "Gastrin-Releasing Peptide",
                "Neuropeptide Y",
                "Corticotropin-Releasing Hormone",
                "Somatostatin",
                "Angiotensin II",
                "Dynorphins",
                "Endorphins",
                "Calcitonin Gene-Related Peptide",
                "Gastrins",
                "Motilin",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Urocortins"
            ],
            "mismatches": [
                "Oxytocin",
                "Cholecystokinin",
                "Islet-1 Neuronal Differentiation Factor"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Bombesin",
                "Buserelin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Leucine Enkephalin",
                "Lypressin",
                "Methionine Enkephalin",
                "Motilin",
                "Nafarelin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Urocortins",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "beta-Endorphin"
            ],
            "TP": 20,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Neurotensin (NT)",
            "Oxytocin (OXT)",
            "Vasopressin (AVP)",
            "Bradykinin (BK)",
            "Cholecystokinin (CCK)",
            "Gastrin-Releasing Peptide (GRP)",
            "Neuropeptide Y (NPY)",
            "Somatostatin (SST)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Growth Hormone-Releasing Hormone (GHRH)",
            "Insulin-like Growth Factor I (IGF-I)",
            "Insulin-like Growth Factor II (IGF-II)",
            "Melanocyte-Stimulating Hormone (MSH)",
            "Neurokinin A (NKA)",
            "Neurokinin B (NKB)",
            "Pituitary Adenylate Cyclase-Activating Polypeptide (PACAP)",
            "Proopiomelanocortin (POMC)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Vasoactive Intestinal Polypeptide (VIP)",
            "Endothelin-1 (ET-1)",
            "Endothelin-2 (ET-2)",
            "Endothelin-3 (ET-3)",
            "Neuropeptide FF (NPFF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Neurotensin",
                "Vasopressin",
                "Bradykinin",
                "Gastrin-Releasing Peptide",
                "Neuropeptide Y",
                "Somatostatin",
                "Corticotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Melanocyte-Stimulating Hormone",
                "Neurokinin A",
                "Neurokinin B",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pro-Opiomelanocortin",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide"
            ],
            "mismatches": [
                "Oxytocin",
                "Cholecystokinin",
                "Insulin-like Growth Factor I",
                "Insulin-like Growth Factor II",
                "Endothelin-1",
                "Endothelin-2",
                "Endothelin-3",
                "Neuropeptide FF"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensin III",
                "Angiotensins",
                "Arginine Vasopressin",
                "Bradykinin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Dynorphins",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Lypressin",
                "Melanocortins",
                "Melanocyte-Stimulating Hormones",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Pro-Opiomelanocortin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "beta-Lipotropin",
                "beta-MSH"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Neuropeptide Y (NPY)",
            "Somatostatin (SST)",
            "Vasopressin (AVP)",
            "Oxytocin (OT)",
            "Endorphins (END)",
            "Enkephalins (ENK)",
            "Dynorphins (DYN)",
            "Cholecystokinin (CCK)",
            "Gastrin-Releasing Peptide (GRP)",
            "Neurotensin (NT)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Corticotropin-Releasing Factor (CRF)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Gonadotropin-Releasing Hormone (GnRH)",
            "Growth Hormone-Releasing Hormone (GHRH)",
            "Prolactin-Releasing Hormone (PRH)",
            "Melanin-Concentrating Hormone (MCH)",
            "Orexin A (ORX-A)",
            "Orexin B (ORX-B)",
            "Neuropeptide FF (NPFF)",
            "Seminal Plasma Protein 1 (SPP1)",
            "Pituitary Adenylate-Cyclizing Polypeptide (PACAP)",
            "Motilin (MTL)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Neuropeptide Y",
                "Somatostatin",
                "Vasopressin",
                "Endorphins",
                "Enkephalins",
                "Dynorphins",
                "Gastrin-Releasing Peptide",
                "Neurotensin",
                "Vasoactive Intestinal Peptide",
                "Thyrotropin-Releasing Hormone",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Prolactin-Releasing Hormone",
                "Orexins",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Motilin"
            ],
            "mismatches": [
                "Oxytocin",
                "Cholecystokinin",
                "Corticotropin-Releasing Factor",
                "Melanin-Concentrating Hormone",
                "Neuropeptide FF",
                "Seminal Plasma Protein 1"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensins",
                "Arginine Vasopressin",
                "Buserelin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Delta Sleep-Inducing Peptide",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Leucine Enkephalin",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Methionine Enkephalin",
                "Motilin",
                "Nafarelin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Orexins",
                "Ornipressin",
                "Pancreatic Polypeptide",
                "Peptide PHI",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Sermorelin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "beta-Endorphin",
                "beta-MSH"
            ],
            "TP": 17,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Neuropeptide Y (NPY)",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Galanin",
            "Endorphins",
            "Enkephalins",
            "Dynorphins",
            "Somatostatin",
            "Neurotensin",
            "Oxytocin",
            "Vasopressin",
            "Cholecystokinin (CCK)",
            "Gastrin-Releasing Peptide (GRP)",
            "Neuropeptide FF (NPFF)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Melanin-Concentrating Hormone (MCH)",
            "Orexin (Hypocretin)",
            "Neurokinin A (NKA)",
            "Neurokinin B (NKB)",
            "Bombesin",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Prolactin-Releasing Peptide (PrRP)",
            "Pituitary Adenylate Cyclase-Activating Polypeptide (PACAP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Vasoactive Intestinal Peptide",
                "Neuropeptide Y",
                "Calcitonin Gene-Related Peptide",
                "Galanin",
                "Endorphins",
                "Enkephalins",
                "Dynorphins",
                "Somatostatin",
                "Neurotensin",
                "Gastrin-Releasing Peptide",
                "Corticotropin-Releasing Hormone",
                "Orexins",
                "Neurokinin A",
                "Neurokinin B",
                "Bombesin",
                "Thyrotropin-Releasing Hormone",
                "Pituitary Adenylate Cyclase-Activating Polypeptide"
            ],
            "mismatches": [
                "Oxytocin",
                "Vasopressin",
                "Cholecystokinin (CCK)",
                "Neuropeptide FF (NPFF)",
                "Melanin-Concentrating Hormone (MCH)",
                "Prolactin-Releasing Peptide (PrRP)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensins",
                "Bombesin",
                "Buserelin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Delta Sleep-Inducing Peptide",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Leucine Enkephalin",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Orexins",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Prolactin Release-Inhibiting Factors",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Terlipressin",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-MSH"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Neuropeptide Y (NPY)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Somatostatin (SST)",
            "Cholecystokinin (CCK)",
            "Oxytocin (OXT)",
            "Vasopressin (AVP)",
            "Enkephalins (ENK)",
            "Endorphins (END)",
            "Neurotensin (NT)",
            "Galanin (GAL)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Brain-Derived Neurotrophic Factor (BDNF)",
            "Glucagon-Like Peptide-1 (GLP-1)",
            "Pituitary Adenylate Cyclase-Activating Polypeptide (PACAP)",
            "Angiotensin II (Ang II)",
            "Neurokinin A (NKA)",
            "Neurokinin B (NKB)",
            "Prolactin-Releasing Peptide (PrRP)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Insulin (INS)",
            "Adrenocorticotropic Hormone (ACTH)",
            "Ghrelin (GHRL)",
            "Nerve Growth Factor (NGF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Neuropeptide Y",
                "Vasoactive Intestinal Peptide",
                "Calcitonin Gene-Related Peptide",
                "Somatostatin",
                "Vasopressin",
                "Enkephalins",
                "Endorphins",
                "Neurotensin",
                "Galanin",
                "Corticotropin-Releasing Hormone",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Angiotensin II",
                "Neurokinin A",
                "Neurokinin B",
                "Thyrotropin-Releasing Hormone",
                "Adrenocorticotropic Hormone"
            ],
            "mismatches": [
                "Cholecystokinin",
                "Oxytocin",
                "Brain-Derived Neurotrophic Factor",
                "Glucagon-Like Peptide-1",
                "Prolactin-Releasing Peptide",
                "Insulin",
                "Ghrelin",
                "Nerve Growth Factor"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Leucine Enkephalin",
                "Lypressin",
                "Melanocortins",
                "Methionine Enkephalin",
                "Motilin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Pancreatic Polypeptide",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Prolactin Release-Inhibiting Factors",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "beta-Endorphin",
                "gamma-Lipotropin"
            ],
            "TP": 17,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Endorphins (END)",
            "Enkephalins (ENK)",
            "Dynorphins (DYN)",
            "Substance P (SP)",
            "Neurotensin (NT)",
            "Cholecystokinin (CCK)",
            "Vasopressin (VP)",
            "Oxytocin (OT)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Gonadotropin-Releasing Hormone (GnRH)",
            "Growth Hormone-Releasing Hormone (GHRH)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Somatostatin (SST)",
            "Vasoactive Intestinal Polypeptide (VIP)",
            "Neuropeptide Y (NPY)",
            "Neurokinin A (NKA)",
            "Neurokinin B (NKB)",
            "Melanocyte Stimulating Hormone (MSH)",
            "Adrenocorticotropic Hormone (ACTH)",
            "Bradykinin (BK)",
            "Angiotensin II (ANG II)",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Neuromedin U (NMU)",
            "Neuromedin B (NMB)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Endorphins",
                "Enkephalins",
                "Dynorphins",
                "Substance P",
                "Neurotensin",
                "Vasopressin",
                "Corticotropin-Releasing Hormone",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Thyrotropin-Releasing Hormone",
                "Somatostatin",
                "Vasoactive Intestinal Peptide",
                "Neuropeptide Y",
                "Neurokinin A",
                "Neurokinin B",
                "Melanocyte-Stimulating Hormones",
                "Adrenocorticotropic Hormone",
                "Bradykinin",
                "Angiotensin II",
                "Calcitonin Gene-Related Peptide"
            ],
            "mismatches": [
                "Cholecystokinin",
                "Oxytocin",
                "Neuromedin U",
                "Neuromedin B"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Bradykinin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Galanin-Like Peptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Leucine Enkephalin",
                "Lypressin",
                "Melanocortins",
                "Melanocyte-Stimulating Hormones",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurophysins",
                "Neurotensin",
                "Nociceptin",
                "Pro-Opiomelanocortin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "beta-Endorphin",
                "beta-MSH"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Endorphin",
            "Oxytocin",
            "Vasopressin",
            "Insulin",
            "Glucagon",
            "Ghrelin",
            "Leptin",
            "Neuropeptide Y",
            "Substance P",
            "Enkephalin",
            "Dynorphin",
            "Cholecystokinin",
            "Neurotensin",
            "Corticotropin-releasing hormone",
            "Angiotensin",
            "Gastrin",
            "Motilin",
            "Bombesin",
            "Neurokinin A",
            "Neurokinin B",
            "Neurotensin",
            "Somatostatin",
            "Thyrotropin-releasing hormone",
            "Vasoactive intestinal peptide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neuropeptide Y",
                "Substance P",
                "Neurotensin",
                "Corticotropin-releasing hormone",
                "Gastrin",
                "Motilin",
                "Bombesin",
                "Neurokinin A",
                "Neurokinin B",
                "Somatostatin",
                "Thyrotropin-releasing hormone",
                "Vasoactive intestinal peptide"
            ],
            "mismatches": [
                "Endorphin",
                "Oxytocin",
                "Vasopressin",
                "Insulin",
                "Glucagon",
                "Ghrelin",
                "Leptin",
                "Enkephalin",
                "Dynorphin",
                "Cholecystokinin",
                "Angiotensin"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Bombesin",
                "Buserelin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Galanin",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Leucine Enkephalin",
                "Lypressin",
                "Methionine Enkephalin",
                "Motilin",
                "Nafarelin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Terlipressin",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-Lipotropin",
                "gamma-Lipotropin"
            ],
            "TP": 12,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Neuropeptide Y (NPY)",
            "Vasopressin (AVP)",
            "Oxytocin (OXT)",
            "Enkephalin",
            "Endorphin",
            "Galanin",
            "Somatostatin",
            "Cholecystokinin (CCK)",
            "Neurotensin",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Dynorphin",
            "Corticotropin-Releasing Factor (CRF)",
            "Neurokinin A (NKA)",
            "Neurokinin B (NKB)",
            "Bombesin",
            "Kisspeptin",
            "Pituitary Adenylate Cyclase-Activating Polypeptide (PACAP)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Nociceptin",
            "Bradykinin",
            "FMRFamide",
            "Substance K"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Neuropeptide Y",
                "Vasopressin",
                "Enkephalin",
                "Endorphin",
                "Galanin",
                "Somatostatin",
                "Neurotensin",
                "Calcitonin Gene-Related Peptide",
                "Dynorphin",
                "Neurokinin A",
                "Neurokinin B",
                "Bombesin",
                "Kisspeptin",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Vasoactive Intestinal Peptide",
                "Nociceptin",
                "Bradykinin",
                "FMRFamide"
            ],
            "mismatches": [
                "Oxytocin",
                "Cholecystokinin",
                "Corticotropin-Releasing Factor",
                "Substance K"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensins",
                "Arginine Vasopressin",
                "Bombesin",
                "Bradykinin",
                "Buserelin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "FMRFamide",
                "Felypressin",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Kisspeptins",
                "Leucine Enkephalin",
                "Lypressin",
                "Methionine Enkephalin",
                "Nafarelin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Nociceptin",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin"
            ],
            "TP": 19,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Neuropeptide Y (NPY)",
            "Somatostatin (SST)",
            "Cholecystokinin (CCK)",
            "Enkephalin",
            "Dynorphin",
            "Beta-Endorphin",
            "Oxytocin",
            "Vasopressin",
            "Corticotropin-Releasing Hormone (CRH)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Gonadotropin-Releasing Hormone (GnRH)",
            "Neurotensin",
            "Galanin",
            "Bradykinin",
            "Neurokinin A",
            "Neurokinin B",
            "Orexin",
            "Melanin-Concentrating Hormone (MCH)",
            "Pituitary Adenylate Cyclase-Activating Polypeptide (PACAP)",
            "Cocaine and Amphetamine Regulated Transcript (CART)",
            "Kisspeptin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P (SP)",
                "Calcitonin Gene-Related Peptide (CGRP)",
                "Vasoactive Intestinal Peptide (VIP)",
                "Neuropeptide Y (NPY)",
                "Somatostatin (SST)",
                "Dynorphin",
                "Corticotropin-Releasing Hormone (CRH)",
                "Thyrotropin-Releasing Hormone (TRH)",
                "Gonadotropin-Releasing Hormone (GnRH)",
                "Neurotensin",
                "Galanin",
                "Bradykinin",
                "Neurokinin A",
                "Neurokinin B",
                "Pituitary Adenylate Cyclase-Activating Polypeptide (PACAP)",
                "Kisspeptin"
            ],
            "mismatches": [
                "Cholecystokinin (CCK)",
                "Enkephalin",
                "Beta-Endorphin",
                "Oxytocin",
                "Vasopressin",
                "Orexin",
                "Melanin-Concentrating Hormone (MCH)",
                "Cocaine and Amphetamine Regulated Transcript (CART)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensins",
                "Bombesin",
                "Bradykinin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Cocaine- and Amphetamine-Regulated Transcript Protein",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Delta Sleep-Inducing Peptide",
                "Dynorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Hypothalamic Hormones",
                "Kisspeptins",
                "Leucine Enkephalin",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Orexins",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Prolactin-Releasing Hormone",
                "Ras Homolog Enriched in Brain Protein",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Terlipressin",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-Endorphin",
                "beta-MSH"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Neuropeptide Y (NPY)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Somatostatin (SST)",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Galanin (GAL)",
            "Cholecystokinin (CCK)",
            "Neurotensin (NT)",
            "Corticotropin-Releasing Factor (CRF)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Gonadotropin-Releasing Hormone (GnRH)",
            "Oxytocin (OXT)",
            "Vasopressin (AVP)",
            "Enkephalins",
            "Endorphins",
            "Dynorphins",
            "Orexins (Hypocretins)",
            "Melanin-Concentrating Hormone (MCH)",
            "Cocaine- and Amphetamine-Regulated Transcript (CART)",
            "Pituitary Adenylate Cyclase-Activating Polypeptide (PACAP)",
            "Neuropeptide S (NPS)",
            "Kisspeptin (KP)",
            "Neurokinin A (NKA)",
            "Neurokinin B (NKB)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Neuropeptide Y",
                "Vasoactive Intestinal Peptide",
                "Somatostatin",
                "Calcitonin Gene-Related Peptide",
                "Galanin",
                "Neurotensin",
                "Thyrotropin-Releasing Hormone",
                "Gonadotropin-Releasing Hormone",
                "Vasopressin",
                "Enkephalins",
                "Endorphins",
                "Dynorphins",
                "Cocaine- and Amphetamine-Regulated Transcript Protein",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Kisspeptins",
                "Neurokinin A",
                "Neurokinin B"
            ],
            "mismatches": [
                "Cholecystokinin (CCK)",
                "Corticotropin-Releasing Factor (CRF)",
                "Oxytocin (OXT)",
                "Orexins (Hypocretins)",
                "Melanin-Concentrating Hormone (MCH)",
                "Neuropeptide S (NPS)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensins",
                "Arginine Vasopressin",
                "Bradykinin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Cocaine- and Amphetamine-Regulated Transcript Protein",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Delta Sleep-Inducing Peptide",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Hypothalamic Hormones",
                "Kisspeptins",
                "Leucine Enkephalin",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Orexins",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Prolactin-Releasing Hormone",
                "Ras Homolog Enriched in Brain Protein",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-MSH"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Endorphin (e.g. \u03b2-endorphin)",
            "Enkephalin (e.g. Met-enkephalin, Leu-enkephalin)",
            "Dynorphin (e.g. Dynorphin A, Dynorphin B)",
            "Substance P",
            "Neurotensin",
            "Somatostatin",
            "Cholecystokinin (CCK)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Neuropeptide Y (NPY)",
            "Galanin",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Oxytocin",
            "Vasopressin",
            "Angiotensin",
            "Bradykinin",
            "Glucagon",
            "Insulin",
            "Leptin",
            "Ghrelin",
            "Orexin (Hypocretin)",
            "Melanocyte-Stimulating Hormone (MSH)",
            "Gonadotropin-Releasing Hormone (GnRH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Neurotensin",
                "Somatostatin",
                "Vasoactive Intestinal Peptide",
                "Neuropeptide Y",
                "Galanin",
                "Calcitonin Gene-Related Peptide",
                "Corticotropin-Releasing Hormone",
                "Bradykinin",
                "Orexin",
                "Melanocyte-Stimulating Hormone",
                "Gonadotropin-Releasing Hormone"
            ],
            "mismatches": [
                "Endorphin (e.g. \u03b2-endorphin)",
                "Enkephalin (e.g. Met-enkephalin, Leu-enkephalin)",
                "Dynorphin (e.g. Dynorphin A, Dynorphin B)",
                "Cholecystokinin (CCK)",
                "Oxytocin",
                "Vasopressin",
                "Angiotensin",
                "Glucagon",
                "Insulin",
                "Leptin",
                "Ghrelin"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Ala(2)-MePhe(4)-Gly(5)- Enkephalin",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Bombesin",
                "Bradykinin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "D-Ala(2),MePhe(4),Met(0)-ol-enkephalin",
                "Delta Sleep-Inducing Peptide",
                "Dynorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Orexins",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Terlipressin",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-Endorphin",
                "beta-Lipotropin",
                "beta-MSH",
                "gamma-Lipotropin"
            ],
            "TP": 12,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Acetylcholine (ACh)",
            "Adenosine",
            "Adrenaline (Epinephrine)",
            "Angiotensin II",
            "Arginine Vasopressin (AVP)",
            "Cholecystokinin (CCK)",
            "Dopamine",
            "Endorphins",
            "Gamma-Aminobutyric Acid (GABA)",
            "Gastrin",
            "Ghrelin",
            "Glutamate",
            "Glycine",
            "Histamine",
            "Insulin",
            "Melatonin",
            "Noradrenaline (Norepinephrine)",
            "Neuropeptide Y (NPY)",
            "Nitric Oxide (NO)",
            "Oxytocin",
            "Serotonin (5-Hydroxytryptamine, 5-HT)",
            "Substance P",
            "Thyroid-Stimulating Hormone (TSH)",
            "Vasoactive Intestinal Peptide (VIP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Angiotensin II",
                "Arginine Vasopressin",
                "Endorphins",
                "Gastrin",
                "Neuropeptide Y",
                "Substance P",
                "Vasoactive Intestinal Peptide"
            ],
            "mismatches": [
                "Acetylcholine (ACh)",
                "Adenosine",
                "Adrenaline (Epinephrine)",
                "Cholecystokinin (CCK)",
                "Dopamine",
                "Gamma-Aminobutyric Acid (GABA)",
                "Ghrelin",
                "Glutamate",
                "Glycine",
                "Histamine",
                "Insulin",
                "Melatonin",
                "Noradrenaline (Norepinephrine)",
                "Nitric Oxide (NO)",
                "Oxytocin",
                "Serotonin (5-Hydroxytryptamine, 5-HT)",
                "Thyroid-Stimulating Hormone (TSH)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Ala(2)-MePhe(4)-Gly(5)- Enkephalin",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Bradykinin",
                "Carnosine",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "D-Penicillamine (2,5)- Enkephalin",
                "Deamino Arginine Vasopressin",
                "Dynorphins",
                "Endorphins",
                "Galanin",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Growth Hormone-Releasing Hormone",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Substance P",
                "Tachykinins",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-Endorphin",
                "beta-Lipotropin",
                "gamma-Endorphin"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Neurotransmitter (NT)",
            "Acetylcholine (ACh)",
            "Dopamine",
            "Serotonin",
            "Norepinephrine",
            "GABA (Gamma-Aminobutyric Acid)",
            "Glutamate",
            "Aspartate",
            "Enkephalin",
            "Endorphin",
            "Substance P",
            "Vasoactive Intestinal Peptide (VIP)",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Neuromedin U",
            "Pituitary Adenylate Cyclase-Activating Polypeptide (PACAP)",
            "Neuropeptide Y (NPY)",
            "Cholecystokinin (CCK)",
            "Somatostatin",
            "Insulin",
            "Glucagon",
            "Adrenocorticotropic Hormone (ACTH)",
            "Melanocyte-Stimulating Hormone (MSH)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Growth Hormone-Releasing Hormone (GHRH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Enkephalin",
                "Endorphin",
                "Substance P",
                "Vasoactive Intestinal Peptide",
                "Calcitonin Gene-Related Peptide",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Neuropeptide Y",
                "Somatostatin",
                "Adrenocorticotropic Hormone",
                "Melanocyte-Stimulating Hormone",
                "Thyrotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone"
            ],
            "mismatches": [
                "Neurotransmitter (NT)",
                "Acetylcholine (ACh)",
                "Dopamine",
                "Serotonin",
                "Norepinephrine",
                "GABA (Gamma-Aminobutyric Acid)",
                "Glutamate",
                "Aspartate",
                "Neuromedin U",
                "Cholecystokinin (CCK)",
                "Insulin",
                "Glucagon"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Carnosine",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "D-Penicillamine (2,5)- Enkephalin",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Galanin-Like Peptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Leucine Enkephalin",
                "Melanocortins",
                "Melanocyte-Stimulating Hormones",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurophysins",
                "Neurotensin",
                "Peptide PHI",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "alpha-Endorphin",
                "beta-Endorphin",
                "beta-Lipotropin",
                "beta-MSH",
                "gamma-Endorphin"
            ],
            "TP": 12,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Neuropeptide Y (NPY)",
            "Substance P",
            "Vasoactive intestinal peptide (VIP)",
            "Calcitonin gene-related peptide (CGRP)",
            "Neuromedin U",
            "Gastrin-releasing peptide (GRP)",
            "Somatostatin",
            "Motilin",
            "Secretin",
            "Gastrin",
            "Cholecystokinin (CCK)",
            "Ghrelin",
            "Oxytocin",
            "Vasopressin",
            "Neurotensin",
            "Angiotensin",
            "Bradykinin",
            "Kisspeptin",
            "Neuropeptide FF (NPFF)",
            "Neuropeptide VF (NPVF)",
            "Hemokinin-1",
            "Neuromedin S",
            "Neuromedin K"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neuropeptide Y (NPY)",
                "Substance P",
                "Vasoactive intestinal peptide (VIP)",
                "Calcitonin gene-related peptide (CGRP)",
                "Gastrin-releasing peptide (GRP)",
                "Somatostatin",
                "Motilin",
                "Secretin",
                "Gastrin",
                "Vasopressin",
                "Neurotensin",
                "Bradykinin",
                "Kisspeptin"
            ],
            "mismatches": [
                "Neuromedin U",
                "Cholecystokinin (CCK)",
                "Ghrelin",
                "Oxytocin",
                "Neuropeptide FF (NPFF)",
                "Neuropeptide VF (NPVF)",
                "Hemokinin-1",
                "Neuromedin S",
                "Neuromedin K"
            ],
            "true_referents": [
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Bradykinin",
                "Buserelin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Cosyntropin",
                "Dynorphins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Growth Hormone-Releasing Hormone",
                "Kisspeptins",
                "Lypressin",
                "Motilin",
                "Nafarelin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurophysins",
                "Neurotensin",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Terlipressin",
                "Vasoactive Intestinal Peptide",
                "Vasopressins"
            ],
            "TP": 13,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Acetylcholine",
            "Adrenocorticotropic hormone",
            "Angiotensin II",
            "Arginine vasopressin",
            "Corticotropin-releasing hormone",
            "Endorphin",
            "Epinephrine",
            "Glucagon",
            "Growth hormone-releasing hormone",
            "Insulin",
            "Leptin",
            "Oxytocin",
            "Parathyroid hormone",
            "Prolactin",
            "Prostaglandin",
            "Prostaglandin E2",
            "Serotonin",
            "Thyrotropin-releasing hormone",
            "Thyroxine",
            "Vasopressin",
            "Vasopressin",
            "Vasopressin",
            "Vasopressin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenocorticotropic hormone",
                "Angiotensin II",
                "Arginine vasopressin",
                "Corticotropin-releasing hormone",
                "Growth hormone-releasing hormone",
                "Thyrotropin-releasing hormone",
                "Vasopressin"
            ],
            "mismatches": [
                "Acetylcholine",
                "Endorphin",
                "Epinephrine",
                "Glucagon",
                "Insulin",
                "Leptin",
                "Oxytocin",
                "Parathyroid hormone",
                "Prolactin",
                "Prostaglandin",
                "Prostaglandin E2",
                "Serotonin",
                "Thyroxine"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Bradykinin",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Deamino Arginine Vasopressin",
                "Endorphins",
                "Galanin",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Hypothalamic Hormones",
                "Lypressin",
                "Melanocortins",
                "Neurokinin A",
                "Pituitary Hormone-Releasing Hormones",
                "Prolactin Release-Inhibiting Factors",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Substance P",
                "Terlipressin",
                "Thyrotropin-Releasing Hormone",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-Lipotropin",
                "gamma-Lipotropin"
            ],
            "TP": 7,
            "FP": 13,
            "FN": 0
        }
    }
]