[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Vasoactive Intestinal Peptide (VIP)",
            "Somatostatin (SS)",
            "Neuropeptide Y (NPY)",
            "Opioid Peptides (Endorphins)",
            "Prolactin-Releasing Peptide (PrRP)",
            "Galanin (GAL)",
            "Cholecystokinin (CCK)",
            "Neuropeptide W (NPW)",
            "Neuropeptide FF (NPFF)",
            "Neurotensin (NT)",
            "Tachykinins (Substance P)",
            "Dynorphin",
            "Satiety Peptide (Peptide YY, PYY)",
            "Hunger Peptide (Ghrelin)",
            "Melanin-Concentrating Hormone (MCH)",
            "Corticotropin-Releasing Factor (CRF)",
            "Tachykinin-Related Peptide (TRP)",
            "Neuropeptide S (NPS)",
            "Cocaine- and Amphetamine-Regulated Transcript (CART)",
            "Galanin-like Peptide (GALP)",
            "Neuropeptide B (NPB)",
            "Neuropeptide K (NPK)",
            "Neuropeptide W (NPW)",
            "Tachykinin (Neurokinin A)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Vasoactive Intestinal Peptide",
                "Somatostatin",
                "Neuropeptide Y",
                "Opioid Peptides",
                "Galanin",
                "Neurotensin",
                "Tachykinins",
                "Dynorphins",
                "Cocaine- and Amphetamine-Regulated Transcript Protein",
                "Galanin-Like Peptide"
            ],
            "mismatches": [
                "Prolactin-Releasing Peptide (PrRP)",
                "Cholecystokinin (CCK)",
                "Neuropeptide W (NPW)",
                "Neuropeptide FF (NPFF)",
                "Satiety Peptide (Peptide YY, PYY)",
                "Hunger Peptide (Ghrelin)",
                "Melanin-Concentrating Hormone (MCH)",
                "Corticotropin-Releasing Factor (CRF)",
                "Tachykinin-Related Peptide (TRP)",
                "Neuropeptide S (NPS)",
                "Neuropeptide B (NPB)",
                "Neuropeptide K (NPK)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensins",
                "Bradykinin",
                "Cocaine- and Amphetamine-Regulated Transcript Protein",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Dynorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Growth Hormone-Releasing Hormone",
                "Kisspeptins",
                "Melanocyte-Stimulating Hormones",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Opioid Peptides",
                "Pancreatic Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Prolactin Release-Inhibiting Factors",
                "Prolactin-Releasing Hormone",
                "Ras Homolog Enriched in Brain Protein",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Vasoactive Intestinal Peptide",
                "alpha-Endorphin",
                "beta-Endorphin",
                "beta-MSH"
            ],
            "TP": 10,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Vasopressin (AVP)",
            "Oxytocin (OXT)",
            "Neurotensin (NT)",
            "Cholecystokinin (CCK)",
            "Galanin (GAL)",
            "Neuromedin U (NMU)",
            "Neuromedin S (NMS)",
            "Corticotropin-releasing hormone (CRH)",
            "Vasoactive intestinal peptide (VIP)",
            "Calcitonin gene-related peptide (CGRP)",
            "Galanin (GAL)",
            "Angiotensin II (Ang II)",
            "Endorphin (ENK)",
            "Dynorphin (DYN)",
            "Enkephalin (ENK)",
            "Neurokinin A (NKA)",
            "Neurokinin B (NKB)",
            "Substance K (NK1)",
            "Gastrin-releasing peptide (GRP)",
            "Pituitary adenylate cyclase-activating peptide (PACAP)",
            "Neuropeptide Y (NPY)",
            "Atrial natriuretic peptide (ANP)",
            "Bradykinin (BK)",
            "Adrenomedullin (AM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Vasopressin",
                "Neurotensin",
                "Galanin",
                "Corticotropin-releasing hormone",
                "Vasoactive intestinal peptide",
                "Calcitonin gene-related peptide",
                "Angiotensin II",
                "Dynorphin",
                "Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Gastrin-releasing peptide",
                "Pituitary adenylate cyclase-activating polypeptide",
                "Neuropeptide Y",
                "Bradykinin"
            ],
            "mismatches": [
                "Oxytocin",
                "Cholecystokinin",
                "Neuromedin U",
                "Neuromedin S",
                "Endorphin",
                "Substance K",
                "Atrial natriuretic peptide",
                "Adrenomedullin"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Bradykinin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Dynorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Leucine Enkephalin",
                "Lypressin",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurophysins",
                "Neurotensin",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Pro-Opiomelanocortin",
                "Secretin",
                "Somatostatin",
                "Substance P",
                "Tachykinins",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-Endorphin"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Adrenomedullin (ADM)",
            "Angiotensin II",
            "Atrial Natriuretic Peptide (ANP)",
            "Beta-Endorphin",
            "Bradykinin",
            "Calcitonin",
            "Cholecystokinin (CCK)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Dynorphin",
            "Endothelin",
            "Enkephalins",
            "Gastrin",
            "Glucagon",
            "Gonadotropin-Releasing Hormone (GnRH)",
            "Insulin",
            "Leptin",
            "Melatonin",
            "Neurotensin",
            "Orexin",
            "Oxytocin",
            "Proopiomelanocortin (POMC)",
            "Secretin",
            "Somatostatin",
            "Substance P"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Angiotensin II",
                "Beta-Endorphin",
                "Bradykinin",
                "Calcitonin",
                "Corticotropin-Releasing Hormone",
                "Enkephalins",
                "Gastrin",
                "Gonadotropin-Releasing Hormone",
                "Neurotensin",
                "Orexins",
                "Pro-Opiomelanocortin",
                "Secretin",
                "Somatostatin",
                "Substance P"
            ],
            "mismatches": [
                "Adrenomedullin (ADM)",
                "Atrial Natriuretic Peptide (ANP)",
                "Cholecystokinin (CCK)",
                "Dynorphin",
                "Endothelin",
                "Glucagon",
                "Insulin",
                "Leptin",
                "Melatonin",
                "Oxytocin"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Bradykinin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Delta Sleep-Inducing Peptide",
                "Dynorphins",
                "Enkephalins",
                "Galanin",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Hypothalamic Hormones",
                "Leucine Enkephalin",
                "Lypressin",
                "Melanocortins",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neurotensin",
                "Orexins",
                "Pro-Opiomelanocortin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Thyrotropin-Releasing Hormone",
                "alpha-Endorphin",
                "beta-Endorphin",
                "beta-Lipotropin",
                "gamma-Lipotropin"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Neuropeptide Y (NPY)",
            "Vasopressin (AVP)",
            "Oxytocin (OT)",
            "Somatostatin (SST)",
            "Cholecystokinin (CCK)",
            "Gastrin-Releasing Peptide (GRP)",
            "Neurotensin (NT)",
            "Luteinizing Hormone-Releasing Hormone (LHRH)",
            "Gonadotropin-Inhibiting Hormone (GnIH)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Growth Hormone-Releasing Hormone (GHRH)",
            "Prolactin-Releasing Hormone (PRH)",
            "Melanocyte-Stimulating Hormone (MSH)",
            "Endorphins (\u03b2-EP)",
            "Dynorphins (Dyn)",
            "Enkephalins (ENK)",
            "Motilin (MTL)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Secretin (SCR)",
            "Glucagon-Like Peptide-1 (GLP-1)",
            "Ghrelin (GHRL)",
            "Neuromedin U (NMU)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Neuropeptide Y",
                "Somatostatin",
                "Gastrin-Releasing Peptide",
                "Neurotensin",
                "Corticotropin-Releasing Hormone",
                "Thyrotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Prolactin-Releasing Hormone",
                "Melanocyte-Stimulating Hormones",
                "Dynorphins",
                "Enkephalins",
                "Motilin",
                "Vasoactive Intestinal Peptide",
                "Secretin"
            ],
            "mismatches": [
                "Vasopressin (AVP)",
                "Oxytocin (OT)",
                "Cholecystokinin (CCK)",
                "Luteinizing Hormone-Releasing Hormone (LHRH)",
                "Gonadotropin-Inhibiting Hormone (GnIH)",
                "Endorphins (\u03b2-EP)",
                "Glucagon-Like Peptide-1 (GLP-1)",
                "Ghrelin (GHRL)",
                "Neuromedin U (NMU)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensins",
                "Arginine Vasopressin",
                "Buserelin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Dynorphins",
                "Enkephalins",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Leucine Enkephalin",
                "Lypressin",
                "MSH Release-Inhibiting Hormone",
                "Melanocyte-Stimulating Hormones",
                "Methionine Enkephalin",
                "Motilin",
                "Nafarelin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurophysins",
                "Neurotensin",
                "Pancreatic Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Pro-Opiomelanocortin",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-Endorphin",
                "beta-MSH",
                "gamma-Lipotropin"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Neuropeptide Y (NPY)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Oxytocin (OXT)",
            "Vasopressin (AVP)",
            "Endorphins",
            "Enkephalins",
            "Dynorphins",
            "Corticotropin-Releasing Hormone (CRH)",
            "Galanin (GAL)",
            "Somatostatin (SST)",
            "Cholecystokinin (CCK)",
            "Neurotensin (NT)",
            "Gonadotropin-Releasing Hormone (GnRH)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Melanin-Concentrating Hormone (MCH)",
            "Bombesin",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Neuropeptide FF (NPFF)",
            "Neuropeptide S (NPS)",
            "Prolactin-Releasing Peptide (PrRP)",
            "Pituitary Adenylate Cyclase-Activating Peptide (PACAP)",
            "Kisspeptin",
            "Orexin (Hypocretin)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Neuropeptide Y",
                "Vasoactive Intestinal Peptide",
                "Vasopressin",
                "Endorphins",
                "Enkephalins",
                "Dynorphins",
                "Corticotropin-Releasing Hormone",
                "Galanin",
                "Somatostatin",
                "Neurotensin",
                "Gonadotropin-Releasing Hormone",
                "Thyrotropin-Releasing Hormone",
                "Bombesin",
                "Calcitonin Gene-Related Peptide",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Kisspeptins",
                "Orexins"
            ],
            "mismatches": [
                "Oxytocin",
                "Cholecystokinin",
                "Melanin-Concentrating Hormone",
                "Neuropeptide FF",
                "Neuropeptide S",
                "Prolactin-Releasing Peptide"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensins",
                "Arginine Vasopressin",
                "Bombesin",
                "Buserelin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Delta Sleep-Inducing Peptide",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Kisspeptins",
                "Leucine Enkephalin",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Orexins",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Prolactin Release-Inhibiting Factors",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-MSH"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Neuropeptide Y (NPY)",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Somatostatin (SST)",
            "Enkephalins (ENK)",
            "Endorphins (END)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Oxytocin (OXT)",
            "Vasopressin (AVP)",
            "Cholecystokinin (CCK)",
            "Neuropeptide FF (NPFF)",
            "Neuropeptide B (NPB)",
            "Neuropeptide W (NPW)",
            "Agouti-Related Peptide (AgRP)",
            "Melanin-Concentrating Hormone (MCH)",
            "Dynorphins (DYN)",
            "Galanin (GAL)",
            "Pituitary Adenylate Cyclase-Activating Polypeptide (PACAP)",
            "Bombesin (BN)",
            "Urocortin (UCN)",
            "Nociceptin (NOP)",
            "Neuropeptide S (NPS)",
            "Corticotropin-Releasing Factor (CRF)",
            "Thyrotropin-Releasing Hormone (TRH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P (SP)",
                "Neuropeptide Y (NPY)",
                "Calcitonin Gene-Related Peptide (CGRP)",
                "Vasoactive Intestinal Peptide (VIP)",
                "Somatostatin (SST)",
                "Corticotropin-Releasing Hormone (CRH)",
                "Dynorphins (DYN)",
                "Galanin (GAL)",
                "Pituitary Adenylate Cyclase-Activating Polypeptide (PACAP)",
                "Bombesin (BN)",
                "Urocortin (UCN)",
                "Nociceptin (NOP)"
            ],
            "mismatches": [
                "Enkephalins (ENK)",
                "Endorphins (END)",
                "Oxytocin (OXT)",
                "Vasopressin (AVP)",
                "Cholecystokinin (CCK)",
                "Neuropeptide FF (NPFF)",
                "Neuropeptide B (NPB)",
                "Neuropeptide W (NPW)",
                "Agouti-Related Peptide (AgRP)",
                "Melanin-Concentrating Hormone (MCH)",
                "Neuropeptide S (NPS)",
                "Corticotropin-Releasing Factor (CRF)",
                "Thyrotropin-Releasing Hormone (TRH)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Arginine Vasopressin",
                "Bombesin",
                "Buserelin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Leucine Enkephalin",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Nociceptin",
                "Peptide PHI",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Urocortins",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "beta-Endorphin",
                "beta-MSH"
            ],
            "TP": 12,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Oxytocin (OT)",
            "Vasopressin (AVP)",
            "Neuropeptide Y (NPY)",
            "Substance P (SP)",
            "Corticotropin-releasing hormone (CRH)",
            "Somatostatin (SST)",
            "Gonadotropin-releasing hormone (GnRH)",
            "Thyrotropin-releasing hormone (TRH)",
            "Neurotensin (NT)",
            "Endorphins (END)",
            "Enkephalins (ENK)",
            "Cholecystokinin (CCK)",
            "Vasoactive intestinal peptide (VIP)",
            "Pituitary adenylate cyclase-activating polypeptide (PACAP)",
            "Neuropeptide S (NPS)",
            "Neuropeptide B (NPB)",
            "Neuropeptide FF (NPFF)",
            "Neuropeptide VF (NPVF)",
            "Orexin (ORX)",
            "Melanocyte-stimulating hormone (MSH)",
            "Adrenocorticotropic hormone (ACTH)",
            "Delta sleep-inducing peptide (DSIP)",
            "Angiotensin II (ANG II)",
            "Motilin (MTL)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Vasopressin (AVP)",
                "Neuropeptide Y (NPY)",
                "Substance P (SP)",
                "Corticotropin-releasing hormone (CRH)",
                "Somatostatin (SST)",
                "Gonadotropin-releasing hormone (GnRH)",
                "Thyrotropin-releasing hormone (TRH)",
                "Neurotensin (NT)",
                "Endorphins (END)",
                "Enkephalins (ENK)",
                "Vasoactive intestinal peptide (VIP)",
                "Pituitary adenylate cyclase-activating polypeptide (PACAP)",
                "Orexin (ORX)",
                "Melanocyte-stimulating hormone (MSH)",
                "Adrenocorticotropic hormone (ACTH)",
                "Delta sleep-inducing peptide (DSIP)",
                "Angiotensin II (ANG II)",
                "Motilin (MTL)"
            ],
            "mismatches": [
                "Oxytocin (OT)",
                "Cholecystokinin (CCK)",
                "Neuropeptide S (NPS)",
                "Neuropeptide B (NPB)",
                "Neuropeptide FF (NPFF)",
                "Neuropeptide VF (NPVF)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Buserelin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Delta Sleep-Inducing Peptide",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Galanin-Like Peptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Leucine Enkephalin",
                "Lypressin",
                "Melanocortins",
                "Melanocyte-Stimulating Hormones",
                "Methionine Enkephalin",
                "Motilin",
                "Nafarelin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Orexins",
                "Ornipressin",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "beta-Endorphin",
                "beta-MSH"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P",
            "Oxytocin",
            "Vasopressin",
            "Endorphins",
            "Enkephalins",
            "Neurokinin A",
            "Neurokinin B",
            "Galanin",
            "Neuropeptide Y",
            "Somatostatin",
            "Corticotropin-releasing hormone (CRH)",
            "Cholecystokinin (CCK)",
            "Gastrin-releasing peptide (GRP)",
            "Neurotensin",
            "Bombesin",
            "Dynorphin",
            "Met-enkephalin",
            "Leu-enkephalin",
            "Ghrelin",
            "Angiotensin",
            "Neurokinin-1 (NK-1)",
            "Neurokinin-2 (NK-2)",
            "Neurokinin-3 (NK-3)",
            "Neurokinin-4 (NK-4)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Endorphins",
                "Enkephalins",
                "Neurokinin A",
                "Neurokinin B",
                "Galanin",
                "Neuropeptide Y",
                "Somatostatin",
                "Neurotensin",
                "Bombesin",
                "Gastrin-releasing peptide (GRP)"
            ],
            "mismatches": [
                "Oxytocin",
                "Vasopressin",
                "Corticotropin-releasing hormone (CRH)",
                "Cholecystokinin (CCK)",
                "Dynorphin",
                "Met-enkephalin",
                "Leu-enkephalin",
                "Ghrelin",
                "Angiotensin",
                "Neurokinin-1 (NK-1)",
                "Neurokinin-2 (NK-2)",
                "Neurokinin-3 (NK-3)",
                "Neurokinin-4 (NK-4)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Bombesin",
                "Buserelin",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "D-Ala(2),MePhe(4),Met(0)-ol-enkephalin",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Growth Hormone-Releasing Hormone",
                "Leucine Enkephalin",
                "Leucine-2-Alanine Enkephalin",
                "Lypressin",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Terlipressin",
                "Vasopressins",
                "alpha-Endorphin"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Neuropeptide Y (NPY)",
            "Oxytocin",
            "Vasopressin",
            "Enkephalin (Enk)",
            "Endorphin",
            "Somatostatin (SST)",
            "Galanin",
            "Corticotropin-releasing hormone (CRH)",
            "Vasoactive intestinal peptide (VIP)",
            "Nociceptin (Orphanin FQ)",
            "Calcitonin gene-related peptide (CGRP)",
            "Dynorphin",
            "Cholecystokinin (CCK)",
            "Bombesin",
            "Kisspeptin",
            "Prolactin-releasing peptide (PrRP)",
            "Tachykinin",
            "Adrenomedullin",
            "Pituitary adenylate cyclase-activating peptide (PACAP)",
            "Secretin",
            "Neurotensin",
            "Cocaine- and amphetamine-regulated transcript (CART)",
            "Relaxin-3"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Neuropeptide Y",
                "Vasopressin",
                "Enkephalins",
                "Endorphins",
                "Somatostatin",
                "Galanin",
                "Corticotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Nociceptin",
                "Calcitonin Gene-Related Peptide",
                "Dynorphins",
                "Bombesin",
                "Kisspeptins",
                "Tachykinins",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Secretin",
                "Neurotensin",
                "Cocaine- and Amphetamine-Regulated Transcript Protein"
            ],
            "mismatches": [
                "Oxytocin",
                "Cholecystokinin",
                "Prolactin-releasing peptide",
                "Adrenomedullin",
                "Relaxin-3"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin III",
                "Angiotensins",
                "Bombesin",
                "Buserelin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Cocaine- and Amphetamine-Regulated Transcript Protein",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Kisspeptins",
                "Leucine Enkephalin",
                "Lypressin",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Nociceptin",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Pro-Opiomelanocortin",
                "Prolactin Release-Inhibiting Factors",
                "Prolactin-Releasing Hormone",
                "Ras Homolog Enriched in Brain Protein",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Terlipressin",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Neuropeptide Y (NPY)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Cholecystokinin (CCK)",
            "Somatostatin (SST)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Oxytocin (OXT)",
            "Vasopressin (AVP)",
            "Enkephalin",
            "Beta-Endorphin",
            "Galanin (GAL)",
            "Neurotensin (NT)",
            "Melanin-Concentrating Hormone (MCH)",
            "Orexin (Hypocretin)",
            "Gonadotropin-Releasing Hormone (GnRH)",
            "Thyrotropin-Releasing Hormone (TRH)",
            "Neurokinin A (NKA)",
            "Neurokinin B (NKB)",
            "Neuropeptide FF (NPFF)",
            "Pituitary Adenylate Cyclase-Activating Polypeptide (PACAP)",
            "Cocaine and Amphetamine Regulated Transcript (CART)",
            "Prolactin-Releasing Peptide (PrRP)",
            "Kisspeptin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Neuropeptide Y",
                "Vasoactive Intestinal Peptide",
                "Calcitonin Gene-Related Peptide",
                "Somatostatin",
                "Corticotropin-Releasing Hormone",
                "Vasopressin",
                "beta-Endorphin",
                "Galanin",
                "Neurotensin",
                "Orexins",
                "Gonadotropin-Releasing Hormone",
                "Thyrotropin-Releasing Hormone",
                "Neurokinin A",
                "Neurokinin B",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Kisspeptins"
            ],
            "mismatches": [
                "Cholecystokinin (CCK)",
                "Oxytocin (OXT)",
                "Enkephalin",
                "Melanin-Concentrating Hormone (MCH)",
                "Neuropeptide FF (NPFF)",
                "Cocaine and Amphetamine Regulated Transcript (CART)",
                "Prolactin-Releasing Peptide (PrRP)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensins",
                "Arginine Vasopressin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Cocaine- and Amphetamine-Regulated Transcript Protein",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Delta Sleep-Inducing Peptide",
                "Dynorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Kisspeptins",
                "Leucine Enkephalin",
                "Lypressin",
                "Melanocyte-Stimulating Hormones",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Orexins",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Prolactin Release-Inhibiting Factors",
                "Prolactin-Releasing Hormone",
                "Ras Homolog Enriched in Brain Protein",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-Endorphin",
                "beta-MSH"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Adrenocorticotropic hormone (ACTH)",
            "Agouti-related peptide (AgRP)",
            "Calcitonin gene-related peptide (CGRP)",
            "Cholecystokinin (CCK)",
            "Corticotropin-releasing factor (CRF)",
            "Dynorphin",
            "Endorphins",
            "Galanin",
            "Gastrin-releasing peptide (GRP)",
            "Ghrelin",
            "Glucagon-like peptide-1 (GLP-1)",
            "Gonadotropin-releasing hormone (GnRH)",
            "Growth hormone-releasing hormone (GHRH)",
            "Kisspeptin",
            "Melanin-concentrating hormone (MCH)",
            "Melanocyte-stimulating hormone (MSH)",
            "Neuropeptide Y (NPY)",
            "Neurotensin",
            "Oxytocin",
            "Pituitary adenylate cyclase-activating polypeptide (PACAP)",
            "Prolactin-releasing peptide (PrRP)",
            "Somatostatin",
            "Substance P",
            "Vasoactive intestinal peptide (VIP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenocorticotropic hormone (ACTH)",
                "Calcitonin gene-related peptide (CGRP)",
                "Dynorphin",
                "Endorphins",
                "Galanin",
                "Gastrin-releasing peptide (GRP)",
                "Gonadotropin-releasing hormone (GnRH)",
                "Growth hormone-releasing hormone (GHRH)",
                "Kisspeptin",
                "Melanocyte-stimulating hormone (MSH)",
                "Neuropeptide Y (NPY)",
                "Neurotensin",
                "Pituitary adenylate cyclase-activating polypeptide (PACAP)",
                "Somatostatin",
                "Substance P",
                "Vasoactive intestinal peptide (VIP)"
            ],
            "mismatches": [
                "Agouti-related peptide (AgRP)",
                "Cholecystokinin (CCK)",
                "Corticotropin-releasing factor (CRF)",
                "Ghrelin",
                "Glucagon-like peptide-1 (GLP-1)",
                "Melanin-concentrating hormone (MCH)",
                "Oxytocin",
                "Prolactin-releasing peptide (PrRP)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensins",
                "Bombesin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Dynorphins",
                "Endorphins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Kisspeptins",
                "Melanocortins",
                "Melanocyte-Stimulating Hormones",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Pancreatic Polypeptide",
                "Peptide PHI",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Prolactin Release-Inhibiting Factors",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Thyrotropin-Releasing Hormone",
                "Vasoactive Intestinal Peptide",
                "alpha-Endorphin",
                "beta-MSH"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Oxytocin (OXT)",
            "Vasopressin (AVP)",
            "Substance P (SP)",
            "Neuropeptide Y (NPY)",
            "Somatostatin (SST)",
            "Cholecystokinin (CCK)",
            "Neurotensin (NT)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Galanin (GAL)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Melanocortins (\u03b1-MSH, \u03b2-MSH, \u03b3-MSH)",
            "Orexins (Orexin-A, Orexin-B)",
            "Opioid Peptides (Enkephalins, Endorphins, Dynorphins)",
            "Tachykinins (Substance P, Neurokinin A, Neurokinin B)",
            "Bradykinin (BK)",
            "Angiotensin (Ang II)",
            "Glucagon-Like Peptide-1 (GLP-1)",
            "Gastrin-Releasing Peptide (GRP)",
            "Pituitary Adenylate Cyclase-Activating Polypeptide (PACAP)",
            "Cocaine- and Amphetamine-Regulated Transcript (CART)",
            "Neuropeptide S (NPS)",
            "Neuropeptide FF (NPFF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Vasopressin (AVP)",
                "Substance P (SP)",
                "Neuropeptide Y (NPY)",
                "Somatostatin (SST)",
                "Neurotensin (NT)",
                "Vasoactive Intestinal Peptide (VIP)",
                "Calcitonin Gene-Related Peptide (CGRP)",
                "Galanin (GAL)",
                "Corticotropin-Releasing Hormone (CRH)",
                "Melanocortins (\u03b1-MSH, \u03b2-MSH, \u03b3-MSH)",
                "Orexins (Orexin-A, Orexin-B)",
                "Opioid Peptides (Enkephalins, Endorphins, Dynorphins)",
                "Tachykinins (Substance P, Neurokinin A, Neurokinin B)",
                "Bradykinin (BK)",
                "Gastrin-Releasing Peptide (GRP)",
                "Pituitary Adenylate Cyclase-Activating Polypeptide (PACAP)",
                "Cocaine- and Amphetamine-Regulated Transcript (CART)"
            ],
            "mismatches": [
                "Oxytocin (OXT)",
                "Cholecystokinin (CCK)",
                "Angiotensin (Ang II)",
                "Glucagon-Like Peptide-1 (GLP-1)",
                "Neuropeptide S (NPS)",
                "Neuropeptide FF (NPFF)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Bradykinin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Cocaine- and Amphetamine-Regulated Transcript Protein",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Delta Sleep-Inducing Peptide",
                "Dynorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Hypothalamic Hormones",
                "Lypressin",
                "Melanocortins",
                "Melanocyte-Stimulating Hormones",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Opioid Peptides",
                "Orexins",
                "Pancreatic Polypeptide",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Ras Homolog Enriched in Brain Protein",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Vasoactive Intestinal Peptide",
                "Vasopressins"
            ],
            "TP": 17,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Adrenocorticotropic Hormone (ACTH)",
            "Antidiuretic Hormone (ADH)",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Cholecystokinin (CCK)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Dynorphin",
            "Endorphin",
            "Enkephalin",
            "Galanin",
            "Ghrelin",
            "Glucagon-Like Peptide-1 (GLP-1)",
            "Gonadotropin-Releasing Hormone (GnRH)",
            "Growth Hormone-Releasing Hormone (GHRH)",
            "Histamine",
            "Melanin-Concentrating Hormone (MCH)",
            "Melanocyte-Stimulating Hormone (MSH)",
            "Neuropeptide Y (NPY)",
            "Orexin",
            "Oxytocin",
            "Parathyroid Hormone-Related Protein (PTHrP)",
            "Prolactin-Releasing Hormone (PRH)",
            "Somatostatin",
            "Substance P",
            "Thyrotropin-Releasing Hormone (TRH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adrenocorticotropic Hormone (ACTH)",
                "Calcitonin Gene-Related Peptide (CGRP)",
                "Corticotropin-Releasing Hormone (CRH)",
                "Dynorphin",
                "Endorphin",
                "Enkephalin",
                "Galanin",
                "Gonadotropin-Releasing Hormone (GnRH)",
                "Growth Hormone-Releasing Hormone (GHRH)",
                "Melanocyte-Stimulating Hormone (MSH)",
                "Neuropeptide Y (NPY)",
                "Orexin",
                "Prolactin-Releasing Hormone (PRH)",
                "Somatostatin",
                "Substance P",
                "Thyrotropin-Releasing Hormone (TRH)"
            ],
            "mismatches": [
                "Antidiuretic Hormone (ADH)",
                "Cholecystokinin (CCK)",
                "Ghrelin",
                "Glucagon-Like Peptide-1 (GLP-1)",
                "Histamine",
                "Melanin-Concentrating Hormone (MCH)",
                "Oxytocin",
                "Parathyroid Hormone-Related Protein (PTHrP)"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Bombesin",
                "Bradykinin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Delta Sleep-Inducing Peptide",
                "Dynorphins",
                "Endorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Hypothalamic Hormones",
                "Leucine Enkephalin",
                "Lypressin",
                "Melanocortins",
                "Melanocyte-Stimulating Hormones",
                "Methionine Enkephalin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Orexins",
                "Pancreatic Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Prolactin-Releasing Hormone",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Tachykinins",
                "Terlipressin",
                "Thyrotropin-Releasing Hormone",
                "Vasopressins",
                "alpha-Endorphin",
                "beta-MSH"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Substance P (SP)",
            "Vasopressin (AVP)",
            "Oxytocin (OT)",
            "Cholecystokinin (CCK)",
            "Gastrin-releasing peptide (GRP)",
            "Neurotensin (NT)",
            "Bombesin (BN)",
            "Neuromedin B (NMB)",
            "Neuromedin U (NMU)",
            "Neuropeptide Y (NPY)",
            "Pituitary adenylate cyclase-activating polypeptide (PACAP)",
            "Vasoactive intestinal peptide (VIP)",
            "Secretin",
            "Calcitonin gene-related peptide (CGRP)",
            "Adrenomedullin (ADM)",
            "Cortistatin",
            "Galanin (GAL)",
            "Motilin",
            "Neurokinin A (NKA)",
            "Neurokinin B (NKB)",
            "Tachykinin-1 (TAC1)",
            "Tachykinin-3 (TAC3)",
            "Neuropeptide AF (NP-AF)",
            "Neuropeptide FF (NP-FF)",
            "Neuropeptide SF (NP-SF)",
            "Neuropeptide EF (NP-EF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Substance P",
                "Vasopressin",
                "Gastrin-Releasing Peptide",
                "Neurotensin",
                "Bombesin",
                "Neuropeptide Y",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Vasoactive Intestinal Peptide",
                "Secretin",
                "Calcitonin Gene-Related Peptide",
                "Galanin",
                "Motilin",
                "Neurokinin A",
                "Neurokinin B"
            ],
            "mismatches": [
                "Oxytocin",
                "Cholecystokinin",
                "Neuromedin B",
                "Neuromedin U",
                "Adrenomedullin",
                "Cortistatin",
                "Tachykinin-1",
                "Tachykinin-3",
                "Neuropeptide AF",
                "Neuropeptide FF",
                "Neuropeptide SF",
                "Neuropeptide EF"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Arginine Vasopressin",
                "Bombesin",
                "Buserelin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Cosyntropin",
                "Dynorphins",
                "FMRFamide",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Lypressin",
                "Motilin",
                "Nafarelin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurophysins",
                "Neurotensin",
                "Nociceptin",
                "Pituitary Adenylate Cyclase-Activating Polypeptide",
                "Pituitary Hormone-Releasing Hormones",
                "Pro-Opiomelanocortin",
                "Secretin",
                "Somatostatin",
                "Substance P",
                "Tachykinins",
                "Vasoactive Intestinal Peptide",
                "Vasopressins"
            ],
            "TP": 14,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Adrenocorticotropic hormone (ACTH)",
            "Angiotensin",
            "Antidiuretic hormone (ADH)",
            "Atrial natriuretic peptide (ANP)",
            "Bradykinin",
            "Calcitonin",
            "Cocaine- and amphetamine-regulated transcript (CART)",
            "Cholecystokinin (CCK)",
            "Corticotropin-releasing hormone (CRH)",
            "Endothelin",
            "Enkephalin",
            "Galanin",
            "Gastrin",
            "Ghrelin",
            "Glucagon-like peptide-1 (GLP-1)",
            "Growth hormone-releasing hormone (GHRH)",
            "Motilin",
            "Neuropeptide FF (NPFF)",
            "Neuropeptide Y (NPY)",
            "Neurotensin",
            "Oxytocin",
            "Secretin",
            "Somatostatin",
            "Substance P",
            "Vasopressin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Bradykinin",
                "Calcitonin",
                "Corticotropin-releasing hormone (CRH)",
                "Enkephalin",
                "Galanin",
                "Gastrin",
                "Growth hormone-releasing hormone (GHRH)",
                "Motilin",
                "Neuropeptide Y (NPY)",
                "Neurotensin",
                "Secretin",
                "Somatostatin",
                "Substance P",
                "Vasopressin"
            ],
            "mismatches": [
                "Adrenocorticotropic hormone (ACTH)",
                "Angiotensin",
                "Antidiuretic hormone (ADH)",
                "Atrial natriuretic peptide (ANP)",
                "Cocaine- and amphetamine-regulated transcript (CART)",
                "Cholecystokinin (CCK)",
                "Endothelin",
                "Ghrelin",
                "Glucagon-like peptide-1 (GLP-1)",
                "Neuropeptide FF (NPFF)",
                "Oxytocin"
            ],
            "true_referents": [
                "Adrenocorticotropic Hormone",
                "Angiotensin I",
                "Angiotensin II",
                "Angiotensins",
                "Bombesin",
                "Bradykinin",
                "Buserelin",
                "Calcitonin",
                "Calcitonin Gene-Related Peptide",
                "Cocaine- and Amphetamine-Regulated Transcript Protein",
                "Corticotropin-Releasing Hormone",
                "Cosyntropin",
                "Dynorphins",
                "Enkephalins",
                "Galanin",
                "Galanin-Like Peptide",
                "Gastric Inhibitory Polypeptide",
                "Gastrin-Releasing Peptide",
                "Gastrins",
                "Gonadotropin-Releasing Hormone",
                "Growth Hormone-Releasing Hormone",
                "Leucine Enkephalin",
                "Lypressin",
                "Melanocortins",
                "Methionine Enkephalin",
                "Motilin",
                "Nafarelin",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Neurotensin",
                "Pancreatic Polypeptide",
                "Prolactin-Releasing Hormone",
                "Ras Homolog Enriched in Brain Protein",
                "Secretin",
                "Somatostatin",
                "Somatostatin-28",
                "Substance P",
                "Terlipressin",
                "Vasopressins"
            ],
            "TP": 14,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "neuropeptide",
        "domain": "biology",
        "response": [
            "Neuropeptide Y",
            "Neuropeptide S",
            "Neuropeptide FF",
            "Neuropeptide K",
            "Neuropeptide W",
            "Neuropeptide V",
            "Neuropeptide A",
            "Neuropeptide B",
            "Neuropeptide C",
            "Neuropeptide D",
            "Neuropeptide E",
            "Neuropeptide F",
            "Neuropeptide G",
            "Neuropeptide H",
            "Neuropeptide I",
            "Neuropeptide J",
            "Neuropeptide K",
            "Neuropeptide L",
            "Neuropeptide M",
            "Neuropeptide N",
            "Neuropeptide O",
            "Neuropeptide P",
            "Neuropeptide Q",
            "Neuropeptide R",
            "Neuropeptide S",
            "Neuropeptide T",
            "Neuropeptide U",
            "Neuropeptide V",
            "Neuropeptide W",
            "Neuropeptide X",
            "Neuropeptide Y",
            "Neuropeptide Z"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neuropeptide Y"
            ],
            "mismatches": [
                "Neuropeptide S",
                "Neuropeptide FF",
                "Neuropeptide K",
                "Neuropeptide W",
                "Neuropeptide V",
                "Neuropeptide A",
                "Neuropeptide B",
                "Neuropeptide C",
                "Neuropeptide D",
                "Neuropeptide E",
                "Neuropeptide F",
                "Neuropeptide G",
                "Neuropeptide H",
                "Neuropeptide I",
                "Neuropeptide J",
                "Neuropeptide K",
                "Neuropeptide L",
                "Neuropeptide M",
                "Neuropeptide N",
                "Neuropeptide O",
                "Neuropeptide P",
                "Neuropeptide Q",
                "Neuropeptide R",
                "Neuropeptide S",
                "Neuropeptide T",
                "Neuropeptide U",
                "Neuropeptide V",
                "Neuropeptide W",
                "Neuropeptide X",
                "Neuropeptide Z"
            ],
            "true_referents": [
                "Dynorphins",
                "Kisspeptins",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide Y",
                "Substance P",
                "Tachykinins"
            ],
            "TP": 1,
            "FP": 26,
            "FN": 0
        }
    }
]