[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Cholecystokinin (CCK)",
            "Gastrin",
            "Secretin",
            "Glucagon-like Peptide-1 (GLP-1)",
            "Glucagon-like Peptide-2 (GLP-2)",
            "Gastric Inhibitory Polypeptide (GIP)",
            "Motilin",
            "Peptide YY (PYY)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Somatostatin",
            "Ghrelin",
            "Neuropeptide Y (NPY)",
            "Pancreatic Polypeptide",
            "Enteroglucagon",
            "Orexin (Hypocretin)",
            "Chromogranin A",
            "Chromogranin B",
            "Enterostatin",
            "Substance P",
            "Enkephalin",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Corticotropin-Releasing Hormone (CRH)",
            "Leptin",
            "Oxyntomodulin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholecystokinin (CCK)",
                "Gastrin",
                "Secretin",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Glucagon-like Peptide-2 (GLP-2)",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Motilin",
                "Peptide YY (PYY)",
                "Vasoactive Intestinal Peptide (VIP)",
                "Somatostatin",
                "Ghrelin",
                "Neuropeptide Y (NPY)",
                "Pancreatic Polypeptide",
                "Enteroglucagon",
                "Orexin (Hypocretin)",
                "Chromogranin A",
                "Chromogranin B",
                "Enterostatin",
                "Substance P",
                "Enkephalin",
                "Calcitonin Gene-Related Peptide (CGRP)",
                "Corticotropin-Releasing Hormone (CRH)",
                "Leptin",
                "Oxyntomodulin"
            ],
            "mismatches": [],
            "true_referents": [
                "Calcitonin Gene-Related Peptide (CGRP)",
                "Cholecystokinin (CCK)",
                "Chromogranin A",
                "Chromogranin B",
                "Corticotropin-Releasing Hormone (CRH)",
                "Enkephalin",
                "Enteroglucagon",
                "Enterostatin",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Gastrin",
                "Ghrelin",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Glucagon-like Peptide-2 (GLP-2)",
                "Leptin",
                "Motilin",
                "Neuropeptide Y (NPY)",
                "Orexin (Hypocretin)",
                "Oxyntomodulin",
                "Pancreatic Polypeptide",
                "Peptide YY (PYY)",
                "Secretin",
                "Somatostatin",
                "Substance P",
                "Vasoactive Intestinal Peptide (VIP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Gastrin (GAS)",
            "Cholecystokinin (CCK)",
            "Secretin (SCT)",
            "Glucose-dependent insulinotropic polypeptide (GIP)",
            "Glucagon-like peptide-1 (GLP-1)",
            "Glucagon-like peptide-2 (GLP-2)",
            "Motilin (MTL)",
            "Gastric inhibitory polypeptide (GIP)",
            "Somatostatin (SST)",
            "Vasoactive intestinal peptide (VIP)",
            "Peptide YY (PYY)",
            "Oxyntomodulin (OXM)",
            "Neurotensin (NTS)",
            "Enteroglucagon (EG)",
            "Gastric inhibitory peptide (GIP)",
            "Ghrelin (GRL)",
            "Ghrelin-acyl (Ghrelin-O-acyl)",
            "Pancreatic polypeptide (PP)",
            "Cholecystokinin-A (CCK-A)",
            "Cholecystokinin-B (CCK-B)",
            "Gastric inhibitory polypeptide-1 (GIP-1)",
            "Gastric inhibitory polypeptide-2 (GIP-2)",
            "Neurotensin receptor 1 (NTSR1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gastrin (GAS)",
                "Cholecystokinin (CCK)",
                "Secretin (SCT)",
                "Glucose-dependent insulinotropic polypeptide (GIP)",
                "Glucagon-like peptide-1 (GLP-1)",
                "Glucagon-like peptide-2 (GLP-2)",
                "Motilin (MTL)",
                "Gastric inhibitory polypeptide (GIP)",
                "Somatostatin (SST)",
                "Vasoactive intestinal peptide (VIP)",
                "Peptide YY (PYY)",
                "Oxyntomodulin (OXM)",
                "Neurotensin (NTS)",
                "Enteroglucagon (EG)",
                "Gastric inhibitory peptide (GIP)",
                "Ghrelin (GRL)",
                "Ghrelin-acyl (Ghrelin-O-acyl)",
                "Pancreatic polypeptide (PP)",
                "Cholecystokinin-A (CCK-A)",
                "Cholecystokinin-B (CCK-B)",
                "Gastric inhibitory polypeptide-1 (GIP-1)",
                "Gastric inhibitory polypeptide-2 (GIP-2)",
                "Neurotensin receptor 1 (NTSR1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Cholecystokinin (CCK)",
                "Cholecystokinin-A (CCK-A)",
                "Cholecystokinin-B (CCK-B)",
                "Enteroglucagon (EG)",
                "Gastric inhibitory peptide (GIP)",
                "Gastric inhibitory polypeptide (GIP)",
                "Gastric inhibitory polypeptide-1 (GIP-1)",
                "Gastric inhibitory polypeptide-2 (GIP-2)",
                "Gastrin (GAS)",
                "Ghrelin (GRL)",
                "Ghrelin-acyl (Ghrelin-O-acyl)",
                "Glucagon-like peptide-1 (GLP-1)",
                "Glucagon-like peptide-2 (GLP-2)",
                "Glucose-dependent insulinotropic polypeptide (GIP)",
                "Motilin (MTL)",
                "Neurotensin (NTS)",
                "Neurotensin receptor 1 (NTSR1)",
                "Oxyntomodulin (OXM)",
                "Pancreatic polypeptide (PP)",
                "Peptide YY (PYY)",
                "Secretin (SCT)",
                "Somatostatin (SST)",
                "Vasoactive intestinal peptide (VIP)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Gastrin (G)",
            "Cholecystokinin (CCK)",
            "Secretin (S)",
            "Gastric Inhibitory Polypeptide (GIP)",
            "Motilin (MOT)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Somatostatin (SST)",
            "Neurotensin (NT)",
            "Peptide YY (PYY)",
            "Glucagon-like Peptide-1 (GLP-1)",
            "Glucagon-like Peptide-2 (GLP-2)",
            "Ghrelin (GHR)",
            "Oxyntomodulin (OXM)",
            "Enterostatin",
            "Pancreatic Polypeptide (PP)",
            "Apo A-IV",
            "Apo B-48",
            "Apo E",
            "Enteroglucagon",
            "Neuropeptide W",
            "Neuropeptide B",
            "Gastrointestinal Inhibitory Peptide (GIP)",
            "Neurokinin A",
            "Neurokinin B"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gastrin (G)",
                "Cholecystokinin (CCK)",
                "Secretin (S)",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Motilin (MOT)",
                "Vasoactive Intestinal Peptide (VIP)",
                "Somatostatin (SST)",
                "Neurotensin (NT)",
                "Peptide YY (PYY)",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Glucagon-like Peptide-2 (GLP-2)",
                "Ghrelin (GHR)",
                "Oxyntomodulin (OXM)",
                "Enterostatin",
                "Pancreatic Polypeptide (PP)",
                "Apo A-IV",
                "Apo B-48",
                "Apo E",
                "Enteroglucagon",
                "Neuropeptide W",
                "Neuropeptide B",
                "Neurokinin A",
                "Neurokinin B"
            ],
            "mismatches": [
                "Gastrointestinal Inhibitory Peptide (GIP)"
            ],
            "true_referents": [
                "Apo A-IV",
                "Apo B-48",
                "Apo E",
                "Cholecystokinin (CCK)",
                "Enteroglucagon",
                "Enterostatin",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Gastrin (G)",
                "Gastrointestinal Inhibitory Peptide (GIP)",
                "Ghrelin (GHR)",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Glucagon-like Peptide-2 (GLP-2)",
                "Motilin (MOT)",
                "Neurokinin A",
                "Neurokinin B",
                "Neuropeptide B",
                "Neuropeptide W",
                "Neurotensin (NT)",
                "Oxyntomodulin (OXM)",
                "Pancreatic Polypeptide (PP)",
                "Peptide YY (PYY)",
                "Secretin (S)",
                "Somatostatin (SST)",
                "Vasoactive Intestinal Peptide (VIP)"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Gastrin (Gast)",
            "Cholecystokinin (CCK)",
            "Secretin (Sec)",
            "Gastric Inhibitory Polypeptide (GIP)",
            "Glucose-dependent Insulinotropic Polypeptide (GIP)",
            "Motilin (Mot)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Enteroglucagon (Glu)",
            "Somatostatin (SST)",
            "Ghrelin (Ghr)",
            "Peptide YY (PYY)",
            "Glucagon-like Peptide-1 (GLP-1)",
            "Glucagon-like Peptide-2 (GLP-2)",
            "Oxyntomodulin (OXM)",
            "Pancreatic Polypeptide (PP)",
            "Urotensin II (URI)",
            "Neurotensin (NT)",
            "Bombesin (Bbn)",
            "Gastrin-Releasing Peptide (GRP)",
            "Cerebrocortical peptide (CCCP)",
            "Apela (APL)",
            "Gonadotropin-releasing hormone (GnRH)",
            "Growth hormone-releasing hormone (GHRH)",
            "Thyrotropin-releasing hormone (TRH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gastrin (Gast)",
                "Cholecystokinin (CCK)",
                "Secretin (Sec)",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Glucose-dependent Insulinotropic Polypeptide (GIP)",
                "Motilin (Mot)",
                "Vasoactive Intestinal Peptide (VIP)",
                "Enteroglucagon (Glu)",
                "Somatostatin (SST)",
                "Ghrelin (Ghr)",
                "Peptide YY (PYY)",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Glucagon-like Peptide-2 (GLP-2)",
                "Oxyntomodulin (OXM)",
                "Pancreatic Polypeptide (PP)",
                "Urotensin II (URI)",
                "Neurotensin (NT)",
                "Bombesin (Bbn)",
                "Gastrin-Releasing Peptide (GRP)",
                "Cerebrocortical peptide (CCCP)",
                "Apela (APL)",
                "Gonadotropin-releasing hormone (GnRH)",
                "Growth hormone-releasing hormone (GHRH)",
                "Thyrotropin-releasing hormone (TRH)"
            ],
            "mismatches": [],
            "true_referents": [
                "Apela (APL)",
                "Bombesin (Bbn)",
                "Cerebrocortical peptide (CCCP)",
                "Cholecystokinin (CCK)",
                "Enteroglucagon (Glu)",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Gastrin (Gast)",
                "Gastrin-Releasing Peptide (GRP)",
                "Ghrelin (Ghr)",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Glucagon-like Peptide-2 (GLP-2)",
                "Glucose-dependent Insulinotropic Polypeptide (GIP)",
                "Gonadotropin-releasing hormone (GnRH)",
                "Growth hormone-releasing hormone (GHRH)",
                "Motilin (Mot)",
                "Neurotensin (NT)",
                "Oxyntomodulin (OXM)",
                "Pancreatic Polypeptide (PP)",
                "Peptide YY (PYY)",
                "Secretin (Sec)",
                "Somatostatin (SST)",
                "Thyrotropin-releasing hormone (TRH)",
                "Urotensin II (URI)",
                "Vasoactive Intestinal Peptide (VIP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Gastrin (GAST)",
            "Cholecystokinin (CCK)",
            "Secretin",
            "Gastric Inhibitory Peptide (GIP)",
            "Motilin",
            "Ghrelin",
            "Somatostatin (SST)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Peptide YY (PYY)",
            "Neuropeptide Y (NPY)",
            "Substance P",
            "Neurotensin",
            "Enteroglucagon",
            "Bombesin",
            "Pancreatic Polypeptide (PP)",
            "Oxyntomodulin",
            "Glucagon-like Peptide-1 (GLP-1)",
            "Glucagon-like Peptide-2 (GLP-2)",
            "Insulin-like Peptide 5 (INSL5)",
            "Amylin",
            "Leptin",
            "Adiponectin",
            "Fibroblast Growth Factor 19 (FGF19)",
            "Fibroblast Growth Factor 21 (FGF21)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gastrin (GAST)",
                "Cholecystokinin (CCK)",
                "Secretin",
                "Gastric Inhibitory Peptide (GIP)",
                "Motilin",
                "Ghrelin",
                "Somatostatin (SST)",
                "Vasoactive Intestinal Peptide (VIP)",
                "Peptide YY (PYY)",
                "Neuropeptide Y (NPY)",
                "Substance P",
                "Neurotensin",
                "Enteroglucagon",
                "Bombesin",
                "Pancreatic Polypeptide (PP)",
                "Oxyntomodulin",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Glucagon-like Peptide-2 (GLP-2)",
                "Insulin-like Peptide 5 (INSL5)",
                "Amylin",
                "Leptin",
                "Adiponectin",
                "Fibroblast Growth Factor 19 (FGF19)",
                "Fibroblast Growth Factor 21 (FGF21)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adiponectin",
                "Amylin",
                "Bombesin",
                "Cholecystokinin (CCK)",
                "Enteroglucagon",
                "Fibroblast Growth Factor 19 (FGF19)",
                "Fibroblast Growth Factor 21 (FGF21)",
                "Gastric Inhibitory Peptide (GIP)",
                "Gastrin (GAST)",
                "Ghrelin",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Glucagon-like Peptide-2 (GLP-2)",
                "Insulin-like Peptide 5 (INSL5)",
                "Leptin",
                "Motilin",
                "Neuropeptide Y (NPY)",
                "Neurotensin",
                "Oxyntomodulin",
                "Pancreatic Polypeptide (PP)",
                "Peptide YY (PYY)",
                "Secretin",
                "Somatostatin (SST)",
                "Substance P",
                "Vasoactive Intestinal Peptide (VIP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Gastrin (GAS)",
            "Cholecystokinin (CCK)",
            "Secretin (SCT)",
            "Ghrelin (GHRL)",
            "Peptide YY (PYY)",
            "Glucagon-like peptide-1 (GLP-1)",
            "Glucagon (GCG)",
            "Somatostatin (SST)",
            "Insulin (INS)",
            "Vasoactive intestinal peptide (VIP)",
            "Motilin (MOT)",
            "Enterogastrone (EG)",
            "Pancreatic polypeptide (PP)",
            "Neuropeptide Y (NPY)",
            "Serotonin (5-HT)",
            "Calcitonin gene-related peptide (CGRP)",
            "Enteropeptidase (EP)",
            "Amylin (AMY)",
            "Dipeptidyl peptidase-4 (DPP-4)",
            "Histamine (HIS)",
            "Apolipoprotein A-IV (ApoA-IV)",
            "Cholecystokinin-octapeptide (CCK-8)",
            "Prostaglandin E2 (PGE2)",
            "Gastric inhibitory polypeptide (GIP)",
            "Neurotensin (NT)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gastrin (GAS)",
                "Cholecystokinin (CCK)",
                "Secretin (SCT)",
                "Ghrelin (GHRL)",
                "Peptide YY (PYY)",
                "Glucagon-like peptide-1 (GLP-1)",
                "Glucagon (GCG)",
                "Somatostatin (SST)",
                "Insulin (INS)",
                "Vasoactive intestinal peptide (VIP)",
                "Motilin (MOT)",
                "Enterogastrone (EG)",
                "Pancreatic polypeptide (PP)",
                "Neuropeptide Y (NPY)",
                "Serotonin (5-HT)",
                "Calcitonin gene-related peptide (CGRP)",
                "Enteropeptidase (EP)",
                "Amylin (AMY)",
                "Dipeptidyl peptidase-4 (DPP-4)",
                "Histamine (HIS)",
                "Apolipoprotein A-IV (ApoA-IV)",
                "Cholecystokinin-octapeptide (CCK-8)",
                "Prostaglandin E2 (PGE2)",
                "Gastric inhibitory polypeptide (GIP)"
            ],
            "mismatches": [
                "Neurotensin (NT)"
            ],
            "true_referents": [
                "Amylin (AMY)",
                "Apolipoprotein A-IV (ApoA-IV)",
                "Calcitonin gene-related peptide (CGRP)",
                "Cholecystokinin (CCK)",
                "Cholecystokinin-octapeptide (CCK-8)",
                "Dipeptidyl peptidase-4 (DPP-4)",
                "Enterogastrone (EG)",
                "Enteropeptidase (EP)",
                "Gastric inhibitory polypeptide (GIP)",
                "Gastrin (GAS)",
                "Ghrelin (GHRL)",
                "Glucagon (GCG)",
                "Glucagon-like peptide-1 (GLP-1)",
                "Histamine (HIS)",
                "Insulin (INS)",
                "Motilin (MOT)",
                "Neuropeptide Y (NPY)",
                "Pancreatic polypeptide (PP)",
                "Peptide YY (PYY)",
                "Prostaglandin E2 (PGE2)",
                "Secretin (SCT)",
                "Serotonin (5-HT)",
                "Somatostatin (SST)",
                "Vasoactive intestinal peptide (VIP)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Gastrin (GAS)",
            "Cholecystokinin (CCK)",
            "Secretin (SCT)",
            "Motilin (MTL)",
            "Gastric Inhibitory Polypeptide (GIP)",
            "Glucagon-like Peptide-1 (GLP-1)",
            "Glucagon-like Peptide-2 (GLP-2)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Neurotensin (NTS)",
            "Peptide YY (PYY)",
            "Pancreatic Polypeptide (PP)",
            "Somatostatin (SST)",
            "Substance P (SP)",
            "Enteroglucagon (EG)",
            "Motilin (MLN)",
            "Pancreatic Peptide YY (PYY-P)",
            "Enterostatin (ES)",
            "Chromogranin A (CgA)",
            "Neuropeptide Y (NPY)",
            "Oxyntomodulin (OXM)",
            "Ghrelin (GHRL)",
            "Leptin (LEP)",
            "Insulin-like Growth Factor-1 (IGF-1)",
            "Corticotropin-Releasing Hormone (CRH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gastrin (GAS)",
                "Cholecystokinin (CCK)",
                "Secretin (SCT)",
                "Motilin (MTL)",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Glucagon-like Peptide-2 (GLP-2)",
                "Vasoactive Intestinal Peptide (VIP)",
                "Neurotensin (NTS)",
                "Peptide YY (PYY)",
                "Pancreatic Polypeptide (PP)",
                "Somatostatin (SST)",
                "Substance P (SP)",
                "Enteroglucagon (EG)",
                "Motilin (MLN)",
                "Pancreatic Peptide YY (PYY-P)",
                "Enterostatin (ES)",
                "Chromogranin A (CgA)",
                "Neuropeptide Y (NPY)",
                "Oxyntomodulin (OXM)",
                "Ghrelin (GHRL)",
                "Leptin (LEP)",
                "Insulin-like Growth Factor-1 (IGF-1)",
                "Corticotropin-Releasing Hormone (CRH)"
            ],
            "mismatches": [],
            "true_referents": [
                "Cholecystokinin (CCK)",
                "Chromogranin A (CgA)",
                "Corticotropin-Releasing Hormone (CRH)",
                "Enteroglucagon (EG)",
                "Enterostatin (ES)",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Gastrin (GAS)",
                "Ghrelin (GHRL)",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Glucagon-like Peptide-2 (GLP-2)",
                "Insulin-like Growth Factor-1 (IGF-1)",
                "Leptin (LEP)",
                "Motilin (MLN)",
                "Motilin (MTL)",
                "Neuropeptide Y (NPY)",
                "Neurotensin (NTS)",
                "Oxyntomodulin (OXM)",
                "Pancreatic Peptide YY (PYY-P)",
                "Pancreatic Polypeptide (PP)",
                "Peptide YY (PYY)",
                "Secretin (SCT)",
                "Somatostatin (SST)",
                "Substance P (SP)",
                "Vasoactive Intestinal Peptide (VIP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Gastrin",
            "Cholecystokinin (CCK)",
            "Secretin",
            "Ghrelin",
            "Motilin",
            "Somatostatin",
            "Neurotensin",
            "Vasoactive intestinal peptide (VIP)",
            "Peptide YY (PYY)",
            "Glucagon-like peptide 1 (GLP-1)",
            "Gastric inhibitory polypeptide (GIP)",
            "Pancreatic polypeptide (PP)",
            "Enteroglucagon",
            "Bombesin",
            "Calcitonin gene-related peptide (CGRP)",
            "Substance P",
            "Neuropeptide Y (NPY)",
            "Oxyntomodulin",
            "Growth hormone-releasing peptide (GHRP)",
            "Motilin receptor agonist",
            "Ghrelin receptor agonist",
            "Cholecystokinin receptor antagonist",
            "Somatostatin receptor agonist",
            "Gastrin receptor antagonist"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gastrin",
                "Cholecystokinin (CCK)",
                "Secretin",
                "Ghrelin",
                "Motilin",
                "Somatostatin",
                "Neurotensin",
                "Vasoactive intestinal peptide (VIP)",
                "Peptide YY (PYY)",
                "Glucagon-like peptide 1 (GLP-1)",
                "Gastric inhibitory polypeptide (GIP)",
                "Pancreatic polypeptide (PP)",
                "Enteroglucagon",
                "Bombesin",
                "Calcitonin gene-related peptide (CGRP)",
                "Substance P",
                "Neuropeptide Y (NPY)",
                "Oxyntomodulin",
                "Growth hormone-releasing peptide (GHRP)",
                "Motilin receptor agonist",
                "Ghrelin receptor agonist",
                "Cholecystokinin receptor antagonist",
                "Somatostatin receptor agonist",
                "Gastrin receptor antagonist"
            ],
            "mismatches": [],
            "true_referents": [
                "Bombesin",
                "Calcitonin gene-related peptide (CGRP)",
                "Cholecystokinin (CCK)",
                "Cholecystokinin receptor antagonist",
                "Enteroglucagon",
                "Gastric inhibitory polypeptide (GIP)",
                "Gastrin",
                "Gastrin receptor antagonist",
                "Ghrelin",
                "Ghrelin receptor agonist",
                "Glucagon-like peptide 1 (GLP-1)",
                "Growth hormone-releasing peptide (GHRP)",
                "Motilin",
                "Motilin receptor agonist",
                "Neuropeptide Y (NPY)",
                "Neurotensin",
                "Oxyntomodulin",
                "Pancreatic polypeptide (PP)",
                "Peptide YY (PYY)",
                "Secretin",
                "Somatostatin",
                "Somatostatin receptor agonist",
                "Substance P",
                "Vasoactive intestinal peptide (VIP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Gastrin (GAST)",
            "Cholecystokinin (CCK)",
            "Secretin (SCT)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Motilin",
            "Ghrelin",
            "Glucose-dependent Insulinotropic Peptide (GIP)",
            "Peptide YY (PYY)",
            "Neurotensin",
            "Somatostatin (SST)",
            "Enteroglucagon",
            "Pancreatic Polypeptide (PP)",
            "Amylin",
            "Uroguanylin",
            "Guanylin",
            "Bombesin",
            "Obestatin",
            "Insulin-like Peptide 5 (INSL5)",
            "Fibroblast Growth Factor 19 (FGF19)",
            "Glucagon-like Peptide 1 (GLP-1)",
            "Glucagon-like Peptide 2 (GLP-2)",
            "Nesfatin-1",
            "Oxyntomodulin",
            "Enterostatin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gastrin (GAST)",
                "Cholecystokinin (CCK)",
                "Secretin (SCT)",
                "Vasoactive Intestinal Peptide (VIP)",
                "Motilin",
                "Ghrelin",
                "Glucose-dependent Insulinotropic Peptide (GIP)",
                "Peptide YY (PYY)",
                "Neurotensin",
                "Somatostatin (SST)",
                "Enteroglucagon",
                "Pancreatic Polypeptide (PP)",
                "Amylin",
                "Uroguanylin",
                "Guanylin",
                "Bombesin",
                "Obestatin",
                "Insulin-like Peptide 5 (INSL5)",
                "Fibroblast Growth Factor 19 (FGF19)",
                "Glucagon-like Peptide 1 (GLP-1)",
                "Glucagon-like Peptide 2 (GLP-2)",
                "Nesfatin-1",
                "Oxyntomodulin",
                "Enterostatin"
            ],
            "mismatches": [],
            "true_referents": [
                "Amylin",
                "Bombesin",
                "Cholecystokinin (CCK)",
                "Enteroglucagon",
                "Enterostatin",
                "Fibroblast Growth Factor 19 (FGF19)",
                "Gastrin (GAST)",
                "Ghrelin",
                "Glucagon-like Peptide 1 (GLP-1)",
                "Glucagon-like Peptide 2 (GLP-2)",
                "Glucose-dependent Insulinotropic Peptide (GIP)",
                "Guanylin",
                "Insulin-like Peptide 5 (INSL5)",
                "Motilin",
                "Nesfatin-1",
                "Neurotensin",
                "Obestatin",
                "Oxyntomodulin",
                "Pancreatic Polypeptide (PP)",
                "Peptide YY (PYY)",
                "Secretin (SCT)",
                "Somatostatin (SST)",
                "Uroguanylin",
                "Vasoactive Intestinal Peptide (VIP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Gastrin (GAS)",
            "Cholecystokinin (CCK)",
            "Secretin (SCT)",
            "Motilin (MLN)",
            "Ghrelin (GHRL)",
            "Gastric inhibitory polypeptide (GIP)",
            "Glucagon-like peptide-1 (GLP-1)",
            "Glucagon-like peptide-2 (GLP-2)",
            "Peptide YY (PYY)",
            "Somatostatin (SST)",
            "Vasoactive intestinal peptide (VIP)",
            "Pancreatic polypeptide (PP)",
            "Oxyntomodulin (OXM)",
            "Neurotensin (NTS)",
            "Gastrin-releasing peptide (GRP)",
            "Enteroglucagon",
            "Guanylin",
            "Uroguanylin",
            "Obestatin",
            "Xenin",
            "Glucose-dependent insulinotropic polypeptide (GIP)",
            "Pancreatic peptide YY (PYY)",
            "Substance P",
            "Bombesin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gastrin (GAS)",
                "Cholecystokinin (CCK)",
                "Secretin (SCT)",
                "Motilin (MLN)",
                "Ghrelin (GHRL)",
                "Gastric inhibitory polypeptide (GIP)",
                "Glucagon-like peptide-1 (GLP-1)",
                "Glucagon-like peptide-2 (GLP-2)",
                "Peptide YY (PYY)",
                "Somatostatin (SST)",
                "Vasoactive intestinal peptide (VIP)",
                "Pancreatic polypeptide (PP)",
                "Oxyntomodulin (OXM)",
                "Neurotensin (NTS)",
                "Gastrin-releasing peptide (GRP)",
                "Enteroglucagon",
                "Guanylin",
                "Uroguanylin",
                "Obestatin",
                "Xenin",
                "Glucose-dependent insulinotropic polypeptide (GIP)",
                "Pancreatic peptide YY (PYY)",
                "Substance P",
                "Bombesin"
            ],
            "mismatches": [],
            "true_referents": [
                "Bombesin",
                "Cholecystokinin (CCK)",
                "Enteroglucagon",
                "Gastric inhibitory polypeptide (GIP)",
                "Gastrin (GAS)",
                "Gastrin-releasing peptide (GRP)",
                "Ghrelin (GHRL)",
                "Glucagon-like peptide-1 (GLP-1)",
                "Glucagon-like peptide-2 (GLP-2)",
                "Glucose-dependent insulinotropic polypeptide (GIP)",
                "Guanylin",
                "Motilin (MLN)",
                "Neurotensin (NTS)",
                "Obestatin",
                "Oxyntomodulin (OXM)",
                "Pancreatic peptide YY (PYY)",
                "Pancreatic polypeptide (PP)",
                "Peptide YY (PYY)",
                "Secretin (SCT)",
                "Somatostatin (SST)",
                "Substance P",
                "Uroguanylin",
                "Vasoactive intestinal peptide (VIP)",
                "Xenin"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Gastrin (GAS)",
            "Cholecystokinin (CCK)",
            "Secretin (SCT)",
            "Glucose-dependent insulinotropic polypeptide (GIP)",
            "Vasoactive intestinal peptide (VIP)",
            "Somatostatin (SST)",
            "Motilin (MLN)",
            "Ghrelin (GHRL)",
            "Glucagon-like peptide-1 (GLP-1)",
            "Glucagon-like peptide-2 (GLP-2)",
            "Peptide YY (PYY)",
            "Pancreatic polypeptide (PPY)",
            "Oxyntomodulin (OXM)",
            "Neurotensin (NTS)",
            "Substance P (SP)",
            "Galanin (GAL)",
            "Gastric inhibitory polypeptide (GIP)",
            "Enteroglucagon",
            "Guanylin",
            "Uroguanylin",
            "Neuromedin U (NMU)",
            "Adrenomedullin (ADM)",
            "Calcitonin gene-related peptide (CGRP)",
            "Obestatin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gastrin (GAS)",
                "Cholecystokinin (CCK)",
                "Secretin (SCT)",
                "Glucose-dependent insulinotropic polypeptide (GIP)",
                "Vasoactive intestinal peptide (VIP)",
                "Somatostatin (SST)",
                "Motilin (MLN)",
                "Ghrelin (GHRL)",
                "Glucagon-like peptide-1 (GLP-1)",
                "Glucagon-like peptide-2 (GLP-2)",
                "Peptide YY (PYY)",
                "Pancreatic polypeptide (PPY)",
                "Oxyntomodulin (OXM)",
                "Neurotensin (NTS)",
                "Substance P (SP)",
                "Galanin (GAL)",
                "Gastric inhibitory polypeptide (GIP)",
                "Enteroglucagon",
                "Guanylin",
                "Uroguanylin",
                "Neuromedin U (NMU)",
                "Adrenomedullin (ADM)",
                "Calcitonin gene-related peptide (CGRP)",
                "Obestatin"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenomedullin (ADM)",
                "Calcitonin gene-related peptide (CGRP)",
                "Cholecystokinin (CCK)",
                "Enteroglucagon",
                "Galanin (GAL)",
                "Gastric inhibitory polypeptide (GIP)",
                "Gastrin (GAS)",
                "Ghrelin (GHRL)",
                "Glucagon-like peptide-1 (GLP-1)",
                "Glucagon-like peptide-2 (GLP-2)",
                "Glucose-dependent insulinotropic polypeptide (GIP)",
                "Guanylin",
                "Motilin (MLN)",
                "Neuromedin U (NMU)",
                "Neurotensin (NTS)",
                "Obestatin",
                "Oxyntomodulin (OXM)",
                "Pancreatic polypeptide (PPY)",
                "Peptide YY (PYY)",
                "Secretin (SCT)",
                "Somatostatin (SST)",
                "Substance P (SP)",
                "Uroguanylin",
                "Vasoactive intestinal peptide (VIP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Gastrin (GAS)",
            "Cholecystokinin (CCK)",
            "Secretin (SEC)",
            "Glucose-dependent Insulinotropic Polypeptide (GIP)",
            "Glucagon-like Peptide-1 (GLP-1)",
            "Motilin (MOT)",
            "Ghrelin (GHRL)",
            "Peptide YY (PYY)",
            "Pancreatic Polypeptide (PP)",
            "Somatostatin (SST)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Neurotensin (NT)",
            "Substance P (SP)",
            "Gastric Inhibitory Polypeptide (GIP)",
            "Enteroglucagon",
            "Oxyntomodulin",
            "Uroguanylin",
            "Guanylin",
            "Xenin",
            "Nesfatin-1",
            "Apelin",
            "Obestatin",
            "Amylin",
            "Cholecystokinin-58 (CCK-58)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gastrin (GAS)",
                "Cholecystokinin (CCK)",
                "Secretin (SEC)",
                "Glucose-dependent Insulinotropic Polypeptide (GIP)",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Motilin (MOT)",
                "Ghrelin (GHRL)",
                "Peptide YY (PYY)",
                "Pancreatic Polypeptide (PP)",
                "Somatostatin (SST)",
                "Vasoactive Intestinal Peptide (VIP)",
                "Neurotensin (NT)",
                "Substance P (SP)",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Enteroglucagon",
                "Oxyntomodulin",
                "Uroguanylin",
                "Guanylin",
                "Xenin",
                "Nesfatin-1",
                "Apelin",
                "Obestatin",
                "Amylin",
                "Cholecystokinin-58 (CCK-58)"
            ],
            "mismatches": [],
            "true_referents": [
                "Amylin",
                "Apelin",
                "Cholecystokinin (CCK)",
                "Cholecystokinin-58 (CCK-58)",
                "Enteroglucagon",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Gastrin (GAS)",
                "Ghrelin (GHRL)",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Glucose-dependent Insulinotropic Polypeptide (GIP)",
                "Guanylin",
                "Motilin (MOT)",
                "Nesfatin-1",
                "Neurotensin (NT)",
                "Obestatin",
                "Oxyntomodulin",
                "Pancreatic Polypeptide (PP)",
                "Peptide YY (PYY)",
                "Secretin (SEC)",
                "Somatostatin (SST)",
                "Substance P (SP)",
                "Uroguanylin",
                "Vasoactive Intestinal Peptide (VIP)",
                "Xenin"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Gastrin (GAS)",
            "Cholecystokinin (CCK)",
            "Secretin (SEC)",
            "Motilin (MOT)",
            "Vasoactive Intestinal Peptide (VIP)",
            "Ghrelin (GHR)",
            "Somatostatin (SST)",
            "Glucagon-like Peptide-1 (GLP-1)",
            "Peptide YY (PYY)",
            "Neurotensin (NT)",
            "Substance P (SP)",
            "Calcitonin Gene-related Peptide (CGRP)",
            "Pancreatic Polypeptide (PP)",
            "Gastric Inhibitory Polypeptide (GIP)",
            "Enteroglucagon (EG)",
            "Enterochromaffin Cell Serotonin (5-HT)",
            "Histamine (HIS)",
            "Prostaglandins (PGs)",
            "Leukotrienes (LTs)",
            "Nitric Oxide (NO)",
            "Endothelin (ET)",
            "Adenosine (ADO)",
            "Bradykinin (BK)",
            "Substance K (SK)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gastrin (GAS)",
                "Cholecystokinin (CCK)",
                "Secretin (SEC)",
                "Motilin (MOT)",
                "Vasoactive Intestinal Peptide (VIP)",
                "Ghrelin (GHR)",
                "Somatostatin (SST)",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Peptide YY (PYY)",
                "Neurotensin (NT)",
                "Substance P (SP)",
                "Calcitonin Gene-related Peptide (CGRP)",
                "Pancreatic Polypeptide (PP)",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Enteroglucagon (EG)",
                "Enterochromaffin Cell Serotonin (5-HT)",
                "Histamine (HIS)",
                "Prostaglandins (PGs)",
                "Leukotrienes (LTs)",
                "Nitric Oxide (NO)",
                "Endothelin (ET)",
                "Adenosine (ADO)",
                "Bradykinin (BK)",
                "Substance K (SK)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adenosine (ADO)",
                "Bradykinin (BK)",
                "Calcitonin Gene-related Peptide (CGRP)",
                "Cholecystokinin (CCK)",
                "Endothelin (ET)",
                "Enterochromaffin Cell Serotonin (5-HT)",
                "Enteroglucagon (EG)",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Gastrin (GAS)",
                "Ghrelin (GHR)",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Histamine (HIS)",
                "Leukotrienes (LTs)",
                "Motilin (MOT)",
                "Neurotensin (NT)",
                "Nitric Oxide (NO)",
                "Pancreatic Polypeptide (PP)",
                "Peptide YY (PYY)",
                "Prostaglandins (PGs)",
                "Secretin (SEC)",
                "Somatostatin (SST)",
                "Substance K (SK)",
                "Substance P (SP)",
                "Vasoactive Intestinal Peptide (VIP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Cholecystokinin (CCK)",
            "Gastrin",
            "Secretin",
            "Motilin",
            "Vasoactive Intestinal Polypeptide (VIP)",
            "Peptide YY (PYY)",
            "Glucagon-like Peptide-1 (GLP-1)",
            "Glucagon",
            "Pancreatic Polypeptide (PP)",
            "Somatostatin",
            "Ghrelin",
            "Insulin-like Peptide (ILP)",
            "Neuropeptide Y (NPY)",
            "Pancreatic Stone Protein (PSP)",
            "Motilin-like Peptide (MLP)",
            "Gastric Inhibitory Polypeptide (GIP)",
            "Enterogastrone",
            "Pancreatic Polypeptide-like Peptide (PPLP)",
            "Cholecystokinin-pancreozymin (CCK-PZ)",
            "Motilin-like Peptide-1 (MLP-1)",
            "Vasoactive Intestinal Polypeptide-like Peptide (VIP-1)",
            "Peptide YY-like Peptide (PYY-1)",
            "Glucagon-like Peptide-1-like Peptide (GLP-1-1)",
            "Neuropeptide Y-like Peptide (NPY-1)",
            "Ghrelin-like Peptide (GHR-1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cholecystokinin (CCK)",
                "Gastrin",
                "Secretin",
                "Motilin",
                "Vasoactive Intestinal Polypeptide (VIP)",
                "Peptide YY (PYY)",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Glucagon",
                "Pancreatic Polypeptide (PP)",
                "Somatostatin",
                "Ghrelin",
                "Insulin-like Peptide (ILP)",
                "Neuropeptide Y (NPY)",
                "Pancreatic Stone Protein (PSP)",
                "Motilin-like Peptide (MLP)",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Enterogastrone",
                "Pancreatic Polypeptide-like Peptide (PPLP)",
                "Cholecystokinin-pancreozymin (CCK-PZ)",
                "Motilin-like Peptide-1 (MLP-1)",
                "Vasoactive Intestinal Polypeptide-like Peptide (VIP-1)",
                "Peptide YY-like Peptide (PYY-1)",
                "Glucagon-like Peptide-1-like Peptide (GLP-1-1)",
                "Neuropeptide Y-like Peptide (NPY-1)"
            ],
            "mismatches": [
                "Ghrelin-like Peptide (GHR-1)"
            ],
            "true_referents": [
                "Cholecystokinin (CCK)",
                "Cholecystokinin-pancreozymin (CCK-PZ)",
                "Enterogastrone",
                "Gastric Inhibitory Polypeptide (GIP)",
                "Gastrin",
                "Ghrelin",
                "Glucagon",
                "Glucagon-like Peptide-1 (GLP-1)",
                "Glucagon-like Peptide-1-like Peptide (GLP-1-1)",
                "Insulin-like Peptide (ILP)",
                "Motilin",
                "Motilin-like Peptide (MLP)",
                "Motilin-like Peptide-1 (MLP-1)",
                "Neuropeptide Y (NPY)",
                "Neuropeptide Y-like Peptide (NPY-1)",
                "Pancreatic Polypeptide (PP)",
                "Pancreatic Polypeptide-like Peptide (PPLP)",
                "Pancreatic Stone Protein (PSP)",
                "Peptide YY (PYY)",
                "Peptide YY-like Peptide (PYY-1)",
                "Secretin",
                "Somatostatin",
                "Vasoactive Intestinal Polypeptide (VIP)",
                "Vasoactive Intestinal Polypeptide-like Peptide (VIP-1)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            "Motilin (MOT)",
            "Galectin-3 (LGALS3)",
            "Gastrin (GAST)",
            "Cholecystokinin (CCK)",
            "Secretin (SCT)",
            "Vasoactive intestinal peptide (VIP)",
            "Neuromedin U (NMU)",
            "Ghrelin (GHRL)",
            "Obestatin (OBEST)",
            "Motilin-related peptide (MLRP)",
            "Pancreatic polypeptide (PP)",
            "Peptide YY (PYY)",
            "Pancreatic peptide YY (PYY3-36)",
            "Glucagon-like peptide-1 (GLP-1)",
            "Glucagon-like peptide-2 (GLP-2)",
            "Gastric inhibitory peptide (GIP)",
            "Somatostatin (SST)",
            "Cortistatin (CST)",
            "Neurotensin (NTS)",
            "Chromogranin A (CHGA)",
            "Pancreastatin (PST)",
            "Adrenomedullin (ADM)",
            "Bombesin (BBS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Motilin (MOT)",
                "Galectin-3 (LGALS3)",
                "Gastrin (GAST)",
                "Cholecystokinin (CCK)",
                "Secretin (SCT)",
                "Vasoactive intestinal peptide (VIP)",
                "Neuromedin U (NMU)",
                "Ghrelin (GHRL)",
                "Obestatin (OBEST)",
                "Motilin-related peptide (MLRP)",
                "Pancreatic polypeptide (PP)",
                "Peptide YY (PYY)",
                "Pancreatic peptide YY (PYY3-36)",
                "Glucagon-like peptide-1 (GLP-1)",
                "Glucagon-like peptide-2 (GLP-2)",
                "Gastric inhibitory peptide (GIP)",
                "Somatostatin (SST)",
                "Cortistatin (CST)",
                "Neurotensin (NTS)",
                "Chromogranin A (CHGA)",
                "Pancreastatin (PST)",
                "Adrenomedullin (ADM)",
                "Bombesin (BBS)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenomedullin (ADM)",
                "Bombesin (BBS)",
                "Cholecystokinin (CCK)",
                "Chromogranin A (CHGA)",
                "Cortistatin (CST)",
                "Galectin-3 (LGALS3)",
                "Gastric inhibitory peptide (GIP)",
                "Gastrin (GAST)",
                "Ghrelin (GHRL)",
                "Glucagon-like peptide-1 (GLP-1)",
                "Glucagon-like peptide-2 (GLP-2)",
                "Motilin (MOT)",
                "Motilin-related peptide (MLRP)",
                "Neuromedin U (NMU)",
                "Neurotensin (NTS)",
                "Obestatin (OBEST)",
                "Pancreastatin (PST)",
                "Pancreatic peptide YY (PYY3-36)",
                "Pancreatic polypeptide (PP)",
                "Peptide YY (PYY)",
                "Secretin (SCT)",
                "Somatostatin (SST)",
                "Vasoactive intestinal peptide (VIP)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "gastrointestinal hormone",
        "domain": "biology",
        "response": [
            {
                "Referent": "Gastrin-releasing peptide (GRP)",
                "Canonical name": "GRP"
            },
            {
                "Referent": "Ghrelin",
                "Canonical name": "GHRL"
            },
            {
                "Referent": "Glucagon-like peptide-1 (GLP-1)",
                "Canonical name": "GLP1"
            },
            {
                "Referent": "Glucagon-like peptide-2 (GLP-2)",
                "Canonical name": "GLP2"
            },
            {
                "Referent": "Glucagon-like peptide-2 (GLP-2)",
                "Canonical name": "GLP2"
            },
            {
                "Referent": "Oxyntomodulin (OXM)",
                "Canonical name": "OXM"
            },
            {
                "Referent": "Peptide YY (PYY)",
                "Canonical name": "PYY"
            },
            {
                "Referent": "Pancreatic polypeptide (PP)",
                "Canonical name": "PPY"
            },
            {
                "Referent": "Pancreatic polypeptide (PP)",
                "Canonical name": "PPY"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Secretin",
                "Canonical name": "SECR"
            },
            {
                "Referent": "Cholecystokinin (CCK)",
                "Canonical name": "CCK"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            },
            {
                "Referent": "Gastric inhibitory peptide (GIP)",
                "Canonical name": "GIP"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gastrin-releasing peptide (GRP)",
                "Ghrelin",
                "Glucagon-like peptide-1 (GLP-1)",
                "Glucagon-like peptide-2 (GLP-2)",
                "Oxyntomodulin (OXM)",
                "Peptide YY (PYY)",
                "Pancreatic polypeptide (PP)",
                "Gastric inhibitory peptide (GIP)",
                "Secretin",
                "Cholecystokinin (CCK)"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"Cholecystokinin (CCK)\", \"Canonical name\": \"CCK\"}",
                "{\"Referent\": \"Gastric inhibitory peptide (GIP)\", \"Canonical name\": \"GIP\"}",
                "{\"Referent\": \"Gastrin-releasing peptide (GRP)\", \"Canonical name\": \"GRP\"}",
                "{\"Referent\": \"Ghrelin\", \"Canonical name\": \"GHRL\"}",
                "{\"Referent\": \"Glucagon-like peptide-1 (GLP-1)\", \"Canonical name\": \"GLP1\"}",
                "{\"Referent\": \"Glucagon-like peptide-2 (GLP-2)\", \"Canonical name\": \"GLP2\"}",
                "{\"Referent\": \"Oxyntomodulin (OXM)\", \"Canonical name\": \"OXM\"}",
                "{\"Referent\": \"Pancreatic polypeptide (PP)\", \"Canonical name\": \"PPY\"}",
                "{\"Referent\": \"Peptide YY (PYY)\", \"Canonical name\": \"PYY\"}",
                "{\"Referent\": \"Secretin\", \"Canonical name\": \"SECR\"}"
            ],
            "TP": 10,
            "FP": 0,
            "FN": 0
        }
    }
]