[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Acetyl-Val-Pro-Pro-Gly-Pro (Ac-VPPP)",
            "Tat-Peptide (Tat48-60)",
            "Angiotensin I (Ang I)",
            "Lysine-Aspartate-Proline-Glycine-Proline (KDPGP)",
            "N-Acetyl-Ser-Thr-Lys-Pro-Ile (Ac-STKPI)",
            "N-Acetyl-Pro-Leu-Pro-Pro-Pro (Ac-PLPPP)",
            "N-Acetyl-Pro-Gly-Pro-Pro-Pro (Ac-GPPP)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Pro (Ac-PPPPP)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Val (Ac-PPPPV)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Trp (Ac-PPPPW)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Tyr (Ac-PPPTY)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Val (Ac-PPPPV)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Trp (Ac-PPPPW)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Tyr (Ac-PPPTY)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Pro (Ac-PPPPP)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Val (Ac-PPPPV)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Trp (Ac-PPPPW)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Tyr (Ac-PPPTY)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Pro (Ac-PPPPP)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Val (Ac-PPPPV)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Trp (Ac-PPPPW)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Tyr (Ac-PPPTY)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Pro (Ac-PPPPP)",
            "N-Acetyl-Pro-Pro-Pro-Pro-Val (Ac-PPPPV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Acetyl-Val-Pro-Pro-Gly-Pro (Ac-VPPP)",
                "Tat-Peptide (Tat48-60)",
                "Angiotensin I (Ang I)",
                "Lysine-Aspartate-Proline-Glycine-Proline (KDPGP)",
                "N-Acetyl-Ser-Thr-Lys-Pro-Ile (Ac-STKPI)",
                "N-Acetyl-Pro-Leu-Pro-Pro-Pro (Ac-PLPPP)",
                "N-Acetyl-Pro-Gly-Pro-Pro-Pro (Ac-GPPP)",
                "N-Acetyl-Pro-Pro-Pro-Pro-Pro (Ac-PPPPP)",
                "N-Acetyl-Pro-Pro-Pro-Pro-Val (Ac-PPPPV)",
                "N-Acetyl-Pro-Pro-Pro-Pro-Trp (Ac-PPPPW)",
                "N-Acetyl-Pro-Pro-Pro-Pro-Tyr (Ac-PPPTY)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl-Val-Pro-Pro-Gly-Pro (Ac-VPPP)",
                "Angiotensin I (Ang I)",
                "Lysine-Aspartate-Proline-Glycine-Proline (KDPGP)",
                "N-Acetyl-Pro-Gly-Pro-Pro-Pro (Ac-GPPP)",
                "N-Acetyl-Pro-Leu-Pro-Pro-Pro (Ac-PLPPP)",
                "N-Acetyl-Pro-Pro-Pro-Pro-Pro (Ac-PPPPP)",
                "N-Acetyl-Pro-Pro-Pro-Pro-Trp (Ac-PPPPW)",
                "N-Acetyl-Pro-Pro-Pro-Pro-Tyr (Ac-PPPTY)",
                "N-Acetyl-Pro-Pro-Pro-Pro-Val (Ac-PPPPV)",
                "N-Acetyl-Ser-Thr-Lys-Pro-Ile (Ac-STKPI)",
                "Tat-Peptide (Tat48-60)"
            ],
            "TP": 11,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Glutathione (GSH)",
            "Cathelicidin LL-37",
            "Met-enkephalin",
            "Leu-enkephalin",
            "Vasopressin (also known as Arginine Vasopressin, AVP)",
            "Oxytocin",
            "Angiotensin II",
            "Thymosin alpha-1",
            "Growth Hormone-Releasing Peptide-6 (GHRP-6)",
            "Corticotropin-releasing hormone (CRH)",
            "Pentapeptide repeat protein (PPR)",
            "Pentapeptide repeat proteins in bacteria (PilT N-terminus, PNT)",
            "Pentapeptide repeat proteins in fungi (Fungal PPR proteins)",
            "Pentapeptide repeat proteins in plants (PPR proteins)",
            "Pentapeptide repeat proteins in apicomplexa (Apicomplexan PPR proteins)",
            "Pentapeptide repeat proteins in trypanosomatids (Trypanosomatid PPR proteins)",
            "Pentapeptide repeat proteins in nematodes (Nematode PPR proteins)",
            "Pentapeptide repeat proteins in vertebrates (Vertebrate PPR proteins)",
            "Cyclosporin A (immunosuppressive agent)",
            "Cyclophilin (binding partner of Cyclosporin A)",
            "Cyclosporin A binding domain",
            "Pentapeptide repeat protein FAM120A",
            "Pentapeptide repeat protein FAM120C",
            "Pentapeptide repeat protein FAM120B"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glutathione (GSH)",
                "Cathelicidin LL-37",
                "Met-enkephalin",
                "Leu-enkephalin",
                "Vasopressin (also known as Arginine Vasopressin, AVP)",
                "Oxytocin",
                "Angiotensin II",
                "Thymosin alpha-1",
                "Growth Hormone-Releasing Peptide-6 (GHRP-6)",
                "Corticotropin-releasing hormone (CRH)",
                "Pentapeptide repeat protein (PPR)",
                "Pentapeptide repeat proteins in bacteria (PilT N-terminus, PNT)",
                "Pentapeptide repeat proteins in fungi (Fungal PPR proteins)",
                "Pentapeptide repeat proteins in plants (PPR proteins)",
                "Pentapeptide repeat proteins in apicomplexa (Apicomplexan PPR proteins)",
                "Pentapeptide repeat proteins in trypanosomatids (Trypanosomatid PPR proteins)",
                "Pentapeptide repeat proteins in nematodes (Nematode PPR proteins)",
                "Pentapeptide repeat proteins in vertebrates (Vertebrate PPR proteins)",
                "Cyclosporin A (immunosuppressive agent)",
                "Cyclophilin (binding partner of Cyclosporin A)",
                "Cyclosporin A binding domain",
                "Pentapeptide repeat protein FAM120A",
                "Pentapeptide repeat protein FAM120C",
                "Pentapeptide repeat protein FAM120B"
            ],
            "mismatches": [],
            "true_referents": [
                "Angiotensin II",
                "Cathelicidin LL-37",
                "Corticotropin-releasing hormone (CRH)",
                "Cyclophilin (binding partner of Cyclosporin A)",
                "Cyclosporin A (immunosuppressive agent)",
                "Cyclosporin A binding domain",
                "Glutathione (GSH)",
                "Growth Hormone-Releasing Peptide-6 (GHRP-6)",
                "Leu-enkephalin",
                "Met-enkephalin",
                "Oxytocin",
                "Pentapeptide repeat protein (PPR)",
                "Pentapeptide repeat protein FAM120A",
                "Pentapeptide repeat protein FAM120B",
                "Pentapeptide repeat protein FAM120C",
                "Pentapeptide repeat proteins in apicomplexa (Apicomplexan PPR proteins)",
                "Pentapeptide repeat proteins in bacteria (PilT N-terminus, PNT)",
                "Pentapeptide repeat proteins in fungi (Fungal PPR proteins)",
                "Pentapeptide repeat proteins in nematodes (Nematode PPR proteins)",
                "Pentapeptide repeat proteins in plants (PPR proteins)",
                "Pentapeptide repeat proteins in trypanosomatids (Trypanosomatid PPR proteins)",
                "Pentapeptide repeat proteins in vertebrates (Vertebrate PPR proteins)",
                "Thymosin alpha-1",
                "Vasopressin (also known as Arginine Vasopressin, AVP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Oxytocin (CYT)",
            "Leu-enkephalin",
            "Met-enkephalin",
            "Angiotensin II (AngII)",
            "Angiotensin III (AngIII)",
            "Angiotensin IV (AngIV)",
            "Des-enkephalin",
            "Dynorphin A (Dyn A)",
            "Dynorphin B (Dyn B)",
            "Neuropeptide Y (NPY)",
            "Substance P",
            "Neurotensin",
            "Bradykinin",
            "Kallidin",
            "Vasopressin",
            "Endomorphin-1",
            "Endomorphin-2",
            "Adrenocorticotropic hormone (ACTH)",
            "Thyrotropin-releasing hormone (TRH)",
            "Corticotropin-releasing hormone (CRH)",
            "Gastrin",
            "Cholecystokinin (CCK)",
            "Secretin",
            "Motilin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Oxytocin (CYT)",
                "Leu-enkephalin",
                "Met-enkephalin",
                "Angiotensin II (AngII)",
                "Angiotensin III (AngIII)",
                "Angiotensin IV (AngIV)",
                "Des-enkephalin",
                "Dynorphin A (Dyn A)",
                "Dynorphin B (Dyn B)",
                "Neuropeptide Y (NPY)",
                "Substance P",
                "Neurotensin",
                "Bradykinin",
                "Kallidin",
                "Vasopressin",
                "Endomorphin-1",
                "Endomorphin-2",
                "Adrenocorticotropic hormone (ACTH)",
                "Thyrotropin-releasing hormone (TRH)",
                "Corticotropin-releasing hormone (CRH)",
                "Gastrin",
                "Cholecystokinin (CCK)",
                "Secretin",
                "Motilin"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenocorticotropic hormone (ACTH)",
                "Angiotensin II (AngII)",
                "Angiotensin III (AngIII)",
                "Angiotensin IV (AngIV)",
                "Bradykinin",
                "Cholecystokinin (CCK)",
                "Corticotropin-releasing hormone (CRH)",
                "Des-enkephalin",
                "Dynorphin A (Dyn A)",
                "Dynorphin B (Dyn B)",
                "Endomorphin-1",
                "Endomorphin-2",
                "Gastrin",
                "Kallidin",
                "Leu-enkephalin",
                "Met-enkephalin",
                "Motilin",
                "Neuropeptide Y (NPY)",
                "Neurotensin",
                "Oxytocin (CYT)",
                "Secretin",
                "Substance P",
                "Thyrotropin-releasing hormone (TRH)",
                "Vasopressin"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Val-Gly-Lys-Glu-Asp (VGEKD)",
            "Leu-Pro-Arg-Gly-Asn (LPRGN)",
            "Tyr-Arg-Gly-Asp-Phe (YRGDF)",
            "Ser-Lys-Val-Asp-Pro (SKVDP)",
            "Ala-Pro-Gly-Lys-Pro (APGKP)",
            "Gly-Arg-Pro-Pro-Gly (GRPPG)",
            "Lys-Thr-Lys-Lys-Glu (KTKKE)",
            "Asp-Ala-Lys-Lys-Arg (DAKKR)",
            "Met-Lys-Val-Lys-Leu (MKVKL)",
            "Phe-His-Leu-Pro-Gly (FHLPG)",
            "Pro-Leu-Gly-Pro-Arg (PLGPR)",
            "Arg-Pro-Gly-Pro-Gly (RPGPG)",
            "Glu-Lys-Tyr-Pro-Ala (EKYPA)",
            "His-Lys-Pro-Val-Gly (HKPVG)",
            "Lys-Ala-Glu-Gly-Arg (KAEGR)",
            "Gln-Pro-Arg-Gly-Gln (QPRGQ)",
            "Thr-Pro-Lys-Ser-Leu (TPKSL)",
            "Gly-Gly-Gly-Gly-His (GGGGH)",
            "Leu-Glu-Val-Glu-Lys (LEVEK)",
            "Arg-Gly-Asp-Ala-Asp (RGDAD)",
            "Phe-Gly-Gly-Arg-Lys (FGGRK)",
            "Pro-Gly-Lys-Pro-Gly (PGKPG)",
            "Ser-Pro-Lys-Lys-Pro (SPKKP)",
            "Val-Pro-Lys-Pro-Val (VPKPV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Val-Gly-Lys-Glu-Asp (VGEKD)",
                "Leu-Pro-Arg-Gly-Asn (LPRGN)",
                "Tyr-Arg-Gly-Asp-Phe (YRGDF)",
                "Ser-Lys-Val-Asp-Pro (SKVDP)",
                "Ala-Pro-Gly-Lys-Pro (APGKP)",
                "Gly-Arg-Pro-Pro-Gly (GRPPG)",
                "Lys-Thr-Lys-Lys-Glu (KTKKE)",
                "Asp-Ala-Lys-Lys-Arg (DAKKR)",
                "Met-Lys-Val-Lys-Leu (MKVKL)",
                "Phe-His-Leu-Pro-Gly (FHLPG)",
                "Pro-Leu-Gly-Pro-Arg (PLGPR)",
                "Arg-Pro-Gly-Pro-Gly (RPGPG)",
                "Glu-Lys-Tyr-Pro-Ala (EKYPA)",
                "His-Lys-Pro-Val-Gly (HKPVG)",
                "Lys-Ala-Glu-Gly-Arg (KAEGR)",
                "Gln-Pro-Arg-Gly-Gln (QPRGQ)",
                "Thr-Pro-Lys-Ser-Leu (TPKSL)",
                "Gly-Gly-Gly-Gly-His (GGGGH)",
                "Leu-Glu-Val-Glu-Lys (LEVEK)",
                "Arg-Gly-Asp-Ala-Asp (RGDAD)",
                "Phe-Gly-Gly-Arg-Lys (FGGRK)",
                "Pro-Gly-Lys-Pro-Gly (PGKPG)",
                "Ser-Pro-Lys-Lys-Pro (SPKKP)",
                "Val-Pro-Lys-Pro-Val (VPKPV)"
            ],
            "mismatches": [],
            "true_referents": [
                "Ala-Pro-Gly-Lys-Pro (APGKP)",
                "Arg-Gly-Asp-Ala-Asp (RGDAD)",
                "Arg-Pro-Gly-Pro-Gly (RPGPG)",
                "Asp-Ala-Lys-Lys-Arg (DAKKR)",
                "Gln-Pro-Arg-Gly-Gln (QPRGQ)",
                "Glu-Lys-Tyr-Pro-Ala (EKYPA)",
                "Gly-Arg-Pro-Pro-Gly (GRPPG)",
                "Gly-Gly-Gly-Gly-His (GGGGH)",
                "His-Lys-Pro-Val-Gly (HKPVG)",
                "Leu-Glu-Val-Glu-Lys (LEVEK)",
                "Leu-Pro-Arg-Gly-Asn (LPRGN)",
                "Lys-Ala-Glu-Gly-Arg (KAEGR)",
                "Lys-Thr-Lys-Lys-Glu (KTKKE)",
                "Met-Lys-Val-Lys-Leu (MKVKL)",
                "Phe-Gly-Gly-Arg-Lys (FGGRK)",
                "Phe-His-Leu-Pro-Gly (FHLPG)",
                "Pro-Gly-Lys-Pro-Gly (PGKPG)",
                "Pro-Leu-Gly-Pro-Arg (PLGPR)",
                "Ser-Lys-Val-Asp-Pro (SKVDP)",
                "Ser-Pro-Lys-Lys-Pro (SPKKP)",
                "Thr-Pro-Lys-Ser-Leu (TPKSL)",
                "Tyr-Arg-Gly-Asp-Phe (YRGDF)",
                "Val-Gly-Lys-Glu-Asp (VGEKD)",
                "Val-Pro-Lys-Pro-Val (VPKPV)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Leu-enkephalin (YGGFL)",
            "Met-enkephalin (YGGFM)",
            "Angiotensin I (DRVYI)",
            "Thymopentin (RKDVY)",
            "Pentagastrin (Boc-Trp-Met-Asp-Phe-NH2)",
            "Dermorphin (YAFGY)",
            "Deltorphin (YAGFL)",
            "Kassinin (APFVG)",
            "Neurotensin (ELYEN)",
            "Bradykinin (RPPGF)",
            "Opiorphin (QRFYS)",
            "Corticotropin-releasing factor (CRF) fragment (RMPIF)",
            "Peptide YY (PYY) fragment (YPIQL)",
            "Endomorphin-1 (YPWF)",
            "Endomorphin-2 (YPFF)",
            "Neuropeptide FF (FLFQP)",
            "Neuropeptide Y (NPY) fragment (YPSKPDNPGEDAPAEDMARYYSALRHYINLITRQRY)",
            "Gastrin (GWMDF)",
            "Substance P (RPKPQQFFGLM)",
            "Thymosin beta-4 fragment (SDKPD)",
            "Neuropeptide B (NPB) fragment (WYKPA)",
            "Neuropeptide W (NPW) fragment (WYKHV)",
            "Galanin (GAL) fragment (GWTLNSAGYLLGPHAIDNHRS)",
            "Neuropeptide S (NPS) fragment (SFRNGVGTGMKKTSFQRAKS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Leu-enkephalin (YGGFL)",
                "Met-enkephalin (YGGFM)",
                "Angiotensin I (DRVYI)",
                "Thymopentin (RKDVY)",
                "Pentagastrin (Boc-Trp-Met-Asp-Phe-NH2)",
                "Dermorphin (YAFGY)",
                "Deltorphin (YAGFL)",
                "Kassinin (APFVG)",
                "Neurotensin (ELYEN)",
                "Bradykinin (RPPGF)",
                "Opiorphin (QRFYS)",
                "Corticotropin-releasing factor (CRF) fragment (RMPIF)",
                "Peptide YY (PYY) fragment (YPIQL)",
                "Endomorphin-1 (YPWF)",
                "Endomorphin-2 (YPFF)",
                "Neuropeptide FF (FLFQP)",
                "Neuropeptide Y (NPY) fragment (YPSKPDNPGEDAPAEDMARYYSALRHYINLITRQRY)",
                "Gastrin (GWMDF)",
                "Substance P (RPKPQQFFGLM)",
                "Thymosin beta-4 fragment (SDKPD)",
                "Neuropeptide B (NPB) fragment (WYKPA)",
                "Neuropeptide W (NPW) fragment (WYKHV)",
                "Galanin (GAL) fragment (GWTLNSAGYLLGPHAIDNHRS)",
                "Neuropeptide S (NPS) fragment (SFRNGVGTGMKKTSFQRAKS)"
            ],
            "mismatches": [],
            "true_referents": [
                "Angiotensin I (DRVYI)",
                "Bradykinin (RPPGF)",
                "Corticotropin-releasing factor (CRF) fragment (RMPIF)",
                "Deltorphin (YAGFL)",
                "Dermorphin (YAFGY)",
                "Endomorphin-1 (YPWF)",
                "Endomorphin-2 (YPFF)",
                "Galanin (GAL) fragment (GWTLNSAGYLLGPHAIDNHRS)",
                "Gastrin (GWMDF)",
                "Kassinin (APFVG)",
                "Leu-enkephalin (YGGFL)",
                "Met-enkephalin (YGGFM)",
                "Neuropeptide B (NPB) fragment (WYKPA)",
                "Neuropeptide FF (FLFQP)",
                "Neuropeptide S (NPS) fragment (SFRNGVGTGMKKTSFQRAKS)",
                "Neuropeptide W (NPW) fragment (WYKHV)",
                "Neuropeptide Y (NPY) fragment (YPSKPDNPGEDAPAEDMARYYSALRHYINLITRQRY)",
                "Neurotensin (ELYEN)",
                "Opiorphin (QRFYS)",
                "Pentagastrin (Boc-Trp-Met-Asp-Phe-NH2)",
                "Peptide YY (PYY) fragment (YPIQL)",
                "Substance P (RPKPQQFFGLM)",
                "Thymopentin (RKDVY)",
                "Thymosin beta-4 fragment (SDKPD)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Oxytocin (OT)",
            "Vasopressin (AVP)",
            "Neuropeptide Y (NPY)",
            "Bradykinin (BK)",
            "Substance P (SP)",
            "Angiotensin II (Ang II)",
            "Cholecystokinin (CCK)",
            "Dynorphin A (Dyn A)",
            "Enkephalin (ENK)",
            "Calcitonin Gene-Related Peptide (CGRP)",
            "Somatostatin (SST)",
            "Insulin (INS)",
            "Glucagon (GLU)",
            "Thymopoietin (TMP)",
            "Neurotensin (NT)",
            "Bombesin (BBS)",
            "Gastrin (GAS)",
            "Corticotropin-Releasing Factor (CRF)",
            "Atrial Natriuretic Peptide (ANP)",
            "Endothelin-1 (ET-1)",
            "Follistatin (FST)",
            "Pro-opiomelanocortin (POMC)",
            "Corticotropin (ACTH)",
            "Luteinizing Hormone-Releasing Hormone (LHRH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Oxytocin (OT)",
                "Vasopressin (AVP)",
                "Neuropeptide Y (NPY)",
                "Bradykinin (BK)",
                "Substance P (SP)",
                "Angiotensin II (Ang II)",
                "Cholecystokinin (CCK)",
                "Dynorphin A (Dyn A)",
                "Enkephalin (ENK)",
                "Calcitonin Gene-Related Peptide (CGRP)",
                "Somatostatin (SST)",
                "Insulin (INS)",
                "Glucagon (GLU)",
                "Thymopoietin (TMP)",
                "Neurotensin (NT)",
                "Bombesin (BBS)",
                "Gastrin (GAS)",
                "Corticotropin-Releasing Factor (CRF)",
                "Atrial Natriuretic Peptide (ANP)",
                "Endothelin-1 (ET-1)",
                "Follistatin (FST)",
                "Pro-opiomelanocortin (POMC)",
                "Corticotropin (ACTH)",
                "Luteinizing Hormone-Releasing Hormone (LHRH)"
            ],
            "mismatches": [],
            "true_referents": [
                "Angiotensin II (Ang II)",
                "Atrial Natriuretic Peptide (ANP)",
                "Bombesin (BBS)",
                "Bradykinin (BK)",
                "Calcitonin Gene-Related Peptide (CGRP)",
                "Cholecystokinin (CCK)",
                "Corticotropin (ACTH)",
                "Corticotropin-Releasing Factor (CRF)",
                "Dynorphin A (Dyn A)",
                "Endothelin-1 (ET-1)",
                "Enkephalin (ENK)",
                "Follistatin (FST)",
                "Gastrin (GAS)",
                "Glucagon (GLU)",
                "Insulin (INS)",
                "Luteinizing Hormone-Releasing Hormone (LHRH)",
                "Neuropeptide Y (NPY)",
                "Neurotensin (NT)",
                "Oxytocin (OT)",
                "Pro-opiomelanocortin (POMC)",
                "Somatostatin (SST)",
                "Substance P (SP)",
                "Thymopoietin (TMP)",
                "Vasopressin (AVP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Enkephalin (ENK)",
            "Tuftsin (TFT)",
            "Angiotensin I (ANG-I)",
            "Bradykinin (BK)",
            "Casomorphin (CSM)",
            "Endomorphin (EDM)",
            "Neurokinin A (NKA)",
            "Neuropeptide Y (NPY)",
            "Oxytocin (OT)",
            "Peptide YY (PYY)",
            "Substance P (SP)",
            "Vasopressin (VP)",
            "Thymopentin (TP5)",
            "Leucine Enkephalin (LENK)",
            "Methionine Enkephalin (MENK)",
            "Pentagastrin (PG)",
            "Thymopoietin (TP)",
            "Thymostimulin (TS)",
            "Thymosin Alpha 1 (TA1)",
            "Thymosin Beta 4 (TB4)",
            "Thymosin Beta 10 (TB10)",
            "Thymosin Beta 15 (TB15)",
            "Thymulin (TH)",
            "Thymosin Alpha 11 (TA11)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Enkephalin (ENK)",
                "Tuftsin (TFT)",
                "Angiotensin I (ANG-I)",
                "Bradykinin (BK)",
                "Casomorphin (CSM)",
                "Endomorphin (EDM)",
                "Neurokinin A (NKA)",
                "Neuropeptide Y (NPY)",
                "Oxytocin (OT)",
                "Peptide YY (PYY)",
                "Substance P (SP)",
                "Vasopressin (VP)",
                "Thymopentin (TP5)",
                "Leucine Enkephalin (LENK)",
                "Methionine Enkephalin (MENK)",
                "Pentagastrin (PG)",
                "Thymopoietin (TP)",
                "Thymostimulin (TS)",
                "Thymosin Alpha 1 (TA1)",
                "Thymosin Beta 4 (TB4)",
                "Thymosin Beta 10 (TB10)",
                "Thymosin Beta 15 (TB15)",
                "Thymulin (TH)",
                "Thymosin Alpha 11 (TA11)"
            ],
            "mismatches": [],
            "true_referents": [
                "Angiotensin I (ANG-I)",
                "Bradykinin (BK)",
                "Casomorphin (CSM)",
                "Endomorphin (EDM)",
                "Enkephalin (ENK)",
                "Leucine Enkephalin (LENK)",
                "Methionine Enkephalin (MENK)",
                "Neurokinin A (NKA)",
                "Neuropeptide Y (NPY)",
                "Oxytocin (OT)",
                "Pentagastrin (PG)",
                "Peptide YY (PYY)",
                "Substance P (SP)",
                "Thymopentin (TP5)",
                "Thymopoietin (TP)",
                "Thymosin Alpha 1 (TA1)",
                "Thymosin Alpha 11 (TA11)",
                "Thymosin Beta 10 (TB10)",
                "Thymosin Beta 15 (TB15)",
                "Thymosin Beta 4 (TB4)",
                "Thymostimulin (TS)",
                "Thymulin (TH)",
                "Tuftsin (TFT)",
                "Vasopressin (VP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Angiotensin I (Ang I)",
            "Angiotensin II (Ang II)",
            "Oxytocin",
            "Vasopressin",
            "Gonadotropin-releasing hormone (GnRH)",
            "Thyrotropin-releasing hormone (TRH)",
            "Substance P",
            "Enkephalin",
            "Endorphin",
            "Bradykinin",
            "Neurotensin",
            "Leu-enkephalin",
            "Met-enkephalin",
            "Leu-enkephalinamide",
            "Met-enkephalinamide",
            "Leu-enkephalin-Arg6",
            "Met-enkephalin-Arg6",
            "Leu-enkephalin-Arg6-Gly7-Leu8",
            "Met-enkephalin-Arg6-Gly7-Leu8",
            "Leu-enkephalin-Arg6-Phe7",
            "Met-enkephalin-Arg6-Phe7",
            "Glycyl-L-histidyl-L-lysine (GHK)",
            "Glycyl-L-histidyl-L-tryptophan (GHW)",
            "Glycyl-L-histidyl-L-phenylalanine (GHP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Angiotensin I (Ang I)",
                "Angiotensin II (Ang II)",
                "Oxytocin",
                "Vasopressin",
                "Gonadotropin-releasing hormone (GnRH)",
                "Thyrotropin-releasing hormone (TRH)",
                "Substance P",
                "Enkephalin",
                "Endorphin",
                "Bradykinin",
                "Neurotensin",
                "Leu-enkephalin",
                "Met-enkephalin",
                "Leu-enkephalinamide",
                "Met-enkephalinamide",
                "Leu-enkephalin-Arg6",
                "Met-enkephalin-Arg6",
                "Leu-enkephalin-Arg6-Gly7-Leu8",
                "Met-enkephalin-Arg6-Gly7-Leu8",
                "Leu-enkephalin-Arg6-Phe7",
                "Met-enkephalin-Arg6-Phe7",
                "Glycyl-L-histidyl-L-lysine (GHK)",
                "Glycyl-L-histidyl-L-tryptophan (GHW)",
                "Glycyl-L-histidyl-L-phenylalanine (GHP)"
            ],
            "mismatches": [],
            "true_referents": [
                "Angiotensin I (Ang I)",
                "Angiotensin II (Ang II)",
                "Bradykinin",
                "Endorphin",
                "Enkephalin",
                "Glycyl-L-histidyl-L-lysine (GHK)",
                "Glycyl-L-histidyl-L-phenylalanine (GHP)",
                "Glycyl-L-histidyl-L-tryptophan (GHW)",
                "Gonadotropin-releasing hormone (GnRH)",
                "Leu-enkephalin",
                "Leu-enkephalin-Arg6",
                "Leu-enkephalin-Arg6-Gly7-Leu8",
                "Leu-enkephalin-Arg6-Phe7",
                "Leu-enkephalinamide",
                "Met-enkephalin",
                "Met-enkephalin-Arg6",
                "Met-enkephalin-Arg6-Gly7-Leu8",
                "Met-enkephalin-Arg6-Phe7",
                "Met-enkephalinamide",
                "Neurotensin",
                "Oxytocin",
                "Substance P",
                "Thyrotropin-releasing hormone (TRH)",
                "Vasopressin"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Leu-enkephalin (LE)",
            "Met-enkephalin (ME)",
            "Thymopentin (TP5)",
            "KTTKS",
            "Acetyl KTTKS",
            "GHRP-5",
            "Arg-Lys-Asp-Val-Tyr",
            "Ser-Gly-Pro-Leu-Glu",
            "Lys-Thr-Thr-Lys-Ser",
            "Gly-Gly-Phe-Met",
            "Tyr-Gly-Gly-Phe-Leu",
            "Asp-Gly-Phe-Phe-Tyr",
            "Gln-Lys-Asn-Val-Tyr",
            "Ala-Pro-Gly-Lys-Leu",
            "Pro-Glu-Val-Pro-Thr",
            "His-Ser-Arg-Lys-Tyr",
            "Asp-Arg-Pro-Gly-Leu",
            "Phe-Ala-Gly-Ser-Thr",
            "Thr-Ala-Leu-Glu-Gly",
            "Gly-Lys-Arg-Arg-Glu",
            "Ser-Thr-Lys-Val-Gly",
            "Lys-Val-Ala-Gly-Thr",
            "Gln-Val-Asp-Ser-Leu",
            "Asn-Gly-Phe-Pro-Tyr"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Leu-enkephalin (LE)",
                "Met-enkephalin (ME)",
                "Thymopentin (TP5)",
                "KTTKS",
                "Acetyl KTTKS",
                "GHRP-5",
                "Arg-Lys-Asp-Val-Tyr",
                "Ser-Gly-Pro-Leu-Glu",
                "Lys-Thr-Thr-Lys-Ser",
                "Gly-Gly-Phe-Met",
                "Tyr-Gly-Gly-Phe-Leu",
                "Asp-Gly-Phe-Phe-Tyr",
                "Gln-Lys-Asn-Val-Tyr",
                "Ala-Pro-Gly-Lys-Leu",
                "Pro-Glu-Val-Pro-Thr",
                "His-Ser-Arg-Lys-Tyr",
                "Asp-Arg-Pro-Gly-Leu",
                "Phe-Ala-Gly-Ser-Thr",
                "Thr-Ala-Leu-Glu-Gly",
                "Gly-Lys-Arg-Arg-Glu",
                "Ser-Thr-Lys-Val-Gly",
                "Lys-Val-Ala-Gly-Thr",
                "Gln-Val-Asp-Ser-Leu",
                "Asn-Gly-Phe-Pro-Tyr"
            ],
            "mismatches": [],
            "true_referents": [
                "Acetyl KTTKS",
                "Ala-Pro-Gly-Lys-Leu",
                "Arg-Lys-Asp-Val-Tyr",
                "Asn-Gly-Phe-Pro-Tyr",
                "Asp-Arg-Pro-Gly-Leu",
                "Asp-Gly-Phe-Phe-Tyr",
                "GHRP-5",
                "Gln-Lys-Asn-Val-Tyr",
                "Gln-Val-Asp-Ser-Leu",
                "Gly-Gly-Phe-Met",
                "Gly-Lys-Arg-Arg-Glu",
                "His-Ser-Arg-Lys-Tyr",
                "KTTKS",
                "Leu-enkephalin (LE)",
                "Lys-Thr-Thr-Lys-Ser",
                "Lys-Val-Ala-Gly-Thr",
                "Met-enkephalin (ME)",
                "Phe-Ala-Gly-Ser-Thr",
                "Pro-Glu-Val-Pro-Thr",
                "Ser-Gly-Pro-Leu-Glu",
                "Ser-Thr-Lys-Val-Gly",
                "Thr-Ala-Leu-Glu-Gly",
                "Thymopentin (TP5)",
                "Tyr-Gly-Gly-Phe-Leu"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Thymopentin (TP5)",
            "Enkephalin",
            "Argireline (acetyl hexapeptide-3)",
            "Leuprorelin",
            "Goserelin",
            "Buserelin",
            "Histrelin",
            "Nafarelin",
            "Triptorelin",
            "Deslorelin",
            "Abarelix",
            "Cetrorelix",
            "Ganirelix",
            "Degarelix",
            "Eledoisin",
            "Substance P",
            "Angiotensin II",
            "Bradykinin",
            "Oxytocin",
            "Vasopressin",
            "Melanocyte-stimulating hormone (\u03b1-MSH)",
            "Thyrotropin-releasing hormone (TRH)",
            "Kyotorphin",
            "Endomorphin-1"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Thymopentin (TP5)",
                "Enkephalin",
                "Argireline (acetyl hexapeptide-3)",
                "Leuprorelin",
                "Goserelin",
                "Buserelin",
                "Histrelin",
                "Nafarelin",
                "Triptorelin",
                "Deslorelin",
                "Abarelix",
                "Cetrorelix",
                "Ganirelix",
                "Degarelix",
                "Eledoisin",
                "Substance P",
                "Angiotensin II",
                "Bradykinin",
                "Oxytocin",
                "Vasopressin",
                "Melanocyte-stimulating hormone (\u03b1-MSH)",
                "Thyrotropin-releasing hormone (TRH)",
                "Kyotorphin",
                "Endomorphin-1"
            ],
            "mismatches": [],
            "true_referents": [
                "Abarelix",
                "Angiotensin II",
                "Argireline (acetyl hexapeptide-3)",
                "Bradykinin",
                "Buserelin",
                "Cetrorelix",
                "Degarelix",
                "Deslorelin",
                "Eledoisin",
                "Endomorphin-1",
                "Enkephalin",
                "Ganirelix",
                "Goserelin",
                "Histrelin",
                "Kyotorphin",
                "Leuprorelin",
                "Melanocyte-stimulating hormone (\u03b1-MSH)",
                "Nafarelin",
                "Oxytocin",
                "Substance P",
                "Thymopentin (TP5)",
                "Thyrotropin-releasing hormone (TRH)",
                "Triptorelin",
                "Vasopressin"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Leucine enkephalin (YGGFL)",
            "Methionine enkephalin (YGGFM)",
            "Thymopentin (RKDVY)",
            "Valinomycin (Val4-Hyi)",
            "Cilengitide (c(RGDf(NMe)V))",
            "Eptifibatide (Integrilin)",
            "Leuprolide (Lupron)",
            "Somatostatin (AGCKNFFWKTFTSC)",
            "Pentagastrin (AWMDF)",
            "Phalloidin (C35H48N8O11S)",
            "\u03b1-Conotoxin GI (ECCNPACGRHYSC)",
            "Contryphan-Sm (GCOWEPWC)",
            "Dolastatin 10 (C47H68N6O11S)",
            "Chlamydocin (Cyclo(Ala-Aib-Phe-Aib-Aib))",
            "Tuftsin (TKPR)",
            "Rigin (RIGPK)",
            "Bradykinin (RPPGFSPFR)",
            "Angiotensin II (DRVYIHPF)",
            "Oxytocin (CYIQNCPLG)",
            "Vasopressin (CYFQNCPRG)",
            "Opiorphin (QRFSR)",
            "Glutathione (\u03b3-ECG)",
            "Neuromedin U-8 (YFLFRPRN)",
            "Endothelin-1 (CSCSSLMDKECVYFCHLDIIW)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Leucine enkephalin (YGGFL)",
                "Methionine enkephalin (YGGFM)",
                "Thymopentin (RKDVY)",
                "Valinomycin (Val4-Hyi)",
                "Cilengitide (c(RGDf(NMe)V))",
                "Eptifibatide (Integrilin)",
                "Leuprolide (Lupron)",
                "Somatostatin (AGCKNFFWKTFTSC)",
                "Pentagastrin (AWMDF)",
                "Phalloidin (C35H48N8O11S)",
                "\u03b1-Conotoxin GI (ECCNPACGRHYSC)",
                "Contryphan-Sm (GCOWEPWC)",
                "Dolastatin 10 (C47H68N6O11S)",
                "Chlamydocin (Cyclo(Ala-Aib-Phe-Aib-Aib))",
                "Tuftsin (TKPR)",
                "Rigin (RIGPK)",
                "Bradykinin (RPPGFSPFR)",
                "Angiotensin II (DRVYIHPF)",
                "Oxytocin (CYIQNCPLG)",
                "Vasopressin (CYFQNCPRG)",
                "Opiorphin (QRFSR)",
                "Glutathione (\u03b3-ECG)",
                "Neuromedin U-8 (YFLFRPRN)",
                "Endothelin-1 (CSCSSLMDKECVYFCHLDIIW)"
            ],
            "mismatches": [],
            "true_referents": [
                "Angiotensin II (DRVYIHPF)",
                "Bradykinin (RPPGFSPFR)",
                "Chlamydocin (Cyclo(Ala-Aib-Phe-Aib-Aib))",
                "Cilengitide (c(RGDf(NMe)V))",
                "Contryphan-Sm (GCOWEPWC)",
                "Dolastatin 10 (C47H68N6O11S)",
                "Endothelin-1 (CSCSSLMDKECVYFCHLDIIW)",
                "Eptifibatide (Integrilin)",
                "Glutathione (\u03b3-ECG)",
                "Leucine enkephalin (YGGFL)",
                "Leuprolide (Lupron)",
                "Methionine enkephalin (YGGFM)",
                "Neuromedin U-8 (YFLFRPRN)",
                "Opiorphin (QRFSR)",
                "Oxytocin (CYIQNCPLG)",
                "Pentagastrin (AWMDF)",
                "Phalloidin (C35H48N8O11S)",
                "Rigin (RIGPK)",
                "Somatostatin (AGCKNFFWKTFTSC)",
                "Thymopentin (RKDVY)",
                "Tuftsin (TKPR)",
                "Valinomycin (Val4-Hyi)",
                "Vasopressin (CYFQNCPRG)",
                "\u03b1-Conotoxin GI (ECCNPACGRHYSC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Leucine-Enkephalin (Leu-Enkephalin)",
            "Methionine-Enkephalin (Met-Enkephalin)",
            "Endomorphin-1 (EM-1)",
            "Endomorphin-2 (EM-2)",
            "Deltorphin I",
            "Deltorphin II",
            "Dermorphin",
            "Kyotorphin (L-Arg-L-Tyr-L-Arg-L-Phe-L-Met-NH2)",
            "Casomorphin",
            "Sodefrin",
            "Melanotropin Release Inhibiting Factor (MIF-1)",
            "Neuropeptide FF (NPFF)",
            "Neuropeptide AF (NPAF)",
            "Neuropeptide SF (NPSF)",
            "Orexin A (Hypocretin-1)",
            "Orexin B (Hypocretin-2)",
            "Ghrelin",
            "Neurotensin",
            "Substance P",
            "Bradykinin",
            "Angiotensin I",
            "Angiotensin II",
            "Renin Substrate",
            "Kallidin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Leucine-Enkephalin (Leu-Enkephalin)",
                "Methionine-Enkephalin (Met-Enkephalin)",
                "Endomorphin-1 (EM-1)",
                "Endomorphin-2 (EM-2)",
                "Deltorphin I",
                "Deltorphin II",
                "Dermorphin",
                "Kyotorphin (L-Arg-L-Tyr-L-Arg-L-Phe-L-Met-NH2)",
                "Casomorphin",
                "Sodefrin",
                "Melanotropin Release Inhibiting Factor (MIF-1)",
                "Neuropeptide FF (NPFF)",
                "Neuropeptide AF (NPAF)",
                "Neuropeptide SF (NPSF)",
                "Orexin A (Hypocretin-1)",
                "Orexin B (Hypocretin-2)",
                "Ghrelin",
                "Neurotensin",
                "Substance P",
                "Bradykinin",
                "Angiotensin I",
                "Angiotensin II",
                "Renin Substrate",
                "Kallidin"
            ],
            "mismatches": [],
            "true_referents": [
                "Angiotensin I",
                "Angiotensin II",
                "Bradykinin",
                "Casomorphin",
                "Deltorphin I",
                "Deltorphin II",
                "Dermorphin",
                "Endomorphin-1 (EM-1)",
                "Endomorphin-2 (EM-2)",
                "Ghrelin",
                "Kallidin",
                "Kyotorphin (L-Arg-L-Tyr-L-Arg-L-Phe-L-Met-NH2)",
                "Leucine-Enkephalin (Leu-Enkephalin)",
                "Melanotropin Release Inhibiting Factor (MIF-1)",
                "Methionine-Enkephalin (Met-Enkephalin)",
                "Neuropeptide AF (NPAF)",
                "Neuropeptide FF (NPFF)",
                "Neuropeptide SF (NPSF)",
                "Neurotensin",
                "Orexin A (Hypocretin-1)",
                "Orexin B (Hypocretin-2)",
                "Renin Substrate",
                "Sodefrin",
                "Substance P"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Angiotensin I (ANG I)",
            "Bradykinin (BK)",
            "Endothelin-1 (ET-1)",
            "Enkephalin (ENK)",
            "Glutathione (GSH)",
            "Melanocyte-stimulating hormone (\u03b1-MSH)",
            "Oxytocin (OT)",
            "Substance P (SP)",
            "Thymopoietin (TP)",
            "Vasopressin (AVP)",
            "Adrenocorticotropic hormone (ACTH)",
            "Calcitonin gene-related peptide (CGRP)",
            "Cholecystokinin (CCK)",
            "Corticotropin-releasing factor (CRF)",
            "Dynorphin A (Dyn A)",
            "Endorphin (END)",
            "Gastrin (GAS)",
            "Glucagon (GLC)",
            "Insulin (INS)",
            "Motilin (MOT)",
            "Neurotensin (NT)",
            "Parathyroid hormone (PTH)",
            "Somatostatin (SRIF)",
            "Thyrotropin-releasing hormone (TRH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Angiotensin I (ANG I)",
                "Bradykinin (BK)",
                "Endothelin-1 (ET-1)",
                "Enkephalin (ENK)",
                "Glutathione (GSH)",
                "Melanocyte-stimulating hormone (\u03b1-MSH)",
                "Oxytocin (OT)",
                "Substance P (SP)",
                "Thymopoietin (TP)",
                "Vasopressin (AVP)",
                "Adrenocorticotropic hormone (ACTH)",
                "Calcitonin gene-related peptide (CGRP)",
                "Cholecystokinin (CCK)",
                "Corticotropin-releasing factor (CRF)",
                "Dynorphin A (Dyn A)",
                "Endorphin (END)",
                "Gastrin (GAS)",
                "Glucagon (GLC)",
                "Insulin (INS)",
                "Motilin (MOT)",
                "Neurotensin (NT)",
                "Parathyroid hormone (PTH)",
                "Somatostatin (SRIF)",
                "Thyrotropin-releasing hormone (TRH)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenocorticotropic hormone (ACTH)",
                "Angiotensin I (ANG I)",
                "Bradykinin (BK)",
                "Calcitonin gene-related peptide (CGRP)",
                "Cholecystokinin (CCK)",
                "Corticotropin-releasing factor (CRF)",
                "Dynorphin A (Dyn A)",
                "Endorphin (END)",
                "Endothelin-1 (ET-1)",
                "Enkephalin (ENK)",
                "Gastrin (GAS)",
                "Glucagon (GLC)",
                "Glutathione (GSH)",
                "Insulin (INS)",
                "Melanocyte-stimulating hormone (\u03b1-MSH)",
                "Motilin (MOT)",
                "Neurotensin (NT)",
                "Oxytocin (OT)",
                "Parathyroid hormone (PTH)",
                "Somatostatin (SRIF)",
                "Substance P (SP)",
                "Thymopoietin (TP)",
                "Thyrotropin-releasing hormone (TRH)",
                "Vasopressin (AVP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Angiotensin II (AII) (Ang-(1-5))",
            "Bradykinin (BK)",
            "CCK-5",
            "Enkephalin (ENK)",
            "Glutathione (GSH)",
            "Gut peptide (GUT)",
            "Hepcidin (Hep)",
            "Insulin-like growth factor-5 (IGF-5)",
            "Kassinin (KSS)",
            "Leu-enkephalin (LEU-ENK)",
            "Melanostatin (MS)",
            "Melanotropin (MT)",
            "Neurokinin A (NKA)",
            "Neurokinin B (NKB)",
            "Oxytocin (OXT)",
            "Pentagastrin (PG)",
            "Pentapeptide-4 (PP-4)",
            "Pentapeptide-5 (PP-5)",
            "Pituitary adenylate cyclase-activating peptide (PACAP)",
            "Tachykinin (TK)",
            "Tachykinin-1 (TK-1)",
            "Tachykinin-2 (TK-2)",
            "Tachykinin-3 (TK-3)",
            "Tachykinin-4 (TK-4)",
            "Tachykinin-5 (TK-5)",
            "Vasopressin (AVP)",
            "Vasoactive intestinal peptide (VIP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Angiotensin II (AII) (Ang-(1-5))",
                "Bradykinin (BK)",
                "CCK-5",
                "Enkephalin (ENK)",
                "Glutathione (GSH)",
                "Gut peptide (GUT)",
                "Hepcidin (Hep)",
                "Insulin-like growth factor-5 (IGF-5)",
                "Kassinin (KSS)",
                "Leu-enkephalin (LEU-ENK)",
                "Melanostatin (MS)",
                "Melanotropin (MT)",
                "Neurokinin A (NKA)",
                "Neurokinin B (NKB)",
                "Oxytocin (OXT)",
                "Pentagastrin (PG)",
                "Pentapeptide-4 (PP-4)",
                "Pentapeptide-5 (PP-5)",
                "Pituitary adenylate cyclase-activating peptide (PACAP)",
                "Tachykinin (TK)",
                "Tachykinin-1 (TK-1)",
                "Tachykinin-2 (TK-2)",
                "Tachykinin-3 (TK-3)",
                "Tachykinin-4 (TK-4)"
            ],
            "mismatches": [
                "Tachykinin-5 (TK-5)",
                "Vasopressin (AVP)",
                "Vasoactive intestinal peptide (VIP)"
            ],
            "true_referents": [
                "Angiotensin II (AII) (Ang-(1-5))",
                "Bradykinin (BK)",
                "CCK-5",
                "Enkephalin (ENK)",
                "Glutathione (GSH)",
                "Gut peptide (GUT)",
                "Hepcidin (Hep)",
                "Insulin-like growth factor-5 (IGF-5)",
                "Kassinin (KSS)",
                "Leu-enkephalin (LEU-ENK)",
                "Melanostatin (MS)",
                "Melanotropin (MT)",
                "Neurokinin A (NKA)",
                "Neurokinin B (NKB)",
                "Oxytocin (OXT)",
                "Pentagastrin (PG)",
                "Pentapeptide-4 (PP-4)",
                "Pentapeptide-5 (PP-5)",
                "Pituitary adenylate cyclase-activating peptide (PACAP)",
                "Tachykinin (TK)",
                "Tachykinin-1 (TK-1)",
                "Tachykinin-2 (TK-2)",
                "Tachykinin-3 (TK-3)",
                "Tachykinin-4 (TK-4)"
            ],
            "TP": 24,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            "Enkephalin (YPWT)",
            "Tuftsin (TKPVY)",
            "Met-enkephalin (YPWT)",
            "Leu-enkephalin (YPWL)",
            "Vasopressin (AVP)",
            "Oxytocin (OXT)",
            "Neuropeptide Y (NPY)",
            "Neuropeptide YY (NPYY)",
            "Angiotensin II (AII)",
            "Angiotensin III (AIII)",
            "Angiotensin IV (AIV)",
            "Bradykinin (BK)",
            "Des-Arg9-bradykinin (DABK)",
            "Kallidin (KD)",
            "Methionyl-methionine (Met-Met)",
            "Glycyl-tyrosine (Gly-Tyr)",
            "Tyrosyl-glycine (Tyr-Gly)",
            "Leucyl-leucine (Leu-Leu)",
            "Isoleucyl-isoleucine (Ile-Ile)",
            "Valyl-valine (Val-Val)",
            "Alamandine (AVP-ala)",
            "Vasopressin-ala (AVP-ala)",
            "Oxytocin-ala (OXT-ala)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Enkephalin (YPWT)",
                "Tuftsin (TKPVY)",
                "Met-enkephalin (YPWT)",
                "Leu-enkephalin (YPWL)",
                "Vasopressin (AVP)",
                "Oxytocin (OXT)",
                "Neuropeptide Y (NPY)",
                "Neuropeptide YY (NPYY)",
                "Angiotensin II (AII)",
                "Angiotensin III (AIII)",
                "Angiotensin IV (AIV)",
                "Bradykinin (BK)",
                "Des-Arg9-bradykinin (DABK)",
                "Kallidin (KD)",
                "Methionyl-methionine (Met-Met)",
                "Glycyl-tyrosine (Gly-Tyr)",
                "Tyrosyl-glycine (Tyr-Gly)",
                "Leucyl-leucine (Leu-Leu)",
                "Isoleucyl-isoleucine (Ile-Ile)",
                "Valyl-valine (Val-Val)",
                "Alamandine (AVP-ala)",
                "Vasopressin-ala (AVP-ala)",
                "Oxytocin-ala (OXT-ala)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alamandine (AVP-ala)",
                "Angiotensin II (AII)",
                "Angiotensin III (AIII)",
                "Angiotensin IV (AIV)",
                "Bradykinin (BK)",
                "Des-Arg9-bradykinin (DABK)",
                "Enkephalin (YPWT)",
                "Glycyl-tyrosine (Gly-Tyr)",
                "Isoleucyl-isoleucine (Ile-Ile)",
                "Kallidin (KD)",
                "Leu-enkephalin (YPWL)",
                "Leucyl-leucine (Leu-Leu)",
                "Met-enkephalin (YPWT)",
                "Methionyl-methionine (Met-Met)",
                "Neuropeptide Y (NPY)",
                "Neuropeptide YY (NPYY)",
                "Oxytocin (OXT)",
                "Oxytocin-ala (OXT-ala)",
                "Tuftsin (TKPVY)",
                "Tyrosyl-glycine (Tyr-Gly)",
                "Valyl-valine (Val-Val)",
                "Vasopressin (AVP)",
                "Vasopressin-ala (AVP-ala)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "pentapeptide",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Pentapeptide",
                "Canonical Name": "Pentapeptide"
            },
            {
                "Referent": "Pentapeptide antibiotic",
                "Canonical Name": "Pentapeptide antibiotic"
            },
            {
                "Referent": "Pentapeptide hormone",
                "Canonical Name": "Pentapeptide hormone"
            },
            {
                "Referent": "Pentapeptide toxin",
                "Canonical Name": "Pentapeptide toxin"
            },
            {
                "Referent": "Pentapeptide receptor",
                "Canonical Name": "Pentapeptide receptor"
            },
            {
                "Referent": "Pentapeptide library",
                "Canonical Name": "Pentapeptide library"
            },
            {
                "Referent": "Pentapeptide vaccine",
                "Canonical Name": "Pentapeptide vaccine"
            },
            {
                "Referent": "Pentapeptide synthesis",
                "Canonical Name": "Pentapeptide synthesis"
            },
            {
                "Referent": "Pentapeptide library synthesis",
                "Canonical Name": "Pentapeptide library synthesis"
            },
            {
                "Referent": "Pentapeptide library screening",
                "Canonical Name": "Pentapeptide library screening"
            },
            {
                "Referent": "Pentapeptide library binding assay",
                "Canonical Name": "Pentapeptide library binding assay"
            },
            {
                "Referent": "Pentapeptide library affinity maturation",
                "Canonical Name": "Pentapeptide library affinity maturation"
            },
            {
                "Referent": "Pentapeptide library display",
                "Canonical Name": "Pentapeptide library display"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display",
                "Canonical Name": "Pentapeptide library affinity maturation display"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            },
            {
                "Referent": "Pentapeptide library affinity maturation display screening",
                "Canonical Name": "Pentapeptide library affinity maturation display screening"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Pentapeptide",
                "Pentapeptide antibiotic",
                "Pentapeptide hormone",
                "Pentapeptide toxin",
                "Pentapeptide receptor",
                "Pentapeptide library",
                "Pentapeptide vaccine",
                "Pentapeptide synthesis",
                "Pentapeptide library synthesis",
                "Pentapeptide library screening",
                "Pentapeptide library binding assay",
                "Pentapeptide library affinity maturation",
                "Pentapeptide library display",
                "Pentapeptide library affinity maturation display",
                "Pentapeptide library affinity maturation display screening"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"Pentapeptide antibiotic\", \"Canonical Name\": \"Pentapeptide antibiotic\"}",
                "{\"Referent\": \"Pentapeptide hormone\", \"Canonical Name\": \"Pentapeptide hormone\"}",
                "{\"Referent\": \"Pentapeptide library affinity maturation display screening\", \"Canonical Name\": \"Pentapeptide library affinity maturation display screening\"}",
                "{\"Referent\": \"Pentapeptide library affinity maturation display\", \"Canonical Name\": \"Pentapeptide library affinity maturation display\"}",
                "{\"Referent\": \"Pentapeptide library affinity maturation\", \"Canonical Name\": \"Pentapeptide library affinity maturation\"}",
                "{\"Referent\": \"Pentapeptide library binding assay\", \"Canonical Name\": \"Pentapeptide library binding assay\"}",
                "{\"Referent\": \"Pentapeptide library display\", \"Canonical Name\": \"Pentapeptide library display\"}",
                "{\"Referent\": \"Pentapeptide library screening\", \"Canonical Name\": \"Pentapeptide library screening\"}",
                "{\"Referent\": \"Pentapeptide library synthesis\", \"Canonical Name\": \"Pentapeptide library synthesis\"}",
                "{\"Referent\": \"Pentapeptide library\", \"Canonical Name\": \"Pentapeptide library\"}",
                "{\"Referent\": \"Pentapeptide receptor\", \"Canonical Name\": \"Pentapeptide receptor\"}",
                "{\"Referent\": \"Pentapeptide synthesis\", \"Canonical Name\": \"Pentapeptide synthesis\"}",
                "{\"Referent\": \"Pentapeptide toxin\", \"Canonical Name\": \"Pentapeptide toxin\"}",
                "{\"Referent\": \"Pentapeptide vaccine\", \"Canonical Name\": \"Pentapeptide vaccine\"}",
                "{\"Referent\": \"Pentapeptide\", \"Canonical Name\": \"Pentapeptide\"}"
            ],
            "TP": 15,
            "FP": 0,
            "FN": 0
        }
    }
]