[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "E-Cadherin (CDH1)",
            "N-Cadherin (CDH2)",
            "P-Cadherin (CDH3)",
            "Desmoglein 1 (DSG1)",
            "Desmoglein 2 (DSG2)",
            "Desmoglein 3 (DSG3)",
            "Desmoglein 4 (DSG4)",
            "Desmocollin 1 (DSC1)",
            "Desmocollin 2 (DSC2)",
            "Desmocollin 3 (DSC3)",
            "Integrin alpha 1 (ITGA1)",
            "Integrin beta 1 (ITGB1)",
            "Integrin alpha 5 (ITGA5)",
            "Integrin beta 3 (ITGB3)",
            "Integrin alpha 6 (ITGA6)",
            "Integrin beta 4 (ITGB4)",
            "L1 Cell Adhesion Molecule (L1CAM)",
            "N-CAM (NCAM1)",
            "P-CAM (PCAM)",
            "Selectin E (SELE)",
            "Selectin L (SELL)",
            "Selectin P (SELP)",
            "CD44 (CD44)",
            "Vascular Endothelial Cadherin (VE-Cadherin)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "E-Cadherin (CDH1)",
                "N-Cadherin (CDH2)",
                "P-Cadherin (CDH3)",
                "Desmoglein 1 (DSG1)",
                "Desmoglein 2 (DSG2)",
                "Desmoglein 3 (DSG3)",
                "Desmoglein 4 (DSG4)",
                "Desmocollin 1 (DSC1)",
                "Desmocollin 2 (DSC2)",
                "Desmocollin 3 (DSC3)",
                "Integrin alpha 1 (ITGA1)",
                "Integrin beta 1 (ITGB1)",
                "Integrin alpha 5 (ITGA5)",
                "Integrin beta 3 (ITGB3)",
                "Integrin alpha 6 (ITGA6)",
                "Integrin beta 4 (ITGB4)",
                "L1 Cell Adhesion Molecule (L1CAM)",
                "N-CAM (NCAM1)",
                "P-CAM (PCAM)",
                "Selectin E (SELE)",
                "Selectin L (SELL)",
                "Selectin P (SELP)",
                "CD44 (CD44)",
                "Vascular Endothelial Cadherin (VE-Cadherin)"
            ],
            "mismatches": [],
            "true_referents": [
                "CD44 (CD44)",
                "Desmocollin 1 (DSC1)",
                "Desmocollin 2 (DSC2)",
                "Desmocollin 3 (DSC3)",
                "Desmoglein 1 (DSG1)",
                "Desmoglein 2 (DSG2)",
                "Desmoglein 3 (DSG3)",
                "Desmoglein 4 (DSG4)",
                "E-Cadherin (CDH1)",
                "Integrin alpha 1 (ITGA1)",
                "Integrin alpha 5 (ITGA5)",
                "Integrin alpha 6 (ITGA6)",
                "Integrin beta 1 (ITGB1)",
                "Integrin beta 3 (ITGB3)",
                "Integrin beta 4 (ITGB4)",
                "L1 Cell Adhesion Molecule (L1CAM)",
                "N-CAM (NCAM1)",
                "N-Cadherin (CDH2)",
                "P-CAM (PCAM)",
                "P-Cadherin (CDH3)",
                "Selectin E (SELE)",
                "Selectin L (SELL)",
                "Selectin P (SELP)",
                "Vascular Endothelial Cadherin (VE-Cadherin)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Intercellular Adhesion Molecule 1 (ICAM-1)",
            "Vascular Cell Adhesion Molecule 1 (VCAM-1)",
            "E-Selectin",
            "P-Selectin",
            "L-Selectin",
            "N-Cadherin",
            "E-Cadherin",
            "M-Cadherin (Cadherin-3)",
            "Cadherin-6",
            "Cadherin-7",
            "Cadherin-8",
            "Cadherin-9",
            "Cadherin-10",
            "Cadherin-11",
            "Cadherin-12",
            "Cadherin-13",
            "Cadherin-14",
            "Cadherin-15",
            "Cadherin-16",
            "Cadherin-17",
            "Cadherin-18",
            "Cadherin-19",
            "Cadherin-20",
            "Cadherin-21"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Intercellular Adhesion Molecule 1 (ICAM-1)",
                "Vascular Cell Adhesion Molecule 1 (VCAM-1)",
                "E-Selectin",
                "P-Selectin",
                "L-Selectin",
                "N-Cadherin",
                "E-Cadherin",
                "M-Cadherin (Cadherin-3)",
                "Cadherin-6",
                "Cadherin-7",
                "Cadherin-8",
                "Cadherin-9",
                "Cadherin-10",
                "Cadherin-11",
                "Cadherin-12",
                "Cadherin-13",
                "Cadherin-14",
                "Cadherin-15",
                "Cadherin-16",
                "Cadherin-17",
                "Cadherin-18",
                "Cadherin-19",
                "Cadherin-20",
                "Cadherin-21"
            ],
            "mismatches": [],
            "true_referents": [
                "Cadherin-10",
                "Cadherin-11",
                "Cadherin-12",
                "Cadherin-13",
                "Cadherin-14",
                "Cadherin-15",
                "Cadherin-16",
                "Cadherin-17",
                "Cadherin-18",
                "Cadherin-19",
                "Cadherin-20",
                "Cadherin-21",
                "Cadherin-6",
                "Cadherin-7",
                "Cadherin-8",
                "Cadherin-9",
                "E-Cadherin",
                "E-Selectin",
                "Intercellular Adhesion Molecule 1 (ICAM-1)",
                "L-Selectin",
                "M-Cadherin (Cadherin-3)",
                "N-Cadherin",
                "P-Selectin",
                "Vascular Cell Adhesion Molecule 1 (VCAM-1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Integrin alpha 1 (ITGA1)",
            "Integrin alpha 2 (ITGA2)",
            "Integrin alpha 3 (ITGA3)",
            "Integrin alpha 4 (ITGA4)",
            "Integrin alpha 5 (ITGA5)",
            "Integrin alpha 6 (ITGA6)",
            "Integrin alpha 7 (ITGA7)",
            "Integrin alpha 8 (ITGA8)",
            "Integrin alpha L (ITGAL)",
            "Integrin alpha M (ITGAM)",
            "Integrin alpha X (ITGAX)",
            "Integrin alpha V (ITGAV)",
            "Integrin alpha D (ITGAD)",
            "Integrin alpha 9 (ITGA9)",
            "Integrin alpha 10 (ITGA10)",
            "Integrin alpha 11 (ITGA11)",
            "Cadherin-1 (CDH1)",
            "Cadherin-2 (CDH2)",
            "Cadherin-3 (CDH3)",
            "Selectin E (SELE)",
            "Selectin L (SELL)",
            "Selectin P (SELP)",
            "Immunoglobulin superfamily member 1 (IGSF1)",
            "N-CAM (NCAM1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Integrin alpha 1 (ITGA1)",
                "Integrin alpha 2 (ITGA2)",
                "Integrin alpha 3 (ITGA3)",
                "Integrin alpha 4 (ITGA4)",
                "Integrin alpha 5 (ITGA5)",
                "Integrin alpha 6 (ITGA6)",
                "Integrin alpha 7 (ITGA7)",
                "Integrin alpha 8 (ITGA8)",
                "Integrin alpha L (ITGAL)",
                "Integrin alpha M (ITGAM)",
                "Integrin alpha X (ITGAX)",
                "Integrin alpha V (ITGAV)",
                "Integrin alpha D (ITGAD)",
                "Integrin alpha 9 (ITGA9)",
                "Integrin alpha 10 (ITGA10)",
                "Integrin alpha 11 (ITGA11)",
                "Cadherin-1 (CDH1)",
                "Cadherin-2 (CDH2)",
                "Cadherin-3 (CDH3)",
                "Selectin E (SELE)",
                "Selectin L (SELL)",
                "Selectin P (SELP)",
                "Immunoglobulin superfamily member 1 (IGSF1)",
                "N-CAM (NCAM1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Cadherin-1 (CDH1)",
                "Cadherin-2 (CDH2)",
                "Cadherin-3 (CDH3)",
                "Immunoglobulin superfamily member 1 (IGSF1)",
                "Integrin alpha 1 (ITGA1)",
                "Integrin alpha 10 (ITGA10)",
                "Integrin alpha 11 (ITGA11)",
                "Integrin alpha 2 (ITGA2)",
                "Integrin alpha 3 (ITGA3)",
                "Integrin alpha 4 (ITGA4)",
                "Integrin alpha 5 (ITGA5)",
                "Integrin alpha 6 (ITGA6)",
                "Integrin alpha 7 (ITGA7)",
                "Integrin alpha 8 (ITGA8)",
                "Integrin alpha 9 (ITGA9)",
                "Integrin alpha D (ITGAD)",
                "Integrin alpha L (ITGAL)",
                "Integrin alpha M (ITGAM)",
                "Integrin alpha V (ITGAV)",
                "Integrin alpha X (ITGAX)",
                "N-CAM (NCAM1)",
                "Selectin E (SELE)",
                "Selectin L (SELL)",
                "Selectin P (SELP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Cadherin-1 (CDH1)",
            "E-Cadherin (CDH1)",
            "N-Cadherin (CDH2)",
            "P-Cadherin (CDH3)",
            "VE-Cadherin (CDH5)",
            "Integrin alphaVbeta3 (ITGAV/ITGB3)",
            "L-Selectin (CD62L)",
            "E-Selectin (CD62E)",
            "P-Selectin (CD62P)",
            "ICAM-1 (CD54)",
            "ICAM-2 (CD54)",
            "VCAM-1 (CD106)",
            "Syndecan-1 (SDC1)",
            "NCAM (CD56)",
            "LFA-1 (CD11a/CD18)",
            "MAC-1 (CD11b/CD18)",
            "CD44",
            "EpCAM (CD326)",
            "Desmoglein-1 (DSG1)",
            "Desmocollin-1 (DSC1)",
            "Claudin-1 (CLDN1)",
            "Occludin (OCLN)",
            "Immunoglobulin superfamily cell adhesion molecule 1 (ICOSL)",
            "Neural Cell Adhesion Molecule L1 (NCAML1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cadherin-1 (CDH1)",
                "E-Cadherin (CDH1)",
                "N-Cadherin (CDH2)",
                "P-Cadherin (CDH3)",
                "VE-Cadherin (CDH5)",
                "Integrin alphaVbeta3 (ITGAV/ITGB3)",
                "L-Selectin (CD62L)",
                "E-Selectin (CD62E)",
                "P-Selectin (CD62P)",
                "ICAM-1 (CD54)",
                "ICAM-2 (CD54)",
                "VCAM-1 (CD106)",
                "Syndecan-1 (SDC1)",
                "NCAM (CD56)",
                "LFA-1 (CD11a/CD18)",
                "MAC-1 (CD11b/CD18)",
                "CD44",
                "EpCAM (CD326)",
                "Desmoglein-1 (DSG1)",
                "Desmocollin-1 (DSC1)",
                "Claudin-1 (CLDN1)",
                "Occludin (OCLN)",
                "Immunoglobulin superfamily cell adhesion molecule 1 (ICOSL)",
                "Neural Cell Adhesion Molecule L1 (NCAML1)"
            ],
            "mismatches": [],
            "true_referents": [
                "CD44",
                "Cadherin-1 (CDH1)",
                "Claudin-1 (CLDN1)",
                "Desmocollin-1 (DSC1)",
                "Desmoglein-1 (DSG1)",
                "E-Cadherin (CDH1)",
                "E-Selectin (CD62E)",
                "EpCAM (CD326)",
                "ICAM-1 (CD54)",
                "ICAM-2 (CD54)",
                "Immunoglobulin superfamily cell adhesion molecule 1 (ICOSL)",
                "Integrin alphaVbeta3 (ITGAV/ITGB3)",
                "L-Selectin (CD62L)",
                "LFA-1 (CD11a/CD18)",
                "MAC-1 (CD11b/CD18)",
                "N-Cadherin (CDH2)",
                "NCAM (CD56)",
                "Neural Cell Adhesion Molecule L1 (NCAML1)",
                "Occludin (OCLN)",
                "P-Cadherin (CDH3)",
                "P-Selectin (CD62P)",
                "Syndecan-1 (SDC1)",
                "VCAM-1 (CD106)",
                "VE-Cadherin (CDH5)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Cadherin-1 (CDH1)",
            "Cadherin-2 (CDH2)",
            "Integrin alpha-1 (ITGA1)",
            "Integrin beta-1 (ITGB1)",
            "Intercellular Adhesion Molecule 1 (ICAM1)",
            "Intercellular Adhesion Molecule 2 (ICAM2)",
            "Vascular Cell Adhesion Molecule 1 (VCAM1)",
            "Neural Cell Adhesion Molecule 1 (NCAM1)",
            "Selectin E (SELE)",
            "Selectin L (SELL)",
            "Selectin P (SELP)",
            "Platelet Endothelial Cell Adhesion Molecule (PECAM1)",
            "L1 Cell Adhesion Molecule (L1CAM)",
            "Cadherin-3 (CDH3)",
            "Cadherin-4 (CDH4)",
            "Integrin alpha-2 (ITGA2)",
            "Integrin beta-2 (ITGB2)",
            "Neural Cell Adhesion Molecule 2 (NCAM2)",
            "Desmoglein 1 (DSG1)",
            "Desmoglein 2 (DSG2)",
            "Desmocollin 1 (DSC1)",
            "Desmocollin 2 (DSC2)",
            "Junctional Adhesion Molecule A (JAM-A)",
            "Junctional Adhesion Molecule B (JAM-B)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cadherin-1 (CDH1)",
                "Cadherin-2 (CDH2)",
                "Integrin alpha-1 (ITGA1)",
                "Integrin beta-1 (ITGB1)",
                "Intercellular Adhesion Molecule 1 (ICAM1)",
                "Intercellular Adhesion Molecule 2 (ICAM2)",
                "Vascular Cell Adhesion Molecule 1 (VCAM1)",
                "Neural Cell Adhesion Molecule 1 (NCAM1)",
                "Selectin E (SELE)",
                "Selectin L (SELL)",
                "Selectin P (SELP)",
                "Platelet Endothelial Cell Adhesion Molecule (PECAM1)",
                "L1 Cell Adhesion Molecule (L1CAM)",
                "Cadherin-3 (CDH3)",
                "Cadherin-4 (CDH4)",
                "Integrin alpha-2 (ITGA2)",
                "Integrin beta-2 (ITGB2)",
                "Neural Cell Adhesion Molecule 2 (NCAM2)",
                "Desmoglein 1 (DSG1)",
                "Desmoglein 2 (DSG2)",
                "Desmocollin 1 (DSC1)",
                "Desmocollin 2 (DSC2)",
                "Junctional Adhesion Molecule A (JAM-A)",
                "Junctional Adhesion Molecule B (JAM-B)"
            ],
            "mismatches": [],
            "true_referents": [
                "Cadherin-1 (CDH1)",
                "Cadherin-2 (CDH2)",
                "Cadherin-3 (CDH3)",
                "Cadherin-4 (CDH4)",
                "Desmocollin 1 (DSC1)",
                "Desmocollin 2 (DSC2)",
                "Desmoglein 1 (DSG1)",
                "Desmoglein 2 (DSG2)",
                "Integrin alpha-1 (ITGA1)",
                "Integrin alpha-2 (ITGA2)",
                "Integrin beta-1 (ITGB1)",
                "Integrin beta-2 (ITGB2)",
                "Intercellular Adhesion Molecule 1 (ICAM1)",
                "Intercellular Adhesion Molecule 2 (ICAM2)",
                "Junctional Adhesion Molecule A (JAM-A)",
                "Junctional Adhesion Molecule B (JAM-B)",
                "L1 Cell Adhesion Molecule (L1CAM)",
                "Neural Cell Adhesion Molecule 1 (NCAM1)",
                "Neural Cell Adhesion Molecule 2 (NCAM2)",
                "Platelet Endothelial Cell Adhesion Molecule (PECAM1)",
                "Selectin E (SELE)",
                "Selectin L (SELL)",
                "Selectin P (SELP)",
                "Vascular Cell Adhesion Molecule 1 (VCAM1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Cadherin (CDH)",
            "Integrin (ITG)",
            "Selectin (SEL)",
            "Immunoglobulin superfamily (IgSF)",
            "N-Cadherin (CDH2)",
            "E-Cadherin (CDH1)",
            "P-Cadherin (CDH3)",
            "Vascular Cell Adhesion Molecule 1 (VCAM1)",
            "Intercellular Adhesion Molecule 1 (ICAM1)",
            "Focal Adhesion Kinase (FAK)",
            "Neural Cell Adhesion Molecule (NCAM)",
            "L1 Cell Adhesion Molecule (L1CAM)",
            "Platelet Endothelial Cell Adhesion Molecule (PECAM1)",
            "Mucosal Addressin Cell Adhesion Molecule 1 (MAdCAM1)",
            "CD44 (CD44)",
            "Integrin Alpha V (ITGAV)",
            "Integrin Beta 1 (ITGB1)",
            "Integrin Beta 2 (ITGB2)",
            "Integrin Alpha 4 (ITGA4)",
            "Integrin Alpha 6 (ITGA6)",
            "Syndecan (SDC)",
            "Desmoglein (DSG)",
            "Desmocollin (DSC)",
            "Neurofascin (NF)",
            "Contactin (CNTN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cadherin (CDH)",
                "Integrin (ITG)",
                "Selectin (SEL)",
                "Immunoglobulin superfamily (IgSF)",
                "N-Cadherin (CDH2)",
                "E-Cadherin (CDH1)",
                "P-Cadherin (CDH3)",
                "Vascular Cell Adhesion Molecule 1 (VCAM1)",
                "Intercellular Adhesion Molecule 1 (ICAM1)",
                "Focal Adhesion Kinase (FAK)",
                "Neural Cell Adhesion Molecule (NCAM)",
                "L1 Cell Adhesion Molecule (L1CAM)",
                "Platelet Endothelial Cell Adhesion Molecule (PECAM1)",
                "Mucosal Addressin Cell Adhesion Molecule 1 (MAdCAM1)",
                "CD44 (CD44)",
                "Integrin Alpha V (ITGAV)",
                "Integrin Beta 1 (ITGB1)",
                "Integrin Beta 2 (ITGB2)",
                "Integrin Alpha 4 (ITGA4)",
                "Integrin Alpha 6 (ITGA6)",
                "Syndecan (SDC)",
                "Desmoglein (DSG)",
                "Desmocollin (DSC)",
                "Neurofascin (NF)"
            ],
            "mismatches": [
                "Contactin (CNTN)"
            ],
            "true_referents": [
                "CD44 (CD44)",
                "Cadherin (CDH)",
                "Desmocollin (DSC)",
                "Desmoglein (DSG)",
                "E-Cadherin (CDH1)",
                "Focal Adhesion Kinase (FAK)",
                "Immunoglobulin superfamily (IgSF)",
                "Integrin (ITG)",
                "Integrin Alpha 4 (ITGA4)",
                "Integrin Alpha 6 (ITGA6)",
                "Integrin Alpha V (ITGAV)",
                "Integrin Beta 1 (ITGB1)",
                "Integrin Beta 2 (ITGB2)",
                "Intercellular Adhesion Molecule 1 (ICAM1)",
                "L1 Cell Adhesion Molecule (L1CAM)",
                "Mucosal Addressin Cell Adhesion Molecule 1 (MAdCAM1)",
                "N-Cadherin (CDH2)",
                "Neural Cell Adhesion Molecule (NCAM)",
                "Neurofascin (NF)",
                "P-Cadherin (CDH3)",
                "Platelet Endothelial Cell Adhesion Molecule (PECAM1)",
                "Selectin (SEL)",
                "Syndecan (SDC)",
                "Vascular Cell Adhesion Molecule 1 (VCAM1)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Integrin alpha-4 (ITGA4)",
            "Integrin alpha-L (ITGAL)",
            "Integrin alpha-M (ITGAM)",
            "Integrin alpha-X (ITGAX)",
            "Integrin beta-2 (ITGB2)",
            "Intercellular Adhesion Molecule 1 (ICAM-1)",
            "Intercellular Adhesion Molecule 2 (ICAM-2)",
            "Intercellular Adhesion Molecule 3 (ICAM-3)",
            "Vascular Cell Adhesion Molecule 1 (VCAM-1)",
            "Platelet Endothelial Cell Adhesion Molecule (PECAM-1)",
            "Neural Cell Adhesion Molecule (NCAM)",
            "Neural Cell Adhesion Molecule 2 (NCAM2)",
            "Melanoma Cell Adhesion Molecule (MCAM)",
            "Leukocyte-endothelial Cell Adhesion Molecule 1 (LECAM-1)",
            "Epithelial Cell Adhesion Molecule (EpCAM)",
            "Selectin E (SELE)",
            "Selectin L (SELL)",
            "Selectin P (SELP)",
            "Cadherin 1 (CDH1)",
            "Cadherin 2 (CDH2)",
            "Cadherin 3 (CDH3)",
            "Nectin Cell Adhesion Molecule 1 (NECTIN1)",
            "Nectin Cell Adhesion Molecule 2 (NECTIN2)",
            "Nectin Cell Adhesion Molecule 3 (NECTIN3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Integrin alpha-4 (ITGA4)",
                "Integrin alpha-L (ITGAL)",
                "Integrin alpha-M (ITGAM)",
                "Integrin alpha-X (ITGAX)",
                "Integrin beta-2 (ITGB2)",
                "Intercellular Adhesion Molecule 1 (ICAM-1)",
                "Intercellular Adhesion Molecule 2 (ICAM-2)",
                "Intercellular Adhesion Molecule 3 (ICAM-3)",
                "Vascular Cell Adhesion Molecule 1 (VCAM-1)",
                "Platelet Endothelial Cell Adhesion Molecule (PECAM-1)",
                "Neural Cell Adhesion Molecule (NCAM)",
                "Neural Cell Adhesion Molecule 2 (NCAM2)",
                "Melanoma Cell Adhesion Molecule (MCAM)",
                "Leukocyte-endothelial Cell Adhesion Molecule 1 (LECAM-1)",
                "Epithelial Cell Adhesion Molecule (EpCAM)",
                "Selectin E (SELE)",
                "Selectin L (SELL)",
                "Selectin P (SELP)",
                "Cadherin 1 (CDH1)",
                "Cadherin 2 (CDH2)",
                "Cadherin 3 (CDH3)",
                "Nectin Cell Adhesion Molecule 1 (NECTIN1)",
                "Nectin Cell Adhesion Molecule 2 (NECTIN2)",
                "Nectin Cell Adhesion Molecule 3 (NECTIN3)"
            ],
            "mismatches": [],
            "true_referents": [
                "Cadherin 1 (CDH1)",
                "Cadherin 2 (CDH2)",
                "Cadherin 3 (CDH3)",
                "Epithelial Cell Adhesion Molecule (EpCAM)",
                "Integrin alpha-4 (ITGA4)",
                "Integrin alpha-L (ITGAL)",
                "Integrin alpha-M (ITGAM)",
                "Integrin alpha-X (ITGAX)",
                "Integrin beta-2 (ITGB2)",
                "Intercellular Adhesion Molecule 1 (ICAM-1)",
                "Intercellular Adhesion Molecule 2 (ICAM-2)",
                "Intercellular Adhesion Molecule 3 (ICAM-3)",
                "Leukocyte-endothelial Cell Adhesion Molecule 1 (LECAM-1)",
                "Melanoma Cell Adhesion Molecule (MCAM)",
                "Nectin Cell Adhesion Molecule 1 (NECTIN1)",
                "Nectin Cell Adhesion Molecule 2 (NECTIN2)",
                "Nectin Cell Adhesion Molecule 3 (NECTIN3)",
                "Neural Cell Adhesion Molecule (NCAM)",
                "Neural Cell Adhesion Molecule 2 (NCAM2)",
                "Platelet Endothelial Cell Adhesion Molecule (PECAM-1)",
                "Selectin E (SELE)",
                "Selectin L (SELL)",
                "Selectin P (SELP)",
                "Vascular Cell Adhesion Molecule 1 (VCAM-1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Integrin (ITG)",
            "Cadherin (CDH)",
            "Selectin",
            "Ig-superfamily cell adhesion molecule (IgCAM)",
            "N-CAM (Neural cell adhesion molecule)",
            "L1CAM (L1 cell adhesion molecule)",
            "VCAM-1 (Vascular cell adhesion molecule 1)",
            "PECAM-1 (Platelet endothelial cell adhesion molecule 1)",
            "JAM (Junctional adhesion molecule)",
            "ICAM (Intercellular adhesion molecule)",
            "CD44 (Cluster of differentiation 44)",
            "NCAM (Neural cell adhesion molecule)",
            "E-cadherin (Epithelial cadherin)",
            "P-selectin (Platelet-selectin)",
            "L-selectin (Leukocyte-selectin)",
            "VE-cadherin (Vascular endothelial cadherin)",
            "MUC1 (Mucin 1)",
            "CD166 (Cluster of differentiation 166)",
            "CDH5 (Cadherin 5)",
            "CDH2 (Cadherin 2)",
            "CDH1 (Cadherin 1)",
            "CDH3 (Cadherin 3)",
            "CDH4 (Cadherin 4)",
            "CDH6 (Cadherin 6)",
            "CDH7 (Cadherin 7)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Integrin (ITG)",
                "Cadherin (CDH)",
                "Selectin",
                "Ig-superfamily cell adhesion molecule (IgCAM)",
                "N-CAM (Neural cell adhesion molecule)",
                "L1CAM (L1 cell adhesion molecule)",
                "VCAM-1 (Vascular cell adhesion molecule 1)",
                "PECAM-1 (Platelet endothelial cell adhesion molecule 1)",
                "JAM (Junctional adhesion molecule)",
                "ICAM (Intercellular adhesion molecule)",
                "CD44 (Cluster of differentiation 44)",
                "NCAM (Neural cell adhesion molecule)",
                "E-cadherin (Epithelial cadherin)",
                "P-selectin (Platelet-selectin)",
                "L-selectin (Leukocyte-selectin)",
                "VE-cadherin (Vascular endothelial cadherin)",
                "MUC1 (Mucin 1)",
                "CD166 (Cluster of differentiation 166)",
                "CDH5 (Cadherin 5)",
                "CDH2 (Cadherin 2)",
                "CDH1 (Cadherin 1)",
                "CDH3 (Cadherin 3)",
                "CDH4 (Cadherin 4)",
                "CDH6 (Cadherin 6)"
            ],
            "mismatches": [
                "CDH7 (Cadherin 7)"
            ],
            "true_referents": [
                "CD166 (Cluster of differentiation 166)",
                "CD44 (Cluster of differentiation 44)",
                "CDH1 (Cadherin 1)",
                "CDH2 (Cadherin 2)",
                "CDH3 (Cadherin 3)",
                "CDH4 (Cadherin 4)",
                "CDH5 (Cadherin 5)",
                "CDH6 (Cadherin 6)",
                "Cadherin (CDH)",
                "E-cadherin (Epithelial cadherin)",
                "ICAM (Intercellular adhesion molecule)",
                "Ig-superfamily cell adhesion molecule (IgCAM)",
                "Integrin (ITG)",
                "JAM (Junctional adhesion molecule)",
                "L-selectin (Leukocyte-selectin)",
                "L1CAM (L1 cell adhesion molecule)",
                "MUC1 (Mucin 1)",
                "N-CAM (Neural cell adhesion molecule)",
                "NCAM (Neural cell adhesion molecule)",
                "P-selectin (Platelet-selectin)",
                "PECAM-1 (Platelet endothelial cell adhesion molecule 1)",
                "Selectin",
                "VCAM-1 (Vascular cell adhesion molecule 1)",
                "VE-cadherin (Vascular endothelial cadherin)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "E-cadherin (CDH1)",
            "N-cadherin (CDH2)",
            "P-cadherin (CDH3)",
            "VE-cadherin (CDH5)",
            "Integrin \u03b15\u03b21",
            "Integrin \u03b1V\u03b23",
            "NCAM1 (Neural Cell Adhesion Molecule 1)",
            "ICAM1 (Intercellular Adhesion Molecule 1)",
            "VCAM1 (Vascular Cell Adhesion Molecule 1)",
            "L1CAM (L1 Cell Adhesion Molecule)",
            "E-selectin",
            "P-selectin",
            "L-selectin",
            "JAM-A (Junctional Adhesion Molecule A)",
            "JAM-B (Junctional Adhesion Molecule B)",
            "JAM-C (Junctional Adhesion Molecule C)",
            "Claudin-1",
            "Claudin-5",
            "Connexin 43 (Cx43)",
            "MUC1 (Mucin 1)",
            "R-cadherin (CDH4)",
            "CD44",
            "CADM1 (Cell Adhesion Molecule 1)",
            "Neurexin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "E-cadherin (CDH1)",
                "N-cadherin (CDH2)",
                "P-cadherin (CDH3)",
                "VE-cadherin (CDH5)",
                "Integrin \u03b15\u03b21",
                "Integrin \u03b1V\u03b23",
                "NCAM1 (Neural Cell Adhesion Molecule 1)",
                "ICAM1 (Intercellular Adhesion Molecule 1)",
                "VCAM1 (Vascular Cell Adhesion Molecule 1)",
                "L1CAM (L1 Cell Adhesion Molecule)",
                "E-selectin",
                "P-selectin",
                "L-selectin",
                "JAM-A (Junctional Adhesion Molecule A)",
                "JAM-B (Junctional Adhesion Molecule B)",
                "JAM-C (Junctional Adhesion Molecule C)",
                "Claudin-1",
                "Claudin-5",
                "Connexin 43 (Cx43)",
                "MUC1 (Mucin 1)",
                "R-cadherin (CDH4)",
                "CD44",
                "CADM1 (Cell Adhesion Molecule 1)",
                "Neurexin"
            ],
            "mismatches": [],
            "true_referents": [
                "CADM1 (Cell Adhesion Molecule 1)",
                "CD44",
                "Claudin-1",
                "Claudin-5",
                "Connexin 43 (Cx43)",
                "E-cadherin (CDH1)",
                "E-selectin",
                "ICAM1 (Intercellular Adhesion Molecule 1)",
                "Integrin \u03b15\u03b21",
                "Integrin \u03b1V\u03b23",
                "JAM-A (Junctional Adhesion Molecule A)",
                "JAM-B (Junctional Adhesion Molecule B)",
                "JAM-C (Junctional Adhesion Molecule C)",
                "L-selectin",
                "L1CAM (L1 Cell Adhesion Molecule)",
                "MUC1 (Mucin 1)",
                "N-cadherin (CDH2)",
                "NCAM1 (Neural Cell Adhesion Molecule 1)",
                "Neurexin",
                "P-cadherin (CDH3)",
                "P-selectin",
                "R-cadherin (CDH4)",
                "VCAM1 (Vascular Cell Adhesion Molecule 1)",
                "VE-cadherin (CDH5)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "E-cadherin (CDH1)",
            "N-cadherin (CDH2)",
            "P-cadherin (CDH3)",
            "Vascular Endothelial Cadherin (VE-cadherin, CDH5)",
            "Epithelial Cell Adhesion Molecule (EpCAM)",
            "Intercellular Adhesion Molecule 1 (ICAM-1)",
            "Vascular Cell Adhesion Molecule 1 (VCAM-1)",
            "Neural Cell Adhesion Molecule (NCAM)",
            "Platelet Endothelial Cell Adhesion Molecule (PECAM-1)",
            "Lymphocyte Function-associated Antigen 1 (LFA-1)",
            "Very Late Antigen 4 (VLA-4)",
            "Integrin \u03b15\u03b21",
            "Integrin \u03b1v\u03b23",
            "Selectin E (SELE)",
            "Selectin P (SELP)",
            "Selectin L (SELL)",
            "Junctional Adhesion Molecule A (JAM-A)",
            "Claudin-1",
            "Occludin",
            "Desmoglein-1",
            "Desmocollin-2",
            "Nectin-1",
            "CD44",
            "Syndecan-1"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "E-cadherin (CDH1)",
                "N-cadherin (CDH2)",
                "P-cadherin (CDH3)",
                "Vascular Endothelial Cadherin (VE-cadherin, CDH5)",
                "Epithelial Cell Adhesion Molecule (EpCAM)",
                "Intercellular Adhesion Molecule 1 (ICAM-1)",
                "Vascular Cell Adhesion Molecule 1 (VCAM-1)",
                "Neural Cell Adhesion Molecule (NCAM)",
                "Platelet Endothelial Cell Adhesion Molecule (PECAM-1)",
                "Lymphocyte Function-associated Antigen 1 (LFA-1)",
                "Very Late Antigen 4 (VLA-4)",
                "Integrin \u03b15\u03b21",
                "Integrin \u03b1v\u03b23",
                "Selectin E (SELE)",
                "Selectin P (SELP)",
                "Selectin L (SELL)",
                "Junctional Adhesion Molecule A (JAM-A)",
                "Claudin-1",
                "Occludin",
                "Desmoglein-1",
                "Desmocollin-2",
                "Nectin-1",
                "CD44",
                "Syndecan-1"
            ],
            "mismatches": [],
            "true_referents": [
                "CD44",
                "Claudin-1",
                "Desmocollin-2",
                "Desmoglein-1",
                "E-cadherin (CDH1)",
                "Epithelial Cell Adhesion Molecule (EpCAM)",
                "Integrin \u03b15\u03b21",
                "Integrin \u03b1v\u03b23",
                "Intercellular Adhesion Molecule 1 (ICAM-1)",
                "Junctional Adhesion Molecule A (JAM-A)",
                "Lymphocyte Function-associated Antigen 1 (LFA-1)",
                "N-cadherin (CDH2)",
                "Nectin-1",
                "Neural Cell Adhesion Molecule (NCAM)",
                "Occludin",
                "P-cadherin (CDH3)",
                "Platelet Endothelial Cell Adhesion Molecule (PECAM-1)",
                "Selectin E (SELE)",
                "Selectin L (SELL)",
                "Selectin P (SELP)",
                "Syndecan-1",
                "Vascular Cell Adhesion Molecule 1 (VCAM-1)",
                "Vascular Endothelial Cadherin (VE-cadherin, CDH5)",
                "Very Late Antigen 4 (VLA-4)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Neural cell adhesion molecule 1 (NCAM1)",
            "Intercellular adhesion molecule 1 (ICAM1)",
            "Vascular cell adhesion molecule 1 (VCAM1)",
            "Platelet endothelial cell adhesion molecule (PECAM1)",
            "Epithelial cell adhesion molecule (EPCAM)",
            "Cadherin 1 (CDH1)",
            "Cadherin 2 (CDH2)",
            "Cadherin 5 (CDH5)",
            "Integrin alpha 1 (ITGA1)",
            "Integrin alpha 2 (ITGA2)",
            "Integrin alpha 4 (ITGA4)",
            "Integrin alpha 5 (ITGA5)",
            "Integrin alpha 6 (ITGA6)",
            "Integrin alpha V (ITGAV)",
            "Integrin beta 1 (ITGB1)",
            "Integrin beta 2 (ITGB2)",
            "Integrin beta 3 (ITGB3)",
            "Integrin beta 4 (ITGB4)",
            "Selectin L (SELL)",
            "Selectin E (SELE)",
            "Selectin P (SELP)",
            "Carcinoembryonic antigen-related cell adhesion molecule 1 (CEACAM1)",
            "Activated leukocyte cell adhesion molecule (ALCAM)",
            "Junctional adhesion molecule A (F11R)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neural cell adhesion molecule 1 (NCAM1)",
                "Intercellular adhesion molecule 1 (ICAM1)",
                "Vascular cell adhesion molecule 1 (VCAM1)",
                "Platelet endothelial cell adhesion molecule (PECAM1)",
                "Epithelial cell adhesion molecule (EPCAM)",
                "Cadherin 1 (CDH1)",
                "Cadherin 2 (CDH2)",
                "Cadherin 5 (CDH5)",
                "Integrin alpha 1 (ITGA1)",
                "Integrin alpha 2 (ITGA2)",
                "Integrin alpha 4 (ITGA4)",
                "Integrin alpha 5 (ITGA5)",
                "Integrin alpha 6 (ITGA6)",
                "Integrin alpha V (ITGAV)",
                "Integrin beta 1 (ITGB1)",
                "Integrin beta 2 (ITGB2)",
                "Integrin beta 3 (ITGB3)",
                "Integrin beta 4 (ITGB4)",
                "Selectin L (SELL)",
                "Selectin E (SELE)",
                "Selectin P (SELP)",
                "Carcinoembryonic antigen-related cell adhesion molecule 1 (CEACAM1)",
                "Activated leukocyte cell adhesion molecule (ALCAM)",
                "Junctional adhesion molecule A (F11R)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated leukocyte cell adhesion molecule (ALCAM)",
                "Cadherin 1 (CDH1)",
                "Cadherin 2 (CDH2)",
                "Cadherin 5 (CDH5)",
                "Carcinoembryonic antigen-related cell adhesion molecule 1 (CEACAM1)",
                "Epithelial cell adhesion molecule (EPCAM)",
                "Integrin alpha 1 (ITGA1)",
                "Integrin alpha 2 (ITGA2)",
                "Integrin alpha 4 (ITGA4)",
                "Integrin alpha 5 (ITGA5)",
                "Integrin alpha 6 (ITGA6)",
                "Integrin alpha V (ITGAV)",
                "Integrin beta 1 (ITGB1)",
                "Integrin beta 2 (ITGB2)",
                "Integrin beta 3 (ITGB3)",
                "Integrin beta 4 (ITGB4)",
                "Intercellular adhesion molecule 1 (ICAM1)",
                "Junctional adhesion molecule A (F11R)",
                "Neural cell adhesion molecule 1 (NCAM1)",
                "Platelet endothelial cell adhesion molecule (PECAM1)",
                "Selectin E (SELE)",
                "Selectin L (SELL)",
                "Selectin P (SELP)",
                "Vascular cell adhesion molecule 1 (VCAM1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Cadherin (CDH)",
            "Integrin (ITG)",
            "Selectin (SELE)",
            "Immunoglobulin superfamily (IgSF)",
            "Mucin (MUC)",
            "Hyaluronic acid (HA)",
            "Fibronectin (FN)",
            "Laminin (LAMA)",
            "Collagen (COL)",
            "Vitronectin (VTN)",
            "Osteopontin (OPN)",
            "Thrombospondin (THBS)",
            "Syndecan (SDC)",
            "Glypican (GPC)",
            "Neuropilin (NRP)",
            "Semaphorin (SEMA)",
            "Ephrin (EFN)",
            "Nectin (NECTIN)",
            "Junctional Adhesion Molecule (JAM)",
            "Vascular Endothelial Cadherin (VE-Cadherin)",
            "Neural Cell Adhesion Molecule (NCAM)",
            "Platelet Endothelial Cell Adhesion Molecule (PECAM-1)",
            "Intercellular Adhesion Molecule (ICAM)",
            "Vascular Cell Adhesion Molecule (VCAM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cadherin (CDH)",
                "Integrin (ITG)",
                "Selectin (SELE)",
                "Immunoglobulin superfamily (IgSF)",
                "Mucin (MUC)",
                "Hyaluronic acid (HA)",
                "Fibronectin (FN)",
                "Laminin (LAMA)",
                "Collagen (COL)",
                "Vitronectin (VTN)",
                "Osteopontin (OPN)",
                "Thrombospondin (THBS)",
                "Syndecan (SDC)",
                "Glypican (GPC)",
                "Neuropilin (NRP)",
                "Semaphorin (SEMA)",
                "Ephrin (EFN)",
                "Nectin (NECTIN)",
                "Junctional Adhesion Molecule (JAM)",
                "Vascular Endothelial Cadherin (VE-Cadherin)",
                "Neural Cell Adhesion Molecule (NCAM)",
                "Platelet Endothelial Cell Adhesion Molecule (PECAM-1)",
                "Intercellular Adhesion Molecule (ICAM)",
                "Vascular Cell Adhesion Molecule (VCAM)"
            ],
            "mismatches": [],
            "true_referents": [
                "Cadherin (CDH)",
                "Collagen (COL)",
                "Ephrin (EFN)",
                "Fibronectin (FN)",
                "Glypican (GPC)",
                "Hyaluronic acid (HA)",
                "Immunoglobulin superfamily (IgSF)",
                "Integrin (ITG)",
                "Intercellular Adhesion Molecule (ICAM)",
                "Junctional Adhesion Molecule (JAM)",
                "Laminin (LAMA)",
                "Mucin (MUC)",
                "Nectin (NECTIN)",
                "Neural Cell Adhesion Molecule (NCAM)",
                "Neuropilin (NRP)",
                "Osteopontin (OPN)",
                "Platelet Endothelial Cell Adhesion Molecule (PECAM-1)",
                "Selectin (SELE)",
                "Semaphorin (SEMA)",
                "Syndecan (SDC)",
                "Thrombospondin (THBS)",
                "Vascular Cell Adhesion Molecule (VCAM)",
                "Vascular Endothelial Cadherin (VE-Cadherin)",
                "Vitronectin (VTN)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Cadherin (CDH)",
            "Integrin (ITGR)",
            "Selectin (SELE)",
            "Immunoglobulin Superfamily Cell Adhesion Molecule (IGSF-CAM)",
            "Neural Cell Adhesion Molecule (NCAM)",
            "Vascular Cell Adhesion Molecule (VCAM)",
            "Intercellular Adhesion Molecule (ICAM)",
            "Platelet Endothelial Cell Adhesion Molecule (PECAM)",
            "Epithelial Cell Adhesion Molecule (EpCAM)",
            "Junctional Adhesion Molecule (JAM)",
            "Desmogleins (DSG)",
            "Desmocollins (DSC)",
            "E-Cadherin (CDH1)",
            "N-Cadherin (CDH2)",
            "P-Cadherin (CDH3)",
            "VE-Cadherin (CDH5)",
            "Integrin Alpha 4 Beta 1 (ITGA4/ITGB1)",
            "Integrin Alpha L Beta 2 (ITGAL/ITGB2)",
            "Integrin Alpha 5 Beta 1 (ITGA5/ITGB1)",
            "E-Selectin (SELE)",
            "P-Selectin (SELP)",
            "L-Selectin (SELL)",
            "Neural Cell Adhesion Molecule 1 (NCAM1)",
            "Neural Cell Adhesion Molecule 2 (NCAM2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cadherin (CDH)",
                "Integrin (ITGR)",
                "Selectin (SELE)",
                "Immunoglobulin Superfamily Cell Adhesion Molecule (IGSF-CAM)",
                "Neural Cell Adhesion Molecule (NCAM)",
                "Vascular Cell Adhesion Molecule (VCAM)",
                "Intercellular Adhesion Molecule (ICAM)",
                "Platelet Endothelial Cell Adhesion Molecule (PECAM)",
                "Epithelial Cell Adhesion Molecule (EpCAM)",
                "Junctional Adhesion Molecule (JAM)",
                "Desmogleins (DSG)",
                "Desmocollins (DSC)",
                "E-Cadherin (CDH1)",
                "N-Cadherin (CDH2)",
                "P-Cadherin (CDH3)",
                "VE-Cadherin (CDH5)",
                "Integrin Alpha 4 Beta 1 (ITGA4/ITGB1)",
                "Integrin Alpha L Beta 2 (ITGAL/ITGB2)",
                "Integrin Alpha 5 Beta 1 (ITGA5/ITGB1)",
                "E-Selectin (SELE)",
                "P-Selectin (SELP)",
                "L-Selectin (SELL)",
                "Neural Cell Adhesion Molecule 1 (NCAM1)",
                "Neural Cell Adhesion Molecule 2 (NCAM2)"
            ],
            "mismatches": [],
            "true_referents": [
                "Cadherin (CDH)",
                "Desmocollins (DSC)",
                "Desmogleins (DSG)",
                "E-Cadherin (CDH1)",
                "E-Selectin (SELE)",
                "Epithelial Cell Adhesion Molecule (EpCAM)",
                "Immunoglobulin Superfamily Cell Adhesion Molecule (IGSF-CAM)",
                "Integrin (ITGR)",
                "Integrin Alpha 4 Beta 1 (ITGA4/ITGB1)",
                "Integrin Alpha 5 Beta 1 (ITGA5/ITGB1)",
                "Integrin Alpha L Beta 2 (ITGAL/ITGB2)",
                "Intercellular Adhesion Molecule (ICAM)",
                "Junctional Adhesion Molecule (JAM)",
                "L-Selectin (SELL)",
                "N-Cadherin (CDH2)",
                "Neural Cell Adhesion Molecule (NCAM)",
                "Neural Cell Adhesion Molecule 1 (NCAM1)",
                "Neural Cell Adhesion Molecule 2 (NCAM2)",
                "P-Cadherin (CDH3)",
                "P-Selectin (SELP)",
                "Platelet Endothelial Cell Adhesion Molecule (PECAM)",
                "Selectin (SELE)",
                "VE-Cadherin (CDH5)",
                "Vascular Cell Adhesion Molecule (VCAM)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Cadherin (CDH1)",
            "Integrin (ITGA1)",
            "Selectin (SELE)",
            "L-selectin (CD62L)",
            "P-selectin (CD62P)",
            "E-selectin (CD62E)",
            "Vascular cell adhesion molecule 1 (VCAM1)",
            "Intercellular adhesion molecule 1 (ICAM1)",
            "Platelet endothelial cell adhesion molecule 1 (PECAM1)",
            "N-cadherin (CDH2)",
            "P-cadherin (CDH3)",
            "Ep-cadherin (CDH1)",
            "T-cadherin (CDH13)",
            "Cadherin-11 (CDH11)",
            "Cadherin-12 (CDH12)",
            "Cadherin-17 (CDH17)",
            "Cadherin-20 (CDH20)",
            "Cadherin-23 (CDH23)",
            "Cadherin-24 (CDH24)",
            "Cadherin-5 (CDH5)",
            "Cadherin-6 (CDH6)",
            "Cadherin-7 (CDH7)",
            "Cadherin-8 (CDH8)",
            "Cadherin-9 (CDH9)",
            "Cadherin-10 (CDH10)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cadherin (CDH1)",
                "Integrin (ITGA1)",
                "Selectin (SELE)",
                "L-selectin (CD62L)",
                "P-selectin (CD62P)",
                "E-selectin (CD62E)",
                "Vascular cell adhesion molecule 1 (VCAM1)",
                "Intercellular adhesion molecule 1 (ICAM1)",
                "Platelet endothelial cell adhesion molecule 1 (PECAM1)",
                "N-cadherin (CDH2)",
                "P-cadherin (CDH3)",
                "Ep-cadherin (CDH1)",
                "T-cadherin (CDH13)",
                "Cadherin-11 (CDH11)",
                "Cadherin-12 (CDH12)",
                "Cadherin-17 (CDH17)",
                "Cadherin-20 (CDH20)",
                "Cadherin-23 (CDH23)",
                "Cadherin-24 (CDH24)",
                "Cadherin-5 (CDH5)",
                "Cadherin-6 (CDH6)",
                "Cadherin-7 (CDH7)",
                "Cadherin-8 (CDH8)",
                "Cadherin-9 (CDH9)"
            ],
            "mismatches": [
                "Cadherin-10 (CDH10)"
            ],
            "true_referents": [
                "Cadherin (CDH1)",
                "Cadherin-11 (CDH11)",
                "Cadherin-12 (CDH12)",
                "Cadherin-17 (CDH17)",
                "Cadherin-20 (CDH20)",
                "Cadherin-23 (CDH23)",
                "Cadherin-24 (CDH24)",
                "Cadherin-5 (CDH5)",
                "Cadherin-6 (CDH6)",
                "Cadherin-7 (CDH7)",
                "Cadherin-8 (CDH8)",
                "Cadherin-9 (CDH9)",
                "E-selectin (CD62E)",
                "Ep-cadherin (CDH1)",
                "Integrin (ITGA1)",
                "Intercellular adhesion molecule 1 (ICAM1)",
                "L-selectin (CD62L)",
                "N-cadherin (CDH2)",
                "P-cadherin (CDH3)",
                "P-selectin (CD62P)",
                "Platelet endothelial cell adhesion molecule 1 (PECAM1)",
                "Selectin (SELE)",
                "T-cadherin (CDH13)",
                "Vascular cell adhesion molecule 1 (VCAM1)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "E-Cadherin (CDH1)",
            "N-Cadherin (CDH2)",
            "V-Cadherin (CDH5)",
            "P-Cadherin (CDH3)",
            "R-Cadherin (CDH4)",
            "T-Cadherin (CDH13)",
            "OB-Cadherin (CDH11)",
            "VE-Cadherin (CDH5)",
            "ACAM (CDH4)",
            "Desmoglein (DSG)",
            "Desmocollin (DSC)",
            "Occludin (OCLN)",
            "Claudin (CLDN)",
            "JAM-A (F11R)",
            "JAM-B (JAM2)",
            "JAM-C (JAM3)",
            "PECAM-1 (CD31)",
            "ICAM-1 (CD54)",
            "ICAM-2 (CD102)",
            "ICAM-3 (CD50)",
            "VCAM-1 (CD106)",
            "NCAM (CD56)",
            "L1CAM (CD171)",
            "Neurofascin (NFASC)",
            "CHL1 (CALL)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "E-Cadherin (CDH1)",
                "N-Cadherin (CDH2)",
                "V-Cadherin (CDH5)",
                "P-Cadherin (CDH3)",
                "R-Cadherin (CDH4)",
                "T-Cadherin (CDH13)",
                "OB-Cadherin (CDH11)",
                "VE-Cadherin (CDH5)",
                "ACAM (CDH4)",
                "Desmoglein (DSG)",
                "Desmocollin (DSC)",
                "Occludin (OCLN)",
                "Claudin (CLDN)",
                "JAM-A (F11R)",
                "JAM-B (JAM2)",
                "JAM-C (JAM3)",
                "PECAM-1 (CD31)",
                "ICAM-1 (CD54)",
                "ICAM-2 (CD102)",
                "ICAM-3 (CD50)",
                "VCAM-1 (CD106)",
                "NCAM (CD56)",
                "L1CAM (CD171)",
                "Neurofascin (NFASC)"
            ],
            "mismatches": [
                "CHL1 (CALL)"
            ],
            "true_referents": [
                "ACAM (CDH4)",
                "Claudin (CLDN)",
                "Desmocollin (DSC)",
                "Desmoglein (DSG)",
                "E-Cadherin (CDH1)",
                "ICAM-1 (CD54)",
                "ICAM-2 (CD102)",
                "ICAM-3 (CD50)",
                "JAM-A (F11R)",
                "JAM-B (JAM2)",
                "JAM-C (JAM3)",
                "L1CAM (CD171)",
                "N-Cadherin (CDH2)",
                "NCAM (CD56)",
                "Neurofascin (NFASC)",
                "OB-Cadherin (CDH11)",
                "Occludin (OCLN)",
                "P-Cadherin (CDH3)",
                "PECAM-1 (CD31)",
                "R-Cadherin (CDH4)",
                "T-Cadherin (CDH13)",
                "V-Cadherin (CDH5)",
                "VCAM-1 (CD106)",
                "VE-Cadherin (CDH5)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            {
                "Referent": "Cadherins",
                "Canonical name": "(CDH)"
            },
            {
                "Referent": "Integrins",
                "Canonical name": "(ITG)"
            },
            {
                "Referent": "Selectins",
                "Canonical name": "(SEL)"
            },
            {
                "Referent": "Immunoglobulins",
                "Canonical name": "(IG)"
            },
            {
                "Referent": "Intercellular adhesion molecule",
                "Canonical name": "(ICAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Lymphocyte function-associated antigen 1",
                "Canonical name": "(LFA-1)"
            },
            {
                "Referent": "Melanoma cell adhesion molecule",
                "Canonical name": "(MCAM)"
            },
            {
                "Referent": "Melanoma cell adhesion molecule",
                "Canonical name": "(MCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Intercellular adhesion molecule",
                "Canonical name": "(ICAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            },
            {
                "Referent": "Neural cell adhesion molecule",
                "Canonical name": "(NCAM)"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cadherins",
                "Integrins",
                "Selectins",
                "Immunoglobulins",
                "Intercellular adhesion molecule",
                "Neural cell adhesion molecule",
                "Lymphocyte function-associated antigen 1",
                "Melanoma cell adhesion molecule"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"Cadherins\", \"Canonical name\": \"(CDH)\"}",
                "{\"Referent\": \"Immunoglobulins\", \"Canonical name\": \"(IG)\"}",
                "{\"Referent\": \"Integrins\", \"Canonical name\": \"(ITG)\"}",
                "{\"Referent\": \"Intercellular adhesion molecule\", \"Canonical name\": \"(ICAM)\"}",
                "{\"Referent\": \"Lymphocyte function-associated antigen 1\", \"Canonical name\": \"(LFA-1)\"}",
                "{\"Referent\": \"Melanoma cell adhesion molecule\", \"Canonical name\": \"(MCAM)\"}",
                "{\"Referent\": \"Neural cell adhesion molecule\", \"Canonical name\": \"(NCAM)\"}",
                "{\"Referent\": \"Selectins\", \"Canonical name\": \"(SEL)\"}"
            ],
            "TP": 8,
            "FP": 0,
            "FN": 0
        }
    }
]