[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Cadherin (CDH)",
            "Selectin (SEL)",
            "Integrin (ITG)",
            "N-Cadherin (CDH2)",
            "E-Cadherin (CDH1)",
            "P-Cadherin (CDH3)",
            "Protocadherin (PCDH)",
            "Desmoglein (DSG)",
            "Desmocollin (DSC)",
            "Connexin (GJB1)",
            "Claudin (CLDN)",
            "Junctional Adhesion Molecule (JAM)",
            "E-Cadherin (CDH1)",
            "N-Cadherin (CDH2)",
            "P-Cadherin (CDH3)",
            "Nectin (PVRL)",
            "Occludin (OCLN)",
            "Cadherin-Related Family Member 3 (CDHR3)",
            "CD44 (CD44)",
            "CD147 (Basigin, BTG4)",
            "CD43 (Sialophorin)",
            "CD54 (ICAM-1)",
            "CD11a (ITGAL)",
            "CD11b (ITGAM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cadherin (CDH)",
                "Selectin (SEL)",
                "Integrin (ITG)",
                "N-Cadherin (CDH2)",
                "E-Cadherin (CDH1)",
                "P-Cadherin (CDH3)",
                "Protocadherin (PCDH)",
                "Desmoglein (DSG)",
                "Desmocollin (DSC)",
                "Connexin (GJB1)",
                "Claudin (CLDN)",
                "Junctional Adhesion Molecule (JAM)",
                "Nectin (PVRL)",
                "Occludin (OCLN)",
                "Cadherin-Related Family Member 3 (CDHR3)",
                "CD44 (CD44)",
                "CD147 (Basigin, BTG4)",
                "CD43 (Sialophorin)",
                "CD54 (ICAM-1)",
                "CD11a (ITGAL)",
                "CD11b (ITGAM)"
            ],
            "mismatches": [],
            "true_referents": [
                "CD11a (ITGAL)",
                "CD11b (ITGAM)",
                "CD147 (Basigin, BTG4)",
                "CD43 (Sialophorin)",
                "CD44 (CD44)",
                "CD54 (ICAM-1)",
                "Cadherin (CDH)",
                "Cadherin-Related Family Member 3 (CDHR3)",
                "Claudin (CLDN)",
                "Connexin (GJB1)",
                "Desmocollin (DSC)",
                "Desmoglein (DSG)",
                "E-Cadherin (CDH1)",
                "Integrin (ITG)",
                "Junctional Adhesion Molecule (JAM)",
                "N-Cadherin (CDH2)",
                "Nectin (PVRL)",
                "Occludin (OCLN)",
                "P-Cadherin (CDH3)",
                "Protocadherin (PCDH)",
                "Selectin (SEL)"
            ],
            "TP": 21,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Intercellular Adhesion Molecule 1 (ICAM-1)",
            "Vascular Cell Adhesion Molecule 1 (VCAM-1)",
            "E-Selectin",
            "P-Selectin",
            "L-Selectin",
            "N-Cadherin",
            "E-Cadherin",
            "P-Cadherin",
            "T-Cell Surface Glycoprotein CD2",
            "T-Cell Surface Glycoprotein CD4",
            "T-Cell Surface Glycoprotein CD8",
            "Leukocyte Function-Associated Antigen 1 (LFA-1)",
            "Integrin alpha L beta 2",
            "Integrin alpha M beta 2",
            "Integrin alpha V beta 3",
            "Integrin alpha V beta 5",
            "Integrin alpha 4 beta 1",
            "Mucin 1 (MUC1)",
            "Mucin 4 (MUC4)",
            "Mucin 16 (CA125)",
            "Mucin 17 (CA19-9)",
            "Mucin 19 (CA72-4)",
            "Mucin 21 (CA15-3)",
            "Mucin 24 (MUC24)",
            "Mucin 28 (MUC28)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Intercellular Adhesion Molecule 1 (ICAM-1)",
                "Vascular Cell Adhesion Molecule 1 (VCAM-1)",
                "E-Selectin",
                "P-Selectin",
                "L-Selectin",
                "N-Cadherin",
                "E-Cadherin",
                "P-Cadherin",
                "T-Cell Surface Glycoprotein CD2",
                "T-Cell Surface Glycoprotein CD4",
                "T-Cell Surface Glycoprotein CD8",
                "Leukocyte Function-Associated Antigen 1 (LFA-1)",
                "Integrin alpha L beta 2",
                "Integrin alpha M beta 2",
                "Integrin alpha V beta 3",
                "Integrin alpha V beta 5",
                "Integrin alpha 4 beta 1",
                "Mucin 1 (MUC1)",
                "Mucin 4 (MUC4)",
                "Mucin 16 (CA125)",
                "Mucin 17 (CA19-9)",
                "Mucin 19 (CA72-4)",
                "Mucin 21 (CA15-3)",
                "Mucin 24 (MUC24)"
            ],
            "mismatches": [
                "Mucin 28 (MUC28)"
            ],
            "true_referents": [
                "E-Cadherin",
                "E-Selectin",
                "Integrin alpha 4 beta 1",
                "Integrin alpha L beta 2",
                "Integrin alpha M beta 2",
                "Integrin alpha V beta 3",
                "Integrin alpha V beta 5",
                "Intercellular Adhesion Molecule 1 (ICAM-1)",
                "L-Selectin",
                "Leukocyte Function-Associated Antigen 1 (LFA-1)",
                "Mucin 1 (MUC1)",
                "Mucin 16 (CA125)",
                "Mucin 17 (CA19-9)",
                "Mucin 19 (CA72-4)",
                "Mucin 21 (CA15-3)",
                "Mucin 24 (MUC24)",
                "Mucin 4 (MUC4)",
                "N-Cadherin",
                "P-Cadherin",
                "P-Selectin",
                "T-Cell Surface Glycoprotein CD2",
                "T-Cell Surface Glycoprotein CD4",
                "T-Cell Surface Glycoprotein CD8",
                "Vascular Cell Adhesion Molecule 1 (VCAM-1)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "E-cadherin (CDH1)",
            "N-cadherin (CDH2)",
            "Vascular endothelial cadherin (CDH5)",
            "Desmoglein (DSG)",
            "Desmocollin (DSC)",
            "Integrin \u03b1L\u03b22 (ITGAL/ITGB2)",
            "Integrin \u03b14\u03b21 (ITGA4/ITGB1)",
            "Integrin \u03b15\u03b21 (ITGA5/ITGB1)",
            "Integrin \u03b1v\u03b23 (ITGAV/ITGB3)",
            "Neural cell adhesion molecule (NCAM)",
            "L-selectin (SELL)",
            "P-selectin (SELP)",
            "E-selectin (SELE)",
            "Intercellular adhesion molecule 1 (ICAM1)",
            "Intercellular adhesion molecule 2 (ICAM2)",
            "Vascular cell adhesion molecule 1 (VCAM1)",
            "Platelet endothelial cell adhesion molecule 1 (PECAM1)",
            "Mucin 1 (MUC1)",
            "CD44",
            "CD47",
            "CD54",
            "CD58",
            "CD151",
            "CD226"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "E-cadherin (CDH1)",
                "N-cadherin (CDH2)",
                "Vascular endothelial cadherin (CDH5)",
                "Desmoglein (DSG)",
                "Desmocollin (DSC)",
                "Integrin \u03b1L\u03b22 (ITGAL/ITGB2)",
                "Integrin \u03b14\u03b21 (ITGA4/ITGB1)",
                "Integrin \u03b15\u03b21 (ITGA5/ITGB1)",
                "Integrin \u03b1v\u03b23 (ITGAV/ITGB3)",
                "Neural cell adhesion molecule (NCAM)",
                "L-selectin (SELL)",
                "P-selectin (SELP)",
                "E-selectin (SELE)",
                "Intercellular adhesion molecule 1 (ICAM1)",
                "Intercellular adhesion molecule 2 (ICAM2)",
                "Vascular cell adhesion molecule 1 (VCAM1)",
                "Platelet endothelial cell adhesion molecule 1 (PECAM1)",
                "Mucin 1 (MUC1)",
                "CD44",
                "CD47",
                "CD54",
                "CD58",
                "CD151",
                "CD226"
            ],
            "mismatches": [],
            "true_referents": [
                "CD151",
                "CD226",
                "CD44",
                "CD47",
                "CD54",
                "CD58",
                "Desmocollin (DSC)",
                "Desmoglein (DSG)",
                "E-cadherin (CDH1)",
                "E-selectin (SELE)",
                "Integrin \u03b14\u03b21 (ITGA4/ITGB1)",
                "Integrin \u03b15\u03b21 (ITGA5/ITGB1)",
                "Integrin \u03b1L\u03b22 (ITGAL/ITGB2)",
                "Integrin \u03b1v\u03b23 (ITGAV/ITGB3)",
                "Intercellular adhesion molecule 1 (ICAM1)",
                "Intercellular adhesion molecule 2 (ICAM2)",
                "L-selectin (SELL)",
                "Mucin 1 (MUC1)",
                "N-cadherin (CDH2)",
                "Neural cell adhesion molecule (NCAM)",
                "P-selectin (SELP)",
                "Platelet endothelial cell adhesion molecule 1 (PECAM1)",
                "Vascular cell adhesion molecule 1 (VCAM1)",
                "Vascular endothelial cadherin (CDH5)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Cadherin-1 (CDH1)",
            "Integrin \u03b15\u03b21 (ITGA5B1)",
            "N-Cadherin (NCDH)",
            "E-Cadherin (CDH1)",
            "P-Cadherin (CDH3)",
            "VCAM-1 (VCAM1)",
            "ICAM-1 (ICAM1)",
            "L-Selectin (SELL)",
            "E-Selectin (SELE)",
            "P-Selectin (SELP)",
            "Neural Cell Adhesion Molecule 1 (NCAM1)",
            "Immunoglobulin Superfamily Cell Adhesion Molecule 1 (ICOSL)",
            "Platelet-Endothelial Cell Adhesion Molecule 1 (PECAM1)",
            "CD44 (CD44)",
            "Syndecan-1 (SDC1)",
            "EpCAM (EPCAM)",
            "Desmoglein 3 (DSG3)",
            "Desmocollin 3 (DSC3)",
            "Claudin-1 (CLDN1)",
            "JAM-A (JAM1)",
            "CECAM-1 (CECAM1)",
            "CD11a/CD18 (LFA-1)",
            "CD29 (Integrin \u03b21)",
            "CD54 (ICAM-1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cadherin-1 (CDH1)",
                "Integrin \u03b15\u03b21 (ITGA5B1)",
                "N-Cadherin (NCDH)",
                "E-Cadherin (CDH1)",
                "P-Cadherin (CDH3)",
                "VCAM-1 (VCAM1)",
                "ICAM-1 (ICAM1)",
                "L-Selectin (SELL)",
                "E-Selectin (SELE)",
                "P-Selectin (SELP)",
                "Neural Cell Adhesion Molecule 1 (NCAM1)",
                "Immunoglobulin Superfamily Cell Adhesion Molecule 1 (ICOSL)",
                "Platelet-Endothelial Cell Adhesion Molecule 1 (PECAM1)",
                "CD44 (CD44)",
                "Syndecan-1 (SDC1)",
                "EpCAM (EPCAM)",
                "Desmoglein 3 (DSG3)",
                "Desmocollin 3 (DSC3)",
                "Claudin-1 (CLDN1)",
                "JAM-A (JAM1)",
                "CECAM-1 (CECAM1)",
                "CD11a/CD18 (LFA-1)",
                "CD29 (Integrin \u03b21)",
                "CD54 (ICAM-1)"
            ],
            "mismatches": [],
            "true_referents": [
                "CD11a/CD18 (LFA-1)",
                "CD29 (Integrin \u03b21)",
                "CD44 (CD44)",
                "CD54 (ICAM-1)",
                "CECAM-1 (CECAM1)",
                "Cadherin-1 (CDH1)",
                "Claudin-1 (CLDN1)",
                "Desmocollin 3 (DSC3)",
                "Desmoglein 3 (DSG3)",
                "E-Cadherin (CDH1)",
                "E-Selectin (SELE)",
                "EpCAM (EPCAM)",
                "ICAM-1 (ICAM1)",
                "Immunoglobulin Superfamily Cell Adhesion Molecule 1 (ICOSL)",
                "Integrin \u03b15\u03b21 (ITGA5B1)",
                "JAM-A (JAM1)",
                "L-Selectin (SELL)",
                "N-Cadherin (NCDH)",
                "Neural Cell Adhesion Molecule 1 (NCAM1)",
                "P-Cadherin (CDH3)",
                "P-Selectin (SELP)",
                "Platelet-Endothelial Cell Adhesion Molecule 1 (PECAM1)",
                "Syndecan-1 (SDC1)",
                "VCAM-1 (VCAM1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "E-cadherin (CDH1)",
            "N-cadherin (CDH2)",
            "P-cadherin (CDH3)",
            "VE-cadherin (CDH5)",
            "ICAM-1 (CD54)",
            "ICAM-2 (CD102)",
            "VCAM-1 (CD106)",
            "PECAM-1 (CD31)",
            "Selectin L (CD62L)",
            "Selectin E (CD62E)",
            "Selectin P (CD62P)",
            "Integrin alpha-4 beta-1 (VLA-4)",
            "Integrin alpha-5 beta-1 (VLA-5)",
            "Integrin alpha-L beta-2 (LFA-1)",
            "Integrin alpha-M beta-2 (Mac-1)",
            "Integrin alpha-X beta-2 (CD11c/CD18)",
            "Integrin alpha-IIb beta-3 (GPIIb/IIIa)",
            "Integrin alpha-V beta-3 (CD51/CD61)",
            "Integrin alpha-6 beta-1 (CD49f/CD29)",
            "Integrin alpha-1 beta-1 (CD49a/CD29)",
            "Integrin alpha-2 beta-1 (CD49b/CD29)",
            "Integrin alpha-3 beta-1 (CD49c/CD29)",
            "Integrin alpha-9 beta-1",
            "Integrin alpha-7 beta-1"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "E-cadherin (CDH1)",
                "N-cadherin (CDH2)",
                "P-cadherin (CDH3)",
                "VE-cadherin (CDH5)",
                "ICAM-1 (CD54)",
                "ICAM-2 (CD102)",
                "VCAM-1 (CD106)",
                "PECAM-1 (CD31)",
                "Selectin L (CD62L)",
                "Selectin E (CD62E)",
                "Selectin P (CD62P)",
                "Integrin alpha-4 beta-1 (VLA-4)",
                "Integrin alpha-5 beta-1 (VLA-5)",
                "Integrin alpha-L beta-2 (LFA-1)",
                "Integrin alpha-M beta-2 (Mac-1)",
                "Integrin alpha-X beta-2 (CD11c/CD18)",
                "Integrin alpha-IIb beta-3 (GPIIb/IIIa)",
                "Integrin alpha-V beta-3 (CD51/CD61)",
                "Integrin alpha-6 beta-1 (CD49f/CD29)",
                "Integrin alpha-1 beta-1 (CD49a/CD29)",
                "Integrin alpha-2 beta-1 (CD49b/CD29)",
                "Integrin alpha-3 beta-1 (CD49c/CD29)",
                "Integrin alpha-9 beta-1",
                "Integrin alpha-7 beta-1"
            ],
            "mismatches": [],
            "true_referents": [
                "E-cadherin (CDH1)",
                "ICAM-1 (CD54)",
                "ICAM-2 (CD102)",
                "Integrin alpha-1 beta-1 (CD49a/CD29)",
                "Integrin alpha-2 beta-1 (CD49b/CD29)",
                "Integrin alpha-3 beta-1 (CD49c/CD29)",
                "Integrin alpha-4 beta-1 (VLA-4)",
                "Integrin alpha-5 beta-1 (VLA-5)",
                "Integrin alpha-6 beta-1 (CD49f/CD29)",
                "Integrin alpha-7 beta-1",
                "Integrin alpha-9 beta-1",
                "Integrin alpha-IIb beta-3 (GPIIb/IIIa)",
                "Integrin alpha-L beta-2 (LFA-1)",
                "Integrin alpha-M beta-2 (Mac-1)",
                "Integrin alpha-V beta-3 (CD51/CD61)",
                "Integrin alpha-X beta-2 (CD11c/CD18)",
                "N-cadherin (CDH2)",
                "P-cadherin (CDH3)",
                "PECAM-1 (CD31)",
                "Selectin E (CD62E)",
                "Selectin L (CD62L)",
                "Selectin P (CD62P)",
                "VCAM-1 (CD106)",
                "VE-cadherin (CDH5)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Cadherin (Cdh)",
            "Integrin (Itg)",
            "Selectin (Sel)",
            "Immunoglobulin superfamily (IgSF)",
            "Neural Cell Adhesion Molecule (NCAM)",
            "Epithelial Cadherin (E-cadherin)",
            "N-Cadherin (N-cadherin)",
            "P-Cadherin (P-cadherin)",
            "Fibronectin (FN)",
            "Laminin (Lam)",
            "Desmoglein (Dsg)",
            "Desmocollin (Dsc)",
            "Cell Adhesion Molecule 1 (CAM-1)",
            "Platelet-Endothelial Cell Adhesion Molecule (PECAM-1)",
            "MUC1 (Mucin 1)",
            "Sialylated Glycoprotein (SGP)",
            "CD44 (Cluster of Differentiation 44)",
            "Neurofascin (Nfasc)",
            "Contactin (CNTN)",
            "Chondroitin Sulfate Proteoglycan (CSPG)",
            "Tenascin (TN)",
            "Thrombospondin (TSP)",
            "Myelin-Associated Glycoprotein (MAG)",
            "L1 Cell Adhesion Molecule (L1CAM)",
            "R-cadherin (R-cadherin)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cadherin (Cdh)",
                "Integrin (Itg)",
                "Selectin (Sel)",
                "Immunoglobulin superfamily (IgSF)",
                "Neural Cell Adhesion Molecule (NCAM)",
                "Epithelial Cadherin (E-cadherin)",
                "N-Cadherin (N-cadherin)",
                "P-Cadherin (P-cadherin)",
                "Fibronectin (FN)",
                "Laminin (Lam)",
                "Desmoglein (Dsg)",
                "Desmocollin (Dsc)",
                "Cell Adhesion Molecule 1 (CAM-1)",
                "Platelet-Endothelial Cell Adhesion Molecule (PECAM-1)",
                "MUC1 (Mucin 1)",
                "Sialylated Glycoprotein (SGP)",
                "CD44 (Cluster of Differentiation 44)",
                "Neurofascin (Nfasc)",
                "Contactin (CNTN)",
                "Chondroitin Sulfate Proteoglycan (CSPG)",
                "Tenascin (TN)",
                "Thrombospondin (TSP)",
                "Myelin-Associated Glycoprotein (MAG)",
                "L1 Cell Adhesion Molecule (L1CAM)"
            ],
            "mismatches": [
                "R-cadherin (R-cadherin)"
            ],
            "true_referents": [
                "CD44 (Cluster of Differentiation 44)",
                "Cadherin (Cdh)",
                "Cell Adhesion Molecule 1 (CAM-1)",
                "Chondroitin Sulfate Proteoglycan (CSPG)",
                "Contactin (CNTN)",
                "Desmocollin (Dsc)",
                "Desmoglein (Dsg)",
                "Epithelial Cadherin (E-cadherin)",
                "Fibronectin (FN)",
                "Immunoglobulin superfamily (IgSF)",
                "Integrin (Itg)",
                "L1 Cell Adhesion Molecule (L1CAM)",
                "Laminin (Lam)",
                "MUC1 (Mucin 1)",
                "Myelin-Associated Glycoprotein (MAG)",
                "N-Cadherin (N-cadherin)",
                "Neural Cell Adhesion Molecule (NCAM)",
                "Neurofascin (Nfasc)",
                "P-Cadherin (P-cadherin)",
                "Platelet-Endothelial Cell Adhesion Molecule (PECAM-1)",
                "Selectin (Sel)",
                "Sialylated Glycoprotein (SGP)",
                "Tenascin (TN)",
                "Thrombospondin (TSP)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Integrin (ITG)",
            "Immunoglobulin superfamily (IgSF)",
            "Cadherins (CDH)",
            "Selectins (SEL)",
            "Intercellular adhesion molecule 1 (ICAM-1)",
            "Vascular cell adhesion molecule 1 (VCAM-1)",
            "L-selectin (SELL)",
            "E-selectin (SELE)",
            "P-selectin (SELP)",
            "Nectin (NECTIN)",
            "Neural cell adhesion molecule (NCAM)",
            "Leukocyte function-associated antigen 1 (LFA-1)",
            "Macrophage-1 antigen (MAC-1)",
            "Junctional adhesion molecule A (JAM-A)",
            "Junctional adhesion molecule B (JAM-B)",
            "Junctional adhesion molecule C (JAM-C)",
            "Platelet endothelial cell adhesion molecule (PECAM-1)",
            "CD34 molecule (CD34)",
            "CD44 molecule (CD44)",
            "CD58 molecule (CD58)",
            "CD62 molecule (CD62)",
            "CD102 molecule (CD102)",
            "CD106 molecule (CD106)",
            "CD166 molecule (CD166)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Integrin (ITG)",
                "Immunoglobulin superfamily (IgSF)",
                "Cadherins (CDH)",
                "Selectins (SEL)",
                "Intercellular adhesion molecule 1 (ICAM-1)",
                "Vascular cell adhesion molecule 1 (VCAM-1)",
                "L-selectin (SELL)",
                "E-selectin (SELE)",
                "P-selectin (SELP)",
                "Nectin (NECTIN)",
                "Neural cell adhesion molecule (NCAM)",
                "Leukocyte function-associated antigen 1 (LFA-1)",
                "Macrophage-1 antigen (MAC-1)",
                "Junctional adhesion molecule A (JAM-A)",
                "Junctional adhesion molecule B (JAM-B)",
                "Junctional adhesion molecule C (JAM-C)",
                "Platelet endothelial cell adhesion molecule (PECAM-1)",
                "CD34 molecule (CD34)",
                "CD44 molecule (CD44)",
                "CD58 molecule (CD58)",
                "CD62 molecule (CD62)",
                "CD102 molecule (CD102)",
                "CD106 molecule (CD106)",
                "CD166 molecule (CD166)"
            ],
            "mismatches": [],
            "true_referents": [
                "CD102 molecule (CD102)",
                "CD106 molecule (CD106)",
                "CD166 molecule (CD166)",
                "CD34 molecule (CD34)",
                "CD44 molecule (CD44)",
                "CD58 molecule (CD58)",
                "CD62 molecule (CD62)",
                "Cadherins (CDH)",
                "E-selectin (SELE)",
                "Immunoglobulin superfamily (IgSF)",
                "Integrin (ITG)",
                "Intercellular adhesion molecule 1 (ICAM-1)",
                "Junctional adhesion molecule A (JAM-A)",
                "Junctional adhesion molecule B (JAM-B)",
                "Junctional adhesion molecule C (JAM-C)",
                "L-selectin (SELL)",
                "Leukocyte function-associated antigen 1 (LFA-1)",
                "Macrophage-1 antigen (MAC-1)",
                "Nectin (NECTIN)",
                "Neural cell adhesion molecule (NCAM)",
                "P-selectin (SELP)",
                "Platelet endothelial cell adhesion molecule (PECAM-1)",
                "Selectins (SEL)",
                "Vascular cell adhesion molecule 1 (VCAM-1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "CD44 (cell adhesion molecule)",
            "E-cadherin (epithelial cadherin)",
            "ICAM-1 (intercellular adhesion molecule 1)",
            "VCAM-1 (vascular cell adhesion molecule 1)",
            "L-selectin (lymphocyte adhesion molecule 1)",
            "P-selectin (platelet selectin)",
            "N-cadherin (neuronal cadherin)",
            "Integrins",
            "CD2 (T-cell surface antigen)",
            "CD58 (lymphocyte function-associated antigen 3)",
            "CD11a/CD18 (lymphocyte function-associated antigen 1)",
            "CD11b/CD18 (Mac-1 integrin)",
            "CD11c/CD18 (p150/95 integrin)",
            "CD49a/CD29 (VLA-1 integrin)",
            "CD49b/CD29 (VLA-2 integrin)",
            "CD49c/CD29 (VLA-3 integrin)",
            "CD49d/CD29 (VLA-4 integrin)",
            "CD49e/CD29 (VLA-5 integrin)",
            "CD49f/CD29 (VLA-6 integrin)",
            "CD49g/CD29 (VLA-7 integrin)",
            "CD49h/CD29 (VLA-8 integrin)",
            "CD49i/CD29 (VLA-9 integrin)",
            "CD49j/CD29 (VLA-10 integrin)",
            "CD49k/CD29 (VLA-11 integrin)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "CD44 (cell adhesion molecule)",
                "E-cadherin (epithelial cadherin)",
                "ICAM-1 (intercellular adhesion molecule 1)",
                "VCAM-1 (vascular cell adhesion molecule 1)",
                "L-selectin (lymphocyte adhesion molecule 1)",
                "P-selectin (platelet selectin)",
                "N-cadherin (neuronal cadherin)",
                "Integrins",
                "CD2 (T-cell surface antigen)",
                "CD58 (lymphocyte function-associated antigen 3)",
                "CD11a/CD18 (lymphocyte function-associated antigen 1)",
                "CD11b/CD18 (Mac-1 integrin)",
                "CD11c/CD18 (p150/95 integrin)",
                "CD49a/CD29 (VLA-1 integrin)",
                "CD49b/CD29 (VLA-2 integrin)",
                "CD49c/CD29 (VLA-3 integrin)",
                "CD49d/CD29 (VLA-4 integrin)",
                "CD49e/CD29 (VLA-5 integrin)",
                "CD49f/CD29 (VLA-6 integrin)",
                "CD49g/CD29 (VLA-7 integrin)",
                "CD49h/CD29 (VLA-8 integrin)",
                "CD49i/CD29 (VLA-9 integrin)",
                "CD49j/CD29 (VLA-10 integrin)",
                "CD49k/CD29 (VLA-11 integrin)"
            ],
            "mismatches": [],
            "true_referents": [
                "CD11a/CD18 (lymphocyte function-associated antigen 1)",
                "CD11b/CD18 (Mac-1 integrin)",
                "CD11c/CD18 (p150/95 integrin)",
                "CD2 (T-cell surface antigen)",
                "CD44 (cell adhesion molecule)",
                "CD49a/CD29 (VLA-1 integrin)",
                "CD49b/CD29 (VLA-2 integrin)",
                "CD49c/CD29 (VLA-3 integrin)",
                "CD49d/CD29 (VLA-4 integrin)",
                "CD49e/CD29 (VLA-5 integrin)",
                "CD49f/CD29 (VLA-6 integrin)",
                "CD49g/CD29 (VLA-7 integrin)",
                "CD49h/CD29 (VLA-8 integrin)",
                "CD49i/CD29 (VLA-9 integrin)",
                "CD49j/CD29 (VLA-10 integrin)",
                "CD49k/CD29 (VLA-11 integrin)",
                "CD58 (lymphocyte function-associated antigen 3)",
                "E-cadherin (epithelial cadherin)",
                "ICAM-1 (intercellular adhesion molecule 1)",
                "Integrins",
                "L-selectin (lymphocyte adhesion molecule 1)",
                "N-cadherin (neuronal cadherin)",
                "P-selectin (platelet selectin)",
                "VCAM-1 (vascular cell adhesion molecule 1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "E-cadherin (CDH1)",
            "N-cadherin (CDH2)",
            "P-cadherin (CDH3)",
            "VE-cadherin (CDH5)",
            "ICAM-1 (CD54)",
            "ICAM-2 (CD102)",
            "ICAM-3 (CD50)",
            "VCAM-1 (CD106)",
            "Integrin \u03b1L\u03b22 (ITGAL/ITGB2)",
            "Integrin \u03b1M\u03b22 (ITGAM/ITGB2)",
            "Integrin \u03b14\u03b21 (ITGA4/ITGB1)",
            "Integrin \u03b15\u03b21 (ITGA5/ITGB1)",
            "Integrin \u03b1V\u03b23 (ITGAV/ITGB3)",
            "E-selectin (CD62E)",
            "P-selectin (CD62P)",
            "N-selectin (CD62L)",
            "JAM-A (F11R)",
            "JAM-B (F11R2)",
            "JAM-C (F11R3)",
            "NCAM1 (CD56)",
            "L1CAM",
            "MCAM (CD146)",
            "PECAM-1 (CD31)",
            "ALCAM (CD166)",
            "MAdCAM-1 (CDM1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "E-cadherin (CDH1)",
                "N-cadherin (CDH2)",
                "P-cadherin (CDH3)",
                "VE-cadherin (CDH5)",
                "ICAM-1 (CD54)",
                "ICAM-2 (CD102)",
                "ICAM-3 (CD50)",
                "VCAM-1 (CD106)",
                "Integrin \u03b1L\u03b22 (ITGAL/ITGB2)",
                "Integrin \u03b1M\u03b22 (ITGAM/ITGB2)",
                "Integrin \u03b14\u03b21 (ITGA4/ITGB1)",
                "Integrin \u03b15\u03b21 (ITGA5/ITGB1)",
                "Integrin \u03b1V\u03b23 (ITGAV/ITGB3)",
                "E-selectin (CD62E)",
                "P-selectin (CD62P)",
                "N-selectin (CD62L)",
                "JAM-A (F11R)",
                "JAM-B (F11R2)",
                "JAM-C (F11R3)",
                "NCAM1 (CD56)",
                "L1CAM",
                "MCAM (CD146)",
                "PECAM-1 (CD31)",
                "ALCAM (CD166)"
            ],
            "mismatches": [
                "MAdCAM-1 (CDM1)"
            ],
            "true_referents": [
                "ALCAM (CD166)",
                "E-cadherin (CDH1)",
                "E-selectin (CD62E)",
                "ICAM-1 (CD54)",
                "ICAM-2 (CD102)",
                "ICAM-3 (CD50)",
                "Integrin \u03b14\u03b21 (ITGA4/ITGB1)",
                "Integrin \u03b15\u03b21 (ITGA5/ITGB1)",
                "Integrin \u03b1L\u03b22 (ITGAL/ITGB2)",
                "Integrin \u03b1M\u03b22 (ITGAM/ITGB2)",
                "Integrin \u03b1V\u03b23 (ITGAV/ITGB3)",
                "JAM-A (F11R)",
                "JAM-B (F11R2)",
                "JAM-C (F11R3)",
                "L1CAM",
                "MCAM (CD146)",
                "N-cadherin (CDH2)",
                "N-selectin (CD62L)",
                "NCAM1 (CD56)",
                "P-cadherin (CDH3)",
                "P-selectin (CD62P)",
                "PECAM-1 (CD31)",
                "VCAM-1 (CD106)",
                "VE-cadherin (CDH5)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "E-cadherin (CDH1)",
            "N-cadherin (CDH2)",
            "P-cadherin (CDH3)",
            "VE-cadherin (CDH5)",
            "Intercellular adhesion molecule 1 (ICAM-1)",
            "Vascular cell adhesion molecule 1 (VCAM-1)",
            "Neural cell adhesion molecule (NCAM)",
            "Epithelial cell adhesion molecule (EpCAM)",
            "Platelet endothelial cell adhesion molecule (PECAM-1)",
            "L1 cell adhesion molecule (L1CAM)",
            "Junctional adhesion molecule A (JAM-A)",
            "Claudin-1",
            "Occludin",
            "Desmoglein-1",
            "Desmocollin-1",
            "Integrin alpha-5 beta-1",
            "Integrin alpha-V beta-3",
            "Selectin E (SELE)",
            "Selectin P (SELP)",
            "Selectin L (SELL)",
            "CD44",
            "Mucin-1 (MUC1)",
            "Carcinoembryonic antigen-related cell adhesion molecule 1 (CEACAM1)",
            "Activated leukocyte cell adhesion molecule (ALCAM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "E-cadherin (CDH1)",
                "N-cadherin (CDH2)",
                "P-cadherin (CDH3)",
                "VE-cadherin (CDH5)",
                "Intercellular adhesion molecule 1 (ICAM-1)",
                "Vascular cell adhesion molecule 1 (VCAM-1)",
                "Neural cell adhesion molecule (NCAM)",
                "Epithelial cell adhesion molecule (EpCAM)",
                "Platelet endothelial cell adhesion molecule (PECAM-1)",
                "L1 cell adhesion molecule (L1CAM)",
                "Junctional adhesion molecule A (JAM-A)",
                "Claudin-1",
                "Occludin",
                "Desmoglein-1",
                "Desmocollin-1",
                "Integrin alpha-5 beta-1",
                "Integrin alpha-V beta-3",
                "Selectin E (SELE)",
                "Selectin P (SELP)",
                "Selectin L (SELL)",
                "CD44",
                "Mucin-1 (MUC1)",
                "Carcinoembryonic antigen-related cell adhesion molecule 1 (CEACAM1)",
                "Activated leukocyte cell adhesion molecule (ALCAM)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated leukocyte cell adhesion molecule (ALCAM)",
                "CD44",
                "Carcinoembryonic antigen-related cell adhesion molecule 1 (CEACAM1)",
                "Claudin-1",
                "Desmocollin-1",
                "Desmoglein-1",
                "E-cadherin (CDH1)",
                "Epithelial cell adhesion molecule (EpCAM)",
                "Integrin alpha-5 beta-1",
                "Integrin alpha-V beta-3",
                "Intercellular adhesion molecule 1 (ICAM-1)",
                "Junctional adhesion molecule A (JAM-A)",
                "L1 cell adhesion molecule (L1CAM)",
                "Mucin-1 (MUC1)",
                "N-cadherin (CDH2)",
                "Neural cell adhesion molecule (NCAM)",
                "Occludin",
                "P-cadherin (CDH3)",
                "Platelet endothelial cell adhesion molecule (PECAM-1)",
                "Selectin E (SELE)",
                "Selectin L (SELL)",
                "Selectin P (SELP)",
                "VE-cadherin (CDH5)",
                "Vascular cell adhesion molecule 1 (VCAM-1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Neural cell adhesion molecule 1 (NCAM1)",
            "Intercellular adhesion molecule 1 (ICAM1)",
            "Vascular cell adhesion molecule 1 (VCAM1)",
            "Platelet endothelial cell adhesion molecule (PECAM1)",
            "Epithelial cell adhesion molecule (EpCAM)",
            "Carcinoembryonic antigen-related cell adhesion molecule 1 (CEACAM1)",
            "Melanoma cell adhesion molecule (MCAM)",
            "Activated leukocyte cell adhesion molecule (ALCAM)",
            "Junctional adhesion molecule A (JAM-A)",
            "Cadherin 1 (CDH1)",
            "Cadherin 2 (CDH2)",
            "Cadherin 5 (CDH5)",
            "Protocadherin 1 (PCDH1)",
            "Desmoglein 1 (DSG1)",
            "Desmocollin 1 (DSC1)",
            "Selectin P (SELP)",
            "Selectin E (SELE)",
            "Selectin L (SELL)",
            "Integrin alpha 1 (ITGA1)",
            "Integrin alpha 2 (ITGA2)",
            "Integrin alpha 4 (ITGA4)",
            "Integrin alpha 5 (ITGA5)",
            "Integrin alpha 6 (ITGA6)",
            "Integrin beta 1 (ITGB1)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Neural cell adhesion molecule 1 (NCAM1)",
                "Intercellular adhesion molecule 1 (ICAM1)",
                "Vascular cell adhesion molecule 1 (VCAM1)",
                "Platelet endothelial cell adhesion molecule (PECAM1)",
                "Epithelial cell adhesion molecule (EpCAM)",
                "Carcinoembryonic antigen-related cell adhesion molecule 1 (CEACAM1)",
                "Melanoma cell adhesion molecule (MCAM)",
                "Activated leukocyte cell adhesion molecule (ALCAM)",
                "Junctional adhesion molecule A (JAM-A)",
                "Cadherin 1 (CDH1)",
                "Cadherin 2 (CDH2)",
                "Cadherin 5 (CDH5)",
                "Protocadherin 1 (PCDH1)",
                "Desmoglein 1 (DSG1)",
                "Desmocollin 1 (DSC1)",
                "Selectin P (SELP)",
                "Selectin E (SELE)",
                "Selectin L (SELL)",
                "Integrin alpha 1 (ITGA1)",
                "Integrin alpha 2 (ITGA2)",
                "Integrin alpha 4 (ITGA4)",
                "Integrin alpha 5 (ITGA5)",
                "Integrin alpha 6 (ITGA6)",
                "Integrin beta 1 (ITGB1)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated leukocyte cell adhesion molecule (ALCAM)",
                "Cadherin 1 (CDH1)",
                "Cadherin 2 (CDH2)",
                "Cadherin 5 (CDH5)",
                "Carcinoembryonic antigen-related cell adhesion molecule 1 (CEACAM1)",
                "Desmocollin 1 (DSC1)",
                "Desmoglein 1 (DSG1)",
                "Epithelial cell adhesion molecule (EpCAM)",
                "Integrin alpha 1 (ITGA1)",
                "Integrin alpha 2 (ITGA2)",
                "Integrin alpha 4 (ITGA4)",
                "Integrin alpha 5 (ITGA5)",
                "Integrin alpha 6 (ITGA6)",
                "Integrin beta 1 (ITGB1)",
                "Intercellular adhesion molecule 1 (ICAM1)",
                "Junctional adhesion molecule A (JAM-A)",
                "Melanoma cell adhesion molecule (MCAM)",
                "Neural cell adhesion molecule 1 (NCAM1)",
                "Platelet endothelial cell adhesion molecule (PECAM1)",
                "Protocadherin 1 (PCDH1)",
                "Selectin E (SELE)",
                "Selectin L (SELL)",
                "Selectin P (SELP)",
                "Vascular cell adhesion molecule 1 (VCAM1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Cadherin (CDH)",
            "Integrin (ITG)",
            "Selectin (SELE)",
            "Immunoglobulin superfamily cell adhesion molecule (IgSF CAM)",
            "Hyaluronic acid receptor (CD44)",
            "Neural cell adhesion molecule (NCAM)",
            "Vascular cell adhesion protein 1 (VCAM-1)",
            "Intercellular adhesion molecule (ICAM)",
            "Platelet endothelial cell adhesion molecule (PECAM-1)",
            "Mucosal addressin cell adhesion molecule (MAdCAM-1)",
            "Junctional adhesion molecule (JAM)",
            "Epithelial cell adhesion molecule (EpCAM)",
            "L1 cell adhesion molecule (L1CAM)",
            "Vascular adhesion protein 1 (VAP-1)",
            "Melanoma cell adhesion molecule (MCAM)",
            "Activated leukocyte cell adhesion molecule (ALCAM)",
            "Brain angiogenesis inhibitor 1 (BAI1)",
            "Neuropilin (NRP)",
            "Semaphorin (SEMA)",
            "Ephrin (EFN)",
            "Nectin (NECTIN)",
            "Neurexin (NRXN)",
            "Neuroligin (NLGN)",
            "Layilin (LAYN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cadherin (CDH)",
                "Integrin (ITG)",
                "Selectin (SELE)",
                "Immunoglobulin superfamily cell adhesion molecule (IgSF CAM)",
                "Hyaluronic acid receptor (CD44)",
                "Neural cell adhesion molecule (NCAM)",
                "Vascular cell adhesion protein 1 (VCAM-1)",
                "Intercellular adhesion molecule (ICAM)",
                "Platelet endothelial cell adhesion molecule (PECAM-1)",
                "Mucosal addressin cell adhesion molecule (MAdCAM-1)",
                "Junctional adhesion molecule (JAM)",
                "Epithelial cell adhesion molecule (EpCAM)",
                "L1 cell adhesion molecule (L1CAM)",
                "Vascular adhesion protein 1 (VAP-1)",
                "Melanoma cell adhesion molecule (MCAM)",
                "Activated leukocyte cell adhesion molecule (ALCAM)",
                "Brain angiogenesis inhibitor 1 (BAI1)",
                "Neuropilin (NRP)",
                "Semaphorin (SEMA)",
                "Ephrin (EFN)",
                "Nectin (NECTIN)",
                "Neurexin (NRXN)",
                "Neuroligin (NLGN)",
                "Layilin (LAYN)"
            ],
            "mismatches": [],
            "true_referents": [
                "Activated leukocyte cell adhesion molecule (ALCAM)",
                "Brain angiogenesis inhibitor 1 (BAI1)",
                "Cadherin (CDH)",
                "Ephrin (EFN)",
                "Epithelial cell adhesion molecule (EpCAM)",
                "Hyaluronic acid receptor (CD44)",
                "Immunoglobulin superfamily cell adhesion molecule (IgSF CAM)",
                "Integrin (ITG)",
                "Intercellular adhesion molecule (ICAM)",
                "Junctional adhesion molecule (JAM)",
                "L1 cell adhesion molecule (L1CAM)",
                "Layilin (LAYN)",
                "Melanoma cell adhesion molecule (MCAM)",
                "Mucosal addressin cell adhesion molecule (MAdCAM-1)",
                "Nectin (NECTIN)",
                "Neural cell adhesion molecule (NCAM)",
                "Neurexin (NRXN)",
                "Neuroligin (NLGN)",
                "Neuropilin (NRP)",
                "Platelet endothelial cell adhesion molecule (PECAM-1)",
                "Selectin (SELE)",
                "Semaphorin (SEMA)",
                "Vascular adhesion protein 1 (VAP-1)",
                "Vascular cell adhesion protein 1 (VCAM-1)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Cadherin (CAD)",
            "Selectin (SEL)",
            "Integrin (INT)",
            "Neural Cell Adhesion Molecule (NCAM)",
            "Vascular Cell Adhesion Molecule (VCAM)",
            "Intercellular Adhesion Molecule (ICAM)",
            "E-Cadherin (E-CAD)",
            "P-Selectin (P-SEL)",
            "L-Selectin (L-SEL)",
            "Fibronectin (FN)",
            "Laminin (LAM)",
            "Collagen (COL)",
            "Vitronectin (VTN)",
            "Osteopontin (OPN)",
            "Thrombospondin (TSP)",
            "Tenascin (TEN)",
            "Galectin (GAL)",
            "Siglec (SIG)",
            "CD44 (CD44)",
            "Neural Cell Adhesion Molecule 1 (NCAM1)",
            "Vascular Cell Adhesion Molecule 1 (VCAM1)",
            "Intercellular Adhesion Molecule 1 (ICAM1)",
            "E-Cadherin (CDH1)",
            "P-Selectin (SELP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cadherin (CAD)",
                "Selectin (SEL)",
                "Integrin (INT)",
                "Neural Cell Adhesion Molecule (NCAM)",
                "Vascular Cell Adhesion Molecule (VCAM)",
                "Intercellular Adhesion Molecule (ICAM)",
                "E-Cadherin (E-CAD)",
                "P-Selectin (P-SEL)",
                "L-Selectin (L-SEL)",
                "Fibronectin (FN)",
                "Laminin (LAM)",
                "Collagen (COL)",
                "Vitronectin (VTN)",
                "Osteopontin (OPN)",
                "Thrombospondin (TSP)",
                "Tenascin (TEN)",
                "Galectin (GAL)",
                "Siglec (SIG)",
                "CD44 (CD44)",
                "Neural Cell Adhesion Molecule 1 (NCAM1)",
                "Vascular Cell Adhesion Molecule 1 (VCAM1)",
                "Intercellular Adhesion Molecule 1 (ICAM1)",
                "E-Cadherin (CDH1)",
                "P-Selectin (SELP)"
            ],
            "mismatches": [],
            "true_referents": [
                "CD44 (CD44)",
                "Cadherin (CAD)",
                "Collagen (COL)",
                "E-Cadherin (CDH1)",
                "E-Cadherin (E-CAD)",
                "Fibronectin (FN)",
                "Galectin (GAL)",
                "Integrin (INT)",
                "Intercellular Adhesion Molecule (ICAM)",
                "Intercellular Adhesion Molecule 1 (ICAM1)",
                "L-Selectin (L-SEL)",
                "Laminin (LAM)",
                "Neural Cell Adhesion Molecule (NCAM)",
                "Neural Cell Adhesion Molecule 1 (NCAM1)",
                "Osteopontin (OPN)",
                "P-Selectin (P-SEL)",
                "P-Selectin (SELP)",
                "Selectin (SEL)",
                "Siglec (SIG)",
                "Tenascin (TEN)",
                "Thrombospondin (TSP)",
                "Vascular Cell Adhesion Molecule (VCAM)",
                "Vascular Cell Adhesion Molecule 1 (VCAM1)",
                "Vitronectin (VTN)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Cadherin (CDH1)",
            "Integrin (ITGA2)",
            "Selectin (SELE)",
            "Mucin (MUC1)",
            "N-CAM (NCAM1)",
            "L-selectin (SELL)",
            "E-cadherin (CDH1)",
            "P-selectin (SELE)",
            "L1-CAM (L1CAM)",
            "ICAM-1 (CD54)",
            "VCAM-1 (CD106)",
            "P-cadherin (CDH3)",
            "NCAM (NCAM1)",
            "CD44 (CD44)",
            "CD31 (PECAM1)",
            "CD62L (SELL)",
            "CD102 (ICAM2)",
            "CD106 (VCAM1)",
            "CD54 (ICAM1)",
            "CDH2 (N-Cadherin)",
            "CDH5 (VE-cadherin)",
            "CDH7 (Cadherin-7)",
            "CDH10 (Cadherin-10)",
            "CDH11 (Cadherin-11)",
            "CDH13 (Cadherin-13)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cadherin (CDH1)",
                "Integrin (ITGA2)",
                "Selectin (SELE)",
                "Mucin (MUC1)",
                "N-CAM (NCAM1)",
                "L-selectin (SELL)",
                "E-cadherin (CDH1)",
                "P-selectin (SELE)",
                "L1-CAM (L1CAM)",
                "ICAM-1 (CD54)",
                "VCAM-1 (CD106)",
                "P-cadherin (CDH3)",
                "NCAM (NCAM1)",
                "CD44 (CD44)",
                "CD31 (PECAM1)",
                "CD62L (SELL)",
                "CD102 (ICAM2)",
                "CD106 (VCAM1)",
                "CD54 (ICAM1)",
                "CDH2 (N-Cadherin)",
                "CDH5 (VE-cadherin)",
                "CDH7 (Cadherin-7)",
                "CDH10 (Cadherin-10)",
                "CDH11 (Cadherin-11)"
            ],
            "mismatches": [
                "CDH13 (Cadherin-13)"
            ],
            "true_referents": [
                "CD102 (ICAM2)",
                "CD106 (VCAM1)",
                "CD31 (PECAM1)",
                "CD44 (CD44)",
                "CD54 (ICAM1)",
                "CD62L (SELL)",
                "CDH10 (Cadherin-10)",
                "CDH11 (Cadherin-11)",
                "CDH2 (N-Cadherin)",
                "CDH5 (VE-cadherin)",
                "CDH7 (Cadherin-7)",
                "Cadherin (CDH1)",
                "E-cadherin (CDH1)",
                "ICAM-1 (CD54)",
                "Integrin (ITGA2)",
                "L-selectin (SELL)",
                "L1-CAM (L1CAM)",
                "Mucin (MUC1)",
                "N-CAM (NCAM1)",
                "NCAM (NCAM1)",
                "P-cadherin (CDH3)",
                "P-selectin (SELE)",
                "Selectin (SELE)",
                "VCAM-1 (CD106)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": [
            "Ep-CAM (Epithelial Cell Adhesion Molecule)",
            "ICAM-1 (Inter-Cellular Adhesion Molecule 1)",
            "ICAM-2 (Inter-Cellular Adhesion Molecule 2)",
            "ICAM-3 (Inter-Cellular Adhesion Molecule 3)",
            "ICAM-4 (Inter-Cellular Adhesion Molecule 4)",
            "ICAM-5 (Inter-Cellular Adhesion Molecule 5)",
            "VCAM-1 (Vascular Cell Adhesion Molecule 1)",
            "NCAM (Neural Cell Adhesion Molecule)",
            "L1CAM (L1 Cell Adhesion Molecule)",
            "Neuroplastin (NRP)",
            "Basigin (BSG)",
            "CD44 (Cluster of Differentiation 44)",
            "CDH1 (E-Cadherin)",
            "CDH2 (N-Cadherin)",
            "CDH3 (P-Cadherin)",
            "CDH4 (R-Cadherin)",
            "CDH5 (VE-Cadherin)",
            "Desmoglein (DSG)",
            "Desmocollin (DSC)",
            "OCAD1 (Ovarian Cancer Associated Antigen 1)",
            "E-Cadherin (CDH1)",
            "OB-Cadherin (CDH11)",
            "VE-Cadherin (CDH5)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ep-CAM (Epithelial Cell Adhesion Molecule)",
                "ICAM-1 (Inter-Cellular Adhesion Molecule 1)",
                "ICAM-2 (Inter-Cellular Adhesion Molecule 2)",
                "ICAM-3 (Inter-Cellular Adhesion Molecule 3)",
                "ICAM-4 (Inter-Cellular Adhesion Molecule 4)",
                "ICAM-5 (Inter-Cellular Adhesion Molecule 5)",
                "VCAM-1 (Vascular Cell Adhesion Molecule 1)",
                "NCAM (Neural Cell Adhesion Molecule)",
                "L1CAM (L1 Cell Adhesion Molecule)",
                "Neuroplastin (NRP)",
                "Basigin (BSG)",
                "CD44 (Cluster of Differentiation 44)",
                "CDH1 (E-Cadherin)",
                "CDH2 (N-Cadherin)",
                "CDH3 (P-Cadherin)",
                "CDH4 (R-Cadherin)",
                "CDH5 (VE-Cadherin)",
                "Desmoglein (DSG)",
                "Desmocollin (DSC)",
                "OCAD1 (Ovarian Cancer Associated Antigen 1)",
                "E-Cadherin (CDH1)",
                "OB-Cadherin (CDH11)",
                "VE-Cadherin (CDH5)"
            ],
            "mismatches": [],
            "true_referents": [
                "Basigin (BSG)",
                "CD44 (Cluster of Differentiation 44)",
                "CDH1 (E-Cadherin)",
                "CDH2 (N-Cadherin)",
                "CDH3 (P-Cadherin)",
                "CDH4 (R-Cadherin)",
                "CDH5 (VE-Cadherin)",
                "Desmocollin (DSC)",
                "Desmoglein (DSG)",
                "E-Cadherin (CDH1)",
                "Ep-CAM (Epithelial Cell Adhesion Molecule)",
                "ICAM-1 (Inter-Cellular Adhesion Molecule 1)",
                "ICAM-2 (Inter-Cellular Adhesion Molecule 2)",
                "ICAM-3 (Inter-Cellular Adhesion Molecule 3)",
                "ICAM-4 (Inter-Cellular Adhesion Molecule 4)",
                "ICAM-5 (Inter-Cellular Adhesion Molecule 5)",
                "L1CAM (L1 Cell Adhesion Molecule)",
                "NCAM (Neural Cell Adhesion Molecule)",
                "Neuroplastin (NRP)",
                "OB-Cadherin (CDH11)",
                "OCAD1 (Ovarian Cancer Associated Antigen 1)",
                "VCAM-1 (Vascular Cell Adhesion Molecule 1)",
                "VE-Cadherin (CDH5)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "cell adhesion molecule",
        "domain": "biology",
        "response": "[\n        \"it is a cell surface ligand\",\n        \"it is usually a glycoprotein\",\n        \"it mediates cell-to-cell adhesion\"\n    ]\n},\n{\n    \"referent\": \"integrins\",\n    \"definition\": [\n        \"it is a cell surface ligand\",\n        \"it is usually a glycoprotein\",\n        \"it mediates cell-to-cell adhesion\"\n    ]",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]