[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "heparin (H)",
            "warfarin (W)",
            "dabigatran etexilate (DE)",
            "rivaroxaban (RX)",
            "apixaban (APX)",
            "edoxaban (EX)",
            "tinzaparin (TZP)",
            "dalteparin (DP)",
            "enoxaparin (ENX)",
            "fondaparinux (FP)",
            "betrixaban (BX)",
            "idarucizumab (IDR)",
            "andexanet alfa (AXA)",
            "argatroban (ARG)",
            "lepirudin (LPR)",
            "bivalirudin (BVL)",
            "danaparoid (DNP)",
            "recombinant hirudin (RH)",
            "levosimendan (LSM)",
            "cilostazol (CZ)",
            "ticlopidine (TIC)",
            "clopidogrel (CPG)",
            "prasugrel (PGR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "heparin (H)",
                "warfarin (W)",
                "dabigatran etexilate (DE)",
                "rivaroxaban (RX)",
                "apixaban (APX)",
                "edoxaban (EX)",
                "tinzaparin (TZP)",
                "dalteparin (DP)",
                "enoxaparin (ENX)",
                "fondaparinux (FP)",
                "betrixaban (BX)",
                "idarucizumab (IDR)",
                "andexanet alfa (AXA)",
                "argatroban (ARG)",
                "lepirudin (LPR)",
                "bivalirudin (BVL)",
                "danaparoid (DNP)",
                "recombinant hirudin (RH)",
                "levosimendan (LSM)",
                "cilostazol (CZ)",
                "ticlopidine (TIC)",
                "clopidogrel (CPG)",
                "prasugrel (PGR)"
            ],
            "mismatches": [],
            "true_referents": [
                "andexanet alfa (AXA)",
                "apixaban (APX)",
                "argatroban (ARG)",
                "betrixaban (BX)",
                "bivalirudin (BVL)",
                "cilostazol (CZ)",
                "clopidogrel (CPG)",
                "dabigatran etexilate (DE)",
                "dalteparin (DP)",
                "danaparoid (DNP)",
                "edoxaban (EX)",
                "enoxaparin (ENX)",
                "fondaparinux (FP)",
                "heparin (H)",
                "idarucizumab (IDR)",
                "lepirudin (LPR)",
                "levosimendan (LSM)",
                "prasugrel (PGR)",
                "recombinant hirudin (RH)",
                "rivaroxaban (RX)",
                "ticlopidine (TIC)",
                "tinzaparin (TZP)",
                "warfarin (W)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Heparin (Hep)",
            "Warfarin (Coumadin)",
            "Dabigatran (Pradaxa)",
            "Rivaroxaban (Xarelto)",
            "Apixaban (Eliquis)",
            "Edoxaban (Savaysa)",
            "Aspirin (Acetylsalicylic acid)",
            "Clopidogrel (Plavix)",
            "Ticagrelor (Brilinta)",
            "Prasugrel (Effient)",
            "Dipyridamole (Persantine)",
            "Anistreplase (Eminase)",
            "Pentosan polysulfate (Floseal)",
            "Hirudin (Lepirudin)",
            "Bivalirudin (Angiomax)",
            "Argatroban (Argatra)",
            "Desirudin (Iprivask)",
            "Tirofiban (Aggrastat)",
            "Eptifibatide (Integrilin)",
            "Abciximab (ReoPro)",
            "Fondaparinux (Arixtra)",
            "Nadroparin (Fraxiparine)",
            "Enoxaparin (Lovenox)",
            "Dalteparin (Fragmin)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heparin (Hep)",
                "Warfarin (Coumadin)",
                "Dabigatran (Pradaxa)",
                "Rivaroxaban (Xarelto)",
                "Apixaban (Eliquis)",
                "Edoxaban (Savaysa)",
                "Aspirin (Acetylsalicylic acid)",
                "Clopidogrel (Plavix)",
                "Ticagrelor (Brilinta)",
                "Prasugrel (Effient)",
                "Dipyridamole (Persantine)",
                "Anistreplase (Eminase)",
                "Pentosan polysulfate (Floseal)",
                "Hirudin (Lepirudin)",
                "Bivalirudin (Angiomax)",
                "Argatroban (Argatra)",
                "Desirudin (Iprivask)",
                "Tirofiban (Aggrastat)",
                "Eptifibatide (Integrilin)",
                "Abciximab (ReoPro)",
                "Fondaparinux (Arixtra)",
                "Nadroparin (Fraxiparine)",
                "Enoxaparin (Lovenox)",
                "Dalteparin (Fragmin)"
            ],
            "mismatches": [],
            "true_referents": [
                "Abciximab (ReoPro)",
                "Anistreplase (Eminase)",
                "Apixaban (Eliquis)",
                "Argatroban (Argatra)",
                "Aspirin (Acetylsalicylic acid)",
                "Bivalirudin (Angiomax)",
                "Clopidogrel (Plavix)",
                "Dabigatran (Pradaxa)",
                "Dalteparin (Fragmin)",
                "Desirudin (Iprivask)",
                "Dipyridamole (Persantine)",
                "Edoxaban (Savaysa)",
                "Enoxaparin (Lovenox)",
                "Eptifibatide (Integrilin)",
                "Fondaparinux (Arixtra)",
                "Heparin (Hep)",
                "Hirudin (Lepirudin)",
                "Nadroparin (Fraxiparine)",
                "Pentosan polysulfate (Floseal)",
                "Prasugrel (Effient)",
                "Rivaroxaban (Xarelto)",
                "Ticagrelor (Brilinta)",
                "Tirofiban (Aggrastat)",
                "Warfarin (Coumadin)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Heparin (HEP)",
            "Warfarin (WAR)",
            "Aspirin (ASA)",
            "Clopidogrel (CLO)",
            "Dabigatran (DAB)",
            "Edoxaban (EDO)",
            "Rivaroxaban (RIV)",
            "Apixaban (API)",
            "Enoxaparin (ENX)",
            "Dalteparin (DAL)",
            "Tinzaparin (TIN)",
            "Fondaparinux (FON)",
            "Lovenox (LOV)",
            "Fragmin (FRG)",
            "Innohep (INN)",
            "Pradaxa (PRA)",
            "Xarelto (XAR)",
            "Eliquis (ELI)",
            "Ticagrelor (TIC)",
            "Bivalirudin (BIV)",
            "Argatroban (ARG)",
            "Lepirudin (LEP)",
            "Desirudin (DES)",
            "Protamine sulfate (PRO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heparin (HEP)",
                "Warfarin (WAR)",
                "Aspirin (ASA)",
                "Clopidogrel (CLO)",
                "Dabigatran (DAB)",
                "Edoxaban (EDO)",
                "Rivaroxaban (RIV)",
                "Apixaban (API)",
                "Enoxaparin (ENX)",
                "Dalteparin (DAL)",
                "Tinzaparin (TIN)",
                "Fondaparinux (FON)",
                "Lovenox (LOV)",
                "Fragmin (FRG)",
                "Innohep (INN)",
                "Pradaxa (PRA)",
                "Xarelto (XAR)",
                "Eliquis (ELI)",
                "Ticagrelor (TIC)",
                "Bivalirudin (BIV)",
                "Argatroban (ARG)",
                "Lepirudin (LEP)",
                "Desirudin (DES)",
                "Protamine sulfate (PRO)"
            ],
            "mismatches": [],
            "true_referents": [
                "Apixaban (API)",
                "Argatroban (ARG)",
                "Aspirin (ASA)",
                "Bivalirudin (BIV)",
                "Clopidogrel (CLO)",
                "Dabigatran (DAB)",
                "Dalteparin (DAL)",
                "Desirudin (DES)",
                "Edoxaban (EDO)",
                "Eliquis (ELI)",
                "Enoxaparin (ENX)",
                "Fondaparinux (FON)",
                "Fragmin (FRG)",
                "Heparin (HEP)",
                "Innohep (INN)",
                "Lepirudin (LEP)",
                "Lovenox (LOV)",
                "Pradaxa (PRA)",
                "Protamine sulfate (PRO)",
                "Rivaroxaban (RIV)",
                "Ticagrelor (TIC)",
                "Tinzaparin (TIN)",
                "Warfarin (WAR)",
                "Xarelto (XAR)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Heparin (Hep)",
            "Warfarin (War)",
            "Aspirin (ASA)",
            "Clopidogrel (Clo)",
            "Dabigatran (Dab)",
            "Rivaroxaban (Riv)",
            "Apixaban (Api)",
            "Edoxaban (Edox)",
            "Argatroban (Arg)",
            "Bivalirudin (Biv)",
            "Fondaparinux (Fon)",
            "Hirudin (Hir)",
            "Lepirudin (Lep)",
            "Desirudin (Des)",
            "Ancrod (Anc)",
            "Ximelagatran (Xim)",
            "Ticlopidine (Tic)",
            "Prasugrel (Pra)",
            "Vorapaxar (Vor)",
            "Citrate (Cit)",
            "Oxalate (Ox)",
            "Phosphate (Pho)",
            "Protein C (PC)",
            "Antithrombin (AT)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heparin (Hep)",
                "Warfarin (War)",
                "Aspirin (ASA)",
                "Clopidogrel (Clo)",
                "Dabigatran (Dab)",
                "Rivaroxaban (Riv)",
                "Apixaban (Api)",
                "Edoxaban (Edox)",
                "Argatroban (Arg)",
                "Bivalirudin (Biv)",
                "Fondaparinux (Fon)",
                "Hirudin (Hir)",
                "Lepirudin (Lep)",
                "Desirudin (Des)",
                "Ancrod (Anc)",
                "Ximelagatran (Xim)",
                "Ticlopidine (Tic)",
                "Prasugrel (Pra)",
                "Vorapaxar (Vor)",
                "Citrate (Cit)",
                "Oxalate (Ox)",
                "Phosphate (Pho)",
                "Protein C (PC)",
                "Antithrombin (AT)"
            ],
            "mismatches": [],
            "true_referents": [
                "Ancrod (Anc)",
                "Antithrombin (AT)",
                "Apixaban (Api)",
                "Argatroban (Arg)",
                "Aspirin (ASA)",
                "Bivalirudin (Biv)",
                "Citrate (Cit)",
                "Clopidogrel (Clo)",
                "Dabigatran (Dab)",
                "Desirudin (Des)",
                "Edoxaban (Edox)",
                "Fondaparinux (Fon)",
                "Heparin (Hep)",
                "Hirudin (Hir)",
                "Lepirudin (Lep)",
                "Oxalate (Ox)",
                "Phosphate (Pho)",
                "Prasugrel (Pra)",
                "Protein C (PC)",
                "Rivaroxaban (Riv)",
                "Ticlopidine (Tic)",
                "Vorapaxar (Vor)",
                "Warfarin (War)",
                "Ximelagatran (Xim)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Heparin",
            "Warfarin",
            "Aspirin",
            "Dabigatran (Pradaxa)",
            "Rivaroxaban (Xarelto)",
            "Apixaban (Eliquis)",
            "Edoxaban (Savaysa)",
            "Fondaparinux (Arixtra)",
            "Bivalirudin (Angiomax)",
            "Argatroban",
            "Enoxaparin (Lovenox)",
            "Tinzaparin (Innohep)",
            "Danaparoid (Orgaran)",
            "Desirudin (Iprivask)",
            "Antithrombin III",
            "Acenocoumarol (Sintrom)",
            "Phenindione",
            "Nadroparin (Fraxiparine)",
            "Bemiparin (Zibor)",
            "Lepirudin (Refludan)",
            "Anisindione",
            "Phenprocoumon",
            "Coumarin",
            "Dicoumarol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heparin",
                "Warfarin",
                "Aspirin",
                "Dabigatran (Pradaxa)",
                "Rivaroxaban (Xarelto)",
                "Apixaban (Eliquis)",
                "Edoxaban (Savaysa)",
                "Fondaparinux (Arixtra)",
                "Bivalirudin (Angiomax)",
                "Argatroban",
                "Enoxaparin (Lovenox)",
                "Tinzaparin (Innohep)",
                "Danaparoid (Orgaran)",
                "Desirudin (Iprivask)",
                "Antithrombin III",
                "Acenocoumarol (Sintrom)",
                "Phenindione",
                "Nadroparin (Fraxiparine)",
                "Bemiparin (Zibor)",
                "Lepirudin (Refludan)",
                "Anisindione",
                "Phenprocoumon",
                "Coumarin",
                "Dicoumarol"
            ],
            "mismatches": [],
            "true_referents": [
                "Acenocoumarol (Sintrom)",
                "Anisindione",
                "Antithrombin III",
                "Apixaban (Eliquis)",
                "Argatroban",
                "Aspirin",
                "Bemiparin (Zibor)",
                "Bivalirudin (Angiomax)",
                "Coumarin",
                "Dabigatran (Pradaxa)",
                "Danaparoid (Orgaran)",
                "Desirudin (Iprivask)",
                "Dicoumarol",
                "Edoxaban (Savaysa)",
                "Enoxaparin (Lovenox)",
                "Fondaparinux (Arixtra)",
                "Heparin",
                "Lepirudin (Refludan)",
                "Nadroparin (Fraxiparine)",
                "Phenindione",
                "Phenprocoumon",
                "Rivaroxaban (Xarelto)",
                "Tinzaparin (Innohep)",
                "Warfarin"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Heparin (HPR)",
            "Warfarin (WAR)",
            "Aspirin (ASP)",
            "Dabigatran (DAB)",
            "Rivaroxaban (RIV)",
            "Apixaban (API)",
            "Clopidogrel (CLO)",
            "Fondaparinux (FON)",
            "Bivalirudin (BIV)",
            "Argatroban (ARG)",
            "Enoxaparin (ENO)",
            "Tinzaparin (TIN)",
            "Danaparoid (DAN)",
            "Selatogrel (SEL)",
            "Cangrelor (CAN)",
            "Edoxaban (EDO)",
            "Lepirudin (LEP)",
            "Recombinant tissue factor pathway inhibitor (TFPI)",
            "Aprotinin (APR)",
            "Thrombin inhibitors (THR)",
            "Ximelagatran (XIM)",
            "Sarpogrelate (SAR)",
            "Bivalirudin (BIV)",
            "Argatroban (ARG)",
            "Nadroparin (NAD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heparin (HPR)",
                "Warfarin (WAR)",
                "Aspirin (ASP)",
                "Dabigatran (DAB)",
                "Rivaroxaban (RIV)",
                "Apixaban (API)",
                "Clopidogrel (CLO)",
                "Fondaparinux (FON)",
                "Bivalirudin (BIV)",
                "Argatroban (ARG)",
                "Enoxaparin (ENO)",
                "Tinzaparin (TIN)",
                "Danaparoid (DAN)",
                "Selatogrel (SEL)",
                "Cangrelor (CAN)",
                "Edoxaban (EDO)",
                "Lepirudin (LEP)",
                "Recombinant tissue factor pathway inhibitor (TFPI)",
                "Aprotinin (APR)",
                "Thrombin inhibitors (THR)",
                "Ximelagatran (XIM)",
                "Sarpogrelate (SAR)"
            ],
            "mismatches": [
                "Nadroparin (NAD)"
            ],
            "true_referents": [
                "Apixaban (API)",
                "Aprotinin (APR)",
                "Argatroban (ARG)",
                "Aspirin (ASP)",
                "Bivalirudin (BIV)",
                "Cangrelor (CAN)",
                "Clopidogrel (CLO)",
                "Dabigatran (DAB)",
                "Danaparoid (DAN)",
                "Edoxaban (EDO)",
                "Enoxaparin (ENO)",
                "Fondaparinux (FON)",
                "Heparin (HPR)",
                "Lepirudin (LEP)",
                "Recombinant tissue factor pathway inhibitor (TFPI)",
                "Rivaroxaban (RIV)",
                "Sarpogrelate (SAR)",
                "Selatogrel (SEL)",
                "Thrombin inhibitors (THR)",
                "Tinzaparin (TIN)",
                "Warfarin (WAR)",
                "Ximelagatran (XIM)"
            ],
            "TP": 22,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Heparin (HP)",
            "Warfarin (WF)",
            "Aspirin (ASP)",
            "Clopidogrel (CP)",
            "Dabigatran (DB)",
            "Rivaroxaban (RV)",
            "Apixaban (AP)",
            "Edoxaban (ED)",
            "Ticagrelor (TG)",
            "Prasugrel (PR)",
            "Dipyridamole (DP)",
            "Cilostazol (CZ)",
            "Enoxaparin (EN)",
            "Dalteparin (DL)",
            "Tinzaparin (TZ)",
            "Fondaparinux (FD)",
            "Argatroban (AG)",
            "Bivalirudin (BV)",
            "Lepirudin (LP)",
            "Desirudin (DS)",
            "Glycoprotein IIb/IIIa inhibitors (GPI)",
            "Vitamin K antagonists (VKA)",
            "Direct oral anticoagulants (DOAC)",
            "Indirect thrombin inhibitors (ITI)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heparin (HP)",
                "Warfarin (WF)",
                "Aspirin (ASP)",
                "Clopidogrel (CP)",
                "Dabigatran (DB)",
                "Rivaroxaban (RV)",
                "Apixaban (AP)",
                "Edoxaban (ED)",
                "Ticagrelor (TG)",
                "Prasugrel (PR)",
                "Dipyridamole (DP)",
                "Cilostazol (CZ)",
                "Enoxaparin (EN)",
                "Dalteparin (DL)",
                "Tinzaparin (TZ)",
                "Fondaparinux (FD)",
                "Argatroban (AG)",
                "Bivalirudin (BV)",
                "Lepirudin (LP)",
                "Desirudin (DS)",
                "Glycoprotein IIb/IIIa inhibitors (GPI)",
                "Vitamin K antagonists (VKA)",
                "Direct oral anticoagulants (DOAC)",
                "Indirect thrombin inhibitors (ITI)"
            ],
            "mismatches": [],
            "true_referents": [
                "Apixaban (AP)",
                "Argatroban (AG)",
                "Aspirin (ASP)",
                "Bivalirudin (BV)",
                "Cilostazol (CZ)",
                "Clopidogrel (CP)",
                "Dabigatran (DB)",
                "Dalteparin (DL)",
                "Desirudin (DS)",
                "Dipyridamole (DP)",
                "Direct oral anticoagulants (DOAC)",
                "Edoxaban (ED)",
                "Enoxaparin (EN)",
                "Fondaparinux (FD)",
                "Glycoprotein IIb/IIIa inhibitors (GPI)",
                "Heparin (HP)",
                "Indirect thrombin inhibitors (ITI)",
                "Lepirudin (LP)",
                "Prasugrel (PR)",
                "Rivaroxaban (RV)",
                "Ticagrelor (TG)",
                "Tinzaparin (TZ)",
                "Vitamin K antagonists (VKA)",
                "Warfarin (WF)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Heparin",
            "Warfarin",
            "Aspirin",
            "Clopidogrel",
            "Rivaroxaban",
            "Dabigatran",
            "Apixaban",
            "Edoxaban",
            "Fondaparinux",
            "Enoxaparin",
            "Dalteparin",
            "Ticagrelor",
            "Cilostazol",
            "Abciximab",
            "Eptifibatide",
            "Tirofiban",
            "Dipyridamole",
            "Streptokinase",
            "Alteplase",
            "Tenecteplase",
            "Urokinase",
            "Anistreplase",
            "Bivalirudin",
            "Argatroban"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heparin",
                "Warfarin",
                "Aspirin",
                "Clopidogrel",
                "Rivaroxaban",
                "Dabigatran",
                "Apixaban",
                "Edoxaban",
                "Fondaparinux",
                "Enoxaparin",
                "Dalteparin",
                "Ticagrelor",
                "Cilostazol",
                "Abciximab",
                "Eptifibatide",
                "Tirofiban",
                "Dipyridamole",
                "Streptokinase",
                "Alteplase",
                "Tenecteplase",
                "Urokinase",
                "Anistreplase",
                "Bivalirudin",
                "Argatroban"
            ],
            "mismatches": [],
            "true_referents": [
                "Abciximab",
                "Alteplase",
                "Anistreplase",
                "Apixaban",
                "Argatroban",
                "Aspirin",
                "Bivalirudin",
                "Cilostazol",
                "Clopidogrel",
                "Dabigatran",
                "Dalteparin",
                "Dipyridamole",
                "Edoxaban",
                "Enoxaparin",
                "Eptifibatide",
                "Fondaparinux",
                "Heparin",
                "Rivaroxaban",
                "Streptokinase",
                "Tenecteplase",
                "Ticagrelor",
                "Tirofiban",
                "Urokinase",
                "Warfarin"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Aspirin (ASA)",
            "Warfarin (Coumadin)",
            "Heparin",
            "Enoxaparin (Lovenox)",
            "Dabigatran (Pradaxa)",
            "Rivaroxaban (Xarelto)",
            "Apixaban (Eliquis)",
            "Edoxaban (Savaysa)",
            "Fondaparinux (Arixtra)",
            "Ticlopidine",
            "Clopidogrel (Plavix)",
            "Prasugrel (Effient)",
            "Ticagrelor (Brilinta)",
            "Bivalirudin (Angiomax)",
            "Argatroban",
            "Desmopressin (DDAVP)",
            "Dipyridamole",
            "Abciximab (ReoPro)",
            "Eptifibatide (Integrilin)",
            "Tirofiban (Aggrastat)",
            "Vitamin K antagonist",
            "Low-molecular-weight heparin (LMWH)",
            "Danaparoid",
            "Anagrelide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspirin (ASA)",
                "Warfarin (Coumadin)",
                "Heparin",
                "Enoxaparin (Lovenox)",
                "Dabigatran (Pradaxa)",
                "Rivaroxaban (Xarelto)",
                "Apixaban (Eliquis)",
                "Edoxaban (Savaysa)",
                "Fondaparinux (Arixtra)",
                "Ticlopidine",
                "Clopidogrel (Plavix)",
                "Prasugrel (Effient)",
                "Ticagrelor (Brilinta)",
                "Bivalirudin (Angiomax)",
                "Argatroban",
                "Desmopressin (DDAVP)",
                "Dipyridamole",
                "Abciximab (ReoPro)",
                "Eptifibatide (Integrilin)",
                "Tirofiban (Aggrastat)",
                "Vitamin K antagonist",
                "Low-molecular-weight heparin (LMWH)",
                "Danaparoid",
                "Anagrelide"
            ],
            "mismatches": [],
            "true_referents": [
                "Abciximab (ReoPro)",
                "Anagrelide",
                "Apixaban (Eliquis)",
                "Argatroban",
                "Aspirin (ASA)",
                "Bivalirudin (Angiomax)",
                "Clopidogrel (Plavix)",
                "Dabigatran (Pradaxa)",
                "Danaparoid",
                "Desmopressin (DDAVP)",
                "Dipyridamole",
                "Edoxaban (Savaysa)",
                "Enoxaparin (Lovenox)",
                "Eptifibatide (Integrilin)",
                "Fondaparinux (Arixtra)",
                "Heparin",
                "Low-molecular-weight heparin (LMWH)",
                "Prasugrel (Effient)",
                "Rivaroxaban (Xarelto)",
                "Ticagrelor (Brilinta)",
                "Ticlopidine",
                "Tirofiban (Aggrastat)",
                "Vitamin K antagonist",
                "Warfarin (Coumadin)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Heparin (UFH)",
            "Low-molecular-weight heparin (LMWH)",
            "Warfarin (Coumadin)",
            "Rivaroxaban (Xarelto)",
            "Apixaban (Eliquis)",
            "Dabigatran (Pradaxa)",
            "Edoxaban (Savaysa)",
            "Fondaparinux (Arixtra)",
            "Argatroban",
            "Bivalirudin (Angiomax)",
            "Dalteparin (Fragmin)",
            "Enoxaparin (Lovenox)",
            "Tinzaparin (Innohep)",
            "Hirudin",
            "Lepirudin (Refludan)",
            "Desirudin (Iprivask)",
            "Acenocoumarol (Sintrom)",
            "Phenprocoumon (Marcoumar)",
            "Aspirin (Acetylsalicylic acid)",
            "Clopidogrel (Plavix)",
            "Ticagrelor (Brilinta)",
            "Prasugrel (Effient)",
            "Dipyridamole (Persantine)",
            "Ticlopidine (Ticlid)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heparin (UFH)",
                "Low-molecular-weight heparin (LMWH)",
                "Warfarin (Coumadin)",
                "Rivaroxaban (Xarelto)",
                "Apixaban (Eliquis)",
                "Dabigatran (Pradaxa)",
                "Edoxaban (Savaysa)",
                "Fondaparinux (Arixtra)",
                "Argatroban",
                "Bivalirudin (Angiomax)",
                "Dalteparin (Fragmin)",
                "Enoxaparin (Lovenox)",
                "Tinzaparin (Innohep)",
                "Hirudin",
                "Lepirudin (Refludan)",
                "Desirudin (Iprivask)",
                "Acenocoumarol (Sintrom)",
                "Phenprocoumon (Marcoumar)",
                "Aspirin (Acetylsalicylic acid)",
                "Clopidogrel (Plavix)",
                "Ticagrelor (Brilinta)",
                "Prasugrel (Effient)",
                "Dipyridamole (Persantine)",
                "Ticlopidine (Ticlid)"
            ],
            "mismatches": [],
            "true_referents": [
                "Acenocoumarol (Sintrom)",
                "Apixaban (Eliquis)",
                "Argatroban",
                "Aspirin (Acetylsalicylic acid)",
                "Bivalirudin (Angiomax)",
                "Clopidogrel (Plavix)",
                "Dabigatran (Pradaxa)",
                "Dalteparin (Fragmin)",
                "Desirudin (Iprivask)",
                "Dipyridamole (Persantine)",
                "Edoxaban (Savaysa)",
                "Enoxaparin (Lovenox)",
                "Fondaparinux (Arixtra)",
                "Heparin (UFH)",
                "Hirudin",
                "Lepirudin (Refludan)",
                "Low-molecular-weight heparin (LMWH)",
                "Phenprocoumon (Marcoumar)",
                "Prasugrel (Effient)",
                "Rivaroxaban (Xarelto)",
                "Ticagrelor (Brilinta)",
                "Ticlopidine (Ticlid)",
                "Tinzaparin (Innohep)",
                "Warfarin (Coumadin)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Heparin",
            "Warfarin",
            "Dabigatran (Pradaxa)",
            "Rivaroxaban (Xarelto)",
            "Apixaban (Eliquis)",
            "Edoxaban (Savaysa)",
            "Fondaparinux (Arixtra)",
            "Bivalirudin (Angiomax)",
            "Argatroban",
            "Danaparoid (Orgaran)",
            "Lepirudin (Refludan)",
            "Enoxaparin (Lovenox)",
            "Dalteparin (Fragmin)",
            "Tinzaparin (Innohep)",
            "Nadroparin (Fraxiparine)",
            "Hirudin",
            "Aspirin",
            "Clopidogrel (Plavix)",
            "Ticagrelor (Brilinta)",
            "Prasugrel (Effient)",
            "Dipyridamole (Persantine)",
            "Ticlopidine (Ticlid)",
            "Cilostazol (Pletal)",
            "Vorapaxar (Zontivity)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heparin",
                "Warfarin",
                "Dabigatran (Pradaxa)",
                "Rivaroxaban (Xarelto)",
                "Apixaban (Eliquis)",
                "Edoxaban (Savaysa)",
                "Fondaparinux (Arixtra)",
                "Bivalirudin (Angiomax)",
                "Argatroban",
                "Danaparoid (Orgaran)",
                "Lepirudin (Refludan)",
                "Enoxaparin (Lovenox)",
                "Dalteparin (Fragmin)",
                "Tinzaparin (Innohep)",
                "Nadroparin (Fraxiparine)",
                "Hirudin",
                "Aspirin",
                "Clopidogrel (Plavix)",
                "Ticagrelor (Brilinta)",
                "Prasugrel (Effient)",
                "Dipyridamole (Persantine)",
                "Ticlopidine (Ticlid)",
                "Cilostazol (Pletal)",
                "Vorapaxar (Zontivity)"
            ],
            "mismatches": [],
            "true_referents": [
                "Apixaban (Eliquis)",
                "Argatroban",
                "Aspirin",
                "Bivalirudin (Angiomax)",
                "Cilostazol (Pletal)",
                "Clopidogrel (Plavix)",
                "Dabigatran (Pradaxa)",
                "Dalteparin (Fragmin)",
                "Danaparoid (Orgaran)",
                "Dipyridamole (Persantine)",
                "Edoxaban (Savaysa)",
                "Enoxaparin (Lovenox)",
                "Fondaparinux (Arixtra)",
                "Heparin",
                "Hirudin",
                "Lepirudin (Refludan)",
                "Nadroparin (Fraxiparine)",
                "Prasugrel (Effient)",
                "Rivaroxaban (Xarelto)",
                "Ticagrelor (Brilinta)",
                "Ticlopidine (Ticlid)",
                "Tinzaparin (Innohep)",
                "Vorapaxar (Zontivity)",
                "Warfarin"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Heparin (Hep)",
            "Warfarin",
            "Apixaban (Apix)",
            "Rivaroxaban (Riv)",
            "Dabigatran (Dab)",
            "Edoxaban (Edox)",
            "Clopidogrel (Clop)",
            "Prasugrel (Pras)",
            "Ticagrelor (Tica)",
            "Dipyridamole (Dipy)",
            "Cilostazol",
            "Abciximab (Abcix)",
            "Eptifibatide (Eptif)",
            "Tirofiban (Tirof)",
            "Dextran",
            "Lepirudin (Lepir)",
            "Bivalirudin (Bival)",
            "Argatroban (Argat)",
            "Fondaparinux (Fond)",
            "Vitamin K Antagonists (VKA)",
            "Direct Thrombin Inhibitors (DTI)",
            "Direct Factor Xa Inhibitors (DFXaI)",
            "Glycoprotein IIb/IIIa Inhibitors (GPIIb/IIIaI)",
            "Adenosine Diphosphate (ADP) Receptor Inhibitors"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Heparin (Hep)",
                "Warfarin",
                "Apixaban (Apix)",
                "Rivaroxaban (Riv)",
                "Dabigatran (Dab)",
                "Edoxaban (Edox)",
                "Clopidogrel (Clop)",
                "Prasugrel (Pras)",
                "Ticagrelor (Tica)",
                "Dipyridamole (Dipy)",
                "Cilostazol",
                "Abciximab (Abcix)",
                "Eptifibatide (Eptif)",
                "Tirofiban (Tirof)",
                "Dextran",
                "Lepirudin (Lepir)",
                "Bivalirudin (Bival)",
                "Argatroban (Argat)",
                "Fondaparinux (Fond)",
                "Vitamin K Antagonists (VKA)",
                "Direct Thrombin Inhibitors (DTI)",
                "Direct Factor Xa Inhibitors (DFXaI)",
                "Glycoprotein IIb/IIIa Inhibitors (GPIIb/IIIaI)",
                "Adenosine Diphosphate (ADP) Receptor Inhibitors"
            ],
            "mismatches": [],
            "true_referents": [
                "Abciximab (Abcix)",
                "Adenosine Diphosphate (ADP) Receptor Inhibitors",
                "Apixaban (Apix)",
                "Argatroban (Argat)",
                "Bivalirudin (Bival)",
                "Cilostazol",
                "Clopidogrel (Clop)",
                "Dabigatran (Dab)",
                "Dextran",
                "Dipyridamole (Dipy)",
                "Direct Factor Xa Inhibitors (DFXaI)",
                "Direct Thrombin Inhibitors (DTI)",
                "Edoxaban (Edox)",
                "Eptifibatide (Eptif)",
                "Fondaparinux (Fond)",
                "Glycoprotein IIb/IIIa Inhibitors (GPIIb/IIIaI)",
                "Heparin (Hep)",
                "Lepirudin (Lepir)",
                "Prasugrel (Pras)",
                "Rivaroxaban (Riv)",
                "Ticagrelor (Tica)",
                "Tirofiban (Tirof)",
                "Vitamin K Antagonists (VKA)",
                "Warfarin"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Aspirin (ASA)",
            "Heparin",
            "Warfarin",
            "Enoxaparin",
            "Clopidogrel",
            "Ticagrelor",
            "Rivaroxaban",
            "Apixaban",
            "Edoxaban",
            "Fondaparinux",
            "Dipyridamole",
            "Cilostazol",
            "Eptifibatide",
            "Tirofiban",
            "Abciximab",
            "Argatroban",
            "Bivalirudin",
            "Dalteparin",
            "Nadroparin",
            "Tinzaparin",
            "Danaparoid",
            "Lepirudin",
            "Desirudin",
            "Ximelagatran"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspirin (ASA)",
                "Heparin",
                "Warfarin",
                "Enoxaparin",
                "Clopidogrel",
                "Ticagrelor",
                "Rivaroxaban",
                "Apixaban",
                "Edoxaban",
                "Fondaparinux",
                "Dipyridamole",
                "Cilostazol",
                "Eptifibatide",
                "Tirofiban",
                "Abciximab",
                "Argatroban",
                "Bivalirudin",
                "Dalteparin",
                "Nadroparin",
                "Tinzaparin",
                "Danaparoid",
                "Lepirudin",
                "Desirudin",
                "Ximelagatran"
            ],
            "mismatches": [],
            "true_referents": [
                "Abciximab",
                "Apixaban",
                "Argatroban",
                "Aspirin (ASA)",
                "Bivalirudin",
                "Cilostazol",
                "Clopidogrel",
                "Dalteparin",
                "Danaparoid",
                "Desirudin",
                "Dipyridamole",
                "Edoxaban",
                "Enoxaparin",
                "Eptifibatide",
                "Fondaparinux",
                "Heparin",
                "Lepirudin",
                "Nadroparin",
                "Rivaroxaban",
                "Ticagrelor",
                "Tinzaparin",
                "Tirofiban",
                "Warfarin",
                "Ximelagatran"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Aspirin (ASA)",
            "Warfarin",
            "Heparin",
            "Eptifibatide",
            "Tirofiban",
            "Clopidogrel",
            "Ticlopidine",
            "Dipyridamole",
            "Indomethacin",
            "Acenocoumarol",
            "Phenprocoumon",
            "Dicoumarol",
            "Bisulfite",
            "Heparan sulfate",
            "Heparinoid",
            "Coumadin",
            "Plavix",
            "Aggrenox",
            "Effient",
            "Ticlid",
            "Persantine",
            "Warfarin sodium",
            "Coumadin sodium",
            "Eptifibatide acetate",
            "Tirofiban hydrochloride"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspirin (ASA)",
                "Warfarin",
                "Heparin",
                "Eptifibatide",
                "Tirofiban",
                "Clopidogrel",
                "Ticlopidine",
                "Dipyridamole",
                "Indomethacin",
                "Acenocoumarol",
                "Phenprocoumon",
                "Dicoumarol",
                "Bisulfite",
                "Heparan sulfate",
                "Heparinoid",
                "Coumadin",
                "Plavix",
                "Aggrenox",
                "Effient",
                "Ticlid",
                "Persantine",
                "Warfarin sodium",
                "Coumadin sodium",
                "Eptifibatide acetate"
            ],
            "mismatches": [
                "Tirofiban hydrochloride"
            ],
            "true_referents": [
                "Acenocoumarol",
                "Aggrenox",
                "Aspirin (ASA)",
                "Bisulfite",
                "Clopidogrel",
                "Coumadin",
                "Coumadin sodium",
                "Dicoumarol",
                "Dipyridamole",
                "Effient",
                "Eptifibatide",
                "Eptifibatide acetate",
                "Heparan sulfate",
                "Heparin",
                "Heparinoid",
                "Indomethacin",
                "Persantine",
                "Phenprocoumon",
                "Plavix",
                "Ticlid",
                "Ticlopidine",
                "Tirofiban",
                "Warfarin",
                "Warfarin sodium"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": [
            "Warfarin (C19H16O4)",
            "Dicumarol (C19H12O6)",
            "Phenindione (C15H10O2)",
            "Bishydroxycoumarin (C19H12O6)",
            "Acenocoumarol (C19H14O6)",
            "Ethyl biscoumacetate (C21H18O6)",
            "Clorindione (C15H10O3)",
            "Anisindione (C15H12O3)",
            "Phenprocoumon (C18H12O3)",
            "Ticlopidine (C16H14ClNO2S)",
            "Clopidogrel (C16H16ClNO2S)",
            "Prasugrel (C20H20ClNO3S)",
            "Dipyridamole (C24H40N8O4)",
            "Aspirin (C9H8O4)",
            "Indobufene (C20H20N2O3)",
            "Ibuprofen (C13H18O2)",
            "Naproxen (C14H14O3)",
            "Sulfinpyrazone (C13H12N2O3S)",
            "Dipyridamole (C24H40N8O4)",
            "Ximelagatran (C22H25IN2O4)",
            "Melagatran (C14H11IN2O)",
            "Argatroban (C23H36N4O4S)",
            "Bivalirudin (C20H25N5O5)",
            "Lepirudin (C20H25N5O5)",
            "Desirudin (C20H25N5O5)",
            "hirudin (C20H25N5O5)",
            "Efegatran (C23H36N4O4S)",
            "Inogatran (C23H36N4O4S)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Warfarin (C19H16O4)",
                "Dicumarol (C19H12O6)",
                "Phenindione (C15H10O2)",
                "Bishydroxycoumarin (C19H12O6)",
                "Acenocoumarol (C19H14O6)",
                "Ethyl biscoumacetate (C21H18O6)",
                "Clorindione (C15H10O3)",
                "Anisindione (C15H12O3)",
                "Phenprocoumon (C18H12O3)",
                "Ticlopidine (C16H14ClNO2S)",
                "Clopidogrel (C16H16ClNO2S)",
                "Prasugrel (C20H20ClNO3S)",
                "Dipyridamole (C24H40N8O4)",
                "Aspirin (C9H8O4)",
                "Indobufene (C20H20N2O3)",
                "Ibuprofen (C13H18O2)",
                "Naproxen (C14H14O3)",
                "Sulfinpyrazone (C13H12N2O3S)",
                "Ximelagatran (C22H25IN2O4)",
                "Melagatran (C14H11IN2O)",
                "Argatroban (C23H36N4O4S)",
                "Bivalirudin (C20H25N5O5)",
                "Lepirudin (C20H25N5O5)"
            ],
            "mismatches": [
                "Desirudin (C20H25N5O5)",
                "hirudin (C20H25N5O5)",
                "Efegatran (C23H36N4O4S)",
                "Inogatran (C23H36N4O4S)"
            ],
            "true_referents": [
                "Acenocoumarol (C19H14O6)",
                "Anisindione (C15H12O3)",
                "Argatroban (C23H36N4O4S)",
                "Aspirin (C9H8O4)",
                "Bishydroxycoumarin (C19H12O6)",
                "Bivalirudin (C20H25N5O5)",
                "Clopidogrel (C16H16ClNO2S)",
                "Clorindione (C15H10O3)",
                "Dicumarol (C19H12O6)",
                "Dipyridamole (C24H40N8O4)",
                "Ethyl biscoumacetate (C21H18O6)",
                "Ibuprofen (C13H18O2)",
                "Indobufene (C20H20N2O3)",
                "Lepirudin (C20H25N5O5)",
                "Melagatran (C14H11IN2O)",
                "Naproxen (C14H14O3)",
                "Phenindione (C15H10O2)",
                "Phenprocoumon (C18H12O3)",
                "Prasugrel (C20H20ClNO3S)",
                "Sulfinpyrazone (C13H12N2O3S)",
                "Ticlopidine (C16H14ClNO2S)",
                "Warfarin (C19H16O4)",
                "Ximelagatran (C22H25IN2O4)"
            ],
            "TP": 23,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "anticoagulant",
        "domain": "medicine",
        "response": "{\n    \"referent\": \"anticoagulant\",\n    \"description\": \"it is a substance\"\n},\n{\n    \"referent\": \"anticoagulant\",\n    \"description\": \"it slows or prevents the clotting of blood\"\n}",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]