[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PCN)",
            "Amoxicillin (AMX)",
            "Ciprofloxacin (CIP)",
            "Tetracycline (TET)",
            "Chloramphenicol (CAM)",
            "Vancomycin (VCM)",
            "Metronidazole (MTZ)",
            "Nitrofurantoin (NIT)",
            "Erythromycin (ERY)",
            "Clindamycin (CLI)",
            "Azithromycin (AZI)",
            "Doxycycline (DOX)",
            "Sulfamethoxazole (SXT)",
            "Trimethoprim (TMP)",
            "Linezolid (LZD)",
            "Levofloxacin (LVX)",
            "Moxifloxacin (MXF)",
            "Ceftriaxone (CRO)",
            "Cefazolin (CAZ)",
            "Cefuroxime (CEM)",
            "Amikacin (AMK)",
            "Gentamicin (GEN)",
            "Tobramycin (TOB)",
            "Meropenem (MEM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (AMX)",
                "Ciprofloxacin (CIP)",
                "Tetracycline (TET)",
                "Chloramphenicol (CAM)",
                "Vancomycin (VCM)",
                "Metronidazole (MTZ)",
                "Nitrofurantoin (NIT)",
                "Azithromycin (AZI)",
                "Doxycycline (DOX)",
                "Trimethoprim (TMP)",
                "Linezolid (LZD)",
                "Levofloxacin (LVX)",
                "Moxifloxacin (MXF)",
                "Ceftriaxone (CRO)",
                "Cefazolin (CAZ)",
                "Amikacin (AMK)",
                "Meropenem (MEM)"
            ],
            "mismatches": [
                "Penicillin (PCN)",
                "Erythromycin (ERY)",
                "Clindamycin (CLI)",
                "Sulfamethoxazole (SXT)",
                "Cefuroxime (CEM)",
                "Gentamicin (GEN)",
                "Tobramycin (TOB)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amikacin disulfate",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "brodimoprim",
                "cefazedone",
                "cefazolin",
                "cefdaloxime",
                "cefmetazole",
                "cefodizime",
                "cefpodoxime",
                "ceftazidime",
                "ceftiolene",
                "ceftizoxime",
                "ceftriaxone",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "dextrofloxacin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "ertapenem",
                "levofloxacin",
                "linezolid",
                "meropenem",
                "meropenem trihydrate",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "oxytetracycline",
                "piperacillin",
                "streptomycin",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "trimethoprim",
                "vancomycin",
                "viomycin",
                "viomycin(3+)"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (Penicillin G)",
            "Amoxicillin (Amoxicillin)",
            "Ciprofloxacin (Ciprofloxacin)",
            "Tetracycline (Tetracycline)",
            "Erythromycin (Erythromycin)",
            "Vancomycin (Vancomycin)",
            "Doxycycline (Doxycycline)",
            "Clindamycin (Clindamycin)",
            "Azithromycin (Azithromycin)",
            "Trimethoprim (Trimethoprim)",
            "Sulfamethoxazole (Sulfamethoxazole)",
            "Ceftazidime (Ceftazidime)",
            "Meropenem (Meropenem)",
            "Gentamicin (Gentamicin)",
            "Linezolid (Linezolid)",
            "Moxifloxacin (Moxifloxacin)",
            "Metronidazole (Metronidazole)",
            "Chloramphenicol (Chloramphenicol)",
            "Nitrofurantoin (Nitrofurantoin)",
            "Cephalexin (Cephalexin)",
            "Amikacin (Amikacin)",
            "Rifampin (Rifampin)",
            "Ceftriaxone (Ceftriaxone)",
            "Daptomycin (Daptomycin)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (Amoxicillin)",
                "Ciprofloxacin (Ciprofloxacin)",
                "Tetracycline (Tetracycline)",
                "Vancomycin (Vancomycin)",
                "Doxycycline (Doxycycline)",
                "Azithromycin (Azithromycin)",
                "Trimethoprim (Trimethoprim)",
                "Ceftazidime (Ceftazidime)",
                "Meropenem (Meropenem)",
                "Linezolid (Linezolid)",
                "Moxifloxacin (Moxifloxacin)",
                "Metronidazole (Metronidazole)",
                "Chloramphenicol (Chloramphenicol)",
                "Nitrofurantoin (Nitrofurantoin)",
                "Cephalexin (Cephalexin)",
                "Amikacin (Amikacin)",
                "Daptomycin (Daptomycin)"
            ],
            "mismatches": [
                "Penicillin (Penicillin G)",
                "Erythromycin (Erythromycin)",
                "Clindamycin (Clindamycin)",
                "Sulfamethoxazole (Sulfamethoxazole)",
                "Gentamicin (Gentamicin)",
                "Rifampin (Rifampin)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "brodimoprim",
                "cefodizime",
                "ceftazidime",
                "ceftiolene",
                "ceftizoxime",
                "ceftriaxone",
                "cephalexin",
                "cephalexin monohydrate",
                "cephapirin",
                "cethromycin",
                "chloramphenicol",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "cloxacillin",
                "co-trimoxazole",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "imipenem",
                "linezolid",
                "meropenem",
                "meropenem trihydrate",
                "methacycline",
                "metronidazole",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "moxifloxacin hydrochloride",
                "nalidixic acid",
                "nitrofurantoin",
                "nitrofurazone",
                "ornidazole",
                "piperacillin",
                "rifabutin",
                "rifampicin",
                "streptomycin",
                "sulfamethazine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "trimethoprim",
                "vancomycin"
            ],
            "TP": 17,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PCN)",
            "Ampicillin",
            "Amoxicillin (AMX)",
            "Cefalexin (CEF)",
            "Cephalothin",
            "Ceftriaxone",
            "Vancomycin (VAN)",
            "Erythromycin (ERY)",
            "Clindamycin (CLI)",
            "Doxycycline (DOX)",
            "Tetracycline (TET)",
            "Azithromycin (AZM)",
            "Trimethoprim (TMP)",
            "Sulfamethoxazole (SMX)",
            "Nitrofurantoin (NIT)",
            "Metronidazole (MET)",
            "Ciprofloxacin (CIP)",
            "Levofloxacin (LEV)",
            "Gentamicin (GEN)",
            "Tobramycin (TOB)",
            "Amikacin (AMK)",
            "Chloramphenicol (CHL)",
            "Fusidic Acid",
            "Teicoplanin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ampicillin",
                "Amoxicillin (AMX)",
                "Ceftriaxone",
                "Vancomycin (VAN)",
                "Doxycycline (DOX)",
                "Tetracycline (TET)",
                "Azithromycin (AZM)",
                "Trimethoprim (TMP)",
                "Nitrofurantoin (NIT)",
                "Metronidazole (MET)",
                "Ciprofloxacin (CIP)",
                "Levofloxacin (LEV)",
                "Amikacin (AMK)",
                "Chloramphenicol (CHL)",
                "Teicoplanin"
            ],
            "mismatches": [
                "Penicillin (PCN)",
                "Cefalexin (CEF)",
                "Cephalothin",
                "Erythromycin (ERY)",
                "Clindamycin (CLI)",
                "Sulfamethoxazole (SMX)",
                "Gentamicin (GEN)",
                "Tobramycin (TOB)",
                "Fusidic Acid"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "Augmentin",
                "amikacin",
                "amikacin disulfate",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "brodimoprim",
                "cefadroxil",
                "cefalotin",
                "cefazolin",
                "ceftazidime",
                "ceftiolene",
                "ceftriaxone",
                "cephalexin",
                "cephapirin",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clavulanic acid",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "levofloxacin",
                "methicillin",
                "metronidazole",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "ornidazole",
                "oxytetracycline",
                "pipemidic acid",
                "piromidic acid",
                "streptomycin",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "teicoplanin",
                "tetracycline",
                "trimethoprim",
                "vancomycin"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin G (PEN)",
            "Amoxicillin (AMOX)",
            "Ciprofloxacin (CIPRO)",
            "Azithromycin (AZM)",
            "Vancomycin (VAN)",
            "Tetracycline (TET)",
            "Erythromycin (ERY)",
            "Gentamicin (GEN)",
            "Clindamycin (CLIN)",
            "Doxycycline (DOXY)",
            "Metronidazole (MET)",
            "Sulfamethoxazole/Trimethoprim (SMX/TMP)",
            "Nitrofurantoin (NIT)",
            "Levofloxacin (LEV)",
            "Cephalexin (CEPH)",
            "Imipenem (IMP)",
            "Meropenem (MER)",
            "Polymyxin B (POL)",
            "Bacitracin (BAC)",
            "Mupirocin (MUP)",
            "Fosfomycin (FOS)",
            "Linezolid (LIN)",
            "Daptomycin (DAP)",
            "Tigecycline (TIG)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (AMOX)",
                "Ciprofloxacin (CIPRO)",
                "Azithromycin (AZM)",
                "Vancomycin (VAN)",
                "Tetracycline (TET)",
                "Doxycycline (DOXY)",
                "Metronidazole (MET)",
                "Nitrofurantoin (NIT)",
                "Levofloxacin (LEV)",
                "Cephalexin (CEPH)",
                "Imipenem (IMP)",
                "Meropenem (MER)",
                "Mupirocin (MUP)",
                "Linezolid (LIN)",
                "Daptomycin (DAP)",
                "Tigecycline (TIG)"
            ],
            "mismatches": [
                "Penicillin G (PEN)",
                "Erythromycin (ERY)",
                "Gentamicin (GEN)",
                "Clindamycin (CLIN)",
                "Sulfamethoxazole/Trimethoprim (SMX/TMP)",
                "Polymyxin B (POL)",
                "Bacitracin (BAC)",
                "Fosfomycin (FOS)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "biapenem",
                "cefepime",
                "cephalexin",
                "cephalexin monohydrate",
                "cephapirin",
                "cethromycin",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "imipenem",
                "levofloxacin",
                "linezolid",
                "meropenem",
                "meropenem trihydrate",
                "methacycline",
                "methicillin",
                "metronidazole",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "mupirocin",
                "mupirocin calcium (anhydrous)",
                "mupirocin calcium hydrate",
                "nafcillin",
                "nalidixic acid",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "ornidazole",
                "oxytetracycline",
                "paromomycin sulfate",
                "piperacillin",
                "streptomycin",
                "sulfisoxazole",
                "tetracycline",
                "tigecycline",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PEN)",
            "Amoxicillin (AMX)",
            "Ciprofloxacin (CIP)",
            "Tetracycline (TET)",
            "Erythromycin (ERY)",
            "Azithromycin (AZM)",
            "Clindamycin (CLI)",
            "Doxycycline (DOX)",
            "Levofloxacin (LEV)",
            "Vancomycin (VAN)",
            "Gentamicin (GEN)",
            "Metronidazole (MTZ)",
            "Cephalexin (CEX)",
            "Trimethoprim (TMP)",
            "Sulfamethoxazole (SMX)",
            "Nitrofurantoin (NIT)",
            "Chloramphenicol (CHL)",
            "Rifampicin (RIF)",
            "Linezolid (LZD)",
            "Tobramycin (TOB)",
            "Meropenem (MER)",
            "Imipenem (IMI)",
            "Daptomycin (DAP)",
            "Fosfomycin (FOS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (AMX)",
                "Ciprofloxacin (CIP)",
                "Tetracycline (TET)",
                "Azithromycin (AZM)",
                "Doxycycline (DOX)",
                "Levofloxacin (LEV)",
                "Vancomycin (VAN)",
                "Metronidazole (MTZ)",
                "Cephalexin (CEX)",
                "Trimethoprim (TMP)",
                "Nitrofurantoin (NIT)",
                "Chloramphenicol (CHL)",
                "Rifampicin (RIF)",
                "Linezolid (LZD)",
                "Meropenem (MER)",
                "Imipenem (IMI)",
                "Daptomycin (DAP)"
            ],
            "mismatches": [
                "Penicillin (PEN)",
                "Erythromycin (ERY)",
                "Clindamycin (CLI)",
                "Gentamicin (GEN)",
                "Sulfamethoxazole (SMX)",
                "Tobramycin (TOB)",
                "Fosfomycin (FOS)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "brodimoprim",
                "cefodizime",
                "cefoxitin",
                "ceftazidime",
                "cephalexin",
                "cephalexin monohydrate",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "imipenem",
                "levofloxacin",
                "linezolid",
                "meropenem",
                "meropenem trihydrate",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "oxytetracycline",
                "piperacillin",
                "rifabutin",
                "rifampicin",
                "streptomycin",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PCN)",
            "Amoxicillin (AMX)",
            "Ciprofloxacin (CIP)",
            "Vancomycin (VAN)",
            "Tetracycline (TET)",
            "Erythromycin (ERY)",
            "Clindamycin (CLI)",
            "Gentamicin (GEN)",
            "Streptomycin (STR)",
            "Rifampicin (RIF)",
            "Metronidazole (MET)",
            "Doxycycline (DOX)",
            "Nitrofurantoin (NIT)",
            "Azithromycin (AZM)",
            "Cephalexin (CEX)",
            "Sulfamethoxazole/Trimethoprim (SXT)",
            "Linezolid (LIN)",
            "Chloramphenicol (CHL)",
            "Mupirocin (MUP)",
            "Fusidic Acid (FUS)",
            "Ceftriaxone (CRO)",
            "Ceftazidime (CAZ)",
            "Daptomycin (DAP)",
            "Telavancin (TEL)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (AMX)",
                "Ciprofloxacin (CIP)",
                "Vancomycin (VAN)",
                "Tetracycline (TET)",
                "Streptomycin (STR)",
                "Rifampicin (RIF)",
                "Metronidazole (MET)",
                "Doxycycline (DOX)",
                "Nitrofurantoin (NIT)",
                "Azithromycin (AZM)",
                "Cephalexin (CEX)",
                "Linezolid (LIN)",
                "Chloramphenicol (CHL)",
                "Mupirocin (MUP)",
                "Ceftriaxone (CRO)",
                "Ceftazidime (CAZ)",
                "Daptomycin (DAP)",
                "Telavancin (TEL)"
            ],
            "mismatches": [
                "Penicillin (PCN)",
                "Erythromycin (ERY)",
                "Clindamycin (CLI)",
                "Gentamicin (GEN)",
                "Sulfamethoxazole/Trimethoprim (SXT)",
                "Fusidic Acid (FUS)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "cefodizime",
                "cefoxitin",
                "ceftazidime",
                "ceftiolene",
                "ceftizoxime",
                "ceftriaxone",
                "cephalexin",
                "cephalexin monohydrate",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clomocycline",
                "cloxacillin",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "linezolid",
                "metronidazole",
                "metronidazole hydrochloride",
                "mupirocin",
                "mupirocin calcium (anhydrous)",
                "mupirocin calcium hydrate",
                "nalidixic acid",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "ornidazole",
                "oxytetracycline",
                "pipemidic acid",
                "piromidic acid",
                "rifabutin",
                "rifampicin",
                "scleropyric acid",
                "streptomycin",
                "sulfamethazine",
                "sulfisoxazole",
                "telavancin",
                "telavancin hydrochloride",
                "tetracycline",
                "ticarcillin",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PCN)",
            "Amoxicillin (AMX)",
            "Ciprofloxacin (CIP)",
            "Doxycycline (DOX)",
            "Azithromycin (AZM)",
            "Vancomycin (VAN)",
            "Erythromycin (ERY)",
            "Clindamycin (CLI)",
            "Tetracycline (TET)",
            "Levofloxacin (LEV)",
            "Bacitracin (BAC)",
            "Ceftriaxone (CRO)",
            "Metronidazole (MTZ)",
            "Trimethoprim (TMP)",
            "Sulfamethoxazole (SMZ)",
            "Rifampicin (RIF)",
            "Chloramphenicol (CHL)",
            "Gentamicin (GEN)",
            "Streptomycin (STR)",
            "Neomycin (NEO)",
            "Polymyxin B (PMB)",
            "Nitrofurantoin (NIT)",
            "Cefazolin (CFZ)",
            "Cefuroxime (CXM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (AMX)",
                "Ciprofloxacin (CIP)",
                "Doxycycline (DOX)",
                "Azithromycin (AZM)",
                "Vancomycin (VAN)",
                "Tetracycline (TET)",
                "Levofloxacin (LEV)",
                "Ceftriaxone (CRO)",
                "Metronidazole (MTZ)",
                "Trimethoprim (TMP)",
                "Rifampicin (RIF)",
                "Chloramphenicol (CHL)",
                "Streptomycin (STR)",
                "Nitrofurantoin (NIT)",
                "Cefazolin (CFZ)"
            ],
            "mismatches": [
                "Penicillin (PCN)",
                "Erythromycin (ERY)",
                "Clindamycin (CLI)",
                "Bacitracin (BAC)",
                "Sulfamethoxazole (SMZ)",
                "Gentamicin (GEN)",
                "Neomycin (NEO)",
                "Polymyxin B (PMB)",
                "Cefuroxime (CXM)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "brodimoprim",
                "cefazolin",
                "cefdaloxime",
                "cefmetazole",
                "cefoperazone",
                "cefpodoxime",
                "ceftazidime",
                "ceftiolene",
                "ceftizoxime",
                "ceftriaxone",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "levofloxacin",
                "methicillin",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "nafcillin",
                "neomycin sulfate",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "oxytetracycline",
                "paromomycin",
                "paromomycin sulfate",
                "rifabutin",
                "rifampicin",
                "streptomycin",
                "sulfamethazine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PEN)",
            "Ciprofloxacin (CIP)",
            "Tetracycline (TET)",
            "Vancomycin (VAN)",
            "Amoxicillin (AMX)",
            "Erythromycin (ERY)",
            "Gentamicin (GEN)",
            "Sulfamethoxazole (SMX)",
            "Trimethoprim (TMP)",
            "Azithromycin (AZI)",
            "Clindamycin (CLI)",
            "Levofloxacin (LEV)",
            "Methicillin (MET)",
            "Doxycycline (DOX)",
            "Ceftriaxone (CFT)",
            "Imipenem (IMP)",
            "Cefotaxime (CTX)",
            "Linezolid (LNZ)",
            "Rifampin (RIF)",
            "Mupirocin (MUP)",
            "Chloramphenicol (CHL)",
            "Nitrofurantoin (NIT)",
            "Colistin (COL)",
            "Daptomycin (DAP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ciprofloxacin (CIP)",
                "Tetracycline (TET)",
                "Vancomycin (VAN)",
                "Amoxicillin (AMX)",
                "Azithromycin (AZI)",
                "Levofloxacin (LEV)",
                "Methicillin (MET)",
                "Doxycycline (DOX)",
                "Ceftriaxone (CFT)",
                "Imipenem (IMP)",
                "Cefotaxime (CTX)",
                "Linezolid (LNZ)",
                "Mupirocin (MUP)",
                "Chloramphenicol (CHL)",
                "Nitrofurantoin (NIT)",
                "Daptomycin (DAP)"
            ],
            "mismatches": [
                "Penicillin (PEN)",
                "Erythromycin (ERY)",
                "Gentamicin (GEN)",
                "Sulfamethoxazole (SMX)",
                "Trimethoprim (TMP)",
                "Clindamycin (CLI)",
                "Rifampin (RIF)",
                "Colistin (COL)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "biapenem",
                "brodimoprim",
                "cefepime",
                "cefixime",
                "cefotaxime",
                "ceftazidime",
                "ceftiolene",
                "ceftizoxime",
                "ceftriaxone",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clometocillin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "imipenem",
                "levofloxacin",
                "linezolid",
                "methacycline",
                "methicillin",
                "mezlocillin",
                "moxifloxacin",
                "mupirocin",
                "mupirocin calcium (anhydrous)",
                "mupirocin calcium hydrate",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "oxytetracycline",
                "piperacillin",
                "rifabutin",
                "rifampicin",
                "streptomycin",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "teicoplanin",
                "tetracycline",
                "tilmicosin",
                "trimethoprim",
                "vancomycin"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin G (Benzylpenicillin)",
            "Amoxicillin",
            "Tetracycline",
            "Ciprofloxacin",
            "Erythromycin",
            "Vancomycin",
            "Doxycycline",
            "Chloramphenicol",
            "Azithromycin",
            "Clindamycin",
            "Sulfamethoxazole",
            "Trimethoprim",
            "Cephalexin",
            "Gentamicin (GM)",
            "Metronidazole",
            "Rifampicin",
            "Mupirocin",
            "Linezolid",
            "Nitrofurantoin",
            "Bacitracin",
            "Fosfomycin",
            "Levofloxacin",
            "Imipenem",
            "Streptomycin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin",
                "Tetracycline",
                "Ciprofloxacin",
                "Vancomycin",
                "Doxycycline",
                "Chloramphenicol",
                "Azithromycin",
                "Trimethoprim",
                "Cephalexin",
                "Metronidazole",
                "Rifampicin",
                "Mupirocin",
                "Linezolid",
                "Nitrofurantoin",
                "Levofloxacin",
                "Imipenem",
                "Streptomycin"
            ],
            "mismatches": [
                "Penicillin G (Benzylpenicillin)",
                "Erythromycin",
                "Clindamycin",
                "Sulfamethoxazole",
                "Gentamicin (GM)",
                "Bacitracin",
                "Fosfomycin"
            ],
            "true_referents": [
                "Augmentin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "brodimoprim",
                "cefazolin",
                "cephalexin",
                "cephapirin",
                "cethromycin",
                "chloramphenicol",
                "ciprofloxacin",
                "clarithromycin",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "imipenem",
                "levofloxacin",
                "linezolid",
                "meropenem",
                "methacycline",
                "methicillin",
                "metronidazole",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "mupirocin",
                "mupirocin calcium (anhydrous)",
                "mupirocin calcium hydrate",
                "nafcillin",
                "nalidixic acid",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "ornidazole",
                "piperacillin",
                "rifabutin",
                "rifampicin",
                "streptomycin",
                "sulfamethazine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PCN)",
            "Amoxicillin (AMOX)",
            "Ciprofloxacin (CIP)",
            "Tetracycline (TET)",
            "Erythromycin (ERY)",
            "Vancomycin (VAN)",
            "Gentamicin (GEN)",
            "Chloramphenicol (CHL)",
            "Sulfamethoxazole (SMX)",
            "Trimethoprim (TMP)",
            "Metronidazole (MTZ)",
            "Ceftriaxone (CRO)",
            "Azithromycin (AZM)",
            "Clindamycin (CLI)",
            "Doxycycline (DOX)",
            "Meropenem (MEM)",
            "Levofloxacin (LVX)",
            "Linezolid (LZD)",
            "Rifampicin (RIF)",
            "Nitrofurantoin (NIT)",
            "Colistin (CST)",
            "Triclosan",
            "Chlorhexidine",
            "Silver nanoparticles"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (AMOX)",
                "Ciprofloxacin (CIP)",
                "Tetracycline (TET)",
                "Vancomycin (VAN)",
                "Chloramphenicol (CHL)",
                "Trimethoprim (TMP)",
                "Metronidazole (MTZ)",
                "Ceftriaxone (CRO)",
                "Azithromycin (AZM)",
                "Doxycycline (DOX)",
                "Meropenem (MEM)",
                "Levofloxacin (LVX)",
                "Linezolid (LZD)",
                "Rifampicin (RIF)",
                "Nitrofurantoin (NIT)"
            ],
            "mismatches": [
                "Penicillin (PCN)",
                "Erythromycin (ERY)",
                "Gentamicin (GEN)",
                "Sulfamethoxazole (SMX)",
                "Clindamycin (CLI)",
                "Colistin (CST)",
                "Triclosan",
                "Chlorhexidine",
                "Silver nanoparticles"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "arsphenamine",
                "azithromycin",
                "benzylpenicillin",
                "brodimoprim",
                "cefodizime",
                "ceftazidime",
                "ceftiolene",
                "ceftriaxone",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clometocillin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "ertapenem",
                "levofloxacin",
                "linezolid",
                "meropenem",
                "meropenem trihydrate",
                "methicillin",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "nalidixic acid",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "oxytetracycline",
                "rifabutin",
                "rifampicin",
                "rosoxacin",
                "salicylhydroxamic acid",
                "silver(1+) sulfadiazinate",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "teicoplanin",
                "tetracycline",
                "trimethoprim",
                "vancomycin"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PCN)",
            "Amoxicillin (AMOX)",
            "Cephalexin (LEX)",
            "Ciprofloxacin (CIP)",
            "Levofloxacin (LEVO)",
            "Doxycycline (DOXY)",
            "Minocycline (MINO)",
            "Tetracycline (TCN)",
            "Erythromycin (ERY)",
            "Azithromycin (AZM)",
            "Clarithromycin (CLR)",
            "Clindamycin (CLI)",
            "Metronidazole (MTZ)",
            "Vancomycin (VAN)",
            "Gentamicin (GEN)",
            "Tobramycin (TOB)",
            "Amikacin (AMK)",
            "Kanamycin (KAN)",
            "Neomycin (NEO)",
            "Streptomycin (STR)",
            "Chloramphenicol (CHL)",
            "Trimethoprim (TMP)",
            "Sulfamethoxazole (SMX)",
            "Nitrofurantoin (NIT)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (AMOX)",
                "Cephalexin (LEX)",
                "Ciprofloxacin (CIP)",
                "Levofloxacin (LEVO)",
                "Doxycycline (DOXY)",
                "Minocycline (MINO)",
                "Tetracycline (TCN)",
                "Azithromycin (AZM)",
                "Clarithromycin (CLR)",
                "Metronidazole (MTZ)",
                "Vancomycin (VAN)",
                "Amikacin (AMK)",
                "Neomycin (NEO)",
                "Streptomycin (STR)",
                "Chloramphenicol (CHL)",
                "Trimethoprim (TMP)",
                "Nitrofurantoin (NIT)"
            ],
            "mismatches": [
                "Penicillin (PCN)",
                "Erythromycin (ERY)",
                "Clindamycin (CLI)",
                "Gentamicin (GEN)",
                "Tobramycin (TOB)",
                "Kanamycin (KAN)",
                "Sulfamethoxazole (SMX)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amikacin disulfate",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "brodimoprim",
                "cephalexin",
                "cephalexin monohydrate",
                "cephapirin",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "kanamycin A sulfate",
                "levofloxacin",
                "methacycline",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "minocycline",
                "neomycin sulfate",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "streptomycin",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PEN)",
            "Amoxicillin (AMX)",
            "Ciprofloxacin (CIP)",
            "Erythromycin (ERY)",
            "Tetracycline (TET)",
            "Vancomycin (VAN)",
            "Gentamicin (GEN)",
            "Clindamycin (CLN)",
            "Metronidazole (MTZ)",
            "Trimethoprim-sulfamethoxazole (TMP-SMX)",
            "Ceftriaxone (CRO)",
            "Azithromycin (AZM)",
            "Chloramphenicol (CHL)",
            "Rifampicin (RIF)",
            "Nitrofurantoin (NIT)",
            "Mupirocin (MUP)",
            "Fosfomycin (FOS)",
            "Linezolid (LZD)",
            "Daptomycin (DAP)",
            "Tigecycline (TGC)",
            "Cefepime (FEP)",
            "Meropenem (MEM)",
            "Colistin (COL)",
            "Fidaxomicin (FDX)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (AMX)",
                "Ciprofloxacin (CIP)",
                "Tetracycline (TET)",
                "Vancomycin (VAN)",
                "Metronidazole (MTZ)",
                "Ceftriaxone (CRO)",
                "Azithromycin (AZM)",
                "Chloramphenicol (CHL)",
                "Rifampicin (RIF)",
                "Nitrofurantoin (NIT)",
                "Mupirocin (MUP)",
                "Linezolid (LZD)",
                "Daptomycin (DAP)",
                "Tigecycline (TGC)",
                "Cefepime (FEP)",
                "Fidaxomicin (FDX)",
                "Meropenem (MEM)"
            ],
            "mismatches": [
                "Penicillin (PEN)",
                "Erythromycin (ERY)",
                "Gentamicin (GEN)",
                "Clindamycin (CLN)",
                "Trimethoprim-sulfamethoxazole (TMP-SMX)",
                "Fosfomycin (FOS)",
                "Colistin (COL)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "cefepime",
                "cefepime hydrochloride",
                "cefixime",
                "cefodizime",
                "ceftazidime",
                "ceftiolene",
                "ceftriaxone",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clometocillin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "daptomycin",
                "difloxacin",
                "dihydrooroxylin A",
                "ertapenem",
                "fidaxomicin",
                "fleroxacin",
                "linezolid",
                "meropenem",
                "meropenem trihydrate",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "mupirocin",
                "mupirocin calcium (anhydrous)",
                "mupirocin calcium hydrate",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "oxytetracycline",
                "piperacillin",
                "rifabutin",
                "rifampicin",
                "streptomycin",
                "sulfisoxazole",
                "teicoplanin",
                "tetracycline",
                "tigecycline",
                "tilmicosin",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PEN)",
            "Amoxicillin (AMX)",
            "Ciprofloxacin (CIP)",
            "Tetracycline (TET)",
            "Chlorhexidine (CHX)",
            "Triclosan (TRI)",
            "Hydrogen Peroxide (H2O2)",
            "Ethanol (EtOH)",
            "Silver Nanoparticles (AgNPs)",
            "Lysozyme (LYS)",
            "Nisin (NIS)",
            "Chitosan (CHI)",
            "Propolis (PRO)",
            "Oregano Essential Oil (OEO)",
            "Thymol (THY)",
            "Carvacrol (CAR)",
            "Allicin (ALL)",
            "Berberine (BER)",
            "Curcumin (CUR)",
            "Gallium (Ga)",
            "Bacteriophages (Phages)",
            "Lactoferrin (LF)",
            "Defensins (DEF)",
            "Cathelicidins (CAT)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin",
                "Ciprofloxacin",
                "Tetracycline"
            ],
            "mismatches": [
                "Penicillin (PEN)",
                "Chlorhexidine (CHX)",
                "Triclosan (TRI)",
                "Hydrogen Peroxide (H2O2)",
                "Ethanol (EtOH)",
                "Silver Nanoparticles (AgNPs)",
                "Lysozyme (LYS)",
                "Nisin (NIS)",
                "Chitosan (CHI)",
                "Propolis (PRO)",
                "Oregano Essential Oil (OEO)",
                "Thymol (THY)",
                "Carvacrol (CAR)",
                "Allicin (ALL)",
                "Berberine (BER)",
                "Curcumin (CUR)",
                "Gallium (Ga)",
                "Bacteriophages (Phages)",
                "Lactoferrin (LF)",
                "Defensins (DEF)",
                "Cathelicidins (CAT)"
            ],
            "true_referents": [
                "(R)-N-trans-feruloyloctopamine",
                "(R)-chlorphenesin",
                "(S)-chlorphenesin",
                "(S)-iclaprim",
                "(S)-nadifloxacin",
                "4-aminosalicylic acid",
                "5alpha-epoxyalantolactone",
                "S-ethyl-L-cysteine",
                "amoxicillin",
                "ampicillin",
                "arsphenamine",
                "benzyl isothiocyanate",
                "carbenicillin",
                "caribenol A",
                "carumonam",
                "caseargrewiin B",
                "cefoxitin",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clavulanic acid",
                "cloxacillin",
                "cyclacillin",
                "dalfopristin",
                "difloxacin",
                "doxycycline",
                "durlobactam",
                "ergosterol peroxide",
                "ethambutol",
                "methicillin",
                "multiorthoquinone",
                "mupirocin calcium (anhydrous)",
                "nalidixic acid",
                "oxolinic acid",
                "oxytetracycline",
                "physalin D",
                "piperacillin",
                "pisonin B",
                "prontosil",
                "salicylhydroxamic acid",
                "silver(1+) sulfadiazinate",
                "streptomycin",
                "tetracycline",
                "tetrahydroxysqualene",
                "thalidomide",
                "trimethoprim",
                "undecanal",
                "vancomycin",
                "viomycin(3+)",
                "viridiflorol"
            ],
            "TP": 3,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (Pen)",
            "Tetracycline",
            "Metronidazole",
            "Vancomycin",
            "Ciprofloxacin",
            "Amoxicillin",
            "Augmentin",
            "Clindamycin",
            "Linezolid",
            "Rifampicin",
            "Streptomycin",
            "Chloramphenicol",
            "Neomycin",
            "Polymyxin B",
            "Colistin",
            "Tyrothricin",
            "Neosporin",
            "Oxytetracycline",
            "Minocycline",
            "Ofloxacin",
            "Cipro",
            "Levofloxacin",
            "Amikacin",
            "Moxifloxacin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Tetracycline",
                "Metronidazole",
                "Vancomycin",
                "Ciprofloxacin",
                "Amoxicillin",
                "Augmentin",
                "Linezolid",
                "Rifampicin",
                "Streptomycin",
                "Chloramphenicol",
                "Oxytetracycline",
                "Minocycline",
                "Ofloxacin",
                "Levofloxacin",
                "Amikacin",
                "Moxifloxacin"
            ],
            "mismatches": [
                "Penicillin (Pen)",
                "Clindamycin",
                "Neomycin",
                "Polymyxin B",
                "Colistin",
                "Tyrothricin",
                "Neosporin",
                "Cipro"
            ],
            "true_referents": [
                "Augmentin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "cloxacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "levofloxacin",
                "linezolid",
                "methacycline",
                "methicillin",
                "metronidazole",
                "metronidazole hydrochloride",
                "minocycline",
                "moxifloxacin",
                "nalidixic acid",
                "neomycin sulfate",
                "ofloxacin",
                "ornidazole",
                "oxytetracycline",
                "piperacillin",
                "rifampicin",
                "spectinomycin",
                "streptomycin",
                "teicoplanin",
                "tetracycline",
                "tilmicosin",
                "vancomycin",
                "viomycin"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin G (PCN)",
            "Ampicillin (AMP)",
            "Amoxicillin (AMX)",
            "Cephalexin (CEP)",
            "Ciprofloxacin (CIP)",
            "Gentamicin (GEN)",
            "Tetracycline (TET)",
            "Doxycycline (DOX)",
            "Metronidazole (MTZ)",
            "Vancomycin (VAN)",
            "Linezolid (LZD)",
            "Clindamycin (CLI)",
            "Sulfamethoxazole (SMX)",
            "Trimethoprim (TMP)",
            "Rifampicin (RIF)",
            "Isoniazid (INH)",
            "Ethambutol (EMB)",
            "Pyrazinamide (PZA)",
            "Streptomycin (STR)",
            "Chloramphenicol (CHL)",
            "Telithromycin (TEL)",
            "Meropenem (MER)",
            "Doripenem (DOR)",
            "Faropenem (FAR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ampicillin (AMP)",
                "Amoxicillin (AMX)",
                "Cephalexin (CEP)",
                "Ciprofloxacin (CIP)",
                "Tetracycline (TET)",
                "Doxycycline (DOX)",
                "Metronidazole (MTZ)",
                "Vancomycin (VAN)",
                "Linezolid (LZD)",
                "Trimethoprim (TMP)",
                "Rifampicin (RIF)",
                "Isoniazid (INH)",
                "Ethambutol (EMB)",
                "Streptomycin (STR)",
                "Chloramphenicol (CHL)",
                "Meropenem (MER)"
            ],
            "mismatches": [
                "Penicillin G (PCN)",
                "Gentamicin (GEN)",
                "Clindamycin (CLI)",
                "Sulfamethoxazole (SMX)",
                "Pyrazinamide (PZA)",
                "Telithromycin (TEL)",
                "Doripenem (DOR)",
                "Faropenem (FAR)"
            ],
            "true_referents": [
                "(R)-iclaprim",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "antimycobacterial drug",
                "antitubercular agent",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "biapenem",
                "brodimoprim",
                "cefodizime",
                "ceftazidime",
                "cephalexin",
                "cephalexin monohydrate",
                "cephapirin",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "ertapenem",
                "ethambutol",
                "ethambutol dihydrochloride",
                "imipenem",
                "isoniazide",
                "linezolid",
                "meropenem",
                "meropenem trihydrate",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "oxytetracycline",
                "piperacillin",
                "pyrazine-2-carboxylic acid",
                "pyrazinecarboxamide",
                "rifabutin",
                "rifampicin",
                "streptomycin",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            {
                "Referent": "Aminoglycoside (AMI)",
                "Canonical Name": "Aminoglycoside"
            },
            {
                "Referent": "Alcohol (ALC)",
                "Canonical Name": "Alcohol"
            },
            {
                "Referent": "Antibiotic (ABT)",
                "Canonical Name": "Antibiotic"
            },
            {
                "Referent": "Antifungal agent (AFG)",
                "Canonical Name": "Antifungal agent"
            },
            {
                "Referent": "Antimicrobial agent (AMT)",
                "Canonical Name": "Antimicrobial agent"
            },
            {
                "Referent": "Antiviral agent (AVG)",
                "Canonical Name": "Antiviral agent"
            },
            {
                "Referent": "Aureomycin (AUR)",
                "Canonical Name": "Aureomycin"
            },
            {
                "Referent": "Benzalkonium chloride (BZK)",
                "Canonical Name": "Benzalkonium chloride"
            },
            {
                "Referent": "Chlorhexidine (CHX)",
                "Canonical Name": "Chlorhexidine"
            },
            {
                "Referent": "Daptomycin (DAP)",
                "Canonical Name": "Daptomycin"
            },
            {
                "Referent": "Didecyldimethylammonium chloride (DDAC)",
                "Canonical Name": "Didecyldimethylammonium chloride"
            },
            {
                "Referent": "Dihydrostreptomycin (DHS)",
                "Canonical Name": "Dihydrostreptomycin"
            },
            {
                "Referent": "Diphenylcyclopropenone (DPCP)",
                "Canonical Name": "Diphenylcyclopropenone"
            },
            {
                "Referent": "Edetate disodium (EDTA)",
                "Canonical Name": "Edetate disodium"
            },
            {
                "Referent": "Erythromycin (ERY)",
                "Canonical Name": "Erythromycin"
            },
            {
                "Referent": "Fluoroquinolone (FLQ)",
                "Canonical Name": "Fluoroquinolone"
            },
            {
                "Referent": "Gentamicin (GEN)",
                "Canonical Name": "Gentamicin"
            },
            {
                "Referent": "Hexachlorophene (HCP)",
                "Canonical Name": "Hexachlorophene"
            },
            {
                "Referent": "Iodine (IOD)",
                "Canonical Name": "Iodine"
            },
            {
                "Referent": "Isoxazolyl penicillin (IPN)",
                "Canonical Name": "Isoxazolyl penicillin"
            },
            {
                "Referent": "Kanamycin (KAN)",
                "Canonical Name": "Kanamycin"
            },
            {
                "Referent": "Miconazole (MCZ)",
                "Canonical Name": "Miconazole"
            },
            {
                "Referent": "Neomycin (NEO)",
                "Canonical Name": "Neomycin"
            },
            {
                "Referent": "Penicillin (PEN)",
                "Canonical Name": "Penicillin"
            },
            {
                "Referent": "Phenol (PHE)",
                "Canonical Name": "Phenol"
            },
            {
                "Referent": "Polymyxin B (POL)",
                "Canonical Name": "Polymyxin B"
            },
            {
                "Referent": "Quaternary ammonium compound (QAC)",
                "Canonical Name": "Quaternary ammonium compound"
            },
            {
                "Referent": "Silver nitrate (SIL)",
                "Canonical Name": "Silver nitrate"
            },
            {
                "Referent": "Sulfadiazine (SDZ)",
                "Canonical Name": "Sulfadiazine"
            },
            {
                "Referent": "Sulfamethoxazole (SMX)",
                "Canonical Name": "Sulfamethoxazole"
            },
            {
                "Referent": "Thiostrepton (THI)",
                "Canonical Name": "Thiostrepton"
            },
            {
                "Referent": "Triclosan (TCL)",
                "Canonical Name": "Triclosan"
            },
            {
                "Referent": "Vancomycin (VAN)",
                "Canonical Name": "Vancomycin"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Daptomycin",
                "Vancomycin"
            ],
            "mismatches": [
                "Aminoglycoside",
                "Alcohol",
                "Antibiotic",
                "Antifungal agent",
                "Antimicrobial agent",
                "Antiviral agent",
                "Aureomycin",
                "Benzalkonium chloride",
                "Chlorhexidine",
                "Didecyldimethylammonium chloride",
                "Dihydrostreptomycin",
                "Diphenylcyclopropenone",
                "Edetate disodium",
                "Erythromycin",
                "Fluoroquinolone",
                "Gentamicin",
                "Hexachlorophene",
                "Iodine",
                "Isoxazolyl penicillin",
                "Kanamycin",
                "Miconazole",
                "Neomycin",
                "Penicillin",
                "Phenol",
                "Polymyxin B",
                "Quaternary ammonium compound",
                "Silver nitrate",
                "Sulfadiazine",
                "Sulfamethoxazole",
                "Thiostrepton",
                "Triclosan"
            ],
            "true_referents": [
                "(R)-chlorphenesin",
                "(R)-temafloxacin",
                "(S)-chlorphenesin",
                "(S)-nadifloxacin",
                "(S)-temafloxacin",
                "1-(2-hydroxy-4-methoxyphenyl)-3-(4-hydroxy-3-methoxyphenyl)propane",
                "3-nitropropanoic acid",
                "amikacin",
                "antitubercular agent",
                "apramycin",
                "arsphenamine",
                "benzylpenicillin",
                "cefotetan disodium",
                "daptomycin",
                "ethionamide",
                "fenticonazole",
                "isoconazole",
                "methicillin",
                "neomycin sulfate",
                "silver(1+) sulfadiazinate",
                "streptomycin",
                "undecanal",
                "vancomycin",
                "viomycin",
                "viomycin(3+)"
            ],
            "TP": 2,
            "FP": 31,
            "FN": 0
        }
    }
]