[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PCN)",
            "Tetracycline (TET)",
            "Ciprofloxacin (CIP)",
            "Amoxicillin (AMX)",
            "Clindamycin",
            "Erythromycin",
            "Vancomycin (VCM)",
            "Metronidazole (MTZ)",
            "Azithromycin",
            "Cephalexin",
            "Doxycycline",
            "Levofloxacin",
            "Nitrofurantoin",
            "Sulfamethoxazole-Trimethoprim (SMX-TMP)",
            "Chloramphenicol",
            "Fosfomycin",
            "Linezolid",
            "Moxifloxacin",
            "Quinupristin-Dalfopristin",
            "Tedizolid",
            "Meropenem",
            "Tigecycline",
            "Daptomycin",
            "Colistin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Tetracycline (TET)",
                "Ciprofloxacin (CIP)",
                "Amoxicillin (AMX)",
                "Vancomycin (VCM)",
                "Metronidazole (MTZ)",
                "Azithromycin",
                "Cephalexin",
                "Doxycycline",
                "Levofloxacin",
                "Nitrofurantoin",
                "Chloramphenicol",
                "Linezolid",
                "Moxifloxacin",
                "Meropenem",
                "Tigecycline",
                "Daptomycin"
            ],
            "mismatches": [
                "Penicillin (PCN)",
                "Clindamycin",
                "Erythromycin",
                "Sulfamethoxazole-Trimethoprim (SMX-TMP)",
                "Fosfomycin",
                "Quinupristin-Dalfopristin",
                "Tedizolid",
                "Colistin"
            ],
            "true_referents": [
                "(R)-nadifloxacin",
                "Augmentin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "cefazolin",
                "cefodizime",
                "cephalexin",
                "cephapirin",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "dalbavancin",
                "dalfopristin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "furazolidone",
                "imipenem",
                "levofloxacin",
                "linezolid",
                "meropenem",
                "meropenem trihydrate",
                "methicillin",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "nalidixic acid",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "oxytetracycline",
                "rifabutin",
                "streptomycin",
                "sulfisoxazole",
                "teicoplanin",
                "tetracycline",
                "tigecycline",
                "tilmicosin",
                "trimethoprim",
                "vancomycin",
                "viomycin",
                "viomycin(3+)"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (Penicillin G)",
            "Tetracycline (Tetracycline HCl)",
            "Ciprofloxacin (Ciprofloxacin HCl)",
            "Erythromycin (Erythromycin Stearate)",
            "Amoxicillin (Amoxicillin Trihydrate)",
            "Vancomycin (Vancomycin Hydrochloride)",
            "Doxycycline (Doxycycline Hyclate)",
            "Clindamycin (Clindamycin Phosphate)",
            "Azithromycin (Azithromycin Trihydrate)",
            "Cephalexin (Cephalexin Monohydrate)",
            "Metronidazole (Metronidazole Hydrochloride)",
            "Gentamicin (Gentamicin Sulfate)",
            "Trimethoprim (Trimethoprim)",
            "Sulfamethoxazole (Sulfamethoxazole)",
            "Meropenem (Meropenem Trihydrate)",
            "Linezolid (Linezolid)",
            "Daptomycin (Daptomycin)",
            "Rifampin (Rifampicin)",
            "Moxifloxacin (Moxifloxacin Hydrochloride)",
            "Levofloxacin (Levofloxacin)",
            "Clarithromycin (Clarithromycin)",
            "Tigecycline (Tigecycline)",
            "Fosfomycin (Fosfomycin Trometamol)",
            "Nitrofurantoin (Nitrofurantoin Monohydrate)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ciprofloxacin (Ciprofloxacin HCl)",
                "Amoxicillin (Amoxicillin Trihydrate)",
                "Doxycycline (Doxycycline Hyclate)",
                "Cephalexin (Cephalexin Monohydrate)",
                "Metronidazole (Metronidazole Hydrochloride)",
                "Trimethoprim (Trimethoprim)",
                "Meropenem (Meropenem Trihydrate)",
                "Linezolid (Linezolid)",
                "Daptomycin (Daptomycin)",
                "Moxifloxacin (Moxifloxacin Hydrochloride)",
                "Levofloxacin (Levofloxacin)",
                "Clarithromycin (Clarithromycin)",
                "Tigecycline (Tigecycline)",
                "Nitrofurantoin (Nitrofurantoin Monohydrate)"
            ],
            "mismatches": [
                "Penicillin (Penicillin G)",
                "Tetracycline (Tetracycline HCl)",
                "Erythromycin (Erythromycin Stearate)",
                "Vancomycin (Vancomycin Hydrochloride)",
                "Clindamycin (Clindamycin Phosphate)",
                "Azithromycin (Azithromycin Trihydrate)",
                "Gentamicin (Gentamicin Sulfate)",
                "Sulfamethoxazole (Sulfamethoxazole)",
                "Rifampin (Rifampicin)",
                "Fosfomycin (Fosfomycin Trometamol)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "amoxicillin trihydrate",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "brodimoprim",
                "cephalexin",
                "cephalexin monohydrate",
                "cephapirin",
                "cethromycin",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "cloxacillin",
                "co-trimoxazole",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "levofloxacin",
                "linezolid",
                "meropenem",
                "meropenem trihydrate",
                "methacycline",
                "methicillin",
                "metronidazole",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "moxifloxacin hydrochloride",
                "nalidixic acid",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "ornidazole",
                "piperacillin",
                "rifabutin",
                "rifampicin",
                "rosoxacin",
                "streptomycin",
                "sulfamethazine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "tigecycline",
                "trimethoprim",
                "vancomycin"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PCN)",
            "Ampicillin",
            "Amoxicillin (AMX)",
            "Cefalexin (CEF)",
            "Cephalosporin (CEP)",
            "Erythromycin (ERY)",
            "Tetracycline (TCN)",
            "Doxycycline (DOX)",
            "Minocycline (MINO)",
            "Vancomycin (VAN)",
            "Ciprofloxacin (CIP)",
            "Levofloxacin (LEV)",
            "Azithromycin (AZI)",
            "Clindamycin (CLI)",
            "Trimethoprim (TMP)",
            "Sulfamethoxazole (SMX)",
            "Metronidazole (MET)",
            "Gentamicin (GEN)",
            "Tobramycin (TOB)",
            "Streptomycin (STR)",
            "Chloramphenicol (CHL)",
            "Nitrofurantoin (NFT)",
            "Fusidic Acid (FUS)",
            "Linezolid (LNZ)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ampicillin",
                "Vancomycin",
                "Ciprofloxacin",
                "Levofloxacin",
                "Azithromycin",
                "Trimethoprim",
                "Metronidazole",
                "Streptomycin",
                "Chloramphenicol",
                "Nitrofurantoin",
                "Linezolid"
            ],
            "mismatches": [
                "Penicillin (PCN)",
                "Amoxicillin (AMX)",
                "Cefalexin (CEF)",
                "Cephalosporin (CEP)",
                "Erythromycin (ERY)",
                "Tetracycline (TCN)",
                "Doxycycline (DOX)",
                "Minocycline (MINO)",
                "Clindamycin (CLI)",
                "Sulfamethoxazole (SMX)",
                "Gentamicin (GEN)",
                "Tobramycin (TOB)",
                "Fusidic Acid (FUS)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "brodimoprim",
                "cefadroxil",
                "cefalotin",
                "cefazolin",
                "cefoperazone",
                "ceftizoxime",
                "cephalexin",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "levofloxacin",
                "linezolid",
                "methacycline",
                "metronidazole",
                "metronidazole hydrochloride",
                "mezlocillin",
                "minocycline",
                "moxifloxacin",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "ornidazole",
                "pipemidic acid",
                "piromidic acid",
                "rifabutin",
                "scleropyric acid",
                "streptomycin",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin G (PenG)",
            "Amoxicillin (Amox)",
            "Tetracycline (Tetr)",
            "Erythromycin (Eryth)",
            "Ciprofloxacin (Cipro)",
            "Azithromycin (Azith)",
            "Vancomycin (Vanc)",
            "Gentamicin (Gent)",
            "Streptomycin (Strep)",
            "Chloramphenicol (Chl)",
            "Sulfamethoxazole (SMX)",
            "Trimethoprim (TMP)",
            "Clindamycin (Clinda)",
            "Metronidazole (Metro)",
            "Daptomycin (Dapt)",
            "Linezolid (Linez)",
            "Polymyxin B (PolB)",
            "Bacitracin (Bact)",
            "Neomycin (Neo)",
            "Nitrofurantoin (Nitro)",
            "Fosfomycin (Fos)",
            "Tigecycline (Tige)",
            "Moxifloxacin (Moxi)",
            "Levofloxacin (Lev)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (Amox)",
                "Tetracycline (Tetr)",
                "Ciprofloxacin (Cipro)",
                "Azithromycin (Azith)",
                "Vancomycin (Vanc)",
                "Streptomycin (Strep)",
                "Chloramphenicol (Chl)",
                "Trimethoprim (TMP)",
                "Metronidazole (Metro)",
                "Daptomycin (Dapt)",
                "Linezolid (Linez)",
                "Nitrofurantoin (Nitro)",
                "Tigecycline (Tige)",
                "Moxifloxacin (Moxi)",
                "Levofloxacin (Lev)"
            ],
            "mismatches": [
                "Penicillin G (PenG)",
                "Erythromycin (Eryth)",
                "Gentamicin (Gent)",
                "Sulfamethoxazole (SMX)",
                "Clindamycin (Clinda)",
                "Polymyxin B (PolB)",
                "Bacitracin (Bact)",
                "Neomycin (Neo)",
                "Fosfomycin (Fos)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "2-nitroimidazole",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "brodimoprim",
                "ceftazidime",
                "ceftizoxime",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "levofloxacin",
                "linezolid",
                "methicillin",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "moxifloxacin hydrochloride",
                "nalidixic acid",
                "neomycin sulfate",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "oxytetracycline",
                "piperacillin",
                "streptomycin",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "tigecycline",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PEN)",
            "Amoxicillin (AMX)",
            "Ciprofloxacin (CIP)",
            "Erythromycin (ERY)",
            "Tetracycline (TET)",
            "Doxycycline (DOX)",
            "Azithromycin (AZI)",
            "Clindamycin (CLI)",
            "Vancomycin (VAN)",
            "Gentamicin (GEN)",
            "Cephalexin (CEF)",
            "Metronidazole (MTZ)",
            "Levofloxacin (LVX)",
            "Trimethoprim (TMP)",
            "Sulfamethoxazole (SMX)",
            "Rifampicin (RIF)",
            "Chloramphenicol (CHL)",
            "Nitrofurantoin (NIT)",
            "Linezolid (LZD)",
            "Meropenem (MEM)",
            "Imipenem (IMI)",
            "Tigecycline (TGC)",
            "Piperacillin (PIP)",
            "Ceftriaxone (CRO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (AMX)",
                "Ciprofloxacin (CIP)",
                "Tetracycline (TET)",
                "Doxycycline (DOX)",
                "Azithromycin (AZI)",
                "Vancomycin (VAN)",
                "Cephalexin (CEF)",
                "Metronidazole (MTZ)",
                "Levofloxacin (LVX)",
                "Trimethoprim (TMP)",
                "Rifampicin (RIF)",
                "Chloramphenicol (CHL)",
                "Nitrofurantoin (NIT)",
                "Linezolid (LZD)",
                "Meropenem (MEM)",
                "Imipenem (IMI)",
                "Tigecycline (TGC)",
                "Piperacillin (PIP)",
                "Ceftriaxone (CRO)"
            ],
            "mismatches": [
                "Penicillin (PEN)",
                "Erythromycin (ERY)",
                "Clindamycin (CLI)",
                "Gentamicin (GEN)",
                "Sulfamethoxazole (SMX)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "brodimoprim",
                "cefazolin",
                "cefixime",
                "cefodizime",
                "ceftazidime",
                "ceftiolene",
                "ceftriaxone",
                "cephalexin",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "ertapenem",
                "imipenem",
                "levofloxacin",
                "linezolid",
                "meropenem",
                "meropenem trihydrate",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "oxytetracycline",
                "piperacillin",
                "rifabutin",
                "rifampicin",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "tigecycline",
                "trimethoprim",
                "vancomycin"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PEN)",
            "Amoxicillin (AMX)",
            "Ciprofloxacin (CIP)",
            "Tetracycline (TET)",
            "Erythromycin (ERY)",
            "Vancomycin (VAN)",
            "Gentamicin (GEN)",
            "Clindamycin (CLI)",
            "Metronidazole (MET)",
            "Doxycycline (DOX)",
            "Azithromycin (AZI)",
            "Rifampicin (RIF)",
            "Streptomycin (STR)",
            "Chloramphenicol (CHL)",
            "Fidaxomicin (FID)",
            "Moxifloxacin (MOX)",
            "Sulfamethoxazole/Trimethoprim (SXT)",
            "Nitrofurantoin (NIT)",
            "Ceftriaxone (CEF)",
            "Nafcillin (NAF)",
            "Linezolid (LIN)",
            "Tobramycin (TOB)",
            "Colistin (COL)",
            "Bacitracin (BAC)",
            "Clarithromycin (CLA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (AMX)",
                "Ciprofloxacin (CIP)",
                "Tetracycline (TET)",
                "Vancomycin (VAN)",
                "Metronidazole (MET)",
                "Doxycycline (DOX)",
                "Azithromycin (AZI)",
                "Rifampicin (RIF)",
                "Streptomycin (STR)",
                "Chloramphenicol (CHL)",
                "Fidaxomicin (FID)",
                "Moxifloxacin (MOX)",
                "Nitrofurantoin (NIT)",
                "Ceftriaxone (CEF)",
                "Nafcillin (NAF)",
                "Linezolid (LIN)",
                "Clarithromycin (CLA)"
            ],
            "mismatches": [
                "Penicillin (PEN)",
                "Erythromycin (ERY)",
                "Gentamicin (GEN)",
                "Clindamycin (CLI)",
                "Sulfamethoxazole/Trimethoprim (SXT)",
                "Tobramycin (TOB)",
                "Colistin (COL)",
                "Bacitracin (BAC)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "ceftazidime",
                "ceftiolene",
                "ceftriaxone",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clometocillin",
                "clomocycline",
                "cloxacillin",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "fidaxomicin",
                "flucloxacillin",
                "linezolid",
                "methicillin",
                "metronidazole",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "moxifloxacin hydrochloride",
                "nafcillin",
                "nalidixic acid",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "ornidazole",
                "oxytetracycline",
                "physalin D",
                "piperacillin",
                "piromidic acid",
                "rifabutin",
                "rifampicin",
                "streptomycin",
                "sulfamethazine",
                "sulfisoxazole",
                "teicoplanin",
                "tetracycline",
                "tilmicosin",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 17,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PCN)",
            "Amoxicillin (AMX)",
            "Ciprofloxacin (CIP)",
            "Vancomycin (VAN)",
            "Tetracycline (TET)",
            "Doxycycline (DOX)",
            "Erythromycin (ERY)",
            "Clindamycin (CLI)",
            "Metronidazole (MET)",
            "Chloramphenicol (CHL)",
            "Streptomycin (STR)",
            "Rifampicin (RIF)",
            "Trimethoprim (TMP)",
            "Sulfamethoxazole (SMX)",
            "Minocycline (MIN)",
            "Levofloxacin (LEV)",
            "Moxifloxacin (MOX)",
            "Linezolid (LZD)",
            "Cephalexin (CEX)",
            "Ceftriaxone (CTR)",
            "Meropenem (MER)",
            "Daptomycin (DAP)",
            "Gentamicin (GEN)",
            "Amikacin (AMK)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (AMX)",
                "Ciprofloxacin (CIP)",
                "Vancomycin (VAN)",
                "Tetracycline (TET)",
                "Doxycycline (DOX)",
                "Chloramphenicol (CHL)",
                "Streptomycin (STR)",
                "Rifampicin (RIF)",
                "Trimethoprim (TMP)",
                "Minocycline (MIN)",
                "Levofloxacin (LEV)",
                "Moxifloxacin (MOX)",
                "Linezolid (LZD)",
                "Cephalexin (CEX)",
                "Ceftriaxone (CTR)",
                "Meropenem (MER)",
                "Daptomycin (DAP)",
                "Amikacin (AMK)"
            ],
            "mismatches": [
                "Penicillin (PCN)",
                "Erythromycin (ERY)",
                "Clindamycin (CLI)",
                "Metronidazole (MET)",
                "Sulfamethoxazole (SMX)",
                "Gentamicin (GEN)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "amikacin",
                "amikacin disulfate",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "benzylpenicillin",
                "brodimoprim",
                "cefditoren",
                "cefodizime",
                "cefoxitin",
                "ceftazidime",
                "ceftiolene",
                "ceftriaxone",
                "cephalexin",
                "cephalexin monohydrate",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "imipenem",
                "levofloxacin",
                "linezolid",
                "meropenem",
                "meropenem trihydrate",
                "methacycline",
                "metronidazole",
                "metronidazole hydrochloride",
                "minocycline",
                "moxifloxacin",
                "moxifloxacin hydrochloride",
                "ofloxacin",
                "ornidazole",
                "oxytetracycline",
                "rifabutin",
                "rifampicin",
                "streptomycin",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin",
            "Ciprofloxacin",
            "Amoxicillin",
            "Tetracycline",
            "Erythromycin",
            "Vancomycin",
            "Gentamicin",
            "Ceftriaxone",
            "Trimethoprim-sulfamethoxazole",
            "Clindamycin",
            "Azithromycin",
            "Levofloxacin",
            "Methicillin",
            "Doxycycline",
            "Metronidazole",
            "Cephalosporin",
            "Linezolid",
            "Ampicillin",
            "Chloramphenicol",
            "Rifampin",
            "Sulfamethoxazole",
            "Isoniazid",
            "Streptomycin",
            "Gatifloxacin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Ciprofloxacin",
                "Amoxicillin",
                "Tetracycline",
                "Vancomycin",
                "Ceftriaxone",
                "Azithromycin",
                "Levofloxacin",
                "Methicillin",
                "Doxycycline",
                "Metronidazole",
                "Linezolid",
                "Ampicillin",
                "Chloramphenicol",
                "Streptomycin"
            ],
            "mismatches": [
                "Penicillin",
                "Erythromycin",
                "Gentamicin",
                "Trimethoprim-sulfamethoxazole",
                "Clindamycin",
                "Cephalosporin",
                "Rifampin",
                "Sulfamethoxazole",
                "Isoniazid",
                "Gatifloxacin"
            ],
            "true_referents": [
                "Augmentin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "antimycobacterial drug",
                "antitubercular agent",
                "apramycin",
                "azithromycin",
                "cefalotin",
                "cefazolin",
                "ceftazidime",
                "ceftiolene",
                "ceftriaxone",
                "cephapirin",
                "cethromycin",
                "chloramphenicol",
                "ciprofloxacin",
                "clarithromycin",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "isoniazide",
                "levofloxacin",
                "linezolid",
                "methacycline",
                "methicillin",
                "metronidazole",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "nalidixic acid",
                "ofloxacin",
                "ornidazole",
                "rifabutin",
                "rifampicin",
                "streptomycin",
                "sulfamethazine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "trimethoprim",
                "vancomycin"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin G (PenG)",
            "Amoxicillin (Amox)",
            "Tetracycline",
            "Erythromycin",
            "Ciprofloxacin (Cipro)",
            "Chloramphenicol",
            "Vancomycin",
            "Gentamicin",
            "Streptomycin",
            "Doxycycline",
            "Clindamycin",
            "Metronidazole",
            "Azithromycin",
            "Sulfamethoxazole",
            "Rifampin",
            "Linezolid",
            "Tobramycin",
            "Nitrofurantoin",
            "Trimethoprim",
            "Bacitracin",
            "Neomycin",
            "Fosfomycin",
            "Colistin",
            "Mupirocin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (Amox)",
                "Tetracycline",
                "Ciprofloxacin (Cipro)",
                "Chloramphenicol",
                "Vancomycin",
                "Streptomycin",
                "Doxycycline",
                "Metronidazole",
                "Azithromycin",
                "Linezolid",
                "Nitrofurantoin",
                "Trimethoprim",
                "Neomycin",
                "Mupirocin"
            ],
            "mismatches": [
                "Penicillin G (PenG)",
                "Erythromycin",
                "Gentamicin",
                "Clindamycin",
                "Sulfamethoxazole",
                "Rifampin",
                "Tobramycin",
                "Bacitracin",
                "Fosfomycin",
                "Colistin"
            ],
            "true_referents": [
                "Augmentin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "brodimoprim",
                "cethromycin",
                "chloramphenicol",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "linezolid",
                "methacycline",
                "methicillin",
                "metronidazole",
                "metronidazole hydrochloride",
                "mupirocin",
                "mupirocin calcium (anhydrous)",
                "mupirocin calcium hydrate",
                "nafcillin",
                "nalidixic acid",
                "neomycin sulfate",
                "nitrofurantoin",
                "nitrofurazone",
                "ornidazole",
                "piperacillin",
                "rifabutin",
                "rifampicin",
                "streptomycin",
                "sulfamethazine",
                "sulfaphenazole",
                "sulfisoxazole",
                "teicoplanin",
                "tetracycline",
                "tilmicosin",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PCN)",
            "Amoxicillin (AMOX)",
            "Ciprofloxacin (CIP)",
            "Tetracycline (TET)",
            "Erythromycin (ERY)",
            "Gentamicin (GEN)",
            "Vancomycin (VAN)",
            "Ceftriaxone (CRO)",
            "Azithromycin (AZM)",
            "Doxycycline (DOX)",
            "Metronidazole (MTZ)",
            "Clindamycin (CLI)",
            "Trimethoprim-sulfamethoxazole (TMP-SMX)",
            "Levofloxacin (LVX)",
            "Meropenem (MEM)",
            "Cephalexin (LEX)",
            "Chloramphenicol (CHL)",
            "Rifampicin (RIF)",
            "Clarithromycin (CLR)",
            "Ampicillin (AMP)",
            "Streptomycin (STR)",
            "Linezolid (LZD)",
            "Nitrofurantoin (NIT)",
            "Polymyxin B (PMB)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (AMOX)",
                "Ciprofloxacin (CIP)",
                "Tetracycline (TET)",
                "Vancomycin (VAN)",
                "Ceftriaxone (CRO)",
                "Azithromycin (AZM)",
                "Doxycycline (DOX)",
                "Metronidazole (MTZ)",
                "Levofloxacin (LVX)",
                "Meropenem (MEM)",
                "Cephalexin (LEX)",
                "Chloramphenicol (CHL)",
                "Rifampicin (RIF)",
                "Clarithromycin (CLR)",
                "Ampicillin (AMP)",
                "Streptomycin (STR)",
                "Linezolid (LZD)",
                "Nitrofurantoin (NIT)"
            ],
            "mismatches": [
                "Penicillin (PCN)",
                "Erythromycin (ERY)",
                "Gentamicin (GEN)",
                "Clindamycin (CLI)",
                "Trimethoprim-sulfamethoxazole (TMP-SMX)",
                "Polymyxin B (PMB)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "cefodizime",
                "ceftazidime",
                "ceftiolene",
                "ceftriaxone",
                "cephalexin",
                "cephalexin monohydrate",
                "cephapirin",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "ertapenem",
                "levofloxacin",
                "linezolid",
                "meropenem",
                "meropenem trihydrate",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "ofloxacin",
                "oxytetracycline",
                "paromomycin",
                "paromomycin sulfate",
                "rifabutin",
                "rifampicin",
                "streptomycin",
                "sulfisoxazole",
                "tetracycline",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PCN)",
            "Amoxicillin (AMOX)",
            "Ciprofloxacin (CIP)",
            "Doxycycline (DOXY)",
            "Erythromycin (ERY)",
            "Tetracycline (TET)",
            "Gentamicin (GEN)",
            "Vancomycin (VAN)",
            "Cephalexin (CEX)",
            "Sulfamethoxazole (SMX)",
            "Trimethoprim (TMP)",
            "Clindamycin (CLI)",
            "Azithromycin (AZM)",
            "Metronidazole (MTZ)",
            "Nitrofurantoin (NFT)",
            "Chloramphenicol (CAP)",
            "Rifampin (RIF)",
            "Mupirocin (MUP)",
            "Linezolid (LZD)",
            "Quinupristin/Dalfopristin (Q/D)",
            "Daptomycin (DAP)",
            "Tigecycline (TGC)",
            "Fosfomycin (FOS)",
            "Fusidic Acid (FA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amoxicillin (AMOX)",
                "Ciprofloxacin (CIP)",
                "Doxycycline (DOXY)",
                "Tetracycline (TET)",
                "Vancomycin (VAN)",
                "Cephalexin (CEX)",
                "Trimethoprim (TMP)",
                "Azithromycin (AZM)",
                "Metronidazole (MTZ)",
                "Nitrofurantoin (NFT)",
                "Chloramphenicol (CAP)",
                "Mupirocin (MUP)",
                "Linezolid (LZD)",
                "Daptomycin (DAP)",
                "Tigecycline (TGC)"
            ],
            "mismatches": [
                "Penicillin (PCN)",
                "Erythromycin (ERY)",
                "Gentamicin (GEN)",
                "Sulfamethoxazole (SMX)",
                "Clindamycin (CLI)",
                "Rifampin (RIF)",
                "Quinupristin/Dalfopristin (Q/D)",
                "Fosfomycin (FOS)",
                "Fusidic Acid (FA)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(R)-nadifloxacin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "brodimoprim",
                "cefodizime",
                "cefoxitin",
                "ceftazidime",
                "cephalexin",
                "cephalexin monohydrate",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "dalfopristin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "linezolid",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "mupirocin",
                "mupirocin calcium (anhydrous)",
                "mupirocin calcium hydrate",
                "nitrofurantoin",
                "nitrofurazone",
                "oxytetracycline",
                "pipemidic acid",
                "piperacillin",
                "piromidic acid",
                "rifabutin",
                "rifampicin",
                "scleropyric acid",
                "streptomycin",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "tigecycline",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PEN)",
            "Streptomycin (STR)",
            "Tetracycline (TET)",
            "Erythromycin (ERY)",
            "Chloramphenicol (CHL)",
            "Ciprofloxacin (CIP)",
            "Gentamicin (GEN)",
            "Vancomycin (VAN)",
            "Ampicillin (AMP)",
            "Amoxicillin (AMX)",
            "Cephalexin (CEX)",
            "Sulfamethoxazole (SMX)",
            "Trimethoprim (TMP)",
            "Nitrofurantoin (NIT)",
            "Metronidazole (MTZ)",
            "Clindamycin (CLN)",
            "Rifampin (RIF)",
            "Isoniazid (INH)",
            "Pyrazinamide (PZA)",
            "Ethambutol (EMB)",
            "Triclosan",
            "Chlorhexidine",
            "Hydrogen Peroxide (H2O2)",
            "Ethanol (EtOH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Streptomycin",
                "Tetracycline",
                "Chloramphenicol",
                "Ciprofloxacin",
                "Vancomycin",
                "Ampicillin",
                "Amoxicillin",
                "Cephalexin",
                "Trimethoprim",
                "Nitrofurantoin",
                "Metronidazole",
                "Isoniazid",
                "Ethambutol"
            ],
            "mismatches": [
                "Penicillin (PEN)",
                "Erythromycin (ERY)",
                "Gentamicin (GEN)",
                "Sulfamethoxazole (SMX)",
                "Clindamycin (CLN)",
                "Rifampin (RIF)",
                "Pyrazinamide (PZA)",
                "Triclosan",
                "Chlorhexidine",
                "Hydrogen Peroxide (H2O2)",
                "Ethanol (EtOH)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "S-ethyl-L-cysteine",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "antimycobacterial drug",
                "antitubercular agent",
                "apramycin",
                "arsphenamine",
                "brodimoprim",
                "cefoxitin",
                "ceftazidime",
                "cephalexin",
                "cephalexin monohydrate",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "daptomycin",
                "difloxacin",
                "ergosterol peroxide",
                "ethambutol",
                "ethambutol dihydrochloride",
                "isoniazide",
                "methicillin",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "nalidixic acid",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "oxytetracycline",
                "piperacillin",
                "pyrazine-2-carboxylic acid",
                "pyrazinecarboxamide",
                "rifabutin",
                "rifampicin",
                "rosoxacin",
                "salicylhydroxamic acid",
                "streptomycin",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "teicoplanin",
                "tetracycline",
                "trimethoprim",
                "undecanal",
                "vancomycin",
                "viomycin"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin (PEN)",
            "Tetracycline (TET)",
            "Streptomycin (STR)",
            "Erythromycin (ERY)",
            "Vancomycin (VAN)",
            "Ciprofloxacin (CIP)",
            "Gentamicin (GEN)",
            "Ampicillin (AMP)",
            "Cephalexin (CEP)",
            "Amoxicillin (AMX)",
            "Clindamycin (CLI)",
            "Doxycycline (DOX)",
            "Azithromycin (AZI)",
            "Ceftriaxone (CEF)",
            "Metronidazole (MET)",
            "Chloramphenicol (CHL)",
            "Sulfamethoxazole (SUL)",
            "Trimethoprim (TRI)",
            "Linezolid (LIN)",
            "Meropenem (MER)",
            "Tigecycline (TIG)",
            "Fosfomycin (FOS)",
            "Nitrofurantoin (NIT)",
            "Mupirocin (MUP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Tetracycline (TET)",
                "Streptomycin (STR)",
                "Vancomycin (VAN)",
                "Ciprofloxacin (CIP)",
                "Ampicillin (AMP)",
                "Cephalexin (CEP)",
                "Amoxicillin (AMX)",
                "Doxycycline (DOX)",
                "Azithromycin (AZI)",
                "Ceftriaxone (CEF)",
                "Metronidazole (MET)",
                "Chloramphenicol (CHL)",
                "Trimethoprim (TRI)",
                "Linezolid (LIN)",
                "Meropenem (MER)",
                "Tigecycline (TIG)",
                "Nitrofurantoin (NIT)",
                "Mupirocin (MUP)"
            ],
            "mismatches": [
                "Penicillin (PEN)",
                "Erythromycin (ERY)",
                "Gentamicin (GEN)",
                "Clindamycin (CLI)",
                "Sulfamethoxazole (SUL)",
                "Fosfomycin (FOS)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "brodimoprim",
                "ceftazidime",
                "ceftiolene",
                "ceftriaxone",
                "cephalexin",
                "cephalexin monohydrate",
                "cephapirin",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "imipenem",
                "linezolid",
                "meropenem",
                "meropenem trihydrate",
                "metronidazole",
                "metronidazole hydrochloride",
                "mupirocin",
                "mupirocin calcium (anhydrous)",
                "mupirocin calcium hydrate",
                "nalidixic acid",
                "nifurtoinol",
                "nitrofurantoin",
                "nitrofurazone",
                "ornidazole",
                "oxytetracycline",
                "piperacillin",
                "streptomycin",
                "sulfamethazine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "tigecycline",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Antibiotic (Penicillin)",
            "Antibiotic (Tetracycline)",
            "Antibiotic (Erythromycin)",
            "Antibiotic (Ciprofloxacin)",
            "Antibiotic (Amoxicillin)",
            "Antibiotic (Metronidazole)",
            "Antibiotic (Cephalexin)",
            "Antibiotic (Azithromycin)",
            "Antibiotic (Clindamycin)",
            "Antibiotic (Gentamicin)",
            "Antibiotic (Ciprofloxacin)",
            "Antibiotic (Sulfamethoxazole)",
            "Antibiotic (Trimethoprim)",
            "Antibiotic (Vancomycin)",
            "Antibiotic (Ceftriaxone)",
            "Antibiotic (Cefotaxime)",
            "Antibiotic (Cefepime)",
            "Antibiotic (Meropenem)",
            "Antibiotic (Imipenem)",
            "Antibiotic (Piperacillin)",
            "Antibiotic (Tobramycin)",
            "Antibiotic (Ciprofloxacin)",
            "Antibiotic (Ofloxacin)",
            "Antibiotic (Norfloxacin)",
            "Antibiotic (Ciprofloxacin)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Tetracycline",
                "Ciprofloxacin",
                "Amoxicillin",
                "Metronidazole",
                "Cephalexin",
                "Azithromycin",
                "Trimethoprim",
                "Vancomycin",
                "Ceftriaxone",
                "Cefotaxime",
                "Cefepime",
                "Meropenem",
                "Imipenem",
                "Piperacillin",
                "Ofloxacin",
                "Norfloxacin"
            ],
            "mismatches": [
                "Penicillin",
                "Erythromycin",
                "Clindamycin",
                "Gentamicin",
                "Sulfamethoxazole",
                "Tobramycin"
            ],
            "true_referents": [
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "apramycin",
                "azithromycin",
                "cefazolin",
                "cefepime",
                "cefixime",
                "cefotaxime",
                "ceftazidime",
                "ceftizoxime",
                "ceftriaxone",
                "cephalexin",
                "cephapirin",
                "cethromycin",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "cloxacillin",
                "cyclacillin",
                "difloxacin",
                "imipenem",
                "levofloxacin",
                "meropenem",
                "methacycline",
                "metronidazole",
                "metronidazole hydrochloride",
                "moxifloxacin",
                "nalidixic acid",
                "norfloxacin",
                "ofloxacin",
                "ornidazole",
                "piperacillin",
                "streptomycin",
                "sulfamethazine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "trimethoprim",
                "vancomycin"
            ],
            "TP": 16,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            "Penicillin G (PCG)",
            "Azithromycin (ZIT)",
            "Ciprofloxacin (CPR)",
            "Gentamicin (GEN)",
            "Vancomycin (VAN)",
            "Streptomycin (STR)",
            "Tetracycline (TET)",
            "Doxycycline (DOX)",
            "Chloramphenicol (CHL)",
            "Erythromycin (ERY)",
            "Clindamycin (CLI)",
            "Metronidazole (MTZ)",
            "Amoxicillin (AMX)",
            "Ampicillin (AMP)",
            "Ceftriaxone (CEF)",
            "Cefotaxime (CEF)",
            "Cephalexin (CEP)",
            "Sulfamethoxazole (SMX)",
            "Trimethoprim (TMP)",
            "Rifampicin (RIF)",
            "Isoniazid (INH)",
            "Pyrazinamide (PZA)",
            "Ethambutol (EMB)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Azithromycin (ZIT)",
                "Ciprofloxacin (CPR)",
                "Vancomycin (VAN)",
                "Streptomycin (STR)",
                "Tetracycline (TET)",
                "Doxycycline (DOX)",
                "Chloramphenicol (CHL)",
                "Metronidazole (MTZ)",
                "Amoxicillin (AMX)",
                "Ampicillin (AMP)",
                "Ceftriaxone (CEF)",
                "Cefotaxime (CEF)",
                "Cephalexin (CEP)",
                "Trimethoprim (TMP)",
                "Rifampicin (RIF)",
                "Isoniazid (INH)",
                "Ethambutol (EMB)"
            ],
            "mismatches": [
                "Penicillin G (PCG)",
                "Gentamicin (GEN)",
                "Erythromycin (ERY)",
                "Clindamycin (CLI)",
                "Sulfamethoxazole (SMX)",
                "Pyrazinamide (PZA)"
            ],
            "true_referents": [
                "(E)-roxithromycin",
                "(Z)-roxithromycin",
                "amikacin",
                "amoxicillin",
                "ampicillin",
                "antimycobacterial drug",
                "antitubercular agent",
                "apramycin",
                "azithromycin",
                "benzylpenicillin",
                "brodimoprim",
                "cefixime",
                "cefmenoxime",
                "cefotaxime",
                "ceftazidime",
                "ceftiolene",
                "ceftriaxone",
                "cephalexin",
                "cephalexin monohydrate",
                "cephapirin",
                "cethromycin",
                "chloramphenicol",
                "chlortetracycline",
                "ciprofloxacin",
                "ciprofloxacin hydrochloride (anhydrous)",
                "clarithromycin",
                "clomocycline",
                "cloxacillin",
                "co-trimoxazole",
                "cyclacillin",
                "daptomycin",
                "difloxacin",
                "doxycycline",
                "doxycycline hyclate",
                "ethambutol",
                "ethambutol dihydrochloride",
                "isoniazide",
                "metronidazole",
                "metronidazole benzoate",
                "metronidazole hydrochloride",
                "oxytetracycline",
                "piperacillin",
                "pyrazine-2-carboxylic acid",
                "pyrazinecarboxamide",
                "rifabutin",
                "rifampicin",
                "streptomycin",
                "sulfadoxine",
                "sulfaphenazole",
                "sulfisoxazole",
                "tetracycline",
                "trimethoprim",
                "vancomycin",
                "viomycin"
            ],
            "TP": 17,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "antibacterial agent",
        "domain": "medicine",
        "response": [
            {
                "Referent": "Acarbose",
                "Canonical name": "Acarbose"
            },
            {
                "Referent": "Acetic acid",
                "Canonical name": "Acetic acid"
            },
            {
                "Referent": "Acetic anhydride",
                "Canonical name": "Acetic anhydride"
            },
            {
                "Referent": "Acetic acid, sodium salt",
                "Canonical name": "Acetic acid, sodium salt"
            },
            {
                "Referent": "Acetic acid, sodium salt (2:1)",
                "Canonical name": "Acetic acid, sodium salt (2:1)"
            },
            {
                "Referent": "Acetic acid, sodium salt (1:1)",
                "Canonical name": "Acetic acid, sodium salt (1:1)"
            },
            {
                "Referent": "Acetic acid, calcium salt",
                "Canonical name": "Acetic acid, calcium salt"
            },
            {
                "Referent": "Acetic acid, potassium salt",
                "Canonical name": "Acetic acid, potassium salt"
            },
            {
                "Referent": "Acetic acid, ammonium salt",
                "Canonical name": "Acetic acid, ammonium salt"
            },
            {
                "Referent": "Acetic acid, magnesium salt",
                "Canonical name": "Acetic acid, magnesium salt"
            },
            {
                "Referent": "Acetic acid, zinc salt",
                "Canonical name": "Acetic acid, zinc salt"
            },
            {
                "Referent": "Acetic acid, aluminum salt",
                "Canonical name": "Acetic acid, aluminum salt"
            },
            {
                "Referent": "Acetic acid, ammonium chloride",
                "Canonical name": "Acetic acid, ammonium chloride"
            },
            {
                "Referent": "Acetic acid, ammonium acetate",
                "Canonical name": "Acetic acid, ammonium acetate"
            },
            {
                "Referent": "Acetic acid, ammonium formate",
                "Canonical name": "Acetic acid, ammonium formate"
            },
            {
                "Referent": "Acetic acid, ammonium nitrate",
                "Canonical name": "Acetic acid, ammonium nitrate"
            },
            {
                "Referent": "Acetic acid, ammonium phosphate",
                "Canonical name": "Acetic acid, ammonium phosphate"
            },
            {
                "Referent": "Acetic acid, ammonium sulfate",
                "Canonical name": "Acetic acid, ammonium sulfate"
            },
            {
                "Referent": "Acetic acid, sodium acetate",
                "Canonical name": "Acetic acid, sodium acetate"
            },
            {
                "Referent": "Acetic acid, sodium benzoate",
                "Canonical name": "Acetic acid, sodium benzoate"
            },
            {
                "Referent": "Acetic acid, sodium butyrate",
                "Canonical name": "Acetic acid, sodium butyrate"
            },
            {
                "Referent": "Acetic acid, sodium citrate",
                "Canonical name": "Acetic acid, sodium citrate"
            },
            {
                "Referent": "Acetic acid, sodium formate",
                "Canonical name": "Acetic acid, sodium formate"
            },
            {
                "Referent": "Acetic acid, sodium lactate",
                "Canonical name": "Acetic acid, sodium lactate"
            },
            {
                "Referent": "Acetic acid, sodium malonate",
                "Canonical name": "Acetic acid, sodium malonate"
            },
            {
                "Referent": "Acetic acid, sodium propionate",
                "Canonical name": "Acetic acid, sodium propionate"
            },
            {
                "Referent": "Acetic acid, sodium succinate",
                "Canonical name": "Acetic acid, sodium succinate"
            },
            {
                "Referent": "Acetic acid, sodium tartrate",
                "Canonical name": "Acetic acid, sodium tartrate"
            },
            {
                "Referent": "Acetic acid, sodium acetate (1:1)",
                "Canonical name": "Acetic acid, sodium acetate (1:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (2:1)",
                "Canonical name": "Acetic acid, sodium acetate (2:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (3:1)",
                "Canonical name": "Acetic acid, sodium acetate (3:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (4:1)",
                "Canonical name": "Acetic acid, sodium acetate (4:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (5:1)",
                "Canonical name": "Acetic acid, sodium acetate (5:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (6:1)",
                "Canonical name": "Acetic acid, sodium acetate (6:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (7:1)",
                "Canonical name": "Acetic acid, sodium acetate (7:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (8:1)",
                "Canonical name": "Acetic acid, sodium acetate (8:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (9:1)",
                "Canonical name": "Acetic acid, sodium acetate (9:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (10:1)",
                "Canonical name": "Acetic acid, sodium acetate (10:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (11:1)",
                "Canonical name": "Acetic acid, sodium acetate (11:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (12:1)",
                "Canonical name": "Acetic acid, sodium acetate (12:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (13:1)",
                "Canonical name": "Acetic acid, sodium acetate (13:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (14:1)",
                "Canonical name": "Acetic acid, sodium acetate (14:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (15:1)",
                "Canonical name": "Acetic acid, sodium acetate (15:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (16:1)",
                "Canonical name": "Acetic acid, sodium acetate (16:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (17:1)",
                "Canonical name": "Acetic acid, sodium acetate (17:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (18:1)",
                "Canonical name": "Acetic acid, sodium acetate (18:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (19:1)",
                "Canonical name": "Acetic acid, sodium acetate (19:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (20:1)",
                "Canonical name": "Acetic acid, sodium acetate (20:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (21:1)",
                "Canonical name": "Acetic acid, sodium acetate (21:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (22:1)",
                "Canonical name": "Acetic acid, sodium acetate (22:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (23:1)",
                "Canonical name": "Acetic acid, sodium acetate (23:1)"
            },
            {
                "Referent": "Acetic acid, sodium acetate (24:1)",
                "Canonical name": "Acetic acid, sodium acetate (24:1)"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Acarbose",
                "Acetic acid",
                "Acetic anhydride",
                "Acetic acid, sodium salt",
                "Acetic acid, sodium salt (2:1)",
                "Acetic acid, sodium salt (1:1)",
                "Acetic acid, calcium salt",
                "Acetic acid, potassium salt",
                "Acetic acid, ammonium salt",
                "Acetic acid, magnesium salt",
                "Acetic acid, zinc salt",
                "Acetic acid, aluminum salt",
                "Acetic acid, ammonium chloride",
                "Acetic acid, ammonium acetate",
                "Acetic acid, ammonium formate",
                "Acetic acid, ammonium nitrate",
                "Acetic acid, ammonium phosphate",
                "Acetic acid, ammonium sulfate",
                "Acetic acid, sodium acetate",
                "Acetic acid, sodium benzoate",
                "Acetic acid, sodium butyrate",
                "Acetic acid, sodium citrate",
                "Acetic acid, sodium formate",
                "Acetic acid, sodium lactate",
                "Acetic acid, sodium malonate",
                "Acetic acid, sodium propionate",
                "Acetic acid, sodium succinate",
                "Acetic acid, sodium tartrate",
                "Acetic acid, sodium acetate (1:1)",
                "Acetic acid, sodium acetate (2:1)",
                "Acetic acid, sodium acetate (3:1)",
                "Acetic acid, sodium acetate (4:1)",
                "Acetic acid, sodium acetate (5:1)",
                "Acetic acid, sodium acetate (6:1)",
                "Acetic acid, sodium acetate (7:1)",
                "Acetic acid, sodium acetate (8:1)",
                "Acetic acid, sodium acetate (9:1)",
                "Acetic acid, sodium acetate (10:1)",
                "Acetic acid, sodium acetate (11:1)",
                "Acetic acid, sodium acetate (12:1)",
                "Acetic acid, sodium acetate (13:1)",
                "Acetic acid, sodium acetate (14:1)",
                "Acetic acid, sodium acetate (15:1)",
                "Acetic acid, sodium acetate (16:1)",
                "Acetic acid, sodium acetate (17:1)",
                "Acetic acid, sodium acetate (18:1)",
                "Acetic acid, sodium acetate (19:1)",
                "Acetic acid, sodium acetate (20:1)",
                "Acetic acid, sodium acetate (21:1)",
                "Acetic acid, sodium acetate (22:1)",
                "Acetic acid, sodium acetate (23:1)",
                "Acetic acid, sodium acetate (24:1)"
            ],
            "true_referents": [
                "(S)-nadifloxacin",
                "(S)-temafloxacin",
                "2-nitroimidazole",
                "3-nitropropanoic acid",
                "D-cycloserine",
                "arsphenamine",
                "desacetylpyramidaglain D",
                "malachite green cation",
                "pipemidic acid",
                "piromidic acid",
                "salicylhydroxamic acid",
                "scleropyric acid",
                "silver(1+) sulfadiazinate",
                "streptomycin",
                "viomycin(3+)"
            ],
            "TP": 0,
            "FP": 52,
            "FN": 0
        }
    }
]