[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli (E. coli)",
            "Klebsiella pneumoniae",
            "Pseudomonas aeruginosa",
            "Acinetobacter baumannii",
            "Salmonella enterica",
            "Neisseria gonorrhoeae",
            "Haemophilus influenzae",
            "Moraxella catarrhalis",
            "Legionella pneumophila",
            "Vibrio cholerae",
            "Yersinia pestis",
            "Francisella tularensis",
            "Chlamydia trachomatis",
            "Brucella abortus",
            "Campylobacter jejuni",
            "Bordetella pertussis",
            "Morganella morganii",
            "Serratia marcescens",
            "Proteus mirabilis",
            "Enterobacter cloacae",
            "Citrobacter freundii",
            "Erwinia amylovora",
            "Helicobacter pylori",
            "Pasteurella multocida"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Klebsiella Infections",
                "Pseudomonas Infections",
                "Acinetobacter Infections",
                "Salmonella Infections",
                "Neisseriaceae Infections",
                "Haemophilus Infections",
                "Moraxellaceae Infections",
                "Legionellosis",
                "Vibrio Infections",
                "Yersinia Infections",
                "Tularemia",
                "Chlamydia Infections",
                "Brucellosis",
                "Campylobacter Infections",
                "Bordetella Infections",
                "Serratia Infections",
                "Proteus Infections",
                "Helicobacter Infections",
                "Pasteurella Infections"
            ],
            "mismatches": [
                "Escherichia coli (E. coli)",
                "Morganella morganii",
                "Enterobacter cloacae",
                "Citrobacter freundii",
                "Erwinia amylovora"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillosis",
                "Bordetella Infections",
                "Bovine Brucellosis",
                "Brucellosis",
                "Campylobacter Infections",
                "Chlamydia Infections",
                "Chlamydial Pneumonia",
                "Cholera",
                "Enterobacteriaceae Infections",
                "Fusobacteriaceae Infections",
                "Gonorrhea",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Leptospirosis",
                "Melioidosis",
                "Moraxellaceae Infections",
                "Neisseriaceae Infections",
                "Pasteurella Infections",
                "Pasteurellaceae Infections",
                "Plague",
                "Pneumonic Pasteurellosis",
                "Proteus Infections",
                "Pseudomonas Infections",
                "Q Fever",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Scrub Typhus",
                "Serratia Infections",
                "Syphilis",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Whooping Cough",
                "Yersinia Infections"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli (E. coli) infection",
            "Pseudomonas aeruginosa infection",
            "Klebsiella pneumoniae infection",
            "Acinetobacter baumannii infection",
            "Neisseria meningitidis infection",
            "Salmonella enterica infection",
            "Haemophilus influenzae infection",
            "Moraxella catarrhalis infection",
            "Chromobacterium violaceum infection",
            "Legionella pneumophila infection",
            "Burkholderia cepacia complex infection",
            "Neisseria gonorrhoeae infection",
            "Helicobacter pylori infection",
            "Bordetella pertussis infection",
            "Vibrio cholerae infection",
            "Shigella spp. infection",
            "Aeromonas hydrophila infection",
            "Proteus mirabilis infection",
            "Serratia marcescens infection",
            "Yersinia pestis infection",
            "Pasteurella multocida infection",
            "Francisella tularensis infection",
            "Brucella spp. infection",
            "Campylobacter jejuni infection",
            "Mycobacterium tuberculosis infection"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Escherichia coli (E. coli) infection",
                "Pseudomonas aeruginosa infection",
                "Klebsiella pneumoniae infection",
                "Acinetobacter baumannii infection",
                "Neisseria meningitidis infection",
                "Salmonella enterica infection",
                "Haemophilus influenzae infection",
                "Burkholderia cepacia complex infection",
                "Helicobacter pylori infection",
                "Bordetella pertussis infection",
                "Vibrio cholerae infection",
                "Proteus mirabilis infection",
                "Serratia marcescens infection",
                "Yersinia pestis infection",
                "Pasteurella multocida infection",
                "Francisella tularensis infection",
                "Brucella spp. infection",
                "Campylobacter jejuni infection"
            ],
            "mismatches": [
                "Moraxella catarrhalis infection",
                "Chromobacterium violaceum infection",
                "Legionella pneumophila infection",
                "Neisseria gonorrhoeae infection",
                "Shigella spp. infection",
                "Aeromonas hydrophila infection",
                "Mycobacterium tuberculosis infection"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillus Infections",
                "Animal Salmonella Infections",
                "Bartonella Infections",
                "Bartonellaceae Infections",
                "Bordetella Infections",
                "Bovine Brucellosis",
                "Brucellosis",
                "Burkholderia Infections",
                "Campylobacter Infections",
                "Chlamydia Infections",
                "Chlamydial Pneumonia",
                "Chlamydophila Infections",
                "Cholera",
                "Desulfovibrionaceae Infections",
                "Enterobacteriaceae Infections",
                "Escherichia coli Infections",
                "Escherichia coli Meningitis",
                "Flavobacteriaceae Infections",
                "Fusobacteriaceae Infections",
                "Gonorrhea",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Melioidosis",
                "Meningococcal Infections",
                "Meningococcal Meningitis",
                "Moraxellaceae Infections",
                "Neisseriaceae Infections",
                "Pasteurella Infections",
                "Pasteurellaceae Infections",
                "Plague",
                "Pneumonic Pasteurellosis",
                "Proteus Infections",
                "Pseudomonas Infections",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Serratia Infections",
                "Syphilis",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Whooping Cough",
                "Yersinia Infections",
                "Yersinia pseudotuberculosis Infections"
            ],
            "TP": 18,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli (E. coli) infection",
            "Salmonella infection",
            "Shigella infection",
            "Yersinia pestis (plague) infection",
            "Helicobacter pylori infection",
            "Neisseria gonorrhoeae (gonorrhea) infection",
            "Neisseria meningitidis (meningococcal) infection",
            "Klebsiella pneumoniae infection",
            "Pseudomonas aeruginosa infection",
            "Legionella pneumophila (legionnaires' disease) infection",
            "Campylobacter jejuni infection",
            "Vibrio cholerae (cholera) infection",
            "Francisella tularensis (tularemia) infection",
            "Haemophilus influenzae infection",
            "Bordetella pertussis (whooping cough) infection",
            "Brucella spp. (brucellosis) infection",
            "Bartonella henselae (cat-scratch disease) infection",
            "Bacteroides fragilis infection",
            "Fusobacterium nucleatum infection",
            "Prevotella spp. infection",
            "Acinetobacter baumannii infection",
            "Serratia marcescens infection",
            "Proteus mirabilis infection",
            "Morganella morganii infection",
            "Citrobacter spp. infection"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Escherichia coli Infections",
                "Salmonella Infections",
                "Plague",
                "Helicobacter Infections",
                "Gonorrhea",
                "Meningococcal Infections",
                "Klebsiella Infections",
                "Pseudomonas Infections",
                "Legionnaires' Disease",
                "Campylobacter Infections",
                "Cholera",
                "Tularemia",
                "Haemophilus Infections",
                "Whooping Cough",
                "Brucellosis",
                "Cat-Scratch Disease",
                "Bacteroides Infections",
                "Fusobacterium Infections",
                "Acinetobacter Infections",
                "Serratia Infections",
                "Proteus Infections"
            ],
            "mismatches": [
                "Shigella infection",
                "Klebsiella pneumoniae infection",
                "Brucella spp. (brucellosis) infection",
                "Prevotella spp. infection",
                "Morganella morganii infection",
                "Citrobacter spp. infection"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillus Infections",
                "Animal Salmonella Infections",
                "Bacteroidaceae Infections",
                "Bacteroides Infections",
                "Bartonella Infections",
                "Bartonellaceae Infections",
                "Bordetella Infections",
                "Bovine Brucellosis",
                "Brucellosis",
                "Burkholderia Infections",
                "Campylobacter Infections",
                "Cat-Scratch Disease",
                "Chlamydia Infections",
                "Chlamydial Pneumonia",
                "Chlamydophila Infections",
                "Cholera",
                "Enterobacteriaceae Infections",
                "Escherichia coli Infections",
                "Escherichia coli Meningitis",
                "Flavobacteriaceae Infections",
                "Fusobacteriaceae Infections",
                "Fusobacterium Infections",
                "Gonorrhea",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Melioidosis",
                "Meningococcal Infections",
                "Meningococcal Meningitis",
                "Moraxellaceae Infections",
                "Neisseriaceae Infections",
                "Pasteurella Infections",
                "Pasteurellaceae Infections",
                "Plague",
                "Proteus Infections",
                "Pseudomonas Infections",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Serratia Infections",
                "Syphilis",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Whooping Cough",
                "Yersinia Infections",
                "Yersinia pseudotuberculosis Infections"
            ],
            "TP": 21,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli Urinary Tract Infection (E. coli UTI)",
            "Salmonella Gastroenteritis (Salmonella spp.)",
            "Shigella Dysentery (Shigella dysenteriae)",
            "Klebsiella pneumoniae Pneumonia (K. pneumoniae)",
            "Pseudomonas aeruginosa Wound Infection (P. aeruginosa)",
            "Neisseria gonorrhoeae Gonorrhea (N. gonorrhoeae)",
            "Neisseria meningitidis Meningitis (N. meningitidis)",
            "Haemophilus influenzae Meningitis (H. influenzae)",
            "Helicobacter pylori Gastritis (H. pylori)",
            "Vibrio cholerae Cholera (V. cholerae)",
            "Yersinia pestis Plague (Y. pestis)",
            "Legionella pneumophila Legionnaires' Disease (L. pneumophila)",
            "Bordetella pertussis Whooping Cough (B. pertussis)",
            "Proteus mirabilis Catheter-Associated UTI (P. mirabilis)",
            "Enterobacter cloacae Bacteremia (E. cloacae)",
            "Serratia marcescens Pneumonia (S. marcescens)",
            "Acinetobacter baumannii Nosocomial Pneumonia (A. baumannii)",
            "Morganella morganii Wound Infection (M. morganii)",
            "Citrobacter freundii Sepsis (C. freundii)",
            "Campylobacter jejuni Diarrhea (C. jejuni)",
            "Francisella tularensis Tularemia (F. tularensis)",
            "Brucella abortus Brucellosis (B. abortus)",
            "Pasteurella multocida Soft Tissue Infection (P. multocida)",
            "Edwardsiella tarda Wound Infection (E. tarda)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Klebsiella Infections",
                "Pseudomonas Infections",
                "Gonorrhea",
                "Meningococcal Meningitis",
                "Haemophilus Meningitis",
                "Cholera",
                "Plague",
                "Legionnaires' Disease",
                "Whooping Cough",
                "Proteus Infections",
                "Serratia Infections",
                "Acinetobacter Infections",
                "Tularemia",
                "Brucellosis",
                "Pasteurella Infections",
                "Campylobacter Infections"
            ],
            "mismatches": [
                "Escherichia coli Urinary Tract Infection (E. coli UTI)",
                "Salmonella Gastroenteritis (Salmonella spp.)",
                "Shigella Dysentery (Shigella dysenteriae)",
                "Helicobacter pylori Gastritis (H. pylori)",
                "Enterobacter cloacae Bacteremia (E. cloacae)",
                "Morganella morganii Wound Infection (M. morganii)",
                "Citrobacter freundii Sepsis (C. freundii)",
                "Edwardsiella tarda Wound Infection (E. tarda)"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillosis",
                "Actinobacillus Infections",
                "Bacillary Dysentery",
                "Bordetella Infections",
                "Bovine Brucellosis",
                "Brucellosis",
                "Burkholderia Infections",
                "Campylobacter Infections",
                "Chlamydial Pneumonia",
                "Cholera",
                "Enterobacteriaceae Infections",
                "Escherichia coli Infections",
                "Escherichia coli Meningitis",
                "Flavobacteriaceae Infections",
                "Fusobacteriaceae Infections",
                "Fusobacterium Infections",
                "Gonorrhea",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Leptospirosis",
                "Lymphogranuloma Venereum",
                "Melioidosis",
                "Meningococcal Infections",
                "Meningococcal Meningitis",
                "Neisseriaceae Infections",
                "Pasteurella Infections",
                "Pasteurellaceae Infections",
                "Plague",
                "Pneumonic Pasteurellosis",
                "Proteus Infections",
                "Pseudomonas Infections",
                "Q Fever",
                "Rickettsial Pneumonia",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Scrub Typhus",
                "Serratia Infections",
                "Syphilis",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Whooping Cough",
                "Yersinia Infections"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli (E. coli)",
            "Salmonella enterica",
            "Pseudomonas aeruginosa",
            "Neisseria meningitidis",
            "Neisseria gonorrhoeae",
            "Haemophilus influenzae",
            "Klebsiella pneumoniae",
            "Legionella pneumophila",
            "Bordetella pertussis",
            "Shigella dysenteriae",
            "Vibrio cholerae",
            "Campylobacter jejuni",
            "Helicobacter pylori",
            "Acinetobacter baumannii",
            "Proteus mirabilis",
            "Yersinia pestis",
            "Francisella tularensis",
            "Brucella abortus",
            "Burkholderia cepacia",
            "Moraxella catarrhalis",
            "Serratia marcescens",
            "Enterobacter cloacae",
            "Bacteroides fragilis",
            "Fusobacterium nucleatum"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Salmonella Infections",
                "Pseudomonas Infections",
                "Meningococcal Infections",
                "Gonorrhea",
                "Haemophilus Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Bordetella Infections",
                "Bacillary Dysentery",
                "Cholera",
                "Campylobacter Infections",
                "Helicobacter Infections",
                "Acinetobacter Infections",
                "Proteus Infections",
                "Yersinia Infections",
                "Tularemia",
                "Brucellosis",
                "Burkholderia Infections",
                "Moraxellaceae Infections",
                "Serratia Infections",
                "Bacteroides Infections",
                "Fusobacterium Infections"
            ],
            "mismatches": [
                "Escherichia coli (E. coli)",
                "Francisella tularensis",
                "Enterobacter cloacae"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillosis",
                "Bacillary Dysentery",
                "Bacteroidaceae Infections",
                "Bacteroides Infections",
                "Bordetella Infections",
                "Bovine Brucellosis",
                "Brucellosis",
                "Burkholderia Infections",
                "Campylobacter Infections",
                "Chlamydial Pneumonia",
                "Cholera",
                "Enterobacteriaceae Infections",
                "Fusobacteriaceae Infections",
                "Fusobacterium Infections",
                "Gonorrhea",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Leptospirosis",
                "Melioidosis",
                "Meningococcal Infections",
                "Meningococcal Meningitis",
                "Moraxellaceae Infections",
                "Neisseriaceae Infections",
                "Plague",
                "Proteus Infections",
                "Pseudomonas Infections",
                "Q Fever",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Scrub Typhus",
                "Serratia Infections",
                "Syphilis",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Whooping Cough",
                "Yersinia Infections"
            ],
            "TP": 22,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli (E. coli)",
            "Klebsiella pneumoniae (K. pneumoniae)",
            "Pseudomonas aeruginosa (P. aeruginosa)",
            "Salmonella enterica (S. enterica)",
            "Neisseria gonorrhoeae (N. gonorrhoeae)",
            "Haemophilus influenzae (H. influenzae)",
            "Shigella dysenteriae (S. dysenteriae)",
            "Vibrio cholerae (V. cholerae)",
            "Campylobacter jejuni (C. jejuni)",
            "Acinetobacter baumannii (A. baumannii)",
            "Proteus mirabilis (P. mirabilis)",
            "Serratia marcescens (S. marcescens)",
            "Burkholderia cepacia (B. cepacia)",
            "Legionella pneumophila (L. pneumophila)",
            "Yersinia pestis (Y. pestis)",
            "Francisella tularensis (F. tularensis)",
            "Brucella spp. (Brucella)",
            "Corynebacterium diphtheriae (C. diphtheriae)",
            "Enterobacter cloacae (E. cloacae)",
            "Citrobacter freundii (C. freundii)",
            "Bordetella pertussis (B. pertussis)",
            "Rickettsia rickettsii (R. rickettsii)",
            "Chlamydia trachomatis (C. trachomatis)",
            "Helicobacter pylori (H. pylori)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Klebsiella pneumoniae (K. pneumoniae)",
                "Pseudomonas aeruginosa (P. aeruginosa)",
                "Salmonella enterica (S. enterica)",
                "Neisseria gonorrhoeae (N. gonorrhoeae)",
                "Haemophilus influenzae (H. influenzae)",
                "Shigella dysenteriae (S. dysenteriae)",
                "Vibrio cholerae (V. cholerae)",
                "Campylobacter jejuni (C. jejuni)",
                "Acinetobacter baumannii (A. baumannii)",
                "Proteus mirabilis (P. mirabilis)",
                "Serratia marcescens (S. marcescens)",
                "Burkholderia cepacia (B. cepacia)",
                "Legionella pneumophila (L. pneumophila)",
                "Yersinia pestis (Y. pestis)",
                "Francisella tularensis (F. tularensis)",
                "Brucella spp. (Brucella)",
                "Bordetella pertussis (B. pertussis)",
                "Rickettsia rickettsii (R. rickettsii)",
                "Helicobacter pylori (H. pylori)"
            ],
            "mismatches": [
                "Escherichia coli (E. coli)",
                "Corynebacterium diphtheriae (C. diphtheriae)",
                "Enterobacter cloacae (E. cloacae)",
                "Citrobacter freundii (C. freundii)",
                "Chlamydia trachomatis (C. trachomatis)"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillosis",
                "Actinobacillus Infections",
                "Bacillary Dysentery",
                "Bordetella Infections",
                "Bovine Brucellosis",
                "Brucellosis",
                "Burkholderia Infections",
                "Campylobacter Infections",
                "Chancroid",
                "Chlamydial Pneumonia",
                "Cholera",
                "Enterobacteriaceae Infections",
                "Flavobacteriaceae Infections",
                "Fusobacteriaceae Infections",
                "Gonorrhea",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Leptospirosis",
                "Melioidosis",
                "Neisseriaceae Infections",
                "Plague",
                "Proteus Infections",
                "Pseudomonas Infections",
                "Q Fever",
                "Rickettsia Infections",
                "Rickettsiaceae Infections",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Scrub Typhus",
                "Serratia Infections",
                "Spotted Fever Group Rickettsiosis",
                "Syphilis",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Whooping Cough",
                "Yersinia Infections"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Gonorrhea (Neisseria gonorrhoeae)",
            "Cholera (Vibrio cholerae)",
            "Salmonellosis (Salmonella enterica)",
            "Shigellosis (Shigella spp.)",
            "Whooping cough (Bordetella pertussis)",
            "Legionnaires' disease (Legionella pneumophila)",
            "Escherichia coli infection (E. coli)",
            "Pseudomonas aeruginosa infection (P. aeruginosa)",
            "Helicobacter pylori infection (H. pylori)",
            "Campylobacteriosis (Campylobacter jejuni)",
            "Haemophilus influenzae infection (H. influenzae)",
            "Klebsiella pneumoniae infection (K. pneumoniae)",
            "Yersiniosis (Yersinia enterocolitica)",
            "Peptic ulcer disease (Helicobacter pylori)",
            "Typhoid fever (Salmonella Typhi)",
            "Plague (Yersinia pestis)",
            "Brucellosis (Brucella spp.)",
            "Leptospirosis (Leptospira interrogans)",
            "Tularemia (Francisella tularensis)",
            "Meliodosis (Burkholderia pseudomallei)",
            "Pertussis (Bordetella pertussis)",
            "Cat Scratch Disease (Bartonella henselae)",
            "Chancroid (Haemophilus ducreyi)",
            "Syphilis (Treponema pallidum)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Gonorrhea",
                "Cholera",
                "Whooping Cough",
                "Legionnaires' Disease",
                "Escherichia coli Infections",
                "Pseudomonas Infections",
                "Helicobacter Infections",
                "Campylobacter Infections",
                "Haemophilus Infections",
                "Klebsiella Infections",
                "Typhoid Fever",
                "Plague",
                "Brucellosis",
                "Leptospirosis",
                "Tularemia",
                "Cat-Scratch Disease",
                "Chancroid",
                "Syphilis"
            ],
            "mismatches": [
                "Salmonellosis (Salmonella enterica)",
                "Shigellosis (Shigella spp.)",
                "Yersiniosis (Yersinia enterocolitica)",
                "Peptic ulcer disease (Helicobacter pylori)",
                "Meliodosis (Burkholderia pseudomallei)"
            ],
            "true_referents": [
                "Actinobacillosis",
                "Bartonella Infections",
                "Bartonellaceae Infections",
                "Bordetella Infections",
                "Bovine Brucellosis",
                "Brucellosis",
                "Burkholderia Infections",
                "Campylobacter Infections",
                "Cat-Scratch Disease",
                "Chancre",
                "Chancroid",
                "Chlamydial Pneumonia",
                "Cholera",
                "Ehrlichiosis",
                "Enterobacteriaceae Infections",
                "Escherichia coli Infections",
                "Escherichia coli Meningitis",
                "Gonorrhea",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Latent Syphilis",
                "Legionellosis",
                "Legionnaires' Disease",
                "Lemierre Syndrome",
                "Leptospirosis",
                "Melioidosis",
                "Paratyphoid Fever",
                "Plague",
                "Pseudomonas Infections",
                "Q Fever",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Scrub Typhus",
                "Syphilis",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Whooping Cough",
                "Yersinia Infections",
                "Yersinia pseudotuberculosis Infections"
            ],
            "TP": 18,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli infection",
            "Pseudomonas aeruginosa infection",
            "Klebsiella pneumoniae infection",
            "Acinetobacter baumannii infection",
            "Salmonella infection",
            "Shigella infection",
            "Neisseria meningitidis infection",
            "Helicobacter pylori infection",
            "Legionella pneumophila infection",
            "Moraxella catarrhalis infection",
            "Campylobacter jejuni infection",
            "Bordetella pertussis infection",
            "Haemophilus influenzae infection",
            "Yersinia pestis infection",
            "Vibrio cholerae infection",
            "Francisella tularensis infection",
            "Burkholderia cepacia infection",
            "Brucella infection",
            "Rickettsia prowazekii infection",
            "Treponema pallidum infection",
            "Chlamydia trachomatis infection",
            "Bacteroides fragilis infection",
            "Fusobacterium nucleatum infection",
            "Prevotella intermedia infection"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Escherichia coli infection",
                "Pseudomonas aeruginosa infection",
                "Klebsiella pneumoniae infection",
                "Acinetobacter baumannii infection",
                "Salmonella infection",
                "Neisseria meningitidis infection",
                "Helicobacter pylori infection",
                "Legionella pneumophila infection",
                "Campylobacter jejuni infection",
                "Bordetella pertussis infection",
                "Haemophilus influenzae infection",
                "Yersinia pestis infection",
                "Vibrio cholerae infection",
                "Francisella tularensis infection",
                "Burkholderia cepacia infection",
                "Brucella infection",
                "Rickettsia prowazekii infection",
                "Treponema pallidum infection",
                "Chlamydia trachomatis infection",
                "Bacteroides fragilis infection",
                "Fusobacterium nucleatum infection"
            ],
            "mismatches": [
                "Shigella infection",
                "Moraxella catarrhalis infection",
                "Prevotella intermedia infection"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillus Infections",
                "Animal Salmonella Infections",
                "Bacteroidaceae Infections",
                "Bacteroides Infections",
                "Bartonella Infections",
                "Bartonellaceae Infections",
                "Bordetella Infections",
                "Bovine Brucellosis",
                "Brucellosis",
                "Burkholderia Infections",
                "Campylobacter Infections",
                "Chlamydia Infections",
                "Chlamydial Pneumonia",
                "Chlamydophila Infections",
                "Cholera",
                "Desulfovibrionaceae Infections",
                "Enterobacteriaceae Infections",
                "Escherichia coli Infections",
                "Escherichia coli Meningitis",
                "Flavobacteriaceae Infections",
                "Fusobacteriaceae Infections",
                "Fusobacterium Infections",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Melioidosis",
                "Meningococcal Infections",
                "Meningococcal Meningitis",
                "Moraxellaceae Infections",
                "Neisseriaceae Infections",
                "Plague",
                "Pseudomonas Infections",
                "Rickettsia Infections",
                "Rickettsiaceae Infections",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Spotted Fever Group Rickettsiosis",
                "Syphilis",
                "Treponemal Infections",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Whooping Cough",
                "Yersinia Infections",
                "Yersinia pseudotuberculosis Infections"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli (E. coli) infection",
            "Pseudomonas aeruginosa (P. aeruginosa) infection",
            "Klebsiella pneumoniae (K. pneumoniae) infection",
            "Salmonella enterica infection",
            "Shigella dysenteriae infection",
            "Neisseria gonorrhoeae (N. gonorrhoeae) infection",
            "Neisseria meningitidis (N. meningitidis) infection",
            "Haemophilus influenzae (H. influenzae) infection",
            "Proteus mirabilis infection",
            "Enterobacter cloacae infection",
            "Serratia marcescens infection",
            "Acinetobacter baumannii infection",
            "Vibrio cholerae infection",
            "Legionella pneumophila infection",
            "Yersinia enterocolitica infection",
            "Campylobacter jejuni infection",
            "Bordetella pertussis infection",
            "Francisella tularensis infection",
            "Burkholderia cepacia infection",
            "Aggregatibacter actinomycetemcomitans infection",
            "Bacteroides fragilis infection",
            "Citrobacter freundii infection",
            "Morganella morganii infection",
            "Ralstonia pickettii infection"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Escherichia coli (E. coli) infection",
                "Pseudomonas aeruginosa (P. aeruginosa) infection",
                "Klebsiella pneumoniae (K. pneumoniae) infection",
                "Neisseria gonorrhoeae (N. gonorrhoeae) infection",
                "Neisseria meningitidis (N. meningitidis) infection",
                "Haemophilus influenzae (H. influenzae) infection",
                "Proteus mirabilis infection",
                "Serratia marcescens infection",
                "Acinetobacter baumannii infection",
                "Vibrio cholerae infection",
                "Legionella pneumophila infection",
                "Yersinia enterocolitica infection",
                "Campylobacter jejuni infection",
                "Bordetella pertussis infection",
                "Francisella tularensis infection",
                "Burkholderia cepacia infection",
                "Bacteroides fragilis infection"
            ],
            "mismatches": [
                "Salmonella enterica infection",
                "Shigella dysenteriae infection",
                "Enterobacter cloacae infection",
                "Aggregatibacter actinomycetemcomitans infection",
                "Citrobacter freundii infection",
                "Morganella morganii infection",
                "Ralstonia pickettii infection"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillosis",
                "Actinobacillus Infections",
                "Animal Salmonella Infections",
                "Bacillary Dysentery",
                "Bacteroidaceae Infections",
                "Bacteroides Infections",
                "Bartonella Infections",
                "Bordetella Infections",
                "Burkholderia Infections",
                "Campylobacter Infections",
                "Chlamydia Infections",
                "Chlamydial Pneumonia",
                "Chlamydophila Infections",
                "Cholera",
                "Enterobacteriaceae Infections",
                "Escherichia coli Infections",
                "Escherichia coli Meningitis",
                "Flavobacteriaceae Infections",
                "Fusobacteriaceae Infections",
                "Fusobacterium Infections",
                "Gonorrhea",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Melioidosis",
                "Meningococcal Infections",
                "Meningococcal Meningitis",
                "Moraxellaceae Infections",
                "Neisseriaceae Infections",
                "Pasteurella Infections",
                "Pasteurellaceae Infections",
                "Piscirickettsiaceae Infections",
                "Proteus Infections",
                "Pseudomonas Infections",
                "Rocky Mountain Spotted Fever",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Serratia Infections",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Whooping Cough",
                "Yersinia Infections",
                "Yersinia pseudotuberculosis Infections"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli (E. coli) infection",
            "Salmonella enterica infection",
            "Klebsiella pneumoniae infection",
            "Pseudomonas aeruginosa infection",
            "Neisseria meningitidis infection",
            "Haemophilus influenzae infection",
            "Legionella pneumophila infection",
            "Vibrio cholerae infection",
            "Helicobacter pylori infection",
            "Campylobacter jejuni infection",
            "Shigella dysenteriae infection",
            "Yersinia pestis infection",
            "Bordetella pertussis infection",
            "Acinetobacter baumannii infection",
            "Proteus mirabilis infection",
            "Serratia marcescens infection",
            "Enterobacter cloacae infection",
            "Citrobacter freundii infection",
            "Moraxella catarrhalis infection",
            "Burkholderia cepacia infection",
            "Francisella tularensis infection",
            "Brucella melitensis infection",
            "Stenotrophomonas maltophilia infection",
            "Providencia stuartii infection"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Escherichia coli (E. coli) infection",
                "Klebsiella pneumoniae infection",
                "Pseudomonas aeruginosa infection",
                "Neisseria meningitidis infection",
                "Haemophilus influenzae infection",
                "Vibrio cholerae infection",
                "Helicobacter pylori infection",
                "Campylobacter jejuni infection",
                "Shigella dysenteriae infection",
                "Yersinia pestis infection",
                "Bordetella pertussis infection",
                "Acinetobacter baumannii infection",
                "Proteus mirabilis infection",
                "Serratia marcescens infection",
                "Burkholderia cepacia infection",
                "Francisella tularensis infection",
                "Brucella melitensis infection"
            ],
            "mismatches": [
                "Salmonella enterica infection",
                "Legionella pneumophila infection",
                "Enterobacter cloacae infection",
                "Citrobacter freundii infection",
                "Moraxella catarrhalis infection",
                "Stenotrophomonas maltophilia infection",
                "Providencia stuartii infection"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillus Infections",
                "Animal Salmonella Infections",
                "Bacillary Dysentery",
                "Bartonella Infections",
                "Bartonellaceae Infections",
                "Bordetella Infections",
                "Bovine Brucellosis",
                "Brucellosis",
                "Burkholderia Infections",
                "Campylobacter Infections",
                "Chlamydial Pneumonia",
                "Chlamydophila Infections",
                "Cholera",
                "Enterobacteriaceae Infections",
                "Escherichia coli Infections",
                "Escherichia coli Meningitis",
                "Flavobacteriaceae Infections",
                "Fusobacteriaceae Infections",
                "Fusobacterium Infections",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Melioidosis",
                "Meningococcal Infections",
                "Meningococcal Meningitis",
                "Moraxellaceae Infections",
                "Neisseriaceae Infections",
                "Pasteurella Infections",
                "Pasteurellaceae Infections",
                "Plague",
                "Proteus Infections",
                "Pseudomonas Infections",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Serratia Infections",
                "Spirochaetales Infections",
                "Syphilis",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Whooping Cough",
                "Yersinia Infections",
                "Yersinia pseudotuberculosis Infections"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli (E. coli) infection",
            "Salmonella enterica infection",
            "Klebsiella pneumoniae infection",
            "Pseudomonas aeruginosa infection",
            "Neisseria gonorrhoeae infection",
            "Haemophilus influenzae infection",
            "Legionella pneumophila infection",
            "Campylobacter jejuni infection",
            "Vibrio cholerae infection",
            "Helicobacter pylori infection",
            "Shigella dysenteriae infection",
            "Yersinia pestis infection",
            "Acinetobacter baumannii infection",
            "Bordetella pertussis infection",
            "Brucella abortus infection",
            "Burkholderia cepacia infection",
            "Chlamydia trachomatis infection",
            "Citrobacter freundii infection",
            "Enterobacter cloacae infection",
            "Francisella tularensis infection",
            "Moraxella catarrhalis infection",
            "Proteus mirabilis infection",
            "Serratia marcescens infection",
            "Stenotrophomonas maltophilia infection"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Escherichia coli Infections",
                "Klebsiella Infections",
                "Pseudomonas Infections",
                "Neisseriaceae Infections",
                "Haemophilus Infections",
                "Legionellosis",
                "Campylobacter Infections",
                "Vibrio Infections",
                "Helicobacter Infections",
                "Bacillary Dysentery",
                "Yersinia Infections",
                "Acinetobacter Infections",
                "Bordetella Infections",
                "Brucellosis",
                "Burkholderia Infections",
                "Chlamydia Infections",
                "Tularemia",
                "Moraxellaceae Infections",
                "Proteus Infections",
                "Serratia Infections"
            ],
            "mismatches": [
                "Salmonella enterica infection",
                "Citrobacter freundii infection",
                "Enterobacter cloacae infection",
                "Stenotrophomonas maltophilia infection"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillus Infections",
                "Animal Salmonella Infections",
                "Bacillary Dysentery",
                "Bartonella Infections",
                "Bartonellaceae Infections",
                "Bordetella Infections",
                "Bovine Brucellosis",
                "Brucellosis",
                "Burkholderia Infections",
                "Campylobacter Infections",
                "Chlamydia Infections",
                "Chlamydial Pneumonia",
                "Chlamydophila Infections",
                "Cholera",
                "Enterobacteriaceae Infections",
                "Escherichia coli Infections",
                "Escherichia coli Meningitis",
                "Flavobacteriaceae Infections",
                "Fusobacteriaceae Infections",
                "Fusobacterium Infections",
                "Gonorrhea",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Melioidosis",
                "Moraxellaceae Infections",
                "Neisseriaceae Infections",
                "Pasteurella Infections",
                "Pasteurellaceae Infections",
                "Plague",
                "Proteus Infections",
                "Pseudomonas Infections",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Serratia Infections",
                "Syphilis",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Whooping Cough",
                "Yersinia Infections",
                "Yersinia pseudotuberculosis Infections"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli (E. coli) infection",
            "Salmonella enterica infection",
            "Pseudomonas aeruginosa infection",
            "Klebsiella pneumoniae infection",
            "Acinetobacter baumannii infection",
            "Helicobacter pylori infection",
            "Legionella pneumophila infection",
            "Neisseria gonorrhoeae infection",
            "Haemophilus influenzae infection",
            "Shigella dysenteriae infection",
            "Yersinia pestis infection",
            "Vibrio cholerae infection",
            "Campylobacter jejuni infection",
            "Bordetella pertussis infection",
            "Brucella abortus infection",
            "Francisella tularensis infection",
            "Burkholderia cepacia infection",
            "Stenotrophomonas maltophilia infection",
            "Aeromonas hydrophila infection",
            "Proteus mirabilis infection",
            "Serratia marcescens infection",
            "Enterobacter cloacae infection",
            "Citrobacter freundii infection",
            "Morganella morganii infection"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Escherichia coli (E. coli) infection",
                "Pseudomonas aeruginosa infection",
                "Klebsiella pneumoniae infection",
                "Acinetobacter baumannii infection",
                "Helicobacter pylori infection",
                "Legionella pneumophila infection",
                "Neisseria gonorrhoeae infection",
                "Haemophilus influenzae infection",
                "Shigella dysenteriae infection",
                "Yersinia pestis infection",
                "Vibrio cholerae infection",
                "Campylobacter jejuni infection",
                "Bordetella pertussis infection",
                "Brucella abortus infection",
                "Francisella tularensis infection",
                "Burkholderia cepacia infection",
                "Proteus mirabilis infection",
                "Serratia marcescens infection"
            ],
            "mismatches": [
                "Salmonella enterica infection",
                "Stenotrophomonas maltophilia infection",
                "Aeromonas hydrophila infection",
                "Enterobacter cloacae infection",
                "Citrobacter freundii infection",
                "Morganella morganii infection"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillus Infections",
                "Animal Salmonella Infections",
                "Bacillary Dysentery",
                "Bartonella Infections",
                "Bordetella Infections",
                "Bovine Brucellosis",
                "Brucellosis",
                "Burkholderia Infections",
                "Campylobacter Infections",
                "Chlamydia Infections",
                "Chlamydial Pneumonia",
                "Chlamydophila Infections",
                "Cholera",
                "Enterobacteriaceae Infections",
                "Escherichia coli Infections",
                "Escherichia coli Meningitis",
                "Flavobacteriaceae Infections",
                "Fusobacteriaceae Infections",
                "Fusobacterium Infections",
                "Gonorrhea",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Melioidosis",
                "Moraxellaceae Infections",
                "Neisseriaceae Infections",
                "Pasteurella Infections",
                "Pasteurellaceae Infections",
                "Plague",
                "Proteus Infections",
                "Pseudomonas Infections",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Serratia Infections",
                "Syphilis",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Whooping Cough",
                "Yersinia Infections",
                "Yersinia pseudotuberculosis Infections"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli (E. coli) Infection",
            "Salmonella Typhimurium Infection",
            "Pseudomonas aeruginosa Infection",
            "Klebsiella pneumoniae Infection",
            "Acinetobacter baumannii Infection",
            "Neisseria gonorrhoeae Infection",
            "Helicobacter pylori Infection",
            "Shigella dysenteriae Infection",
            "Legionella pneumophila Infection",
            "Campylobacter jejuni Infection",
            "Burkholderia cepacia Infection",
            "Haemophilus influenzae Infection",
            "Vibrio cholerae Infection",
            "Proteus mirabilis Infection",
            "Serratia marcescens Infection",
            "Enterobacter cloacae Infection",
            "Stenotrophomonas maltophilia Infection",
            "Citrobacter freundii Infection",
            "Morganella morganii Infection",
            "Providencia stuartii Infection",
            "Yersinia enterocolitica Infection",
            "Pasteurella multocida Infection",
            "Moraxella catarrhalis Infection",
            "Eikenella corrodens Infection"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Escherichia coli (E. coli) Infection",
                "Pseudomonas aeruginosa Infection",
                "Klebsiella pneumoniae Infection",
                "Acinetobacter baumannii Infection",
                "Helicobacter pylori Infection",
                "Legionella pneumophila Infection",
                "Campylobacter jejuni Infection",
                "Burkholderia cepacia Infection",
                "Haemophilus influenzae Infection",
                "Vibrio cholerae Infection",
                "Proteus mirabilis Infection",
                "Serratia marcescens Infection",
                "Pasteurella multocida Infection"
            ],
            "mismatches": [
                "Salmonella Typhimurium Infection",
                "Neisseria gonorrhoeae Infection",
                "Shigella dysenteriae Infection",
                "Enterobacter cloacae Infection",
                "Stenotrophomonas maltophilia Infection",
                "Citrobacter freundii Infection",
                "Morganella morganii Infection",
                "Providencia stuartii Infection",
                "Yersinia enterocolitica Infection",
                "Moraxella catarrhalis Infection",
                "Eikenella corrodens Infection"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillus Infections",
                "Bacillary Dysentery",
                "Bartonella Infections",
                "Bartonellaceae Infections",
                "Burkholderia Infections",
                "Campylobacter Infections",
                "Chlamydia Infections",
                "Chlamydial Pneumonia",
                "Chlamydophila Infections",
                "Cholera",
                "Enterobacteriaceae Infections",
                "Escherichia coli Infections",
                "Escherichia coli Meningitis",
                "Flavobacteriaceae Infections",
                "Fusobacteriaceae Infections",
                "Fusobacterium Infections",
                "Gonorrhea",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Melioidosis",
                "Moraxellaceae Infections",
                "Neisseriaceae Infections",
                "Pasteurella Infections",
                "Pasteurellaceae Infections",
                "Pneumonic Pasteurellosis",
                "Proteus Infections",
                "Pseudomonas Infections",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Serratia Infections",
                "Spirochaetales Infections",
                "Syphilis",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Yersinia Infections",
                "Yersinia pseudotuberculosis Infections"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli (E. coli) urinary tract infection",
            "Salmonella typhi typhoid fever",
            "Pseudomonas aeruginosa pneumonia",
            "Klebsiella pneumoniae septicemia",
            "Haemophilus influenzae meningitis",
            "Neisseria meningitidis meningitis",
            "Francisella tularensis tularemia",
            "Yersinia pestis plague",
            "Legionella pneumophila Legionnaires' disease",
            "Burkholderia pseudomallei melioidosis",
            "Acinetobacter baumannii nosocomial infection",
            "Enterobacter cloacae septicemia",
            "Proteus mirabilis urinary tract infection",
            "Vibrio vulnificus wound infection",
            "Francisella novicida Francisella-like agent",
            "Brucella suis brucellosis",
            "Brucella melitensis brucellosis",
            "Francisella philomiragia Francisella-like agent",
            "Acinetobacter calcoaceticus-Acinetobacter baumannii complex nosocomial infection",
            "Burkholderia mallei melioidosis",
            "Klebsiella oxytoca urinary tract infection",
            "Pseudomonas fluorescens wound infection",
            "Haemophilus parainfluenzae otitis media",
            "Neisseria gonorrhoeae gonorrhea",
            "Francisella tularensis subspecies novicida tularemia"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Brucellosis",
                "Gonorrhea",
                "Haemophilus Meningitis",
                "Legionnaires' Disease",
                "Melioidosis",
                "Plague",
                "Tularemia",
                "Typhoid Fever"
            ],
            "mismatches": [
                "Escherichia coli (E. coli) urinary tract infection",
                "Salmonella typhi typhoid fever",
                "Pseudomonas aeruginosa pneumonia",
                "Klebsiella pneumoniae septicemia",
                "Francisella tularensis tularemia",
                "Yersinia pestis plague",
                "Burkholderia pseudomallei melioidosis",
                "Acinetobacter baumannii nosocomial infection",
                "Enterobacter cloacae septicemia",
                "Proteus mirabilis urinary tract infection",
                "Vibrio vulnificus wound infection",
                "Francisella novicida Francisella-like agent",
                "Francisella philomiragia Francisella-like agent",
                "Acinetobacter calcoaceticus-Acinetobacter baumannii complex nosocomial infection",
                "Burkholderia mallei melioidosis",
                "Klebsiella oxytoca urinary tract infection",
                "Pseudomonas fluorescens wound infection",
                "Haemophilus parainfluenzae otitis media",
                "Neisseria gonorrhoeae gonorrhea",
                "Francisella tularensis subspecies novicida tularemia"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillosis",
                "Actinobacillus Infections",
                "Aliivibrio Infections",
                "Bartonellaceae Infections",
                "Bovine Brucellosis",
                "Brucellosis",
                "Burkholderia Infections",
                "Chlamydial Pneumonia",
                "Chlamydophila Infections",
                "Desulfovibrionaceae Infections",
                "Enterobacteriaceae Infections",
                "Escherichia coli Infections",
                "Escherichia coli Meningitis",
                "Flavobacteriaceae Infections",
                "Fusobacteriaceae Infections",
                "Gonorrhea",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Hemorrhagic Septicemia",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Lymphogranuloma Venereum",
                "Melioidosis",
                "Meningococcal Infections",
                "Meningococcal Meningitis",
                "Moraxellaceae Infections",
                "Neisseriaceae Infections",
                "Paratyphoid Fever",
                "Plague",
                "Pneumonic Pasteurellosis",
                "Proteus Infections",
                "Pseudomonas Infections",
                "Salmonella Infections",
                "Serratia Infections",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Yersinia Infections",
                "Yersinia pseudotuberculosis Infections"
            ],
            "TP": 8,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            "Escherichia coli (E. coli) infection",
            "Pseudomonas aeruginosa infection",
            "Klebsiella pneumoniae infection",
            "Acinetobacter baumannii infection",
            "Haemophilus influenzae infection",
            "Salmonella enterica infection",
            "Shigella flexneri infection",
            "Francisella tularensis infection",
            "Vibrio cholerae infection",
            "Campylobacter jejuni infection",
            "Helicobacter pylori infection",
            "Legionella pneumophila infection",
            "Bacteroides fragilis infection",
            "Porphyromonas gingivitis infection",
            "Prevotella intermedia infection",
            "Capnocytophaga canimorsus infection",
            "Chromobacterium violaceum infection",
            "Yersinia pestis infection",
            "Aeromonas hydrophila infection",
            "Edwardsiella tarda infection",
            "Stenotrophomonas maltophilia infection",
            "Burkholderia pseudomallei infection",
            "Burkholderia mallei infection",
            "Ralstonia pickettii infection"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Escherichia coli (E. coli) infection",
                "Pseudomonas aeruginosa infection",
                "Klebsiella pneumoniae infection",
                "Acinetobacter baumannii infection",
                "Haemophilus influenzae infection",
                "Salmonella enterica infection",
                "Vibrio cholerae infection",
                "Campylobacter jejuni infection",
                "Helicobacter pylori infection",
                "Legionella pneumophila infection",
                "Bacteroides fragilis infection",
                "Yersinia pestis infection",
                "Burkholderia pseudomallei infection"
            ],
            "mismatches": [
                "Shigella flexneri infection",
                "Francisella tularensis infection",
                "Porphyromonas gingivitis infection",
                "Prevotella intermedia infection",
                "Capnocytophaga canimorsus infection",
                "Chromobacterium violaceum infection",
                "Aeromonas hydrophila infection",
                "Edwardsiella tarda infection",
                "Stenotrophomonas maltophilia infection",
                "Burkholderia mallei infection",
                "Ralstonia pickettii infection"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillus Infections",
                "Animal Salmonella Infections",
                "Bacteroidaceae Infections",
                "Bacteroides Infections",
                "Bartonella Infections",
                "Burkholderia Infections",
                "Campylobacter Infections",
                "Chlamydial Pneumonia",
                "Chlamydophila Infections",
                "Cholera",
                "Cytophagaceae Infections",
                "Desulfovibrionaceae Infections",
                "Enterobacteriaceae Infections",
                "Escherichia coli Infections",
                "Escherichia coli Meningitis",
                "Flavobacteriaceae Infections",
                "Fusobacterium Infections",
                "Haemophilus Infections",
                "Haemophilus Meningitis",
                "Helicobacter Infections",
                "Klebsiella Infections",
                "Legionellosis",
                "Legionnaires' Disease",
                "Melioidosis",
                "Moraxellaceae Infections",
                "Necrotizing Ulcerative Gingivitis",
                "Piscirickettsiaceae Infections",
                "Plague",
                "Pseudomonas Infections",
                "Rocky Mountain Spotted Fever",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Serratia Infections",
                "Syphilis",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Yersinia Infections",
                "Yersinia pseudotuberculosis Infections"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "Gram-negative bacterial infection",
        "domain": "medicine",
        "response": [
            {
                "Referent": "Acinetobacter baumannii (AB)",
                "Canonical Name": "Acinetobacter baumannii"
            },
            {
                "Referent": "Burkholderia cepacia (BC)",
                "Canonical Name": "Burkholderia cepacia"
            },
            {
                "Referent": "Burkholderia pseudomallei (BP)",
                "Canonical Name": "Burkholderia pseudomallei"
            },
            {
                "Referent": "Chromobacterium violaceum (CV)",
                "Canonical Name": "Chromobacterium violaceum"
            },
            {
                "Referent": "Enterobacter aerogenes (EA)",
                "Canonical Name": "Enterobacter aerogenes"
            },
            {
                "Referent": "Escherichia coli (EC)",
                "Canonical Name": "Escherichia coli"
            },
            {
                "Referent": "Klebsiella pneumoniae (KP)",
                "Canonical Name": "Klebsiella pneumoniae"
            },
            {
                "Referent": "Pseudomonas aeruginosa (PA)",
                "Canonical Name": "Pseudomonas aeruginosa"
            },
            {
                "Referent": "Salmonella enterica (SE)",
                "Canonical Name": "Salmonella enterica"
            },
            {
                "Referent": "Serratia marcescens (SM)",
                "Canonical Name": "Serratia marcescens"
            },
            {
                "Referent": "Vibrio cholerae (VC)",
                "Canonical Name": "Vibrio cholerae"
            },
            {
                "Referent": "Xanthomonas campestris (XC)",
                "Canonical Name": "Xanthomonas campestris"
            },
            {
                "Referent": "Yersinia enterocolitica (YE)",
                "Canonical Name": "Yersinia enterocolitica"
            },
            {
                "Referent": "Acinetobacter baumannii (AB)",
                "Canonical Name": "Acinetobacter baumannii"
            },
            {
                "Referent": "Burkholderia cepacia (BC)",
                "Canonical Name": "Burkholderia cepacia"
            },
            {
                "Referent": "Burkholderia pseudomallei (BP)",
                "Canonical Name": "Burkholderia pseudomallei"
            },
            {
                "Referent": "Chromobacterium violaceum (CV)",
                "Canonical Name": "Chromobacterium violaceum"
            },
            {
                "Referent": "Enterobacter aerogenes (EA)",
                "Canonical Name": "Enterobacter aerogenes"
            },
            {
                "Referent": "Escherichia coli (EC)",
                "Canonical Name": "Escherichia coli"
            },
            {
                "Referent": "Klebsiella pneumoniae (KP)",
                "Canonical Name": "Klebsiella pneumoniae"
            },
            {
                "Referent": "Pseudomonas aeruginosa (PA)",
                "Canonical Name": "Pseudomonas aeruginosa"
            },
            {
                "Referent": "Salmonella enterica (SE)",
                "Canonical Name": "Salmonella enterica"
            },
            {
                "Referent": "Serratia marcescens (SM)",
                "Canonical Name": "Serratia marcescens"
            },
            {
                "Referent": "Vibrio cholerae (VC)",
                "Canonical Name": "Vibrio cholerae"
            },
            {
                "Referent": "Xanthomonas campestris (XC)",
                "Canonical Name": "Xanthomonas campestris"
            },
            {
                "Referent": "Yersinia enterocolitica (YE)",
                "Canonical Name": "Yersinia enterocolitica"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Acinetobacter baumannii",
                "Burkholderia cepacia",
                "Burkholderia pseudomallei",
                "Chromobacterium violaceum",
                "Enterobacter aerogenes",
                "Escherichia coli",
                "Klebsiella pneumoniae",
                "Pseudomonas aeruginosa",
                "Salmonella enterica",
                "Serratia marcescens",
                "Vibrio cholerae",
                "Xanthomonas campestris",
                "Yersinia enterocolitica"
            ],
            "true_referents": [
                "Acinetobacter Infections",
                "Actinobacillosis",
                "Burkholderia Infections",
                "Chancre",
                "Chlamydial Pneumonia",
                "Cholera",
                "Enterobacteriaceae Infections",
                "Escherichia coli Meningitis",
                "Flavobacteriaceae Infections",
                "Gonorrhea",
                "Klebsiella Infections",
                "Leptospirosis",
                "Melioidosis",
                "Moraxellaceae Infections",
                "Pseudomonas Infections",
                "Salmonella Food Poisoning",
                "Salmonella Infections",
                "Serratia Infections",
                "Syphilis",
                "Tabes Dorsalis",
                "Tularemia",
                "Typhoid Fever",
                "Vibrio Infections",
                "Yersinia Infections"
            ],
            "TP": 0,
            "FP": 13,
            "FN": 0
        }
    }
]