[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Herpes Simplex Virus (HSV)",
            "Human Papillomavirus (HPV)",
            "Adenovirus",
            "Smallpox Virus (Variola virus)",
            "Epstein-Barr Virus (EBV)",
            "Human Herpesvirus 6 (HHV-6)",
            "Human Herpesvirus 7 (HHV-7)",
            "Kaposi's Sarcoma-associated Herpesvirus (KSHV)",
            "Cytomegalovirus (CMV)",
            "Varicella-Zoster Virus (VZV)",
            "Adeno-Associated Virus (AAV)",
            "Bovine Papillomavirus",
            "Polyomavirus",
            "Simian Virus 40 (SV40)",
            "Molluscum Contagiosum Virus (MCV)",
            "Murine Cytomegalovirus (MCMV)",
            "Pseudorabies Virus (PRV)",
            "Baculovirus",
            "Autographa californica Multiple Nucleopolyhedrovirus (AcMNPV)",
            "Deerpox Virus",
            "Ovine Pulmonary Adenocarcinoma Virus (OPAV)",
            "Canine Herpesvirus (CHV)",
            "Beak and Feather Disease Virus (BFDV)",
            "Avian Sarcoma Leukosis Virus (ASLV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Human Herpesvirus 6 (HHV-6)",
                "Human Herpesvirus 7 (HHV-7)",
                "Cytomegalovirus (CMV)",
                "Polyomavirus",
                "Simian Virus 40 (SV40)",
                "Molluscum Contagiosum Virus (MCV)"
            ],
            "mismatches": [
                "Herpes Simplex Virus (HSV)",
                "Human Papillomavirus (HPV)",
                "Adenovirus",
                "Smallpox Virus (Variola virus)",
                "Epstein-Barr Virus (EBV)",
                "Kaposi's Sarcoma-associated Herpesvirus (KSHV)",
                "Varicella-Zoster Virus (VZV)",
                "Adeno-Associated Virus (AAV)",
                "Bovine Papillomavirus",
                "Murine Cytomegalovirus (MCMV)",
                "Pseudorabies Virus (PRV)",
                "Baculovirus",
                "Autographa californica Multiple Nucleopolyhedrovirus (AcMNPV)",
                "Deerpox Virus",
                "Ovine Pulmonary Adenocarcinoma Virus (OPAV)",
                "Canine Herpesvirus (CHV)",
                "Beak and Feather Disease Virus (BFDV)",
                "Avian Sarcoma Leukosis Virus (ASLV)"
            ],
            "true_referents": [
                "Adenoviridae",
                "Aviadenovirus",
                "Avihepadnavirus",
                "Baculoviridae",
                "Betapapillomavirus",
                "Bocavirus",
                "Bovine papillomavirus 1",
                "Bovine papillomavirus 4",
                "Canid Herpesvirus 1",
                "Canine Parvovirus",
                "Chicken anemia virus",
                "Cowpox virus",
                "Cytomegalovirus",
                "Fowl adenovirus A",
                "Gallid Herpesvirus 1",
                "Geminiviridae",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Human papillomavirus 16",
                "Inovirus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nanovirus",
                "Nucleopolyhedroviruses",
                "Orthopoxvirus",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Poxviridae",
                "Pseudocowpox Virus",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes Simplex Virus 1 (HSV-1)",
            "Herpes Simplex Virus 2 (HSV-2)",
            "Varicella-Zoster Virus (VZV)",
            "Epstein-Barr Virus (EBV)",
            "Human Cytomegalovirus (HCMV)",
            "Papillomavirus (HPV)",
            "Polyomavirus (PyV)",
            "Baculovirus",
            "Parvovirus B19",
            "Hepadnavirus (HBV)",
            "Poxvirus",
            "Anellovirus",
            "Circovirus",
            "Geminivirus",
            "Bacteriophage T4",
            "Bacteriophage Lambda",
            "Bacteriophage M13",
            "Bacteriophage T7",
            "Bacteriophage P1",
            "Bacteriophage T3",
            "Bacteriophage T5",
            "Bacteriophage Mu"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Bacteriophage T4",
                "Bacteriophage M13",
                "Bacteriophage T7",
                "Bacteriophage P1",
                "Bacteriophage T3",
                "Bacteriophage mu",
                "Bacteriophage lambda"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes Simplex Virus 1 (HSV-1)",
                "Herpes Simplex Virus 2 (HSV-2)",
                "Varicella-Zoster Virus (VZV)",
                "Epstein-Barr Virus (EBV)",
                "Human Cytomegalovirus (HCMV)",
                "Papillomavirus (HPV)",
                "Polyomavirus (PyV)",
                "Baculovirus",
                "Parvovirus B19",
                "Hepadnavirus (HBV)",
                "Poxvirus",
                "Anellovirus",
                "Circovirus",
                "Geminivirus",
                "Bacteriophage T5"
            ],
            "true_referents": [
                "Adenoviridae",
                "Anelloviridae",
                "Ascoviridae",
                "Bacteriophage IKe",
                "Bacteriophage M13",
                "Bacteriophage N4",
                "Bacteriophage P1",
                "Bacteriophage P2",
                "Bacteriophage Pf1",
                "Bacteriophage T3",
                "Bacteriophage T4",
                "Bacteriophage T7",
                "Bacteriophage lambda",
                "Bacteriophage mu",
                "Baculoviridae",
                "Begomovirus",
                "Circoviridae",
                "Circovirus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Geminiviridae",
                "Hepadnaviridae",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Parvovirus B19",
                "Human papillomavirus 16",
                "Inovirus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nanovirus",
                "Papillomaviridae",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Roseolovirus",
                "Vaccinia virus",
                "Varicellovirus"
            ],
            "TP": 7,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes Simplex Virus 1 (HSV-1)",
            "Herpes Simplex Virus 2 (HSV-2)",
            "Varicella-Zoster Virus (VZV)",
            "Epstein-Barr Virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Human Herpesvirus 6 (HHV-6)",
            "Human Herpesvirus 7 (HHV-7)",
            "Kaposi's Sarcoma-Associated Herpesvirus (KSHV)",
            "Human Herpesvirus 8 (HHV-8)",
            "Poxvirus",
            "Molluscum Contagiosum Virus (MCV)",
            "Parvovirus B19",
            "Papillomavirus",
            "Human Papillomavirus (HPV)",
            "Adeno-associated Virus (AAV)",
            "Hepatitis B Virus (HBV)",
            "Polyomavirus",
            "Simian Virus 40 (SV40)",
            "Baculovirus",
            "African Swine Fever Virus (ASFV)",
            "Pseudorabies Virus (PRV)",
            "Mimivirus",
            "Pithovirus",
            "Asfivirus"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus (CMV)",
                "Human Herpesvirus 6 (HHV-6)",
                "Human Herpesvirus 7 (HHV-7)",
                "Human Herpesvirus 8 (HHV-8)",
                "Molluscum Contagiosum Virus (MCV)",
                "Parvovirus B19",
                "Polyomavirus",
                "Simian Virus 40 (SV40)",
                "African Swine Fever Virus (ASFV)"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes Simplex Virus 1 (HSV-1)",
                "Herpes Simplex Virus 2 (HSV-2)",
                "Varicella-Zoster Virus (VZV)",
                "Epstein-Barr Virus (EBV)",
                "Kaposi's Sarcoma-Associated Herpesvirus (KSHV)",
                "Poxvirus",
                "Papillomavirus",
                "Human Papillomavirus (HPV)",
                "Adeno-associated Virus (AAV)",
                "Hepatitis B Virus (HBV)",
                "Baculovirus",
                "Pseudorabies Virus (PRV)",
                "Mimivirus",
                "Pithovirus",
                "Asfivirus"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Asfarviridae",
                "Baculoviridae",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Fowl adenovirus A",
                "Geminiviridae",
                "Granulovirus",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Human Parvovirus B19",
                "Human papillomavirus 16",
                "Inovirus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Mimiviridae",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nanovirus",
                "Orf virus",
                "Papillomaviridae",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Pseudocowpox Virus",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Siphoviridae",
                "Vaccinia virus",
                "Varicellovirus",
                "Woodchuck Hepatitis B Virus",
                "Xipapillomavirus"
            ],
            "TP": 9,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes Simplex Virus 1 (HSV-1)",
            "Herpes Simplex Virus 2 (HSV-2)",
            "Varicella-Zoster Virus (VZV)",
            "Epstein-Barr Virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Human Papillomavirus (HPV)",
            "Human Herpesvirus 6 (HHV-6)",
            "Human Herpesvirus 7 (HHV-7)",
            "Human Herpesvirus 8 (HHV-8)",
            "Poxviridae family viruses (Poxviridae)",
            "Baculoviruses (Bac)",
            "Asfarviridae family viruses (Asfarviridae)",
            "Iridoviruses (Iri)",
            "Polyomavirus (Poly)",
            "Merkel Cell Polyomavirus (MCPyV)",
            "JC Virus (JCV)",
            "BK Virus (BKV)",
            "African swine fever virus (ASFV)",
            "Feline herpesvirus 1 (FHV-1)",
            "Bovine herpesvirus 1 (BHV-1)",
            "Equine herpesvirus 1 (EHV-1)",
            "Molluscipoxvirus (MPV)",
            "Yaba monkey tumor virus (YMTV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Polyomavirus",
                "Merkel cell polyomavirus",
                "JC Virus",
                "BK Virus",
                "Bovine Herpesvirus 1",
                "Equid Herpesvirus 1",
                "Molluscipoxvirus",
                "Yaba monkey tumor virus"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes Simplex Virus 1 (HSV-1)",
                "Herpes Simplex Virus 2 (HSV-2)",
                "Varicella-Zoster Virus (VZV)",
                "Epstein-Barr Virus (EBV)",
                "Human Papillomavirus (HPV)",
                "Poxviridae family viruses (Poxviridae)",
                "Baculoviruses (Bac)",
                "Asfarviridae family viruses (Asfarviridae)",
                "Iridoviruses (Iri)",
                "African swine fever virus (ASFV)",
                "Feline herpesvirus 1 (FHV-1)"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Ascoviridae",
                "Asfarviridae",
                "BK Virus",
                "Baculoviridae",
                "Bovine Herpesvirus 1",
                "Bovine Herpesvirus 5",
                "Circoviridae",
                "Cytomegalovirus",
                "Equid Herpesvirus 1",
                "Equid Herpesvirus 3",
                "Equid Herpesvirus 4",
                "Geminiviridae",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Human papillomavirus 16",
                "Inovirus",
                "Iridoviridae",
                "Iridovirus",
                "JC Virus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nucleopolyhedroviruses",
                "Orf virus",
                "Polyomaviridae",
                "Polyomavirus",
                "Poxviridae",
                "Rudiviridae",
                "Vaccinia virus",
                "Varicellovirus",
                "Yaba monkey tumor virus",
                "Yatapoxvirus"
            ],
            "TP": 12,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes Simplex Virus (HSV)",
            "Varicella Zoster Virus (VZV)",
            "Epstein-Barr Virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Human Papillomavirus (HPV)",
            "Parvovirus B19",
            "Hepatitis B Virus (HBV)",
            "Molluscum Contagiosum Virus (MCV)",
            "Simian Virus 40 (SV40)",
            "Baculovirus",
            "Polyomavirus",
            "Torque Teno Virus (TTV)",
            "Human Herpesvirus 6 (HHV-6)",
            "Human Herpesvirus 7 (HHV-7)",
            "Kaposi's Sarcoma-associated Herpesvirus (KSHV)",
            "Merkel Cell Polyomavirus (MCPyV)",
            "Human Cytomegalovirus (HCMV)",
            "Bovine Papillomavirus (BPV)",
            "Canine Adenovirus",
            "Feline Herpesvirus",
            "Equine Herpesvirus",
            "Porcine Circovirus",
            "African Swine Fever Virus (ASFV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Merkel cell polyomavirus",
                "Simian virus 40",
                "Polyomavirus",
                "Torque teno virus",
                "Human papillomavirus 16",
                "Human Parvovirus B19",
                "Hepatitis B virus",
                "Molluscum contagiosum virus",
                "African Swine Fever Virus"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes Simplex Virus (HSV)",
                "Varicella Zoster Virus (VZV)",
                "Epstein-Barr Virus (EBV)",
                "Human Cytomegalovirus (HCMV)",
                "Bovine Papillomavirus (BPV)",
                "Canine Adenovirus",
                "Feline Herpesvirus",
                "Equine Herpesvirus",
                "Porcine Circovirus",
                "Kaposi's Sarcoma-associated Herpesvirus (KSHV)",
                "Baculovirus"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Asfarviridae",
                "Baculoviridae",
                "Betapapillomavirus",
                "Bovine papillomavirus 1",
                "Bovine papillomavirus 4",
                "Canine Adenoviruses",
                "Canine Parvovirus",
                "Circoviridae",
                "Circovirus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Equid Herpesvirus 1",
                "Equid Herpesvirus 3",
                "Equid Herpesvirus 4",
                "Fowl adenovirus A",
                "Geminiviridae",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Human Parvovirus B19",
                "Human papillomavirus 16",
                "Iltovirus",
                "Inovirus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nanovirus",
                "Orf virus",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Torque teno virus",
                "Vaccinia virus",
                "Varicellovirus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 12,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes simplex virus (HSV)",
            "Varicella-zoster virus (VZV)",
            "Human papillomavirus (HPV)",
            "Epstein-Barr virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Poxvirus (e.g., Variola virus)",
            "Adeno-associated virus (AAV)",
            "Bacillus Calmette-Gu\u00e9rin (BCG) virus",
            "African swine fever virus (ASFV)",
            "Molluscum contagiosum virus (MCV)",
            "Human adenovirus C (HAdV-C)",
            "Canine adenovirus (CAV)",
            "Fowlpox virus (FPV)",
            "Lymphocytic choriomeningitis virus (LCMV)",
            "Bovine papillomavirus (BPV)",
            "Simian virus 40 (SV40)",
            "Porcine circovirus (PCV)",
            "Human herpesvirus 6 (HHV-6)",
            "Rhesus monkey rhadinovirus (RRV)",
            "Caprine arthritis encephalitis virus (CAEV)",
            "Feline herpesvirus (FHV)",
            "Equine herpesvirus (EHV)",
            "Avian leukosis virus (ALV)",
            "Infectious bursal disease virus (IBDV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Varicella-zoster virus (VZV)",
                "Cytomegalovirus (CMV)",
                "African swine fever virus (ASFV)",
                "Molluscum contagiosum virus (MCV)",
                "Canine adenovirus (CAV)",
                "Fowlpox virus (FPV)",
                "Simian virus 40 (SV40)",
                "Human herpesvirus 6 (HHV-6)"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes simplex virus (HSV)",
                "Human papillomavirus (HPV)",
                "Epstein-Barr virus (EBV)",
                "Poxvirus (e.g., Variola virus)",
                "Adeno-associated virus (AAV)",
                "Bacillus Calmette-Gu\u00e9rin (BCG) virus",
                "Human adenovirus C (HAdV-C)",
                "Lymphocytic choriomeningitis virus (LCMV)",
                "Bovine papillomavirus (BPV)",
                "Porcine circovirus (PCV)",
                "Rhesus monkey rhadinovirus (RRV)",
                "Caprine arthritis encephalitis virus (CAEV)",
                "Feline herpesvirus (FHV)",
                "Equine herpesvirus (EHV)",
                "Avian leukosis virus (ALV)",
                "Infectious bursal disease virus (IBDV)"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Asfarviridae",
                "Avipoxvirus",
                "Betapapillomavirus",
                "Bovine papillomavirus 1",
                "Bovine papillomavirus 4",
                "Canine Adenoviruses",
                "Canine Parvovirus",
                "Capripoxvirus",
                "Chicken anemia virus",
                "Circoviridae",
                "Circovirus",
                "Cytomegalovirus",
                "Equid Herpesvirus 1",
                "Equid Herpesvirus 3",
                "Equid Herpesvirus 4",
                "Fowl adenovirus A",
                "Fowlpox virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human papillomavirus 16",
                "Inovirus",
                "Lymphocryptovirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Orf virus",
                "Parvovirus",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Ranid Herpesvirus 1",
                "Rhadinovirus",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus"
            ],
            "TP": 8,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Baculovirus (BV)",
            "Epstein-Barr virus (EBV)",
            "Herpes simplex virus (HSV)",
            "Varicella zoster virus (VZV)",
            "Cytomegalovirus (CMV)",
            "Human herpesvirus 6 (HHV-6)",
            "Human herpesvirus 7 (HHV-7)",
            "Kaposi's sarcoma-associated herpesvirus (KSHV)",
            "Human herpesvirus 8 (HHV-8)",
            "Molluscum contagiosum virus (MCV)",
            "Orf virus (ORFV)",
            "Parvovirus B19 (B19V)",
            "Human papillomavirus (HPV)",
            "Hepatitis B virus (HBV)",
            "Polyomavirus (PyV)",
            "Simian Virus 40 (SV40)",
            "JC virus (JCV)",
            "Monkeypox virus (MPXV)",
            "Cowpox virus (CPXV)",
            "Vaccinia virus (VV)",
            "Canarypox virus (CNPV)",
            "Fowlpox virus (FPV)",
            "Swinepox virus (SPV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Molluscum contagiosum virus",
                "Orf virus",
                "Human Parvovirus B19",
                "Hepatitis B virus",
                "Polyomavirus",
                "Simian virus 40",
                "JC Virus",
                "Monkeypox virus",
                "Cowpox virus",
                "Vaccinia virus",
                "Canarypox virus",
                "Fowlpox virus"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Baculovirus (BV)",
                "Epstein-Barr virus (EBV)",
                "Herpes simplex virus (HSV)",
                "Varicella zoster virus (VZV)",
                "Kaposi's sarcoma-associated herpesvirus (KSHV)",
                "Human papillomavirus (HPV)",
                "Swinepox virus (SPV)"
            ],
            "true_referents": [
                "Adenoviridae",
                "Avipoxvirus",
                "BK Virus",
                "Baculoviridae",
                "Begomovirus",
                "Canarypox virus",
                "Cowpox virus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Fowl adenovirus A",
                "Fowlpox virus",
                "Geminiviridae",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Human Parvovirus B19",
                "Human papillomavirus 16",
                "Inovirus",
                "JC Virus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Orf virus",
                "Orthopoxvirus",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Suipoxvirus",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Influenza virus (FLU)",
            "Herpes simplex virus (HSV)",
            "Human immunodeficiency virus (HIV)",
            "Hepatitis B virus (HBV)",
            "Varicella-zoster virus (VZV)",
            "Epstein-Barr virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Papillomavirus (HPV)",
            "Adenovirus (AdV)",
            "Rotavirus (RV)",
            "Measles virus (MV)",
            "Mumps virus (MuV)",
            "Rubella virus (RV)",
            "Poliovirus (PV)",
            "Rhinovirus (RV)",
            "Coronavirus (CoV)",
            "Ebola virus (EBOV)",
            "Zika virus (ZIKV)",
            "Dengue virus (DENV)",
            "West Nile virus (WNV)",
            "Hantavirus (HantV)",
            "Rabies virus (RABV)",
            "Norovirus (NoV)",
            "SARS-CoV-2"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis B virus",
                "Cytomegalovirus"
            ],
            "mismatches": [
                "Influenza virus (FLU)",
                "Herpes simplex virus (HSV)",
                "Human immunodeficiency virus (HIV)",
                "Varicella-zoster virus (VZV)",
                "Epstein-Barr virus (EBV)",
                "Papillomavirus (HPV)",
                "Adenovirus (AdV)",
                "Rotavirus (RV)",
                "Measles virus (MV)",
                "Mumps virus (MuV)",
                "Rubella virus (RV)",
                "Poliovirus (PV)",
                "Rhinovirus (RV)",
                "Coronavirus (CoV)",
                "Ebola virus (EBOV)",
                "Zika virus (ZIKV)",
                "Dengue virus (DENV)",
                "West Nile virus (WNV)",
                "Hantavirus (HantV)",
                "Rabies virus (RABV)",
                "Norovirus (NoV)",
                "SARS-CoV-2"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "BK Virus",
                "Badnavirus",
                "Bocavirus",
                "Cytomegalovirus",
                "Densovirus",
                "Duck Hepatitis B Virus",
                "Gyrovirus",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human papillomavirus 16",
                "Inoviridae",
                "Inovirus",
                "Mardivirus",
                "Microvirus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nudiviridae",
                "Orf virus",
                "Papillomaviridae",
                "Parvovirus",
                "Polyomavirus",
                "Rudiviridae",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes simplex virus type 1 (HSV-1)",
            "Herpes simplex virus type 2 (HSV-2)",
            "Varicella-zoster virus (VZV)",
            "Epstein-Barr virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Human papillomavirus (HPV)",
            "Hepatitis B virus (HBV)",
            "JC virus (Human polyomavirus JC)",
            "BK virus (Human polyomavirus BK)",
            "Parvovirus B19",
            "Vaccinia virus",
            "Variola virus",
            "Monkeypox virus",
            "Molluscum contagiosum virus",
            "Kaposi's sarcoma-associated herpesvirus (KSHV)",
            "Marek's disease virus",
            "Bovine papillomavirus",
            "Simian virus 40 (SV40)",
            "Duck hepatitis B virus",
            "Torque teno virus (TTV)",
            "Canine parvovirus",
            "Feline panleukopenia virus",
            "Pseudorabies virus (PRV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Hepatitis B virus",
                "JC Virus",
                "BK Virus",
                "Vaccinia virus",
                "Variola virus",
                "Monkeypox virus",
                "Molluscum contagiosum virus",
                "Simian virus 40",
                "Duck Hepatitis B Virus",
                "Torque teno virus",
                "Canine Parvovirus",
                "Feline Panleukopenia Virus"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes simplex virus type 1 (HSV-1)",
                "Herpes simplex virus type 2 (HSV-2)",
                "Varicella-zoster virus (VZV)",
                "Epstein-Barr virus (EBV)",
                "Human papillomavirus (HPV)",
                "Parvovirus B19",
                "Kaposi's sarcoma-associated herpesvirus (KSHV)",
                "Marek's disease virus",
                "Bovine papillomavirus",
                "Pseudorabies virus (PRV)"
            ],
            "true_referents": [
                "Adenoviridae",
                "BK Virus",
                "Betapapillomavirus",
                "Bovine papillomavirus 1",
                "Bovine papillomavirus 4",
                "Canine Parvovirus",
                "Cowpox virus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Feline Panleukopenia Virus",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 8",
                "Human Parvovirus B19",
                "Human papillomavirus 16",
                "Iltovirus",
                "Inovirus",
                "JC Virus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nanovirus",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Pseudocowpox Virus",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Torque teno virus",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes simplex virus (HSV)",
            "Epstein-Barr virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Varicella-zoster virus (VZV)",
            "Human papillomavirus (HPV)",
            "Hepatitis B virus (HBV)",
            "Poxvirus",
            "Polyomavirus",
            "Papillomavirus",
            "Hepadnavirus",
            "Baculovirus",
            "Mimivirus",
            "Chlorovirus",
            "Pandoravirus",
            "Pithovirus",
            "Marseillevirus",
            "Iridovirus",
            "Ascoviridae",
            "Polydnavirus",
            "Asfarvirus",
            "Phycodnaviridae",
            "Herpesviridae",
            "Parvovirus"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Hepatitis B virus",
                "Herpesviridae",
                "Iridovirus",
                "Parvovirus",
                "Phycodnaviridae",
                "Polyomavirus",
                "Ascoviridae"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes simplex virus (HSV)",
                "Epstein-Barr virus (EBV)",
                "Varicella-zoster virus (VZV)",
                "Human papillomavirus (HPV)",
                "Poxvirus",
                "Papillomavirus",
                "Hepadnavirus",
                "Baculovirus",
                "Mimivirus",
                "Chlorovirus",
                "Pandoravirus",
                "Pithovirus",
                "Marseillevirus",
                "Polydnavirus",
                "Asfarvirus"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Alphaherpesvirinae",
                "Ascoviridae",
                "Asfarviridae",
                "Baculoviridae",
                "Canine Parvovirus",
                "Circoviridae",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Fuselloviridae",
                "Geminiviridae",
                "Granulovirus",
                "Gyrovirus",
                "Hepadnaviridae",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human papillomavirus 16",
                "Inoviridae",
                "Inovirus",
                "Iridoviridae",
                "Iridovirus",
                "Mardivirus",
                "Merkel cell polyomavirus",
                "Microviridae",
                "Microvirus",
                "Mimiviridae",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nanovirus",
                "Orf virus",
                "Papillomaviridae",
                "Parapoxvirus",
                "Parvovirus",
                "Phycodnaviridae",
                "Polydnaviridae",
                "Polyomaviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Rudiviridae",
                "Siphoviridae",
                "Vaccinia virus",
                "Varicellovirus",
                "Woodchuck Hepatitis B Virus",
                "Xipapillomavirus"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus",
            "African swine fever virus (ASFV)",
            "BK polyomavirus (BKPyV)",
            "Bovine papillomavirus (BPV)",
            "Canine parvovirus (CPV)",
            "Cytomegalovirus (CMV)",
            "Epstein-Barr virus (EBV)",
            "Feline panleukopenia virus (FPV)",
            "Herpes simplex virus 1 (HSV-1)",
            "Herpes simplex virus 2 (HSV-2)",
            "Human papillomavirus (HPV)",
            "JC polyomavirus (JCPyV)",
            "Kaposi's sarcoma-associated herpesvirus (KSHV)",
            "Merkel cell polyomavirus (MCPyV)",
            "Molluscum contagiosum virus (MCV)",
            "Monkeypox virus (MPXV)",
            "Orf virus",
            "Poxvirus",
            "Pseudorabies virus (PRV)",
            "Simian virus 40 (SV40)",
            "Smallpox virus (Variola virus)",
            "Vaccinia virus (VACV)",
            "Varicella-zoster virus (VZV)",
            "White spot syndrome virus (WSSV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "BK Virus",
                "Canine Parvovirus",
                "Cytomegalovirus",
                "Feline Panleukopenia Virus",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 8",
                "JC Virus",
                "Merkel cell polyomavirus",
                "Molluscum contagiosum virus",
                "Monkeypox virus",
                "Orf virus",
                "Simian virus 40",
                "Vaccinia virus",
                "Variola virus",
                "White spot syndrome virus 1"
            ],
            "mismatches": [
                "Adenovirus",
                "African swine fever virus (ASFV)",
                "Bovine papillomavirus (BPV)",
                "Epstein-Barr virus (EBV)",
                "Human papillomavirus (HPV)",
                "Kaposi's sarcoma-associated herpesvirus (KSHV)",
                "Poxvirus",
                "Pseudorabies virus (PRV)",
                "Varicella-zoster virus (VZV)"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Asfarviridae",
                "BK Virus",
                "Betapapillomavirus",
                "Bovine papillomavirus 1",
                "Bovine papillomavirus 4",
                "Canine Parvovirus",
                "Cowpox virus",
                "Cytomegalovirus",
                "Feline Panleukopenia Virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 8",
                "Human papillomavirus 16",
                "Inovirus",
                "JC Virus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Orf virus",
                "Orthopoxvirus",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Pseudocowpox Virus",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Simplexvirus",
                "Suid Herpesvirus 1",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "White spot syndrome virus 1"
            ],
            "TP": 16,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Herpes simplex virus (HSV)",
            "Epstein-Barr virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Hepatitis B virus (HBV)",
            "Varicella-zoster virus (VZV)",
            "Adenovirus",
            "Parvovirus B19",
            "Human papillomavirus (HPV)",
            "Polyomavirus",
            "Hepatitis C virus (HCV)",
            "Human immunodeficiency virus (HIV)",
            "Molluscum contagiosum virus",
            "Poxvirus",
            "Mimivirus",
            "Pandoravirus",
            "Pithovirus",
            "Marseillevirus",
            "Megavirus chilensis",
            "Cafeteria roenbergensis virus",
            "Klosneuvirus",
            "Tupanvirus",
            "Mollivirus sibericum",
            "Cedratvirus",
            "Orpheovirus"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Hepatitis B virus",
                "Parvovirus",
                "Polyomavirus",
                "Molluscum contagiosum virus"
            ],
            "mismatches": [
                "Herpes simplex virus (HSV)",
                "Epstein-Barr virus (EBV)",
                "Varicella-zoster virus (VZV)",
                "Adenovirus",
                "Parvovirus B19",
                "Human papillomavirus (HPV)",
                "Hepatitis C virus (HCV)",
                "Human immunodeficiency virus (HIV)",
                "Poxvirus",
                "Mimivirus",
                "Pandoravirus",
                "Pithovirus",
                "Marseillevirus",
                "Megavirus chilensis",
                "Cafeteria roenbergensis virus",
                "Klosneuvirus",
                "Tupanvirus",
                "Mollivirus sibericum",
                "Cedratvirus",
                "Orpheovirus"
            ],
            "true_referents": [
                "Adenoviridae",
                "Atadenovirus",
                "Badnavirus",
                "Caulimovirus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Fuselloviridae",
                "Giant Viruses",
                "Granulovirus",
                "Hepadnaviridae",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Parvovirus B19",
                "Human papillomavirus 16",
                "Iltovirus",
                "Inovirus",
                "Mardivirus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Mimiviridae",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nanovirus",
                "Nimaviridae",
                "Orf virus",
                "Orthohepadnavirus",
                "Orthopoxvirus",
                "Parapoxvirus",
                "Parvovirus",
                "Plectrovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Siphoviridae",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 5,
            "FP": 20,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (ADV)",
            "Herpes Simplex Virus (HSV)",
            "Hepatitis B Virus (HBV)",
            "Epstein-Barr Virus (EBV)",
            "Varicella-Zoster Virus (VZV)",
            "Cytomegalovirus (CMV)",
            "Parvovirus B19 (B19V)",
            "Polyomavirus (PyV)",
            "Papillomavirus (HPV)",
            "Molluscum Contagiosum Virus (MCV)",
            "Human Immunodeficiency Virus (HIV)",
            "Hepatitis D Virus (HDV)",
            "Hepatitis C Virus (HCV)",
            "Influenza Virus (Flu)",
            "Coronavirus (CoV)",
            "Rhinovirus (RV)",
            "Respiratory Syncytial Virus (RSV)",
            "Rotavirus (RoV)",
            "Norovirus (NoV)",
            "Enterovirus (EV)",
            "Poxvirus (POXV)",
            "Monkeypox Virus (MPXV)",
            "Variola Virus (VARV)",
            "Vaccinia Virus (VACV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Polyomavirus",
                "Molluscum contagiosum virus",
                "Monkeypox virus",
                "Variola virus",
                "Vaccinia virus"
            ],
            "mismatches": [
                "Adenovirus (ADV)",
                "Herpes Simplex Virus (HSV)",
                "Hepatitis B Virus (HBV)",
                "Epstein-Barr Virus (EBV)",
                "Varicella-Zoster Virus (VZV)",
                "Parvovirus B19 (B19V)",
                "Papillomavirus (HPV)",
                "Human Immunodeficiency Virus (HIV)",
                "Hepatitis D Virus (HDV)",
                "Hepatitis C Virus (HCV)",
                "Influenza Virus (Flu)",
                "Coronavirus (CoV)",
                "Rhinovirus (RV)",
                "Respiratory Syncytial Virus (RSV)",
                "Rotavirus (RoV)",
                "Norovirus (NoV)",
                "Enterovirus (EV)",
                "Poxvirus (POXV)"
            ],
            "true_referents": [
                "Adenoviridae",
                "Bocavirus",
                "Cowpox virus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Gyrovirus",
                "Hepadnaviridae",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Parvovirus B19",
                "Human papillomavirus 16",
                "Iltovirus",
                "Inoviridae",
                "Inovirus",
                "Mardivirus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Orf virus",
                "Papillomaviridae",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Roseolovirus",
                "Simplexvirus",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Epstein-Barr virus (EBV)",
            "Human papillomavirus (HPV)",
            "Herpes simplex virus 1 (HSV-1)",
            "Herpes simplex virus 2 (HSV-2)",
            "Human immunodeficiency virus 1 (HIV-1)",
            "Human immunodeficiency virus 2 (HIV-2)",
            "Cytomegalovirus (CMV)",
            "Varicella-zoster virus (VZV)",
            "Human T-lymphotropic virus 1 (HTLV-1)",
            "Human T-lymphotropic virus 2 (HTLV-2)",
            "Simian immunodeficiency virus (SIV)",
            "Feline immunodeficiency virus (FIV)",
            "Bovine leukemia virus (BLV)",
            "Simian virus 40 (SV40)",
            "Rous sarcoma virus (RSV)",
            "Avian leukosis virus (ALV)",
            "Murine leukemia virus (MLV)",
            "Rabies virus (RABV)",
            "Influenza A virus",
            "Influenza B virus",
            "Influenza C virus",
            "Influenza D virus"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Simian virus 40"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Epstein-Barr virus (EBV)",
                "Human papillomavirus (HPV)",
                "Herpes simplex virus 1 (HSV-1)",
                "Herpes simplex virus 2 (HSV-2)",
                "Human immunodeficiency virus 1 (HIV-1)",
                "Human immunodeficiency virus 2 (HIV-2)",
                "Varicella-zoster virus (VZV)",
                "Human T-lymphotropic virus 1 (HTLV-1)",
                "Human T-lymphotropic virus 2 (HTLV-2)",
                "Simian immunodeficiency virus (SIV)",
                "Feline immunodeficiency virus (FIV)",
                "Bovine leukemia virus (BLV)",
                "Rous sarcoma virus (RSV)",
                "Avian leukosis virus (ALV)",
                "Murine leukemia virus (MLV)",
                "Rabies virus (RABV)",
                "Influenza A virus",
                "Influenza B virus",
                "Influenza C virus",
                "Influenza D virus"
            ],
            "true_referents": [
                "Adenoviridae",
                "Bocavirus",
                "Bovine Herpesvirus 1",
                "Bovine Herpesvirus 2",
                "Bovine papillomavirus 1",
                "Chicken anemia virus",
                "Cytomegalovirus",
                "Densovirus",
                "Gyrovirus",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human bocavirus",
                "Human papillomavirus 16",
                "Iltovirus",
                "Inovirus",
                "Lymphocryptovirus",
                "Microvirus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Parvovirus",
                "Polyomavirus",
                "Ranid Herpesvirus 1",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus"
            ],
            "TP": 2,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Human papillomavirus (HPV)",
            "Adenovirus",
            "Herpes simplex virus 1 (HSV-1)",
            "Herpes simplex virus 2 (HSV-2)",
            "Human cytomegalovirus (HCMV)",
            "Varicella-zoster virus (VZV)",
            "Epstein-Barr virus (EBV)",
            "Cytomegalovirus (CMV)",
            "JC virus",
            "BK virus",
            "Simian virus 40 (SV40)",
            "Murine polyomavirus",
            "Bovine papillomavirus (BPV)",
            "Yaba monkey tumor virus",
            "Frog virus 3",
            "Human endogenous retrovirus K (HERV-K)",
            "Torque teno virus (TTV)",
            "Merkel cell polyomavirus (MCPyV)",
            "Trichodysplasia spinulosa polyomavirus (TSPyV)",
            "Human polyomavirus 6 (HPyV6)",
            "Human polyomavirus 7 (HPyV7)",
            "Human polyomavirus 9 (HPyV9)",
            "Lymphocryptovirus (EBV-like)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "JC virus",
                "BK virus",
                "Yaba monkey tumor virus",
                "Torque teno virus",
                "Merkel cell polyomavirus",
                "Lymphocryptovirus"
            ],
            "mismatches": [
                "Human papillomavirus (HPV)",
                "Adenovirus",
                "Herpes simplex virus 1 (HSV-1)",
                "Herpes simplex virus 2 (HSV-2)",
                "Human cytomegalovirus (HCMV)",
                "Varicella-zoster virus (VZV)",
                "Epstein-Barr virus (EBV)",
                "Cytomegalovirus (CMV)",
                "Simian virus 40 (SV40)",
                "Murine polyomavirus",
                "Bovine papillomavirus (BPV)",
                "Frog virus 3",
                "Human endogenous retrovirus K (HERV-K)",
                "Trichodysplasia spinulosa polyomavirus (TSPyV)",
                "Human polyomavirus 6 (HPyV6)",
                "Human polyomavirus 7 (HPyV7)",
                "Human polyomavirus 9 (HPyV9)"
            ],
            "true_referents": [
                "Adenoviridae",
                "BK Virus",
                "Betapapillomavirus",
                "Bovine papillomavirus 1",
                "Bovine papillomavirus 4",
                "Cytomegalovirus",
                "Equid Herpesvirus 3",
                "Gallid Herpesvirus 3",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Papillomavirus Viruses",
                "Human papillomavirus 16",
                "Human papillomavirus 18",
                "Human papillomavirus 6",
                "Iltovirus",
                "Inovirus",
                "JC Virus",
                "Lymphocryptovirus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nanovirus",
                "Polydnaviridae",
                "Polyomaviridae",
                "Polyomavirus",
                "Ranavirus",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Torque teno virus",
                "Vaccinia virus",
                "Varicellovirus",
                "Yaba monkey tumor virus",
                "Yatapoxvirus"
            ],
            "TP": 6,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": "error when calling model 'amazon.titan-text-express-v1': empty response",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]