[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes Simplex Virus (HSV)",
            "Papillomavirus (HPV)",
            "Hepatitis B Virus (HBV)",
            "Epstein-Barr Virus (EBV)",
            "Herpesvirus saimiri (HVS)",
            "Varicella-Zoster Virus (VZV)",
            "Human Herpesvirus 6 (HHV-6)",
            "Cytomegalovirus (CMV)",
            "Kaposi's Sarcoma-Associated Herpesvirus (KSHV)",
            "Molluscum Contagiosum Virus (MCV)",
            "Polyomavirus (PyV)",
            "Simian Virus 40 (SV40)",
            "Adeno-Associated Virus (AAV)",
            "Baculovirus (BacV)",
            "Autographa californica M nucleopolyhedrovirus (AcMNPV)",
            "Rhabdovirus (RHDV)",
            "Measles Virus (MV)",
            "Mumps Virus (MuV)",
            "Respirovirus (RSV)",
            "Parainfluenza Virus (PIV)",
            "Influenza Virus (IFV)",
            "Poxvirus (PV)",
            "Molluscum Contagiosum Poxvirus (MCV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Human Herpesvirus 6",
                "Molluscum contagiosum virus",
                "Polyomavirus",
                "Simian virus 40"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes Simplex Virus (HSV)",
                "Papillomavirus (HPV)",
                "Hepatitis B Virus (HBV)",
                "Epstein-Barr Virus (EBV)",
                "Herpesvirus saimiri (HVS)",
                "Varicella-Zoster Virus (VZV)",
                "Kaposi's Sarcoma-Associated Herpesvirus (KSHV)",
                "Adeno-Associated Virus (AAV)",
                "Baculovirus (BacV)",
                "Autographa californica M nucleopolyhedrovirus (AcMNPV)",
                "Rhabdovirus (RHDV)",
                "Measles Virus (MV)",
                "Mumps Virus (MuV)",
                "Respirovirus (RSV)",
                "Parainfluenza Virus (PIV)",
                "Influenza Virus (IFV)",
                "Poxvirus (PV)",
                "Molluscum Contagiosum Poxvirus (MCV)"
            ],
            "true_referents": [
                "Adenoviridae",
                "Baculoviridae",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Erythrovirus",
                "Fowl adenovirus A",
                "Geminiviridae",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 8",
                "Human papillomavirus 16",
                "Iltovirus",
                "Inovirus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nanovirus",
                "Nimaviridae",
                "Nucleopolyhedroviruses",
                "Papillomaviridae",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Rhadinovirus",
                "Rudiviridae",
                "Saimiriine Herpesvirus 2",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Suid Herpesvirus 1",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes Simplex Virus 1 (HSV-1)",
            "Herpes Simplex Virus 2 (HSV-2)",
            "Varicella-Zoster Virus (VZV)",
            "Epstein-Barr Virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Human Papillomavirus (HPV)",
            "Hepatitis B Virus (HBV)",
            "Human Herpesvirus 6 (HHV-6)",
            "Human Herpesvirus 7 (HHV-7)",
            "Parvovirus B19",
            "Poxvirus (e.g., Variola Virus)",
            "Polyomavirus (e.g., JC Virus)",
            "Kaposi's Sarcoma-associated Herpesvirus (KSHV)",
            "Human T-lymphotropic Virus 1 (HTLV-1)",
            "Human T-lymphotropic Virus 2 (HTLV-2)",
            "Adeno-associated Virus (AAV)",
            "Simian Virus 40 (SV40)",
            "Baculovirus",
            "Papillomavirus (e.g., Bovine Papillomavirus)",
            "Molluscum Contagiosum Virus (MCV)",
            "Papillomavirus (e.g., Cottontail Rabbit Papillomavirus)",
            "Anellovirus (e.g., TTV - Torque Teno Virus)",
            "Boca Virus"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Hepatitis B Virus",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Simian Virus 40",
                "Baculovirus",
                "Molluscum Contagiosum Virus",
                "Anellovirus"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes Simplex Virus 1 (HSV-1)",
                "Herpes Simplex Virus 2 (HSV-2)",
                "Varicella-Zoster Virus (VZV)",
                "Epstein-Barr Virus (EBV)",
                "Human Papillomavirus (HPV)",
                "Parvovirus B19",
                "Poxvirus (e.g., Variola Virus)",
                "Polyomavirus (e.g., JC Virus)",
                "Kaposi's Sarcoma-associated Herpesvirus (KSHV)",
                "Human T-lymphotropic Virus 1 (HTLV-1)",
                "Human T-lymphotropic Virus 2 (HTLV-2)",
                "Adeno-associated Virus (AAV)",
                "Papillomavirus (e.g., Bovine Papillomavirus)",
                "Papillomavirus (e.g., Cottontail Rabbit Papillomavirus)",
                "Boca Virus"
            ],
            "true_referents": [
                "Adenoviridae",
                "Anelloviridae",
                "BK Virus",
                "Baculoviridae",
                "Bocavirus",
                "Bovine Herpesvirus 2",
                "Bovine papillomavirus 1",
                "Cottontail rabbit papillomavirus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Fowl adenovirus A",
                "Geminiviridae",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Human Parvovirus B19",
                "Human bocavirus",
                "Human papillomavirus 16",
                "Iltovirus",
                "Inovirus",
                "JC Virus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nanovirus",
                "Papillomaviridae",
                "Parvovirus",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Torque teno virus",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes Simplex Virus 1 (HSV-1)",
            "Herpes Simplex Virus 2 (HSV-2)",
            "Varicella-Zoster Virus (VZV)",
            "Epstein-Barr Virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Human Herpesvirus 6 (HHV-6)",
            "Human Herpesvirus 7 (HHV-7)",
            "Human Herpesvirus 8 (HHV-8)",
            "Papillomavirus",
            "Polyomavirus",
            "Parvovirus B19",
            "Hepatitis B Virus (HBV)",
            "Poxvirus",
            "Smallpox Virus (Variola)",
            "Vaccinia Virus",
            "Molluscum Contagiosum Virus",
            "Simian Virus 40 (SV40)",
            "JC Virus (JCV)",
            "BK Virus (BKV)",
            "Mercaptoethanolsulfonic acid (MES)",
            "Adeno-associated Virus (AAV)",
            "Adenovirus serotype 5 (Ad5)",
            "Adenovirus serotype 26 (Ad26)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Parvovirus",
                "Papillomavirus",
                "Polyomavirus",
                "Hepatitis B Virus",
                "Vaccinia Virus",
                "Molluscum Contagiosum Virus",
                "Simian Virus 40",
                "JC Virus",
                "BK Virus"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes Simplex Virus 1 (HSV-1)",
                "Herpes Simplex Virus 2 (HSV-2)",
                "Varicella-Zoster Virus (VZV)",
                "Epstein-Barr Virus (EBV)",
                "Poxvirus",
                "Smallpox Virus (Variola)",
                "Mercaptoethanolsulfonic acid (MES)",
                "Adeno-associated Virus (AAV)",
                "Adenovirus serotype 5 (Ad5)",
                "Adenovirus serotype 26 (Ad26)"
            ],
            "true_referents": [
                "Adenoviridae",
                "BK Virus",
                "Bacteriophage M13",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Fowl adenovirus A",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Human Parvovirus B19",
                "Inovirus",
                "JC Virus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Papillomaviridae",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus",
                "Xipapillomavirus"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes Simplex Virus 1 (HSV-1)",
            "Herpes Simplex Virus 2 (HSV-2)",
            "Varicella-Zoster Virus (VZV)",
            "Epstein-Barr Virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Human Papillomavirus (HPV)",
            "Human Polyomavirus JC (JCV)",
            "Human Polyomavirus BK (BKV)",
            "Merkel Cell Polyomavirus (MCPyV)",
            "Parvovirus B19",
            "Human Adenovirus C (HAdV-C)",
            "Kaposi's Sarcoma-Associated Herpesvirus (KSHV/HHV-8)",
            "Human Herpesvirus 6 (HHV-6A)",
            "Human Herpesvirus 7 (HHV-7)",
            "Bovine Herpesvirus 1 (BHV-1)",
            "Canine Adenovirus 2 (CAV-2)",
            "Feline Herpesvirus 1 (FHV-1)",
            "Simian Virus 40 (SV40)",
            "Hepatitis B Virus (HBV)",
            "African Swine Fever Virus (ASFV)",
            "Poxviridae family (e.g., Vaccinia Virus)",
            "Ringtail Possum Adenovirus (RPAdV)",
            "Human Bocavirus (HBoV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Bovine Herpesvirus 1",
                "Simian virus 40",
                "Hepatitis B virus",
                "African Swine Fever Virus",
                "Poxviridae",
                "Human bocavirus"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes Simplex Virus 1 (HSV-1)",
                "Herpes Simplex Virus 2 (HSV-2)",
                "Varicella-Zoster Virus (VZV)",
                "Epstein-Barr Virus (EBV)",
                "Human Papillomavirus (HPV)",
                "Human Polyomavirus JC (JCV)",
                "Human Polyomavirus BK (BKV)",
                "Merkel Cell Polyomavirus (MCPyV)",
                "Parvovirus B19",
                "Human Adenovirus C (HAdV-C)",
                "Kaposi's Sarcoma-Associated Herpesvirus (KSHV/HHV-8)",
                "Canine Adenovirus 2 (CAV-2)",
                "Feline Herpesvirus 1 (FHV-1)",
                "Ringtail Possum Adenovirus (RPAdV)"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Asfarviridae",
                "BK Virus",
                "Bocavirus",
                "Bovine Herpesvirus 1",
                "Bovine Herpesvirus 5",
                "Canine Adenoviruses",
                "Canine Parvovirus",
                "Cottontail rabbit papillomavirus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Equid Herpesvirus 1",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Human Parvovirus B19",
                "Human bocavirus",
                "Human papillomavirus 16",
                "Inovirus",
                "JC Virus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Orf virus",
                "Parvovirus",
                "Podoviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Vaccinia virus",
                "Varicellovirus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 10,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes Simplex Virus (HSV)",
            "Varicella Zoster Virus (VZV)",
            "Epstein-Barr Virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Human Papillomavirus (HPV)",
            "Hepatitis B Virus (HBV)",
            "Smallpox Virus (Variola)",
            "Vaccinia Virus",
            "Molluscum Contagiosum Virus (MCV)",
            "Parvovirus B19",
            "BK Virus",
            "JC Virus",
            "Merkel Cell Polyomavirus (MCV)",
            "Human Herpesvirus 6 (HHV-6)",
            "Human Herpesvirus 7 (HHV-7)",
            "Human Herpesvirus 8 (HHV-8)",
            "Kaposi's Sarcoma-associated Herpesvirus (KSHV)",
            "Orf Virus",
            "Bovine Papillomavirus (BPV)",
            "Simian Virus 40 (SV40)",
            "Canine Adenovirus",
            "Equine Herpesvirus",
            "African Swine Fever Virus (ASFV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "BK Virus",
                "JC Virus",
                "Merkel cell polyomavirus",
                "Orf virus",
                "Vaccinia virus",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "African Swine Fever Virus"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes Simplex Virus (HSV)",
                "Varicella Zoster Virus (VZV)",
                "Epstein-Barr Virus (EBV)",
                "Human Papillomavirus (HPV)",
                "Hepatitis B Virus (HBV)",
                "Smallpox Virus (Variola)",
                "Molluscum Contagiosum Virus (MCV)",
                "Parvovirus B19",
                "Kaposi's Sarcoma-associated Herpesvirus (KSHV)",
                "Bovine Papillomavirus (BPV)",
                "Simian Virus 40 (SV40)",
                "Canine Adenovirus",
                "Equine Herpesvirus"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Asfarviridae",
                "BK Virus",
                "Betapapillomavirus",
                "Bovine papillomavirus 1",
                "Bovine papillomavirus 4",
                "Canine Adenoviruses",
                "Canine Parvovirus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Equid Herpesvirus 1",
                "Equid Herpesvirus 3",
                "Equid Herpesvirus 4",
                "Fowl adenovirus A",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Human Parvovirus B19",
                "Human papillomavirus 16",
                "Inovirus",
                "JC Virus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Orf virus",
                "Orthopoxvirus",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes Simplex Virus (HSV)",
            "Human Papillomavirus (HPV)",
            "Hepatitis B Virus (HBV)",
            "Epstein-Barr Virus (EBV)",
            "Varicella-Zoster Virus (VZV)",
            "Cytomegalovirus (CMV)",
            "Poxvirus (PV)",
            "Parvovirus B19 (B19V)",
            "Molluscum Contagiosum Virus (MCV)",
            "Canine Parvovirus (CPV)",
            "Feline Panleukopenia Virus (FPV)",
            "Simian Virus 40 (SV40)",
            "Kaposi's Sarcoma-Associated Herpesvirus (KSHV)",
            "Bovine Papillomavirus (BPV)",
            "Porcine Parvovirus (PPV)",
            "Avian Adenovirus (AAvV)",
            "Human Adenovirus (HAdV)",
            "Lymphocytic Choriomeningitis Virus (LCMV)",
            "African Swine Fever Virus (ASFV)",
            "Baculovirus (Bac)",
            "Infectious Bursal Disease Virus (IBDV)",
            "Lymphoma-associated Virus (Mason-Pfizer Monkey Virus, MPMV)",
            "Tocopherol-Associated Virus (TAV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Canine Parvovirus",
                "Feline Panleukopenia Virus",
                "Simian virus 40",
                "Porcine Parvovirus",
                "African Swine Fever Virus",
                "Baculoviridae",
                "Human Adenoviruses"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes Simplex Virus (HSV)",
                "Human Papillomavirus (HPV)",
                "Hepatitis B Virus (HBV)",
                "Epstein-Barr Virus (EBV)",
                "Varicella-Zoster Virus (VZV)",
                "Poxvirus (PV)",
                "Parvovirus B19 (B19V)",
                "Molluscum Contagiosum Virus (MCV)",
                "Kaposi's Sarcoma-Associated Herpesvirus (KSHV)",
                "Bovine Papillomavirus (BPV)",
                "Avian Adenovirus (AAvV)",
                "Lymphocytic Choriomeningitis Virus (LCMV)",
                "Infectious Bursal Disease Virus (IBDV)",
                "Lymphoma-associated Virus (Mason-Pfizer Monkey Virus, MPMV)",
                "Tocopherol-Associated Virus (TAV)"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Asfarviridae",
                "Atadenovirus",
                "Aviadenovirus",
                "Baculoviridae",
                "Badnavirus",
                "Betapapillomavirus",
                "Bocavirus",
                "Bovine papillomavirus 1",
                "Bovine papillomavirus 4",
                "Canine Parvovirus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Feline Panleukopenia Virus",
                "Fowl adenovirus A",
                "Geminiviridae",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 8",
                "Human Parvovirus B19",
                "Human papillomavirus 16",
                "Inovirus",
                "Lymphocryptovirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Orf virus",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Vaccinia virus",
                "Varicellovirus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Hepatitis B Virus (HBV)",
            "Human Papillomavirus (HPV)",
            "Herpes Simplex Virus (HSV)",
            "Epstein-Barr Virus (EBV)",
            "Varicella-Zoster Virus (VZV)",
            "Human Herpesvirus 6 (HHV-6)",
            "Human Herpesvirus 7 (HHV-7)",
            "Kaposi's Sarcoma-associated Herpesvirus (KSHV)",
            "Cytomegalovirus (CMV)",
            "Polyomavirus (PyV)",
            "Parvovirus B19 (B19V)",
            "Human T-lymphotropic virus (HTLV)",
            "Monkeypox Virus (MPXV)",
            "Canine Parvovirus (CPV)",
            "Bovine Papillomavirus (BPV)",
            "Simian Virus 40 (SV40)",
            "Chicken Anemia Virus (CAV)",
            "African Swine Fever Virus (ASFV)",
            "Porcine Circovirus (PCV)",
            "Banana Bunchy Top Virus (BBTV)",
            "Bean Yellow Dwarf Virus (BeYDV)",
            "Tomato Yellow Leaf Curl Virus (TYLCV)",
            "Wheat Dwarf Virus (WDV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hepatitis B Virus (HBV)",
                "Human Herpesvirus 6 (HHV-6)",
                "Human Herpesvirus 7 (HHV-7)",
                "Cytomegalovirus (CMV)",
                "Polyomavirus (PyV)",
                "Parvovirus B19 (B19V)",
                "Monkeypox Virus (MPXV)",
                "Canine Parvovirus (CPV)",
                "Chicken Anemia Virus (CAV)",
                "African Swine Fever Virus (ASFV)",
                "Simian Virus 40 (SV40)"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Human Papillomavirus (HPV)",
                "Herpes Simplex Virus (HSV)",
                "Epstein-Barr Virus (EBV)",
                "Varicella-Zoster Virus (VZV)",
                "Kaposi's Sarcoma-associated Herpesvirus (KSHV)",
                "Human T-lymphotropic virus (HTLV)",
                "Bovine Papillomavirus (BPV)",
                "Porcine Circovirus (PCV)",
                "Banana Bunchy Top Virus (BBTV)",
                "Bean Yellow Dwarf Virus (BeYDV)",
                "Tomato Yellow Leaf Curl Virus (TYLCV)",
                "Wheat Dwarf Virus (WDV)"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Asfarviridae",
                "BK Virus",
                "Begomovirus",
                "Betapapillomavirus",
                "Bocavirus",
                "Bovine papillomavirus 1",
                "Bovine papillomavirus 4",
                "Canine Parvovirus",
                "Chicken anemia virus",
                "Circoviridae",
                "Circovirus",
                "Cowpox virus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Geminiviridae",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Human Parvovirus B19",
                "Human papillomavirus 16",
                "Iltovirus",
                "Inovirus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Orf virus",
                "Parapoxvirus",
                "Parvovirus",
                "Plectrovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Tungrovirus",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Herpes simplex virus (HSV)",
            "Varicella-zoster virus (VZV)",
            "Epstein-Barr virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Human papillomavirus (HPV)",
            "Adenovirus",
            "Hepatitis B virus (HBV)",
            "Human immunodeficiency virus (HIV)",
            "Poxvirus",
            "Human T-lymphotropic virus (HTLV)",
            "Polyomavirus",
            "Molluscum contagiosum virus",
            "Kaposi's sarcoma-associated herpesvirus (KSHV)",
            "Human herpesvirus 6 (HHV-6)",
            "Human herpesvirus 7 (HHV-7)",
            "Human herpesvirus 8 (HHV-8)",
            "Simian virus 40 (SV40)",
            "Bovine papillomavirus (BPV)",
            "Canine parvovirus",
            "Feline panleukopenia virus (FPV)",
            "Porcine circovirus",
            "Avian influenza virus",
            "Rabbit hemorrhagic disease virus (RHDV)",
            "West Nile virus"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Human papillomavirus",
                "Hepatitis B virus",
                "Polyomavirus",
                "Molluscum contagiosum virus",
                "Human herpesvirus 6",
                "Human herpesvirus 7",
                "Human herpesvirus 8",
                "Simian virus 40",
                "Canine parvovirus",
                "Feline panleukopenia virus"
            ],
            "mismatches": [
                "Herpes simplex virus (HSV)",
                "Varicella-zoster virus (VZV)",
                "Epstein-Barr virus (EBV)",
                "Adenovirus",
                "Human immunodeficiency virus (HIV)",
                "Poxvirus",
                "Human T-lymphotropic virus (HTLV)",
                "Kaposi's sarcoma-associated herpesvirus (KSHV)",
                "Bovine papillomavirus (BPV)",
                "Porcine circovirus",
                "Avian influenza virus",
                "Rabbit hemorrhagic disease virus (RHDV)",
                "West Nile virus"
            ],
            "true_referents": [
                "Adenoviridae",
                "Betapapillomavirus",
                "Bovine papillomavirus 1",
                "Bovine papillomavirus 4",
                "Canine Parvovirus",
                "Circoviridae",
                "Circovirus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Feline Panleukopenia Virus",
                "Fowl adenovirus A",
                "Fowlpox virus",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Human papillomavirus 16",
                "Iltovirus",
                "Inovirus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Rabbit Fibroma Virus",
                "Rhadinovirus",
                "Rudiviridae",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Tungrovirus",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes Simplex Virus 1 (HSV-1)",
            "Herpes Simplex Virus 2 (HSV-2)",
            "Varicella-Zoster Virus (VZV)",
            "Epstein-Barr Virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Human Herpesvirus 6 (HHV-6)",
            "Human Herpesvirus 7 (HHV-7)",
            "Human Herpesvirus 8 (HHV-8)",
            "Human Papillomavirus (HPV)",
            "Merkel Cell Polyomavirus (MCPyV)",
            "JC Virus (JCV)",
            "BK Virus (BKV)",
            "Vaccinia Virus (VACV)",
            "Variola Virus (Smallpox Virus)",
            "Molluscum Contagiosum Virus (MCV)",
            "Pseudorabies Virus (PRV)",
            "African Swine Fever Virus (ASFV)",
            "Parvovirus B19",
            "Hepatitis B Virus (HBV)",
            "Torque Teno Virus (TTV)",
            "Adeno-associated Virus (AAV)",
            "Bovine Papillomavirus (BPV)",
            "Canine Parvovirus"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Merkel cell polyomavirus",
                "JC Virus",
                "BK Virus",
                "Vaccinia virus",
                "Variola virus",
                "Molluscum contagiosum virus",
                "African Swine Fever Virus",
                "Hepatitis B virus",
                "Torque teno virus"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes Simplex Virus 1 (HSV-1)",
                "Herpes Simplex Virus 2 (HSV-2)",
                "Varicella-Zoster Virus (VZV)",
                "Epstein-Barr Virus (EBV)",
                "Human Papillomavirus (HPV)",
                "Pseudorabies Virus (PRV)",
                "Parvovirus B19",
                "Adeno-associated Virus (AAV)",
                "Bovine Papillomavirus (BPV)",
                "Canine Parvovirus"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Asfarviridae",
                "BK Virus",
                "Betapapillomavirus",
                "Bovine papillomavirus 1",
                "Bovine papillomavirus 4",
                "Canine Parvovirus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Fowl adenovirus A",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Human Parvovirus B19",
                "Human papillomavirus 16",
                "Iltovirus",
                "Inovirus",
                "JC Virus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nanovirus",
                "Orf virus",
                "Parvovirus",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Pseudocowpox Virus",
                "Torque teno virus",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes simplex virus 1 (HSV-1)",
            "Human papillomavirus (HPV)",
            "Hepatitis B virus (HBV)",
            "Epstein-Barr virus (EBV)",
            "Varicella-zoster virus (VZV)",
            "Cytomegalovirus (CMV)",
            "Parvovirus B19",
            "Human polyomavirus (HPyV)",
            "Variola virus",
            "Molluscum contagiosum virus (MCV)",
            "Kaposi's sarcoma-associated herpesvirus (KSHV)",
            "Human bocavirus (HBoV)",
            "Torque teno virus (TTV)",
            "Mimivirus",
            "Poxvirus",
            "Baculovirus",
            "Chlorella virus",
            "African swine fever virus (ASFV)",
            "Cauliflower mosaic virus (CaMV)",
            "Hepadnavirus",
            "Circovirus",
            "Iridovirus",
            "Papillomavirus"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Variola virus",
                "Molluscum contagiosum virus",
                "Human bocavirus",
                "Torque teno virus",
                "African swine fever virus",
                "Circovirus",
                "Iridovirus"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes simplex virus 1 (HSV-1)",
                "Human papillomavirus (HPV)",
                "Hepatitis B virus (HBV)",
                "Epstein-Barr virus (EBV)",
                "Varicella-zoster virus (VZV)",
                "Cytomegalovirus (CMV)",
                "Parvovirus B19",
                "Human polyomavirus (HPyV)",
                "Kaposi's sarcoma-associated herpesvirus (KSHV)",
                "Mimivirus",
                "Poxvirus",
                "Baculovirus",
                "Chlorella virus",
                "Cauliflower mosaic virus (CaMV)",
                "Hepadnavirus",
                "Papillomavirus"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Ascoviridae",
                "Asfarviridae",
                "Baculoviridae",
                "Bocavirus",
                "Caulimoviridae",
                "Caulimovirus",
                "Circoviridae",
                "Circovirus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Ectromelia virus",
                "Geminiviridae",
                "Hepadnaviridae",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 8",
                "Human Papillomavirus Viruses",
                "Human Parvovirus B19",
                "Human bocavirus",
                "Human papillomavirus 16",
                "Human papillomavirus 18",
                "Iltovirus",
                "Inovirus",
                "Iridoviridae",
                "Iridovirus",
                "Microvirus",
                "Mimiviridae",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Nanovirus",
                "Orf virus",
                "Papillomaviridae",
                "Parapoxvirus",
                "Parvovirus",
                "Plectrovirus",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Poxviridae",
                "Rudiviridae",
                "Torque teno virus",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus",
                "Xipapillomavirus"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Human papillomavirus (HPV)",
            "Adenovirus (AdV)",
            "Herpes simplex virus 1 (HSV-1)",
            "Herpes simplex virus 2 (HSV-2)",
            "Varicella-zoster virus (VZV)",
            "Epstein-Barr virus (EBV)",
            "Cytomegalovirus (CMV)",
            "Kaposi's sarcoma-associated herpesvirus (KSHV)",
            "Hepatitis B virus (HBV)",
            "Parvovirus B19",
            "JC virus (JCV)",
            "BK virus (BKV)",
            "Merkel cell polyomavirus (MCPyV)",
            "Human bocavirus (HBoV)",
            "Molluscum contagiosum virus (MCV)",
            "Vaccinia virus (VACV)",
            "Cowpox virus (CPV)",
            "Monkeypox virus (MPV)",
            "Orf virus (ORFV)",
            "African swine fever virus (ASFV)",
            "Feline panleukopenia virus (FPV)",
            "Canine parvovirus (CPV)",
            "Simian virus 40 (SV40)",
            "Polyomavirus BK (BKPyV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Hepatitis B virus",
                "JC Virus",
                "BK Virus",
                "Merkel cell polyomavirus",
                "Human bocavirus",
                "Molluscum contagiosum virus",
                "Vaccinia virus",
                "Cowpox virus",
                "Monkeypox virus",
                "Orf virus",
                "African Swine Fever Virus",
                "Feline Panleukopenia Virus",
                "Canine Parvovirus",
                "Simian virus 40"
            ],
            "mismatches": [
                "Human papillomavirus (HPV)",
                "Adenovirus (AdV)",
                "Herpes simplex virus 1 (HSV-1)",
                "Herpes simplex virus 2 (HSV-2)",
                "Varicella-zoster virus (VZV)",
                "Epstein-Barr virus (EBV)",
                "Kaposi's sarcoma-associated herpesvirus (KSHV)",
                "Parvovirus B19",
                "Polyomavirus BK (BKPyV)"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Asfarviridae",
                "BK Virus",
                "Bocavirus",
                "Canine Parvovirus",
                "Cowpox virus",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Feline Panleukopenia Virus",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 8",
                "Human Parvovirus B19",
                "Human bocavirus",
                "Human papillomavirus 16",
                "Inovirus",
                "JC Virus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Molluscipoxvirus",
                "Molluscum contagiosum virus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Orf virus",
                "Orthopoxvirus",
                "Parapoxvirus",
                "Parvovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Porcine Parvovirus",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Vaccinia virus",
                "Varicellovirus",
                "Variola virus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenoviridae (AdV)",
            "Papillomaviridae (PV)",
            "Polyomaviridae (PyV)",
            "Parvoviridae (PaV)",
            "Herpesviridae (HHV)",
            "Poxviridae (POXV)",
            "Hepadnaviridae (HBV)",
            "Caudovirales (Caudovirales)",
            "Iridoviridae (IIV)",
            "Asfarviridae (ASFV)",
            "Baculoviridae (BV)",
            "Nimaviridae (NIMV)",
            "Plasmaviridae (PlasmaV)",
            "Genomoviridae (GemV)",
            "Circoviridae (CV)",
            "Anelloviridae (AnelloV)",
            "Bacilliadnaviridae (BdnV)",
            "Ampullaviridae (AmpullaV)",
            "Lipothrixviridae (LipothrixV)",
            "Rudiviridae (RudivV)",
            "Salterprovirus (SalterproV)",
            "Phycodnaviridae (PhycoDNAV)",
            "Marseilleviridae (MarseilleV)",
            "Pithoviridae (PithoV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adenoviridae",
                "Papillomaviridae",
                "Polyomaviridae",
                "Parvoviridae",
                "Herpesviridae",
                "Poxviridae",
                "Hepadnaviridae",
                "Caudovirales",
                "Iridoviridae",
                "Asfarviridae",
                "Baculoviridae",
                "Nimaviridae",
                "Circoviridae",
                "Anelloviridae",
                "Lipothrixviridae",
                "Rudiviridae",
                "Phycodnaviridae"
            ],
            "mismatches": [
                "Plasmaviridae",
                "Genomoviridae",
                "Bacilliadnaviridae",
                "Ampullaviridae",
                "Salterprovirus",
                "Marseilleviridae",
                "Pithoviridae"
            ],
            "true_referents": [
                "Adenoviridae",
                "Anelloviridae",
                "Ascoviridae",
                "Asfarviridae",
                "Baculoviridae",
                "Caudovirales",
                "Caulimoviridae",
                "Circoviridae",
                "Circovirus",
                "Duck Hepatitis B Virus",
                "Fuselloviridae",
                "Gammaherpesvirinae",
                "Geminiviridae",
                "Guttaviridae",
                "Hepadnaviridae",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Herpesvirus 1",
                "Human Papillomavirus Viruses",
                "Inoviridae",
                "Iridoviridae",
                "Iridovirus",
                "Lipothrixviridae",
                "Microviridae",
                "Microvirus",
                "Mimiviridae",
                "Molluscipoxvirus",
                "Mupapillomavirus",
                "Myoviridae",
                "Nanoviridae",
                "Nanovirus",
                "Nimaviridae",
                "Nudiviridae",
                "Papillomaviridae",
                "Parvoviridae",
                "Parvovirinae",
                "Parvovirus",
                "Phycodnaviridae",
                "Plectrovirus",
                "Podoviridae",
                "Polydnaviridae",
                "Polyomaviridae",
                "Polyomavirus",
                "Poxviridae",
                "Rudiviridae",
                "Simplexvirus",
                "Siphoviridae",
                "Tectiviridae"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Anelloviridae",
            "Baculoviridae",
            "Circoviridae",
            "Coccolithoviridae",
            "Corticoviridae",
            "Fuselloviridae",
            "Geminiviridae",
            "Herpesviridae",
            "Inoviridae",
            "Lipothrixviridae",
            "Microviridae",
            "Myoviridae",
            "Nimaviridae",
            "Papillomaviridae",
            "Parvoviridae",
            "Phycodnaviridae",
            "Podoviridae",
            "Polydnaviridae",
            "Poxviridae",
            "Rudiviridae",
            "Tectiviridae",
            "Tombusviridae",
            "Totiviridae"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Anelloviridae",
                "Baculoviridae",
                "Circoviridae",
                "Fuselloviridae",
                "Geminiviridae",
                "Herpesviridae",
                "Inoviridae",
                "Lipothrixviridae",
                "Microviridae",
                "Myoviridae",
                "Nimaviridae",
                "Papillomaviridae",
                "Parvoviridae",
                "Phycodnaviridae",
                "Podoviridae",
                "Polydnaviridae",
                "Poxviridae",
                "Rudiviridae",
                "Tectiviridae"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Coccolithoviridae",
                "Corticoviridae",
                "Tombusviridae",
                "Totiviridae"
            ],
            "true_referents": [
                "Adenoviridae",
                "Alphaherpesvirinae",
                "Anelloviridae",
                "Ascoviridae",
                "Baculoviridae",
                "Circoviridae",
                "Circovirus",
                "Fuselloviridae",
                "Geminiviridae",
                "Guttaviridae",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Papillomavirus Viruses",
                "Inoviridae",
                "Inovirus",
                "Lipothrixviridae",
                "Microviridae",
                "Molluscipoxvirus",
                "Mupapillomavirus",
                "Myoviridae",
                "Nanoviridae",
                "Nimaviridae",
                "Nudiviridae",
                "Papillomaviridae",
                "Parvoviridae",
                "Parvovirinae",
                "Parvovirus",
                "Phycodnaviridae",
                "Podoviridae",
                "Polydnaviridae",
                "Polyomaviridae",
                "Poxviridae",
                "Rudiviridae",
                "Siphoviridae",
                "Tectiviridae"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Human Papillomavirus (HPV)",
            "Adenovirus",
            "Herpes Simplex Virus",
            "Epstein-Barr Virus (EBV)",
            "Hepatitis B Virus (HBV)",
            "Hepatitis C Virus (HCV)",
            "Human Immunodeficiency Virus (HIV)",
            "Cytomegalovirus (CMV)",
            "Varicella-Zoster Virus (VZV)",
            "Human T-Lymphotropic Virus (HTLV)",
            "Papovavirus",
            "Polyomavirus",
            "Adenovirus 5",
            "Herpes Simplex Virus 2",
            "Epstein-Barr Virus",
            "Human T-Lymphotropic Virus 1",
            "Human T-Lymphotropic Virus 2",
            "Hepatitis A Virus",
            "Hepatitis E Virus",
            "Human Herpesvirus 6",
            "Human Herpesvirus 8",
            "Simian Virus 40",
            "Bovine Papillomavirus",
            "Feline Leukemia Virus"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cytomegalovirus",
                "Human Herpesvirus 6",
                "Human Herpesvirus 8",
                "Polyomavirus",
                "Simian Virus 40"
            ],
            "mismatches": [
                "Human Papillomavirus (HPV)",
                "Adenovirus",
                "Herpes Simplex Virus",
                "Epstein-Barr Virus (EBV)",
                "Hepatitis B Virus (HBV)",
                "Hepatitis C Virus (HCV)",
                "Human Immunodeficiency Virus (HIV)",
                "Varicella-Zoster Virus (VZV)",
                "Human T-Lymphotropic Virus (HTLV)",
                "Papovavirus",
                "Adenovirus 5",
                "Herpes Simplex Virus 2",
                "Epstein-Barr Virus",
                "Human T-Lymphotropic Virus 1",
                "Human T-Lymphotropic Virus 2",
                "Hepatitis A Virus",
                "Hepatitis E Virus",
                "Bovine Papillomavirus",
                "Feline Leukemia Virus"
            ],
            "true_referents": [
                "Adenoviridae",
                "Alphapapillomavirus",
                "Betapapillomavirus",
                "Bovine Herpesvirus 2",
                "Bovine papillomavirus 1",
                "Bovine papillomavirus 4",
                "Cytomegalovirus",
                "Duck Hepatitis B Virus",
                "Feline Panleukopenia Virus",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 8",
                "Human Papillomavirus Viruses",
                "Human papillomavirus 16",
                "Iltovirus",
                "Inovirus",
                "Lymphocryptovirus",
                "Merkel cell polyomavirus",
                "Microvirus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Parvovirus",
                "Polyomaviridae",
                "Polyomavirus",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Simplexvirus",
                "Vaccinia virus",
                "Varicellovirus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            "Adenovirus (AdV)",
            "Herpes simplex virus 1 (HSV-1)",
            "Human cytomegalovirus (HCMV)",
            "Epstein-Barr virus (EBV)",
            "Human papillomavirus (HPV)",
            "Simian virus 40 (SV40)",
            "JC virus",
            "BK virus",
            "Varicella-zoster virus (VZV)",
            "Human herpesvirus 6 (HHV-6)",
            "Human herpesvirus 7 (HHV-7)",
            "Kaposi's sarcoma-associated herpesvirus (KSHV)",
            "Murine cytomegalovirus (MCMV)",
            "Rhesus cytomegalovirus (RhCMV)",
            "African swine fever virus",
            "Porcine circovirus",
            "Feline calicivirus (FCV)",
            "Canine adenovirus (CAV-1)",
            "Avian adenovirus",
            "Human endogenous retrovirus K (HERV-K)",
            "Bovine adenovirus (BAdV-3)",
            "Ovine adenovirus (OAdV)",
            "Caprine adenovirus (CApAdV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "JC virus",
                "BK virus",
                "Simian virus 40",
                "Human herpesvirus 6 (HHV-6)",
                "Human herpesvirus 7 (HHV-7)",
                "African swine fever virus"
            ],
            "mismatches": [
                "Adenovirus (AdV)",
                "Herpes simplex virus 1 (HSV-1)",
                "Human cytomegalovirus (HCMV)",
                "Epstein-Barr virus (EBV)",
                "Human papillomavirus (HPV)",
                "Varicella-zoster virus (VZV)",
                "Kaposi's sarcoma-associated herpesvirus (KSHV)",
                "Murine cytomegalovirus (MCMV)",
                "Rhesus cytomegalovirus (RhCMV)",
                "Porcine circovirus",
                "Feline calicivirus (FCV)",
                "Canine adenovirus (CAV-1)",
                "Avian adenovirus",
                "Human endogenous retrovirus K (HERV-K)",
                "Bovine adenovirus (BAdV-3)",
                "Ovine adenovirus (OAdV)",
                "Caprine adenovirus (CApAdV)"
            ],
            "true_referents": [
                "Adenoviridae",
                "African Swine Fever Virus",
                "Aviadenovirus",
                "BK Virus",
                "Bovine Herpesvirus 1",
                "Bovine Herpesvirus 5",
                "Canid Herpesvirus 1",
                "Canine Adenoviruses",
                "Canine Parvovirus",
                "Capripoxvirus",
                "Circoviridae",
                "Circovirus",
                "Cytomegalovirus",
                "Fowl adenovirus A",
                "Herpesviridae",
                "Human Adenoviruses",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Herpesvirus 3",
                "Human Herpesvirus 6",
                "Human Herpesvirus 7",
                "Human Herpesvirus 8",
                "Human papillomavirus 16",
                "Inovirus",
                "JC Virus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Muromegalovirus",
                "Orf virus",
                "Parvovirus",
                "Polyomavirus",
                "Porcine Adenoviruses",
                "Porcine Parvovirus",
                "Simian Adenoviruses",
                "Simian virus 40",
                "Vaccinia virus",
                "Varicellovirus"
            ],
            "TP": 6,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "DNA virus",
        "domain": "medicine",
        "response": [
            {
                "Referent": "Adenoviridae",
                "Canonical name": "Adenoviridae"
            },
            {
                "Referent": "Adenovirus",
                "Canonical name": "Adenovirus"
            },
            {
                "Referent": "Baculoviridae",
                "Canonical name": "Baculoviridae"
            },
            {
                "Referent": "Baculovirus",
                "Canonical name": "Baculovirus"
            },
            {
                "Referent": "Herpesviridae",
                "Canonical name": "Herpesviridae"
            },
            {
                "Referent": "Herpes simplex virus 1",
                "Canonical name": "Herpes simplex virus 1"
            },
            {
                "Referent": "Herpes simplex virus 2",
                "Canonical name": "Herpes simplex virus 2"
            },
            {
                "Referent": "Papillomaviridae",
                "Canonical name": "Papillomaviridae"
            },
            {
                "Referent": "Papillomavirus",
                "Canonical name": "Papillomavirus"
            },
            {
                "Referent": "Poxviridae",
                "Canonical name": "Poxviridae"
            },
            {
                "Referent": "Poxvirus",
                "Canonical name": "Poxvirus"
            },
            {
                "Referent": "Polyomaviridae",
                "Canonical name": "Polyomaviridae"
            },
            {
                "Referent": "Polyomavirus",
                "Canonical name": "Polyomavirus"
            },
            {
                "Referent": "Parvoviridae",
                "Canonical name": "Parvoviridae"
            },
            {
                "Referent": "Parvovirus",
                "Canonical name": "Parvovirus"
            },
            {
                "Referent": "Picornaviridae",
                "Canonical name": "Picornaviridae"
            },
            {
                "Referent": "Picornavirus",
                "Canonical name": "Picornavirus"
            },
            {
                "Referent": "Reoviridae",
                "Canonical name": "Reoviridae"
            },
            {
                "Referent": "Reovirus",
                "Canonical name": "Reovirus"
            },
            {
                "Referent": "Togaviridae",
                "Canonical name": "Togaviridae"
            },
            {
                "Referent": "Togavirus",
                "Canonical name": "Togavirus"
            },
            {
                "Referent": "Hepadnaviridae",
                "Canonical name": "Hapadnaviridae"
            },
            {
                "Referent": "Hepatitis B virus",
                "Canonical name": "Hepatitis B virus"
            },
            {
                "Referent": "Hepatitis E virus",
                "Canonical name": "Hepatitis E virus"
            },
            {
                "Referent": "Hepatitis G virus",
                "Canonical name": "Hepatitis G virus"
            },
            {
                "Referent": "Hepatitis C virus",
                "Canonical name": "Hepatitis C virus"
            },
            {
                "Referent": "Hepatitis D virus",
                "Canonical name": "Hepatitis D virus"
            },
            {
                "Referent": "Hepatitis F virus",
                "Canonical name": "Hepatitis F virus"
            },
            {
                "Referent": "Hepatitis G virus",
                "Canonical name": "Hepatitis G virus"
            },
            {
                "Referent": "Hepatitis H virus",
                "Canonical name": "Hepatitis H virus"
            },
            {
                "Referent": "Hepatitis I virus",
                "Canonical name": "Hepatitis I virus"
            },
            {
                "Referent": "Hepatitis J virus",
                "Canonical name": "Hepatitis J virus"
            },
            {
                "Referent": "Hepatitis K virus",
                "Canonical name": "Hepatitis K virus"
            },
            {
                "Referent": "Hepatitis M virus",
                "Canonical name": "Hepatitis M virus"
            },
            {
                "Referent": "Hepatitis N virus",
                "Canonical name": "Hepatitis N virus"
            },
            {
                "Referent": "Hepatitis O virus",
                "Canonical name": "Hepatitis O virus"
            },
            {
                "Referent": "Hepatitis P virus",
                "Canonical name": "Hepatitis P virus"
            },
            {
                "Referent": "Hepatitis R virus",
                "Canonical name": "Hepatitis R virus"
            },
            {
                "Referent": "Hepatitis T virus",
                "Canonical name": "Hepatitis T virus"
            },
            {
                "Referent": "Hepatitis V virus",
                "Canonical name": "Hepatitis V virus"
            },
            {
                "Referent": "Hepatitis X virus",
                "Canonical name": "Hepatitis X virus"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Adenoviridae",
                "Baculoviridae",
                "Herpesviridae",
                "Papillomaviridae",
                "Poxviridae",
                "Polyomaviridae",
                "Parvoviridae",
                "Hepadnaviridae",
                "Hepatitis B virus"
            ],
            "mismatches": [
                "Adenovirus",
                "Baculovirus",
                "Herpes simplex virus 1",
                "Herpes simplex virus 2",
                "Papillomavirus",
                "Poxvirus",
                "Picornaviridae",
                "Picornavirus",
                "Reoviridae",
                "Reovirus",
                "Togaviridae",
                "Togavirus",
                "Hepatitis E virus",
                "Hepatitis G virus",
                "Hepatitis C virus",
                "Hepatitis D virus",
                "Hepatitis F virus",
                "Hepatitis H virus",
                "Hepatitis I virus",
                "Hepatitis J virus",
                "Hepatitis K virus",
                "Hepatitis M virus",
                "Hepatitis N virus",
                "Hepatitis O virus",
                "Hepatitis P virus",
                "Hepatitis R virus",
                "Hepatitis T virus",
                "Hepatitis V virus",
                "Hepatitis X virus"
            ],
            "true_referents": [
                "Adenoviridae",
                "Alphaherpesvirinae",
                "BK Virus",
                "Baculoviridae",
                "Canine Parvovirus",
                "Cytomegalovirus",
                "Entomopoxvirinae",
                "Geminiviridae",
                "Hepadnaviridae",
                "Hepatitis B virus",
                "Herpesviridae",
                "Human Herpesvirus 1",
                "Human Herpesvirus 2",
                "Human Papillomavirus Viruses",
                "Inoviridae",
                "Inovirus",
                "Monkeypox virus",
                "Mupapillomavirus",
                "Myoviridae",
                "Nimaviridae",
                "Papillomaviridae",
                "Parvoviridae",
                "Parvovirinae",
                "Parvovirus",
                "Plectrovirus",
                "Podoviridae",
                "Polydnaviridae",
                "Polyomaviridae",
                "Polyomavirus",
                "Poxviridae",
                "Rudiviridae",
                "Tectiviridae",
                "Vaccinia virus",
                "Woodchuck Hepatitis B Virus"
            ],
            "TP": 9,
            "FP": 29,
            "FN": 0
        }
    }
]