[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Acaricide (AC)",
            "Dichlorovos (DCV)",
            "Benzovindiflupyr (BVI)",
            "Etofenprox (ETF)",
            "Hexythiazox (HTZ)",
            "Propargite (PRG)",
            "Spiromesifen (SPM)",
            "Spiroxamine (SRX)",
            "Clofentezine (CLF)",
            "Cyhexatin (CHT)",
            "Diflovidazin (DFV)",
            "Hexythiazox (HTZ)",
            "Tetradifon (TDF)",
            "Dicyclanil (DCN)",
            "Fluacyprim (FUP)",
            "Cyhexatin (CHT)",
            "Spiroxamine (SRX)",
            "Bifenazate (BFN)",
            "Flonicamid (FLN)",
            "Pyridaben (PYR)",
            "Tebufenpyrad (TBP)",
            "Etofenprox (ETF)",
            "Fluazuron (FZR)",
            "Spiroxamine (SRX)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexythiazox (HTZ)",
                "Propargite (PRG)",
                "Clofentezine (CLF)",
                "Cyhexatin (CHT)",
                "Tetradifon (TDF)",
                "Pyridaben (PYR)",
                "Bifenazate (BFN)",
                "Fluazuron (FZR)"
            ],
            "mismatches": [
                "Acaricide (AC)",
                "Dichlorovos (DCV)",
                "Benzovindiflupyr (BVI)",
                "Etofenprox (ETF)",
                "Spiromesifen (SPM)",
                "Spiroxamine (SRX)",
                "Diflovidazin (DFV)",
                "Dicyclanil (DCN)",
                "Fluacyprim (FUP)",
                "Flonicamid (FLN)",
                "Tebufenpyrad (TBP)"
            ],
            "true_referents": [
                "(S,S)-hexythiazox",
                "acaricide drug",
                "antibiotic acaricide",
                "bifenazate",
                "bifenthrin",
                "bisulflufen",
                "bridged diphenyl acaricide",
                "butocarboxim",
                "chlorfenvinfos",
                "clofentezine",
                "cyenopyrafen",
                "cyhexatin",
                "dichlofluanid",
                "dichlorvos",
                "dicofol",
                "dicrotophos",
                "dinitrophenol acaricide",
                "disulfiram",
                "disulfoton",
                "esfenvalerate",
                "etoxazole",
                "fenpropathrin",
                "fenvalerate",
                "fipronil",
                "fluacrypyrim",
                "fluazuron",
                "halfenprox",
                "hexythiazox",
                "organochlorine acaricide",
                "phosmet",
                "propargite",
                "propoxur",
                "pyridaben",
                "pyrimidifen",
                "spirobudifen",
                "spirodiclofen",
                "tetradifon",
                "triazophos"
            ],
            "TP": 8,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Abamectin (ABM)",
            "Amitraz (AMT)",
            "Bifenthrin (BIF)",
            "Clofentezine (CLE)",
            "Cypermethrin (CYP)",
            "Deltamethrin (DEL)",
            "Diatomaceous Earth (DE)",
            "Etofenprox (ETP)",
            "Fenpyroximate (FEN)",
            "Flumethrin (FLU)",
            "Gamma-cyhalothrin (GCH)",
            "Hexythiazox (HTX)",
            "Ivermectin (IVM)",
            "Ketoconazole (KTC)",
            "Lambda-cyhalothrin (LCY)",
            "Malathion (MAL)",
            "Methoprene (MTH)",
            "Neem Oil (NEM)",
            "Permethrin (PER)",
            "Phosmet (PHM)",
            "Propargite (PPG)",
            "Sulprofos (SUL)",
            "Tebufenozide (TEB)",
            "Zetacypermethrin (ZCP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Abamectin",
                "Amitraz",
                "Bifenthrin",
                "Clofentezine",
                "Cypermethrin",
                "Flumethrin",
                "Gamma-cyhalothrin",
                "Hexythiazox",
                "Ivermectin",
                "Lambda-cyhalothrin",
                "Malathion",
                "Permethrin",
                "Phosmet",
                "Propargite"
            ],
            "mismatches": [
                "Deltamethrin",
                "Diatomaceous Earth",
                "Etofenprox",
                "Fenpyroximate",
                "Ketoconazole",
                "Methoprene",
                "Neem Oil",
                "Sulprofos",
                "Tebufenozide",
                "Zetacypermethrin"
            ],
            "true_referents": [
                "(-)-trans-permethrin",
                "(S,S)-hexythiazox",
                "abamectin",
                "alpha-cypermethrin",
                "amitraz",
                "azamethiphos",
                "azinphos-ethyl",
                "bifenazate",
                "bifenthrin",
                "carbanolate",
                "chloropropylate",
                "chlorpyrifos-methyl",
                "clofentezine",
                "cyhalothrin",
                "cypermethrin",
                "diafenthiuron",
                "dimethoate",
                "etoxazole",
                "fenpropathrin",
                "fentin hydroxide",
                "fenvalerate",
                "flumethrin",
                "gamma-cyhalothrin",
                "halfenprox",
                "hexythiazox",
                "ivermectin",
                "lambda-cyhalothrin",
                "malathion",
                "methiocarb",
                "methomyl",
                "milbemectin",
                "omethoate",
                "parathion",
                "parathion-methyl",
                "permethrin",
                "phosmet",
                "profenofos",
                "propargite",
                "propoxur",
                "quinomethionate",
                "sulfotep",
                "tetrazine acaricide"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Acaricide",
            "Amitraz",
            "Bifenazate",
            "Bifenesate",
            "Carbaryl",
            "Chlorfenapyr",
            "Clofentezine",
            "Cyflumetofen",
            "Cyhexatin",
            "Cypermethrin",
            "Dicofol",
            "Difenoconazole",
            "Dienochlor",
            "Dinotefuran",
            "Fenazaquin",
            "Fenbutatin Oxide",
            "Fenpyroximate",
            "Hexythiazox",
            "Indoxacarb",
            "Methidathion",
            "Methiocarb",
            "Propargite",
            "Pyridaben",
            "Spinosad"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amitraz",
                "Bifenazate",
                "Carbaryl",
                "Chlorfenapyr",
                "Clofentezine",
                "Cyflumetofen",
                "Cyhexatin",
                "Cypermethrin",
                "Dicofol",
                "Fenazaquin",
                "Fenbutatin Oxide",
                "Hexythiazox",
                "Methidathion",
                "Methiocarb",
                "Propargite",
                "Pyridaben"
            ],
            "mismatches": [
                "Acaricide",
                "Bifenesate",
                "Difenoconazole",
                "Dienochlor",
                "Dinotefuran",
                "Fenpyroximate",
                "Indoxacarb",
                "Spinosad"
            ],
            "true_referents": [
                "(S,S)-hexythiazox",
                "4,6-dinitro-o-cresol",
                "DDT",
                "acaricide drug",
                "aldicarb",
                "aminocarb",
                "amitraz",
                "antibiotic acaricide",
                "bifenazate",
                "bifenthrin",
                "bisulflufen",
                "carbanolate",
                "carbaryl",
                "carbofuran",
                "chlorfenapyr",
                "chlorpyrifos",
                "clofentezine",
                "cyflumetofen",
                "cyhexatin",
                "cypermethrin",
                "diafenthiuron",
                "dichlofluanid",
                "dichlorvos",
                "dicofol",
                "esfenvalerate",
                "fenamiphos",
                "fenazaquin",
                "fenbutatin oxide",
                "fenpropathrin",
                "fenthion",
                "fentin hydroxide",
                "fenvalerate",
                "hexythiazox",
                "malaoxon",
                "malathion",
                "methidathion",
                "methiocarb",
                "methomyl",
                "metolcarb",
                "organochlorine acaricide",
                "parathion",
                "permethrin",
                "phosmet",
                "propargite",
                "propoxur",
                "pyridaben",
                "pyrimidifen",
                "pyriminostrobin",
                "spirodiclofen",
                "tetradifon",
                "tetrazine acaricide"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Acaricides (ACR)",
            "Amitraz (AMT)",
            "Abamectin (ABE)",
            "Formetanate (FMT)",
            "Propargite (PRP)",
            "Spirodiclofen (SPD)",
            "Spiromesifen (SPM)",
            "Fenpyroximate (FNP)",
            "Cyflumetofen (CFL)",
            "Diazinon (DIA)",
            "Chlorfenapyr (CFP)",
            "Etoxazole (ETX)",
            "Hexythiazox (HXT)",
            "Milbemectin (MLB)",
            "Fluensulfone (FLS)",
            "Bifenazate (BFN)",
            "Clofentezine (CFT)",
            "Dinobuton (DBN)",
            "Ovex (OVX)",
            "Sulfur (SUL)",
            "Lime Sulfur (LMS)",
            "Neem Oil (NMO)",
            "Rosemary Oil (RMO)",
            "Thyme Oil (TMO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amitraz",
                "Abamectin",
                "Formetanate",
                "Propargite",
                "Spirodiclofen",
                "Cyflumetofen",
                "Diazinon",
                "Chlorfenapyr",
                "Etoxazole",
                "Hexythiazox",
                "Milbemectin",
                "Bifenazate",
                "Clofentezine"
            ],
            "mismatches": [
                "Acaricides (ACR)",
                "Spiromesifen (SPM)",
                "Fenpyroximate (FNP)",
                "Fluensulfone (FLS)",
                "Dinobuton (DBN)",
                "Ovex (OVX)",
                "Sulfur (SUL)",
                "Lime Sulfur (LMS)",
                "Neem Oil (NMO)",
                "Rosemary Oil (RMO)",
                "Thyme Oil (TMO)"
            ],
            "true_referents": [
                "(+)-neoisodihydrocarveol",
                "(-)-neoisodihydrocarveol",
                "(-)-usnic acid",
                "(S,S)-hexythiazox",
                "abamectin",
                "acaricide drug",
                "amitraz",
                "antibiotic acaricide",
                "azinphos-ethyl",
                "bifenazate",
                "bifenthrin",
                "bisulflufen",
                "carbosulfan",
                "chlorfenapyr",
                "clofentezine",
                "cyenopyrafen",
                "cyflumetofen",
                "diazinon",
                "dichlofluanid",
                "dimethoate",
                "disulfoton",
                "endosulfan",
                "esfenvalerate",
                "ethyl oleate",
                "etoxazole",
                "fenamiphos",
                "fenpropathrin",
                "fenvalerate",
                "fipronil",
                "flucythrinate",
                "formetanate",
                "halfenprox",
                "hexythiazox",
                "ivermectin",
                "malaoxon",
                "methomyl",
                "milbemectin",
                "milbemycin acaricide",
                "organochlorine acaricide",
                "parathion",
                "permethrin",
                "phosmet",
                "propargite",
                "propoxur",
                "spirobudifen",
                "spirodiclofen",
                "tetrazine acaricide"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Abamectin",
            "Bifenazate",
            "Clofentezine",
            "Diafenthiuron",
            "Dicofol",
            "Etoxazole",
            "Fenbutatin oxide",
            "Fenpyroximate",
            "Fenazaquin",
            "Hexythiazox",
            "Milbemectin",
            "Spirodiclofen",
            "Spiromesifen",
            "Tebufenpyrad",
            "Propargite",
            "Pyridaben",
            "Tetradifon",
            "Amitraz",
            "Cyflumetofen",
            "Fluvalinate",
            "Flufenoxuron",
            "Bromopropylate",
            "Chlorfenapyr",
            "Acequinocyl"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Abamectin",
                "Bifenazate",
                "Clofentezine",
                "Diafenthiuron",
                "Dicofol",
                "Etoxazole",
                "Fenbutatin oxide",
                "Fenazaquin",
                "Hexythiazox",
                "Milbemectin",
                "Spirodiclofen",
                "Propargite",
                "Pyridaben",
                "Tetradifon",
                "Amitraz",
                "Cyflumetofen",
                "Fluvalinate",
                "Flufenoxuron",
                "Chlorfenapyr",
                "Acequinocyl"
            ],
            "mismatches": [
                "Fenpyroximate",
                "Spiromesifen",
                "Tebufenpyrad",
                "Bromopropylate"
            ],
            "true_referents": [
                "(S,S)-hexythiazox",
                "abamectin",
                "acephate",
                "acequinocyl",
                "acetoprole",
                "amitraz",
                "bifenazate",
                "bifenthrin",
                "bisulflufen",
                "chlorfenapyr",
                "chloropropylate",
                "chlorpyrifos",
                "chlorpyrifos-methyl",
                "clofentezine",
                "cyflumetofen",
                "diafenthiuron",
                "diafenthiuron-S-oxide",
                "dichlofluanid",
                "dicofol",
                "esfenvalerate",
                "etoxazole",
                "fenamiphos",
                "fenazaquin",
                "fenbutatin oxide",
                "fenpropathrin",
                "fenthion",
                "fentin hydroxide",
                "fenvalerate",
                "fluazuron",
                "flucycloxuron",
                "flufenoxuron",
                "fluvalinate",
                "hexythiazox",
                "ivermectin",
                "milbemectin",
                "milbemycin acaricide",
                "phosmet",
                "propargite",
                "propoxur",
                "pyridaben",
                "pyrimidifen",
                "pyriminostrobin",
                "spirobudifen",
                "spirodiclofen",
                "tetradifon",
                "tetrazine acaricide",
                "triazophos"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Acaricide (AC1)",
            "Abamectin (AC2)",
            "Bifenthrin (AC3)",
            "Chlorfenapyr (AC4)",
            "Cyfluthrin (AC5)",
            "Deltamethrin (AC6)",
            "Endosulfan (AC7)",
            "Fenpyroximate (AC8)",
            "Flumethrin (AC9)",
            "Ivermectin (AC10)",
            "Lambdacyhalothrin (AC11)",
            "Malathion (AC12)",
            "Methomyl (AC13)",
            "Omethoate (AC14)",
            "Pyridaben (AC15)",
            "Spinosad (AC16)",
            "Teflubenzuron (AC17)",
            "Thiamethoxam (AC18)",
            "Triazophos (AC19)",
            "Trombidium (AC20)",
            "Valifenalate (AC21)",
            "Zeta-cypermethrin (AC22)",
            "Amitraz (AC23)",
            "Propargite (AC24)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Abamectin",
                "Bifenthrin",
                "Chlorfenapyr",
                "Endosulfan",
                "Flumethrin",
                "Ivermectin",
                "Malathion",
                "Methomyl",
                "Omethoate",
                "Pyridaben",
                "Triazophos",
                "Amitraz",
                "Propargite"
            ],
            "mismatches": [
                "Acaricide",
                "Cyfluthrin",
                "Deltamethrin",
                "Fenpyroximate",
                "Lambdacyhalothrin",
                "Spinosad",
                "Teflubenzuron",
                "Thiamethoxam",
                "Trombidium",
                "Valifenalate",
                "Zeta-cypermethrin"
            ],
            "true_referents": [
                "(E)-flucycloxuron",
                "abamectin",
                "acaricide drug",
                "acetoprole",
                "acrinathrin",
                "alpha-cypermethrin",
                "amitraz",
                "antibiotic acaricide",
                "avermectin acaricide",
                "azamethiphos",
                "azinphos-ethyl",
                "benzyl benzoate",
                "bifenazate",
                "bifenthrin",
                "carbosulfan",
                "chlorfenapyr",
                "chlorpyrifos",
                "chlorpyrifos-methyl",
                "cyflumetofen",
                "cyhalothrin",
                "cypermethrin",
                "dimethoate",
                "endosulfan",
                "esfenvalerate",
                "etoxazole",
                "fenamiphos",
                "fenpropathrin",
                "fenvalerate",
                "fluazuron",
                "flumethrin",
                "formetanate",
                "gamma-cyhalothrin",
                "ivermectin",
                "lambda-cyhalothrin",
                "malathion",
                "methiocarb",
                "methomyl",
                "metolcarb",
                "milbemectin",
                "omethoate",
                "organochlorine acaricide",
                "parathion",
                "parathion-methyl",
                "permethrin",
                "propargite",
                "propoxur",
                "pyridaben",
                "pyrimidinamine acaricide",
                "tetrazine acaricide",
                "thiometon",
                "tralopyril",
                "triazophos"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Acaricide",
            "Deltamethrin (DM)",
            "Fenpyroximate (FP)",
            "Propargite (PR)",
            "Pyridaben (PY)",
            "Hexythiazox (HX)",
            "Bifenazate (BF)",
            "Acequinocyl (AQ)",
            "Spinosad (SP)",
            "Indoxacarb (IX)",
            "Abamectin (AB)",
            "Fenbutatin oxide (FO)",
            "Chlorfenapyr (CF)",
            "Fluazuron (FZ)",
            "Milbemectin (MB)",
            "Pyriproxyfen (PP)",
            "Cyflumetofen (CFM)",
            "Clofentezine (CZ)",
            "Flufenoxuron (FFX)",
            "Etoxazole (EX)",
            "Fenazaquin (FQ)",
            "Diflubenzuron (DFB)",
            "Hexaflumuron (HF)",
            "Tebufenozide (TBZ)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Propargite",
                "Pyridaben",
                "Hexythiazox",
                "Bifenazate",
                "Acequinocyl",
                "Abamectin",
                "Fenbutatin oxide",
                "Chlorfenapyr",
                "Fluazuron",
                "Milbemectin",
                "Cyflumetofen",
                "Clofentezine",
                "Flufenoxuron",
                "Etoxazole",
                "Fenazaquin"
            ],
            "mismatches": [
                "Acaricide",
                "Deltamethrin (DM)",
                "Fenpyroximate (FP)",
                "Spinosad (SP)",
                "Indoxacarb (IX)",
                "Pyriproxyfen (PP)",
                "Diflubenzuron (DFB)",
                "Hexaflumuron (HF)",
                "Tebufenozide (TBZ)"
            ],
            "true_referents": [
                "(E)-flucycloxuron",
                "(S,S)-hexythiazox",
                "DDT",
                "abamectin",
                "acaricide drug",
                "acephate",
                "acequinocyl",
                "acetoprole",
                "aldicarb",
                "aminocarb",
                "antibiotic acaricide",
                "bifenazate",
                "bifenthrin",
                "chlorfenapyr",
                "chlorpyrifos",
                "clofentezine",
                "cyenopyrafen",
                "cyflumetofen",
                "dichlofluanid",
                "dimethoate",
                "esfenvalerate",
                "etoxazole",
                "fenamiphos",
                "fenazaquin",
                "fenbutatin oxide",
                "fenpropathrin",
                "fentin hydroxide",
                "fenvalerate",
                "fipronil",
                "fluazuron",
                "flucycloxuron",
                "flufenoxuron",
                "flumethrin",
                "hexythiazox",
                "ivermectin",
                "metolcarb",
                "milbemectin",
                "milbemycin acaricide",
                "organochlorine acaricide",
                "phosmet",
                "propargite",
                "propoxur",
                "pyflubumide",
                "pyridaben",
                "thioquinox"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Insecticide (I001)",
            "Miticide (M001)",
            "Acaricide (A001)",
            "Tick repellent (T001)",
            "Mite control spray (MCS001)",
            "Spider mite killer (SMK001)",
            "Pesticide (P001)",
            "Nematicide (N001)",
            "Insecticidal soap (IS001)",
            "Organophosphate (O001)",
            "Pyrethroid (P002)",
            "Carbamate (C001)",
            "Neonicotinoid (N002)",
            "Chlorinated hydrocarbon (CH001)",
            "Botanical insecticide (BI001)",
            "Fungicide (F001)",
            "Rodenticide (R001)",
            "Herbicide (H001)",
            "Biological control agent (BCA001)",
            "Insect growth regulator (IGR001)",
            "Chemical control agent (CCA001)",
            "Insect trap (IT001)",
            "Fumigant (F002)",
            "Insect repellent (IR001)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Insecticide (I001)",
                "Miticide (M001)",
                "Acaricide (A001)",
                "Tick repellent (T001)",
                "Mite control spray (MCS001)",
                "Spider mite killer (SMK001)",
                "Pesticide (P001)",
                "Nematicide (N001)",
                "Insecticidal soap (IS001)",
                "Organophosphate (O001)",
                "Pyrethroid (P002)",
                "Carbamate (C001)",
                "Neonicotinoid (N002)",
                "Chlorinated hydrocarbon (CH001)",
                "Botanical insecticide (BI001)",
                "Fungicide (F001)",
                "Rodenticide (R001)",
                "Herbicide (H001)",
                "Biological control agent (BCA001)",
                "Insect growth regulator (IGR001)",
                "Chemical control agent (CCA001)",
                "Insect trap (IT001)",
                "Fumigant (F002)",
                "Insect repellent (IR001)"
            ],
            "true_referents": [
                "abamectin",
                "acaricide drug",
                "aminocarb",
                "antibiotic acaricide",
                "carbanolate",
                "carbaryl",
                "chlorpyrifos",
                "chlorpyrifos-methyl",
                "cypermethrin",
                "dinitrophenol acaricide",
                "hexachlorophene",
                "malathion",
                "mite growth regulator",
                "organochlorine acaricide",
                "organofluorine acaricide",
                "organonitrogen acaricide",
                "organotin acaricide",
                "parathion-methyl",
                "permethrin",
                "scabicide"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Amitraz",
            "Permethrin",
            "Fipronil",
            "Ivermectin",
            "Pyrethrin",
            "Cypermethrin",
            "Benzyl benzoate",
            "Deltamethrin",
            "Sulfur",
            "Malathion",
            "Abamectin",
            "Fenvalerate",
            "Propargite",
            "Spirodiclofen",
            "Chlorpyrifos",
            "Dicofol",
            "Bifenazate",
            "Horticultural oil",
            "Neem oil",
            "Eucalyptus oil",
            "Pyriproxyfen",
            "Thymol",
            "Sulfoxaflor",
            "Metarhizium anisopliae"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amitraz",
                "Permethrin",
                "Fipronil",
                "Ivermectin",
                "Cypermethrin",
                "Benzyl benzoate",
                "Malathion",
                "Abamectin",
                "Fenvalerate",
                "Propargite",
                "Spirodiclofen",
                "Chlorpyrifos",
                "Dicofol",
                "Bifenazate"
            ],
            "mismatches": [
                "Pyrethrin",
                "Deltamethrin",
                "Sulfur",
                "Horticultural oil",
                "Neem oil",
                "Eucalyptus oil",
                "Pyriproxyfen",
                "Thymol",
                "Sulfoxaflor",
                "Metarhizium anisopliae"
            ],
            "true_referents": [
                "(-)-neoisodihydrocarveol",
                "(-)-usnic acid",
                "(S,S)-hexythiazox",
                "abamectin",
                "amitraz",
                "azinphos-ethyl",
                "benzyl benzoate",
                "bifenazate",
                "bifenthrin",
                "carbofuran",
                "chlorfenapyr",
                "chloropropylate",
                "chlorpyrifos",
                "chlorpyrifos-methyl",
                "cypermethrin",
                "dichlofluanid",
                "dicofol",
                "esfenvalerate",
                "ethyl oleate",
                "fenazaquin",
                "fenbutatin oxide",
                "fenitrothion",
                "fenvalerate",
                "fipronil",
                "flumethrin",
                "ivermectin",
                "malathion",
                "methomyl",
                "milbemectin",
                "parathion",
                "parathion-methyl",
                "permethrin",
                "phosmet",
                "propargite",
                "propoxur",
                "pyrimidifen",
                "spirobudifen",
                "spirodiclofen",
                "sulfluramid",
                "sulfotep",
                "tetradifon",
                "tetrazine acaricide"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Abamectin (ABM)",
            "Acequinocyl",
            "Amitraz",
            "Bifenazate",
            "Bromopropylate",
            "Chlorfenapyr",
            "Clofentezine",
            "Cyflumetofen",
            "Dicofol",
            "Etoxazole",
            "Fenazaquin",
            "Fenpyroximate",
            "Hexythiazox",
            "Ivermectin",
            "Milbemectin",
            "Propargite",
            "Pyridaben",
            "Spirodiclofen",
            "Spiromesifen",
            "Sulfur",
            "Tebufenpyrad",
            "Tetradifon",
            "Lime sulfur",
            "Diatomaceous earth"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Abamectin (ABM)",
                "Acequinocyl",
                "Amitraz",
                "Bifenazate",
                "Chlorfenapyr",
                "Clofentezine",
                "Cyflumetofen",
                "Dicofol",
                "Etoxazole",
                "Fenazaquin",
                "Hexythiazox",
                "Ivermectin",
                "Milbemectin",
                "Propargite",
                "Pyridaben",
                "Spirodiclofen",
                "Tetradifon"
            ],
            "mismatches": [
                "Bromopropylate",
                "Fenpyroximate",
                "Spiromesifen",
                "Sulfur",
                "Tebufenpyrad",
                "Lime sulfur",
                "Diatomaceous earth"
            ],
            "true_referents": [
                "(-)-usnic acid",
                "(S,S)-hexythiazox",
                "abamectin",
                "acephate",
                "acequinocyl",
                "acetoprole",
                "amitraz",
                "bifenazate",
                "bifenthrin",
                "bisulflufen",
                "chlorfenapyr",
                "chloropropylate",
                "chlorpyrifos",
                "chlorpyrifos-methyl",
                "clofentezine",
                "cyflumetofen",
                "dichlofluanid",
                "dicofol",
                "esfenvalerate",
                "etoxazole",
                "fenamiphos",
                "fenazaquin",
                "fenbutatin oxide",
                "fenpropathrin",
                "fenthion",
                "fentin hydroxide",
                "fenvalerate",
                "fluazuron",
                "hexythiazox",
                "ivermectin",
                "milbemectin",
                "milbemycin acaricide",
                "permethrin",
                "phosmet",
                "propargite",
                "propoxur",
                "pyridaben",
                "pyrimidifen",
                "pyriminostrobin",
                "spirobudifen",
                "spirodiclofen",
                "tetradifon",
                "tetrazine acaricide",
                "triazophos"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Abamectin (ABM)",
            "Amitraz",
            "Benzyl benzoate",
            "Bifenazate",
            "Bifenthrin",
            "Bromopropylate",
            "Chlorfenapyr",
            "Clofentezine",
            "Dicofol",
            "Etoxazole",
            "Fenazaquin",
            "Fenpyroximate",
            "Hexythiazox",
            "Ivermectin",
            "Lindane",
            "Malathion",
            "Milbemectin",
            "Permethrin",
            "Propargite",
            "Pyridaben",
            "Spirodiclofen",
            "Spiromesifen",
            "Tebufenpyrad",
            "Tetradifon"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Abamectin",
                "Amitraz",
                "Benzyl benzoate",
                "Bifenazate",
                "Bifenthrin",
                "Chlorfenapyr",
                "Clofentezine",
                "Dicofol",
                "Etoxazole",
                "Fenazaquin",
                "Hexythiazox",
                "Ivermectin",
                "Malathion",
                "Milbemectin",
                "Permethrin",
                "Propargite",
                "Pyridaben",
                "Spirodiclofen",
                "Tetradifon"
            ],
            "mismatches": [
                "Bromopropylate",
                "Fenpyroximate",
                "Lindane",
                "Spiromesifen",
                "Tebufenpyrad"
            ],
            "true_referents": [
                "(S,S)-hexythiazox",
                "abamectin",
                "acrinathrin",
                "amitraz",
                "benzyl benzoate",
                "bifenazate",
                "bifenthrin",
                "chlorfenapyr",
                "chloropropylate",
                "chlorpyrifos",
                "chlorpyrifos-methyl",
                "clofentezine",
                "cypermethrin",
                "dichlofluanid",
                "dicofol",
                "esfenvalerate",
                "ethyl oleate",
                "etoxazole",
                "fenamiphos",
                "fenazaquin",
                "fenbutatin oxide",
                "fenpropathrin",
                "fenthion",
                "fentin hydroxide",
                "fenvalerate",
                "fluazuron",
                "hexythiazox",
                "ivermectin",
                "malathion",
                "milbemectin",
                "milbemycin acaricide",
                "parathion",
                "parathion-methyl",
                "permethrin",
                "phosmet",
                "propargite",
                "propoxur",
                "pyridaben",
                "pyrimidifen",
                "pyriminostrobin",
                "spirobudifen",
                "spirodiclofen",
                "tetradifon",
                "tetrazine acaricide",
                "triazophos"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Bifenazate (BIF)",
            "Spirodiclofen (SPI)",
            "Etoxazole (ETO)",
            "Clofentezine (CLF)",
            "Hexythiazox (HEX)",
            "Fenpyroximate (FEN)",
            "Pyridaben (PYR)",
            "Tebufenpyrad (TEB)",
            "Fenazaquin (FEN)",
            "Cyflumetofen (CYF)",
            "Acequinocyl (ACE)",
            "Fluacrypyrim (FLU)",
            "Cyenopyrafen (CYE)",
            "Pyridalyl (PYR)",
            "Chlorfenapyr (CFP)",
            "Fenbutatin oxide (FBO)",
            "Propargite (PRO)",
            "Spiromesifen (SPI)",
            "Spirotetramat (SPI)",
            "Milbemectin (MIL)",
            "Abamectin (ABA)",
            "Emamectin benzoate (EMB)",
            "Ivermectin (IVE)",
            "Doramectin (DOR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Bifenazate (BIF)",
                "Spirodiclofen (SPI)",
                "Etoxazole (ETO)",
                "Clofentezine (CLF)",
                "Hexythiazox (HEX)",
                "Pyridaben (PYR)",
                "Fenazaquin (FEN)",
                "Cyflumetofen (CYF)",
                "Acequinocyl (ACE)",
                "Fluacrypyrim (FLU)",
                "Cyenopyrafen (CYE)",
                "Chlorfenapyr (CFP)",
                "Fenbutatin oxide (FBO)",
                "Propargite (PRO)",
                "Milbemectin (MIL)",
                "Abamectin (ABA)",
                "Ivermectin (IVE)"
            ],
            "mismatches": [
                "Fenpyroximate (FEN)",
                "Tebufenpyrad (TEB)",
                "Pyridalyl (PYR)",
                "Spiromesifen (SPI)",
                "Spirotetramat (SPI)",
                "Emamectin benzoate (EMB)",
                "Doramectin (DOR)"
            ],
            "true_referents": [
                "(-)-neodihydrocarveol",
                "(S,S)-hexythiazox",
                "abamectin",
                "acephate",
                "acequinocyl",
                "acetoprole",
                "bifenazate",
                "bifenthrin",
                "bisulflufen",
                "carbaryl",
                "chlorfenapyr",
                "clofentezine",
                "cyenopyrafen",
                "cyflumetofen",
                "eprinomectin",
                "etoxazole",
                "fenazaquin",
                "fenbutatin oxide",
                "fenitrothion",
                "fenpropathrin",
                "fenthion",
                "fentin hydroxide",
                "fenvalerate",
                "fluacrypyrim",
                "flucythrinate",
                "hexythiazox",
                "ivermectin",
                "milbemectin",
                "milbemycin acaricide",
                "proacaricide",
                "propargite",
                "propoxur",
                "pyridaben",
                "pyrimidifen",
                "spirobudifen",
                "spirodiclofen",
                "tetradifon",
                "thiometon"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Acaricide (AC)",
            "Acarcide (ACR)",
            "Acariticide (ACT)",
            "Acaricide compound (ACC)",
            "Acaricidal agent (ACA)",
            "Acaricidal substance (ACS)",
            "Acarine pesticide (ACP)",
            "Acarus killer (ACK)",
            "Mite control agent (MCA)",
            "Mite exterminator (MEX)",
            "Mite killer (MKR)",
            "Mite poison (MPO)",
            "Miticide (MIT)",
            "Miticide compound (MTC)",
            "Miticide substance (MTS)",
            "Mite control chemical (MCC)",
            "Mite eradication agent (MEA)",
            "Mite exterminating substance (MES)",
            "Mite killing agent (MKA)",
            "Mite pesticide (MPE)",
            "Mite repellent (MRE)",
            "Mite toxicant (MTO)",
            "Tick control agent (TCA)",
            "Tick killer (TKR)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "Acaricide (AC)",
                "Acarcide (ACR)",
                "Acariticide (ACT)",
                "Acaricide compound (ACC)",
                "Acaricidal agent (ACA)",
                "Acaricidal substance (ACS)",
                "Acarine pesticide (ACP)",
                "Acarus killer (ACK)",
                "Mite control agent (MCA)",
                "Mite exterminator (MEX)",
                "Mite killer (MKR)",
                "Mite poison (MPO)",
                "Miticide (MIT)",
                "Miticide compound (MTC)",
                "Miticide substance (MTS)",
                "Mite control chemical (MCC)",
                "Mite eradication agent (MEA)",
                "Mite exterminating substance (MES)",
                "Mite killing agent (MKA)",
                "Mite pesticide (MPE)",
                "Mite repellent (MRE)",
                "Mite toxicant (MTO)",
                "Tick control agent (TCA)",
                "Tick killer (TKR)"
            ],
            "true_referents": [
                "DDT",
                "abamectin",
                "acaricide drug",
                "antibiotic acaricide",
                "avermectin acaricide",
                "chlorpyrifos-methyl",
                "malathion",
                "milbemycin acaricide",
                "mite growth regulator",
                "organochlorine acaricide",
                "organonitrogen acaricide",
                "organosulfur acaricide",
                "organotin acaricide",
                "parathion",
                "parathion-methyl",
                "permethrin",
                "pyrethroid ether acaricide",
                "scabicide"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Acaricide (Acaricide)",
            "Acarosan",
            "Amitraz",
            "Benzyl benzoate",
            "Coumaphos",
            "Deltamethrin",
            "Dicofol",
            "Fipronil",
            "Hydrogen peroxide",
            "Ivermectin",
            "Lindane",
            "Malathion",
            "Methoprene",
            "Methoxychlor",
            "Nitenpyram",
            "Permethrin",
            "Phoxim",
            "Pyrethrin",
            "Pyriproxyfen",
            "Resmethrin",
            "Roubaixine",
            "Sulfluramid",
            "Tetramethrin",
            "Tralomethrin",
            "Vamidothion"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Amitraz",
                "Benzyl benzoate",
                "Coumaphos",
                "Dicofol",
                "Fipronil",
                "Ivermectin",
                "Malathion",
                "Permethrin",
                "Sulfluramid"
            ],
            "mismatches": [
                "Acaricide (Acaricide)",
                "Acarosan",
                "Deltamethrin",
                "Hydrogen peroxide",
                "Lindane",
                "Methoprene",
                "Methoxychlor",
                "Nitenpyram",
                "Phoxim",
                "Pyrethrin",
                "Pyriproxyfen",
                "Resmethrin",
                "Roubaixine",
                "Tetramethrin",
                "Tralomethrin",
                "Vamidothion"
            ],
            "true_referents": [
                "(E)-flucycloxuron",
                "abamectin",
                "acaricide drug",
                "amitraz",
                "antibiotic acaricide",
                "benzyl benzoate",
                "bisulflufen",
                "butocarboxim",
                "chlorfenapyr",
                "chloropropylate",
                "chlorpyrifos",
                "chlorpyrifos-methyl",
                "coumaphos",
                "cyenopyrafen",
                "cypermethrin",
                "dichlofluanid",
                "dicofol",
                "disulfiram",
                "ethyl oleate",
                "fenazaquin",
                "fenitrothion",
                "fipronil",
                "fluacrypyrim",
                "flumethrin",
                "hexachlorophene",
                "ivermectin",
                "malaoxon",
                "malathion",
                "methamidophos",
                "methomyl",
                "milbemectin",
                "organochlorine acaricide",
                "organosulfur acaricide",
                "organotin acaricide",
                "parathion",
                "parathion-methyl",
                "permethrin",
                "propoxur",
                "pyrimidifen",
                "sulfluramid",
                "temephos",
                "tetradifon",
                "tetrazine acaricide",
                "toxaphene",
                "triarathene"
            ],
            "TP": 9,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "acaricide",
        "domain": "medicine",
        "response": [
            "Acaricide (ACR)",
            "Hexythiazox (HTZ)",
            "Bifenazate (BZF)",
            "Cyflumetofen (CYF)",
            "Pyridaben (PYR)",
            "Tebufenpyrad (TBP)",
            "Fenazaquin (FNZ)",
            "Pyriproxyfen (PYP)",
            "Chlorfenapyr (CFP)",
            "Flufenoxuron (FFU)",
            "Fluacrypyrim (FLP)",
            "Ethion (ETH)",
            "Propargite (PRP)",
            "Chlorobenzilate (CBL)",
            "Amitraz (AMT)",
            "Bromopropylate (BRL)",
            "Cypermethrin (CYP)",
            "Deltamethrin (DLM)",
            "Permethrin (PMN)",
            "Phenothrin (PHT)",
            "Allethrin (ALH)",
            "Piperonyl butoxide (PBO)",
            "Rotenone (RTN)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hexythiazox",
                "Bifenazate",
                "Cyflumetofen",
                "Pyridaben",
                "Fenazaquin",
                "Chlorfenapyr",
                "Flufenoxuron",
                "Fluacrypyrim",
                "Ethion",
                "Propargite",
                "Amitraz",
                "Cypermethrin",
                "Permethrin"
            ],
            "mismatches": [
                "Acaricide",
                "Tebufenpyrad",
                "Pyriproxyfen",
                "Chlorobenzilate",
                "Bromopropylate",
                "Deltamethrin",
                "Phenothrin",
                "Allethrin",
                "Piperonyl butoxide",
                "Rotenone"
            ],
            "true_referents": [
                "(-)-trans-permethrin",
                "(E)-flucycloxuron",
                "(S,S)-hexythiazox",
                "(Z)-flucycloxuron",
                "acaricide drug",
                "acrinathrin",
                "alpha-cypermethrin",
                "amitraz",
                "antibiotic acaricide",
                "benzyl benzoate",
                "bifenazate",
                "bifenthrin",
                "bisulflufen",
                "butocarboxim",
                "chlorfenapyr",
                "chloropropylate",
                "chlorpyrifos-methyl",
                "cyenopyrafen",
                "cyflumetofen",
                "cyhalothrin",
                "cypermethrin",
                "diafenthiuron",
                "diafenthiuron-S-oxide",
                "esfenvalerate",
                "ethion",
                "etoxazole",
                "fenazaquin",
                "fenpropathrin",
                "fenthion",
                "fenvalerate",
                "fluacrypyrim",
                "flucycloxuron",
                "flucythrinate",
                "flufenoxuron",
                "flumethrin",
                "hexythiazox",
                "lambda-cyhalothrin",
                "organochlorine acaricide",
                "parathion",
                "permethrin",
                "phosmet",
                "propargite",
                "propoxur",
                "pyridaben",
                "pyrimidifen",
                "tetrazine acaricide"
            ],
            "TP": 13,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "acaricide",
        "domain": "medicine",
        "response": "[\n        {\n            \"referent\": \"pyrethrin\" (PYRE),\n            \"canonical name\": \"pyrethrin\"\n        },\n        {\n            \"referent\": \"deltamethrin\" (DELT),\n            \"canonical name\": \"deltamethrin\"\n        },\n        {\n            \"referent\": \"cyfluthrin\" (CYFL),\n            \"canonical name\": \"cyfluthrin\"\n        },\n        {\n            \"referent\": \"permethrin\" (PERM),\n            \"canonical name\": \"permethrin\"\n        }\n    ]",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]