[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "sulfanilamide (SAN)",
            "sulfacetamide (SAC)",
            "sodium sulfacetamide",
            "procainamide hydrochloride",
            "benzathine penicillin G",
            "sulfamethoxazole (SMX)",
            "trimethoprim-sulfamethoxazole",
            "acetazolamide",
            "methazolamide",
            "sulfadiazine",
            "sulfisoxazole",
            "sulfamethoxypyridazine",
            "sulfadoxine",
            "sulfamerazine",
            "sulfamethizole",
            "sulfasalazine",
            "dapsone",
            "sulfisomidine",
            "sulfamonomethoxine",
            "sulfametrole",
            "sulfadimidine",
            "sulfamethazine",
            "sulfamethoxazole-trimethoprim",
            "sulfamethoxazole"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "sulfanilamide (SAN)",
                "sulfacetamide (SAC)",
                "sulfamethoxazole (SMX)",
                "acetazolamide",
                "methazolamide",
                "sulfadiazine",
                "sulfisoxazole",
                "sulfamethoxypyridazine",
                "sulfadoxine",
                "sulfamerazine",
                "sulfamethizole",
                "sulfasalazine",
                "sulfisomidine",
                "sulfamonomethoxine",
                "sulfametrole",
                "sulfamethazine",
                "sulfamethoxazole"
            ],
            "mismatches": [
                "sodium sulfacetamide",
                "procainamide hydrochloride",
                "benzathine penicillin G",
                "trimethoprim-sulfamethoxazole",
                "dapsone",
                "sulfadimidine",
                "sulfamethoxazole-trimethoprim"
            ],
            "true_referents": [
                "(R)-bendroflumethiazide",
                "(S)-bendroflumethiazide",
                "4-sulfanilamidobenzoic acid",
                "Methazolamide",
                "Sulfamonomethoxine",
                "Sulfamoyldapsone",
                "acetazolamide",
                "benzthiazide",
                "brinzolamide",
                "diclofenamide",
                "furosemide",
                "hydrochlorothiazide",
                "sulfacarbamide",
                "sulfacetamide",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfamethoxypyridazine",
                "sulfametrole",
                "sulfamoxole",
                "sulfanilamide",
                "sulfasalazine",
                "sulfisomidine",
                "sulfisoxazole"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfonamide (Sulfamethoxazole)",
            "Sulfonamide (Sulfadiazine)",
            "Sulfonamide (Sulfapyridine)",
            "Sulfonamide (Sulfamethoxypyridazine)",
            "Sulfonamide (Sulfisoxazole)",
            "Sulfonamide (Sulfacetamide)",
            "Sulfonamide (Sulfamethoxazole-trimethoprim)",
            "Sulfonamide (Mafenide)",
            "Sulfonamide (Silver Sulfadiazine)",
            "Sulfonamide (Sulfadoxine)",
            "Sulfonamide (Trimethoprim)",
            "Sulfonamide (Dapsone)",
            "Sulfonamide (Sulfamethazine)",
            "Sulfonamide (Sulfamerazine)",
            "Sulfonamide (Sulfathiazole)",
            "Sulfonamide (Sulfadimethoxine)",
            "Sulfonamide (Sulfachloropyridazine)",
            "Sulfonamide (Sulfamonomethoxine)",
            "Sulfonamide (Sulfisoxazole)",
            "Sulfonamide (Sulfacetamide sodium)",
            "Sulfonamide (Sulfamethoxypyridazine)",
            "Sulfonamide (Sulfamethoxazole)",
            "Sulfonamide (Sulfadimidine)",
            "Sulfonamide (Sulfamethizole)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfamethoxazole",
                "Sulfadiazine",
                "Sulfapyridine",
                "Sulfisoxazole",
                "Sulfacetamide",
                "Sulfadoxine",
                "Sulfamethazine",
                "Sulfamerazine",
                "Sulfathiazole",
                "Sulfadimethoxine",
                "Sulfachloropyridazine",
                "Sulfamethizole"
            ],
            "mismatches": [
                "Sulfamethoxypyridazine",
                "Sulfamethoxazole-trimethoprim",
                "Mafenide",
                "Silver Sulfadiazine",
                "Trimethoprim",
                "Dapsone",
                "Sulfamonomethoxine",
                "Sulfacetamide sodium",
                "Sulfadimidine"
            ],
            "true_referents": [
                "Sulfamoyldapsone",
                "dapoxyl (2-aminoethyl)sulfonamide",
                "sulfabenzamide",
                "sulfacetamide",
                "sulfachloropyridazine",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfamoxole",
                "sulfapyridine",
                "sulfathiazole",
                "sulfisoxazole",
                "sulfonamide antibiotic"
            ],
            "TP": 12,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Methanesulfonamide",
            "Ethanesulfonamide",
            "Benzenesulfonamide",
            "Toluenesulfonamide",
            "p-Toluenesulfonamide",
            "Phenylmethanesulfonamide",
            "p-Nitrobenzenesulfonamide",
            "o-Nitrobenzenesulfonamide",
            "m-Nitrobenzenesulfonamide",
            "2-Naphthalenesulfonamide",
            "1-Naphthalenesulfonamide",
            "4-Chlorobenzenesulfonamide",
            "4-Bromobenzenesulfonamide",
            "4-Fluorobenzenesulfonamide",
            "4-Iodobenzenulfonamide",
            "4-Methoxybenzenesulfonamide",
            "4-Hydroxybenzenesulfonamide",
            "4-Methylbenzenesulfonamide",
            "4-Ethylbenzenesulfonamide",
            "4-Propylbenzenesulfonamide",
            "4-Butylbenzenesulfonamide",
            "4-Pentylbenzenesulfonamide",
            "4-Hexylbenzenesulfonamide",
            "4-Heptylbenzenesulfonamide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Benzenesulfonamide",
                "4-Chlorobenzenesulfonamide"
            ],
            "mismatches": [
                "Methanesulfonamide",
                "Ethanesulfonamide",
                "Toluenesulfonamide",
                "p-Toluenesulfonamide",
                "Phenylmethanesulfonamide",
                "p-Nitrobenzenesulfonamide",
                "o-Nitrobenzenesulfonamide",
                "m-Nitrobenzenesulfonamide",
                "2-Naphthalenesulfonamide",
                "1-Naphthalenesulfonamide",
                "4-Bromobenzenesulfonamide",
                "4-Fluorobenzenesulfonamide",
                "4-Iodobenzenulfonamide",
                "4-Methoxybenzenesulfonamide",
                "4-Hydroxybenzenesulfonamide",
                "4-Methylbenzenesulfonamide",
                "4-Ethylbenzenesulfonamide",
                "4-Propylbenzenesulfonamide",
                "4-Butylbenzenesulfonamide",
                "4-Pentylbenzenesulfonamide",
                "4-Hexylbenzenesulfonamide",
                "4-Heptylbenzenesulfonamide"
            ],
            "true_referents": [
                "2,4-Difluorobenzenesulfonamide",
                "2,6-difluorobenzenesulfonamide",
                "2-aminobenzenesulfonamide",
                "2-bromo-N-(phenylmethyl)benzenesulfonamide",
                "3,4-Dichlorobenzenesulfonamide",
                "3,5-difluorobenzenesulfonamide",
                "4-(2-AMINOETHYL)BENZENESULFONAMIDE",
                "4-Methoxybenzenesulfonohydrazide",
                "4-bromo-N-(cinnamylideneamino)benzenesulfonamide",
                "4-chlorobenzenesulfonamide",
                "4-hydroxy-N,N-dimethylbenzenesulfonamide",
                "4-methyl-N-(5,6,7,8-tetrahydronaphthalen-1-yl)benzenesulfonamide",
                "4-methyl-N-(phenylmethyl)benzenesulfonamide",
                "4-nitrosobenzenesulfonamide",
                "5-(dimethylamino)-N-(4-aminobenzyl)naphthalene-1-sulfonamide",
                "Benzenesulfonamide",
                "N,4-dimethyl-N-nitrosobenzenesulfonamide",
                "N-(4-chlorophenyl)methanesulfonamide",
                "N-(4-phenylmethoxyphenyl)methanesulfonamide",
                "N-Carbamoyl-4-chlorobenzenesulfonamide",
                "N-[3-(4-methyl-1-piperidinyl)-1,4-dioxo-2-naphthalenyl]benzenesulfonamide",
                "N-[4-(methanesulfonamido)phenyl]acetamide",
                "N-butylbenzenesulfonamide",
                "N1,N1,4-trimethylbenzene-1-sulfonamide",
                "piperidinesulfonamide",
                "pyridinesulfonamide",
                "toluene-4-sulfonamide"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfanilamide (SULF)",
            "Toluenesulfonamide (TSA)",
            "p-Chlorobenzenesulfonamide (CBSA)",
            "N,N-Dimethylsulfamide (DMS)",
            "N-Ethylbenzenesulfonamide (EBSA)",
            "N-Cyclohexylbenzenesulfonamide (CBS)",
            "Methanesulfonamide (MSA)",
            "Ethanesulfonamide (ESA)",
            "2,4-Dichlorobenzenesulfonamide (DCBSA)",
            "3-Sulfopropanamide (SPA)",
            "N-Methyl-p-toluenesulfonamide (MTS)",
            "N-Phenylbenzenesulfonamide (PBS)",
            "N,N-Diethylsulfamide (DES)",
            "N-Isopropylbenzenesulfonamide (IBSA)",
            "N-tert-Butylbenzenesulfonamide (TBSA)",
            "N-Hydroxyethanesulfonamide (HESA)",
            "N-Methylmethanesulfonamide (MMSA)",
            "N-Ethylmethanesulfonamide (EMSA)",
            "N,N-Dimethyl-p-toluenesulfonamide (DMTS)",
            "N-Acetylsulfanilamide (NASA)",
            "N-Formylsulfanilamide (NFSA)",
            "N-Propylbenzenesulfonamide (PBSA)",
            "N-Butylbenzenesulfonamide (BBSA)",
            "N-Hexylbenzenesulfonamide (HBSA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfanilamide (SULF)",
                "N-Butylbenzenesulfonamide (BBSA)"
            ],
            "mismatches": [
                "Toluenesulfonamide (TSA)",
                "p-Chlorobenzenesulfonamide (CBSA)",
                "N,N-Dimethylsulfamide (DMS)",
                "N-Ethylbenzenesulfonamide (EBSA)",
                "N-Cyclohexylbenzenesulfonamide (CBS)",
                "Methanesulfonamide (MSA)",
                "Ethanesulfonamide (ESA)",
                "2,4-Dichlorobenzenesulfonamide (DCBSA)",
                "3-Sulfopropanamide (SPA)",
                "N-Methyl-p-toluenesulfonamide (MTS)",
                "N-Phenylbenzenesulfonamide (PBS)",
                "N,N-Diethylsulfamide (DES)",
                "N-Isopropylbenzenesulfonamide (IBSA)",
                "N-tert-Butylbenzenesulfonamide (TBSA)",
                "N-Hydroxyethanesulfonamide (HESA)",
                "N-Methylmethanesulfonamide (MMSA)",
                "N-Ethylmethanesulfonamide (EMSA)",
                "N,N-Dimethyl-p-toluenesulfonamide (DMTS)",
                "N-Acetylsulfanilamide (NASA)",
                "N-Formylsulfanilamide (NFSA)",
                "N-Propylbenzenesulfonamide (PBSA)",
                "N-Hexylbenzenesulfonamide (HBSA)"
            ],
            "true_referents": [
                "2-aminobenzenesulfonamide",
                "2-oxoethane-1-sulfonamide",
                "3,4-Dichlorobenzenesulfonamide",
                "4-(2-AMINOETHYL)BENZENESULFONAMIDE",
                "4-[[(4-acetamidophenyl)sulfonylamino]methyl]-N-(3-methoxypropyl)benzamide",
                "4-[[(4-methoxyphenyl)sulfonylamino]methyl]-N-[2-[methyl-(phenylmethyl)amino]ethyl]benzamide",
                "4-chlorobenzenesulfonamide",
                "4-hydroxy-N,N-dimethylbenzenesulfonamide",
                "4-methyl-N-(phenylmethyl)benzenesulfonamide",
                "4-nitrosobenzenesulfonamide",
                "4-sulfanilamidobenzoic acid",
                "Benzenesulfonamide",
                "N,4-dimethyl-N-(4-methylphenyl)benzenesulfonamide",
                "N,4-dimethyl-N-nitrosobenzenesulfonamide",
                "N-(4-chlorophenyl)methanesulfonamide",
                "N-(4-phenylmethoxyphenyl)methanesulfonamide",
                "N-Carbamoyl-4-chlorobenzenesulfonamide",
                "N-[4-(methanesulfonamido)phenyl]acetamide",
                "N-butylbenzenesulfonamide",
                "N-cyclooctyl-4-methylbenzenesulfonamide",
                "N-cyclopropyl-4-methylbenzenesulfonamide",
                "N1,N1-diethyl-4-methylbenzene-1-sulfonamide",
                "N1,N4-Diacetylsulfanilamide",
                "N4-Acetylsulfadoxine",
                "N4-Acetylsulfapyridine",
                "benzene-1-3-disulfonamide",
                "disulfamide",
                "formylsulfamethin",
                "sulfanilamide",
                "sulfonamide antibiotic",
                "toluene-4-sulfonamide"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Methanesulfonamide (MSA)",
            "Tosylamide (TsNH2)",
            "Benzenesulfonamide",
            "N-Methylbenzenesulfonamide",
            "N-Ethylbenzenesulfonamide",
            "N-Phenylbenzenesulfonamide",
            "N,N-Dimethylbenzenesulfonamide",
            "N,N-Diethylbenzenesulfonamide",
            "N-Methylmethanesulfonamide",
            "N-Ethylmethanesulfonamide",
            "N-Phenylmethanesulfonamide",
            "N,N-Dimethylmethanesulfonamide",
            "N,N-Diethylmethanesulfonamide",
            "N-Methylp-toluenesulfonamide",
            "N-Ethylp-toluenesulfonamide",
            "N-Phenylp-toluenesulfonamide",
            "N,N-Dimethylp-toluenesulfonamide",
            "N,N-Diethylp-toluenesulfonamide",
            "Mesylamide",
            "N-Methylmesylamide",
            "N-Ethylmesylamide",
            "N-Phenylmesylamide",
            "N,N-Dimethylmesylamide",
            "N,N-Diethylmesylamide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Benzenesulfonamide"
            ],
            "mismatches": [
                "Methanesulfonamide (MSA)",
                "Tosylamide (TsNH2)",
                "N-Methylbenzenesulfonamide",
                "N-Ethylbenzenesulfonamide",
                "N-Phenylbenzenesulfonamide",
                "N,N-Dimethylbenzenesulfonamide",
                "N,N-Diethylbenzenesulfonamide",
                "N-Methylmethanesulfonamide",
                "N-Ethylmethanesulfonamide",
                "N-Phenylmethanesulfonamide",
                "N,N-Dimethylmethanesulfonamide",
                "N,N-Diethylmethanesulfonamide",
                "N-Methylp-toluenesulfonamide",
                "N-Ethylp-toluenesulfonamide",
                "N-Phenylp-toluenesulfonamide",
                "N,N-Dimethylp-toluenesulfonamide",
                "N,N-Diethylp-toluenesulfonamide",
                "Mesylamide",
                "N-Methylmesylamide",
                "N-Ethylmesylamide",
                "N-Phenylmesylamide",
                "N,N-Dimethylmesylamide",
                "N,N-Diethylmesylamide"
            ],
            "true_referents": [
                "2-aminobenzenesulfonamide",
                "4-(2-AMINOETHYL)BENZENESULFONAMIDE",
                "4-amino-N-(4-ethoxyphenyl)benzenesulfonamide",
                "4-hydroxy-N,N-dimethylbenzenesulfonamide",
                "4-methyl-N-(phenylmethyl)benzenesulfonamide",
                "4-nitrosobenzenesulfonamide",
                "Benzenesulfonamide",
                "Methazolamide",
                "N,4-dimethyl-N-(4-methylphenyl)benzenesulfonamide",
                "N,4-dimethyl-N-nitrosobenzenesulfonamide",
                "N-(4-chlorophenyl)methanesulfonamide",
                "N-(4-phenylmethoxyphenyl)methanesulfonamide",
                "N-[4-(methanesulfonamido)phenyl]acetamide",
                "N-butylbenzenesulfonamide",
                "N1,N1-diethyl-4-methylbenzene-1-sulfonamide",
                "N1,N4-Diacetylsulfanilamide",
                "acetazolamide",
                "azosemide",
                "brinzolamide",
                "tolpyrramide"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "N-ethylsulfonamide (NESA)",
            "N-methylsulfonamide (NMSA)",
            "N-phenylsulfonamide (NPSA)",
            "N-benzenesulfonamide (NBSA)",
            "N-cyclohexylsulfonamide (NCHSA)",
            "N-isopropylsulfonamide (NIPSA)",
            "N-p-tolylsulfonamide (NPTSA)",
            "N-butylsulfonamide (NBS)",
            "N-hexylsulfonamide (NHS)",
            "N-dodecylsulfonamide (NDSA)",
            "N-ethyl-4-methylbenzenesulfonamide (NEMBSA)",
            "N-benzylsulfonamide (NBSA)",
            "N-(2-hydroxyethyl)sulfonamide (NHESA)",
            "N-(4-chlorophenyl)sulfonamide (N4CPSA)",
            "N-(2,6-dimethylphenyl)sulfonamide (N2,6DPSA)",
            "N-phenyl-2-pyridinesulfonamide (NPPYSA)",
            "N-(4-fluorophenyl)sulfonamide (N4FPSA)",
            "N-(3-methoxyphenyl)sulfonamide (N3MPSA)",
            "N-(4-nitrophenyl)sulfonamide (N4NPSA)",
            "N-(pyridin-3-yl)sulfonamide (NPSA3)",
            "N-(4-methylphenyl)sulfonamide (N4MPSA)",
            "N-(3-aminophenyl)sulfonamide (N3APSA)",
            "N-(1-naphthyl)sulfonamide (N1NSA)",
            "N-(2-thienyl)sulfonamide (N2TSA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "N-ethylsulfonamide (NESA)",
                "N-methylsulfonamide (NMSA)",
                "N-phenylsulfonamide (NPSA)",
                "N-benzenesulfonamide (NBSA)",
                "N-cyclohexylsulfonamide (NCHSA)",
                "N-isopropylsulfonamide (NIPSA)",
                "N-p-tolylsulfonamide (NPTSA)",
                "N-butylsulfonamide (NBS)",
                "N-hexylsulfonamide (NHS)",
                "N-dodecylsulfonamide (NDSA)",
                "N-ethyl-4-methylbenzenesulfonamide (NEMBSA)",
                "N-benzylsulfonamide (NBSA)",
                "N-(2-hydroxyethyl)sulfonamide (NHESA)",
                "N-(4-chlorophenyl)sulfonamide (N4CPSA)",
                "N-(2,6-dimethylphenyl)sulfonamide (N2,6DPSA)",
                "N-phenyl-2-pyridinesulfonamide (NPPYSA)",
                "N-(4-fluorophenyl)sulfonamide (N4FPSA)",
                "N-(3-methoxyphenyl)sulfonamide (N3MPSA)",
                "N-(4-nitrophenyl)sulfonamide (N4NPSA)",
                "N-(pyridin-3-yl)sulfonamide (NPSA3)",
                "N-(4-methylphenyl)sulfonamide (N4MPSA)",
                "N-(3-aminophenyl)sulfonamide (N3APSA)",
                "N-(1-naphthyl)sulfonamide (N1NSA)",
                "N-(2-thienyl)sulfonamide (N2TSA)"
            ],
            "true_referents": [
                "2,3,4-trimethyl-N-(3-pyridinyl)benzenesulfonamide",
                "2,4-Difluorobenzenesulfonamide",
                "2-[(4-fluorophenyl)sulfonyl-(2-pyridinyl)amino]-N-phenylacetamide",
                "2-aminobenzenesulfonamide",
                "2-oxoethane-1-sulfonamide",
                "4-(2-AMINOETHYL)BENZENESULFONAMIDE",
                "4-hydroxy-N,N-dimethylbenzenesulfonamide",
                "4-methyl-N-(phenylmethyl)benzenesulfonamide",
                "4-methyl-N-(pyridin-4-ylmethyl)benzenesulfonamide",
                "4-nitrosobenzenesulfonamide",
                "5-(dimethylamino)-N-(4-aminobenzyl)naphthalene-1-sulfonamide",
                "5-(dimethylamino)-N-(4-nitrosobenzyl)naphthalene-1-sulfonamide",
                "5-amino-1,3,4-thiadiazole-2-sulfonamide",
                "Benzenesulfonamide",
                "N,4-dimethyl-N-nitrosobenzenesulfonamide",
                "N-(2,5-dimethoxyphenyl)sulfonyl-N-(4-methoxyphenyl)cyclohexanecarboxamide",
                "N-(4-chlorophenyl)methanesulfonamide",
                "N-(4-methoxyphenyl)-2-(3-methylphenoxy)-N-(4-methylphenyl)sulfonylacetamide",
                "N-(4-phenylmethoxyphenyl)methanesulfonamide",
                "N-[3-(4-fluorophenoxy)phenyl]-4-[(2-hydroxybenzyl)amino]piperidine-1-sulfonamide",
                "N-[4-(methanesulfonamido)phenyl]acetamide",
                "N-benzyl-4-sulfamoylbenzamide",
                "N-butylbenzenesulfonamide",
                "N-chlorotoluene-p-sulfonamide",
                "N-cyclohexyl-N-ethyl-1,3-dimethyl-2,4-dioxo-5-pyrimidinesulfonamide",
                "N-ethylperfluorooctane sulfonamidoacetic acid",
                "N-sulfonyldiazepane",
                "N1,N1,4-trimethylbenzene-1-sulfonamide",
                "N1,N1-diethyl-4-methylbenzene-1-sulfonamide",
                "N1,N4-Diacetylsulfanilamide",
                "N1-(2-thienylmethyl)benzene-1-sulfonamide",
                "N1-(3-pyridyl)-2,3,4,5,6-pentamethylbenzene-1-sulfonamide",
                "N1-[4-(aminosulfonyl)phenyl]-2,2-dimethylpropanamide",
                "N1-piperidinocarbonyl-4-methylbenzene-1-sulfonamide",
                "N4-cyclohexyl-N1-ethyl-N4-(2-pyridinylmethyl)benzene-1,4-disulfonamide",
                "dapoxyl (2-aminoethyl)sulfonamide",
                "necrosulfonamide",
                "pyridinesulfonamide"
            ],
            "TP": 0,
            "FP": 24,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Tosylamide (TsNH2)",
            "Methanesulfonamide (MSA)",
            "Benzenesulfonamide",
            "Ethanesulfonamide",
            "Trifluoromethanesulfonamide (TfNH2)",
            "p-Toluenesulfonamide",
            "N-Methylbenzenesulfonamide",
            "N-Ethylbenzenesulfonamide",
            "N-Phenylmethanesulfonamide",
            "N-Butylbenzenesulfonamide",
            "N,N-Dimethylbenzenesulfonamide",
            "N,N-Diethylbenzenesulfonamide",
            "N-Methylmethanesulfonamide",
            "N-Ethylmethanesulfonamide",
            "N-Phenylethanesulfonamide",
            "N-Butylmethanesulfonamide",
            "N,N-Dimethylmethanesulfonamide",
            "N,N-Diethylmethanesulfonamide",
            "N-Methyltrifluoromethanesulfonamide",
            "N-Ethyltrifluoromethanesulfonamide",
            "N-Phenyltrifluoromethanesulfonamide",
            "N-Butyltrifluoromethanesulfonamide",
            "N,N-Dimethyltrifluoromethanesulfonamide",
            "N,N-Diethyltrifluoromethanesulfonamide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Benzenesulfonamide",
                "N-Butylbenzenesulfonamide"
            ],
            "mismatches": [
                "Tosylamide (TsNH2)",
                "Methanesulfonamide (MSA)",
                "Ethanesulfonamide",
                "Trifluoromethanesulfonamide (TfNH2)",
                "p-Toluenesulfonamide",
                "N-Methylbenzenesulfonamide",
                "N-Ethylbenzenesulfonamide",
                "N-Phenylmethanesulfonamide",
                "N,N-Dimethylbenzenesulfonamide",
                "N,N-Diethylbenzenesulfonamide",
                "N-Methylmethanesulfonamide",
                "N-Ethylmethanesulfonamide",
                "N-Phenylethanesulfonamide",
                "N-Butylmethanesulfonamide",
                "N,N-Dimethylmethanesulfonamide",
                "N,N-Diethylmethanesulfonamide",
                "N-Methyltrifluoromethanesulfonamide",
                "N-Ethyltrifluoromethanesulfonamide",
                "N-Phenyltrifluoromethanesulfonamide",
                "N-Butyltrifluoromethanesulfonamide",
                "N,N-Dimethyltrifluoromethanesulfonamide",
                "N,N-Diethyltrifluoromethanesulfonamide"
            ],
            "true_referents": [
                "2,4,6-trimethyl-N-[2-(trifluoromethyl)phenyl]benzenesulfonamide",
                "2,4,6-trimethyl-N-[3-(trifluoromethyl)phenyl]benzenesulfonamide",
                "2,4-Difluorobenzenesulfonamide",
                "2,6-difluorobenzenesulfonamide",
                "2-aminobenzenesulfonamide",
                "3,5-difluorobenzenesulfonamide",
                "4-(2-AMINOETHYL)BENZENESULFONAMIDE",
                "4-hydroxy-N,N-dimethylbenzenesulfonamide",
                "4-methyl-N-(phenylmethyl)benzenesulfonamide",
                "4-nitrosobenzenesulfonamide",
                "Benzenesulfonamide",
                "Methazolamide",
                "N,4-dimethyl-N-(4-methylphenyl)benzenesulfonamide",
                "N,4-dimethyl-N-nitrosobenzenesulfonamide",
                "N-(4-chlorophenyl)methanesulfonamide",
                "N-(4-phenylmethoxyphenyl)methanesulfonamide",
                "N-[4-(methanesulfonamido)phenyl]acetamide",
                "N-butylbenzenesulfonamide",
                "N-ethylperfluorooctane sulfonamidoacetic acid",
                "N-methylperfluorooctane sulfonamidoacetic acid",
                "N1,N1-diethyl-4-methylbenzene-1-sulfonamide",
                "N1,N4-Diacetylsulfanilamide",
                "piperidinesulfonamide",
                "pyridinesulfonamide",
                "tolpyrramide",
                "toluene-4-sulfonamide",
                "triflusulfuron-methyl"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "sulfonamide (R1SO2NR2R3)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "sulfonamide (R1SO2NR2R3)"
            ],
            "true_referents": [
                "2-oxoethane-1-sulfonamide",
                "N1,N1,4-trimethylbenzene-1-sulfonamide",
                "sulfonamide antibiotic"
            ],
            "TP": 0,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfanilamide (SA)",
            "Sulfadiazine (SDZ)",
            "Sulfamethoxazole (SMX)",
            "Sulfapyridine (SPY)",
            "Sulfisoxazole (SIZ)",
            "Sulfamethizole (SMZ)",
            "Sulfacetamide (SAC)",
            "Sulfadoxine (SDX)",
            "Sulfamethoxypyridazine (SMP)",
            "Sulfameturon",
            "Sulfameter",
            "Sulfametanilide",
            "Sulfamonomethoxine",
            "Sulfamethazine",
            "Sulfamethoxazole-trimethoprim (Co-trimoxazole)",
            "Sulfamethazine-dapsone",
            "Sulfamerazine",
            "Sulfatricamide",
            "Sulfamethoxypyridazine",
            "Sulfamonomethoxine",
            "Sulfaguanidine",
            "Sulfathiazole",
            "Sulfometuron methyl",
            "Sulfamethizole dapsone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfanilamide (SA)",
                "Sulfadiazine (SDZ)",
                "Sulfamethoxazole (SMX)",
                "Sulfapyridine (SPY)",
                "Sulfisoxazole (SIZ)",
                "Sulfamethizole (SMZ)",
                "Sulfacetamide (SAC)",
                "Sulfadoxine (SDX)",
                "Sulfamethoxypyridazine (SMP)",
                "Sulfamonomethoxine",
                "Sulfamethazine",
                "Sulfamerazine",
                "Sulfaguanidine",
                "Sulfathiazole",
                "Sulfometuron methyl"
            ],
            "mismatches": [
                "Sulfameturon",
                "Sulfameter",
                "Sulfametanilide",
                "Sulfamethoxazole-trimethoprim (Co-trimoxazole)",
                "Sulfamethazine-dapsone",
                "Sulfatricamide",
                "Sulfamethizole dapsone"
            ],
            "true_referents": [
                "4-sulfanilamidobenzoic acid",
                "Sulfamonomethoxine",
                "Sulfamoyldapsone",
                "Sulfatolamide",
                "sulfacarbamide",
                "sulfacetamide",
                "sulfadiazine",
                "sulfadicramide",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfaguanidine",
                "sulfaguanole",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfamethoxypyridazine",
                "sulfamethylthiazole",
                "sulfanilamide",
                "sulfapyridine",
                "sulfathiazole",
                "sulfisoxazole",
                "sulfometuron",
                "sulfometuron methyl",
                "sulfonamide antibiotic"
            ],
            "TP": 15,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfanilamide (SA)",
            "Sulfadiazine (SDZ)",
            "Sulfamethoxazole (SMX)",
            "Sulfadimethoxine (SDM)",
            "Sulfadoxine (SDX)",
            "Sulfisoxazole (SIX)",
            "Sulfacetamide (SAM)",
            "Sulfathiazole (STZ)",
            "Sulfapyridine (SPY)",
            "Sulfasalazine (SSZ)",
            "Sulfamerazine (SMR)",
            "Sulfamethazine (SMZ)",
            "Sulfamethizole (SMT)",
            "Sulfaguanidine (SGN)",
            "Sulfamonomethoxine (SMM)",
            "Sulfachloropyridazine (SCP)",
            "Sulfaquinoxaline (SQX)",
            "Sulfadimidine (SDD)",
            "Sulfanitran (SNT)",
            "Sulfaphenazole (SPZ)",
            "Sulfabenzamide (SBZ)",
            "Sulfacarbamide (SCM)",
            "Sulfametopyrazine (SMP)",
            "Sulfamoxole (SMO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfanilamide (SA)",
                "Sulfadiazine (SDZ)",
                "Sulfamethoxazole (SMX)",
                "Sulfadimethoxine (SDM)",
                "Sulfadoxine (SDX)",
                "Sulfisoxazole (SIX)",
                "Sulfacetamide (SAM)",
                "Sulfathiazole (STZ)",
                "Sulfapyridine (SPY)",
                "Sulfasalazine (SSZ)",
                "Sulfamerazine (SMR)",
                "Sulfamethazine (SMZ)",
                "Sulfamethizole (SMT)",
                "Sulfaguanidine (SGN)",
                "Sulfamonomethoxine (SMM)",
                "Sulfachloropyridazine (SCP)",
                "Sulfaphenazole (SPZ)",
                "Sulfabenzamide (SBZ)",
                "Sulfacarbamide (SCM)",
                "Sulfamoxole (SMO)"
            ],
            "mismatches": [
                "Sulfaquinoxaline (SQX)",
                "Sulfadimidine (SDD)",
                "Sulfanitran (SNT)",
                "Sulfametopyrazine (SMP)"
            ],
            "true_referents": [
                "4-sulfanilamidobenzoic acid",
                "Sulfamonomethoxine",
                "sulfabenzamide",
                "sulfacarbamide",
                "sulfacetamide",
                "sulfachloropyridazine",
                "sulfachlorpyrazine",
                "sulfadiasulfone",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfaethoxypyridazine",
                "sulfaguanidine",
                "sulfaguanole",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethopyrazine",
                "sulfamethoxazole",
                "sulfamethylthiazole",
                "sulfamoxole",
                "sulfamoylbenzoate",
                "sulfanilamide",
                "sulfaphenazole",
                "sulfapyridine",
                "sulfasalazine",
                "sulfathiazole",
                "sulfisoxazole",
                "sulfonamide antibiotic"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfanilamide",
            "Sulfamethoxazole (SMX)",
            "Sulfadiazine",
            "Sulfisoxazole",
            "Sulfamethizole",
            "Sulfadimethoxine",
            "Sulfapyridine",
            "Sulfamerazine",
            "Sulfamethazine",
            "Sulfathiazole",
            "Sulfaguanidine",
            "Sulfacetamide",
            "Sulfabenzamide",
            "Sulfachlorpyridazine",
            "Sulfadoxine",
            "Sulfamonomethoxine",
            "Sulfamethoxypyridazine",
            "Sulfaquinoxaline",
            "Sulfatroxazole",
            "Sulfametopyrazine",
            "Sulfaphenazole",
            "Sulfaethidole",
            "Sulfamoxole",
            "Sulfadimidine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfanilamide",
                "Sulfamethoxazole",
                "Sulfadiazine",
                "Sulfisoxazole",
                "Sulfamethizole",
                "Sulfadimethoxine",
                "Sulfapyridine",
                "Sulfamerazine",
                "Sulfamethazine",
                "Sulfathiazole",
                "Sulfaguanidine",
                "Sulfacetamide",
                "Sulfabenzamide",
                "Sulfadoxine",
                "Sulfamonomethoxine",
                "Sulfamethoxypyridazine",
                "Sulfamoxole",
                "Sulfaphenazole"
            ],
            "mismatches": [
                "Sulfachlorpyridazine",
                "Sulfaquinoxaline",
                "Sulfatroxazole",
                "Sulfametopyrazine",
                "Sulfaethidole",
                "Sulfadimidine"
            ],
            "true_referents": [
                "4-sulfanilamidobenzoic acid",
                "Sulfamonomethoxine",
                "sulfabenzamide",
                "sulfacarbamide",
                "sulfacetamide",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfaguanidine",
                "sulfaguanole",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethopyrazine",
                "sulfamethoxazole",
                "sulfamethoxypyridazine",
                "sulfamoxole",
                "sulfanilamide",
                "sulfaphenazole",
                "sulfapyridine",
                "sulfathiazole",
                "sulfisomidine",
                "sulfisoxazole"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Methanesulfonamide (CH3SO2NH2)",
            "Ethanesulfonamide (CH3CH2SO2NH2)",
            "Benzenesulfonamide (C6H5SO2NH2)",
            "Toluenesulfonamide (CH3C6H4SO2NH2)",
            "Naphthalenesulfonamide (C10H7SO2NH2)",
            "Trifluoromethanesulfonamide (CF3SO2NH2)",
            "N,N-Dimethylmethanesulfonamide ((CH3)2NSO2CH3)",
            "N,N-Diethylmethanesulfonamide ((C2H5)2NSO2CH3)",
            "N-Methylbenzenesulfonamide (CH3NHC6H4SO2CH3)",
            "N-Ethylbenzenesulfonamide (C2H5NHC6H4SO2CH3)",
            "N,N-Dimethylbenzenesulfonamide ((CH3)2NC6H4SO2CH3)",
            "N,N-Diethylbenzenesulfonamide ((C2H5)2NC6H4SO2CH3)",
            "4-Methylbenzenesulfonamide (CH3C6H4SO2NH2)",
            "2-Naphthalenesulfonamide (C10H7SO2NH2)",
            "1,5-Naphthalenedisulfonamide (C10H6(SO2NH2)2)",
            "4-Chlorobenzenesulfonamide (ClC6H4SO2NH2)",
            "4-Nitrobenzenesulfonamide (O2NC6H4SO2NH2)",
            "4-Aminobenzenesulfonamide (H2NC6H4SO2NH2)",
            "4-Methoxybenzenesulfonamide (CH3OC6H4SO2NH2)",
            "2,4,6-Trimethylbenzenesulfonamide ((CH3)3C6H2SO2NH2)",
            "2,4,6-Triisopropylbenzenesulfonamide ((CH3)2CHC6H2SO2NH2)3",
            "Camphorsulfonamide (C10H16SO2NH2)",
            "Saccharinsulfonamide (C7H5NO3S)SO2NH2"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Benzenesulfonamide",
                "4-Chlorobenzenesulfonamide"
            ],
            "mismatches": [
                "Methanesulfonamide (CH3SO2NH2)",
                "Ethanesulfonamide (CH3CH2SO2NH2)",
                "Toluenesulfonamide (CH3C6H4SO2NH2)",
                "Naphthalenesulfonamide (C10H7SO2NH2)",
                "Trifluoromethanesulfonamide (CF3SO2NH2)",
                "N,N-Dimethylmethanesulfonamide ((CH3)2NSO2CH3)",
                "N,N-Diethylmethanesulfonamide ((C2H5)2NSO2CH3)",
                "N-Methylbenzenesulfonamide (CH3NHC6H4SO2CH3)",
                "N-Ethylbenzenesulfonamide (C2H5NHC6H4SO2CH3)",
                "N,N-Dimethylbenzenesulfonamide ((CH3)2NC6H4SO2CH3)",
                "N,N-Diethylbenzenesulfonamide ((C2H5)2NC6H4SO2CH3)",
                "4-Methylbenzenesulfonamide (CH3C6H4SO2NH2)",
                "2-Naphthalenesulfonamide (C10H7SO2NH2)",
                "1,5-Naphthalenedisulfonamide (C10H6(SO2NH2)2)",
                "4-Nitrobenzenesulfonamide (O2NC6H4SO2NH2)",
                "4-Aminobenzenesulfonamide (H2NC6H4SO2NH2)",
                "4-Methoxybenzenesulfonamide (CH3OC6H4SO2NH2)",
                "2,4,6-Trimethylbenzenesulfonamide ((CH3)3C6H2SO2NH2)",
                "2,4,6-Triisopropylbenzenesulfonamide ((CH3)2CHC6H2SO2NH2)3",
                "Camphorsulfonamide (C10H16SO2NH2)",
                "Saccharinsulfonamide (C7H5NO3S)SO2NH2"
            ],
            "true_referents": [
                "(R)-1-amino-1-[5-(dimethylamino)-1,3,4-thiadiazol-2-yl]methanesulfonamide",
                "2,4,6-trimethyl-N-[2-(trifluoromethyl)phenyl]benzenesulfonamide",
                "2,4,6-trimethyl-N-[3-(trifluoromethyl)phenyl]benzenesulfonamide",
                "2-(methanesulfonamido)-N-[2-(phenylmethylthio)ethyl]benzamide",
                "2-aminobenzenesulfonamide",
                "3,4-Dichlorobenzenesulfonamide",
                "3,5-difluorobenzenesulfonamide",
                "3-nitro-N-(pyridin-4-ylmethyl)benzenesulfonamide",
                "4-(2-AMINOETHYL)BENZENESULFONAMIDE",
                "4-[2-[(5-chloro-2-phenylmethoxyphenyl)methylamino]ethyl]benzenesulfonamide",
                "4-[butyl(methyl)sulfamoyl]-N-[5-[(methylthio)methyl]-1,3,4-oxadiazol-2-yl]benzamide",
                "4-amino-N-(4-ethoxyphenyl)benzenesulfonamide",
                "4-chlorobenzenesulfonamide",
                "4-hydroxy-N,N-dimethylbenzenesulfonamide",
                "4-methyl-N-(5,6,7,8-tetrahydronaphthalen-1-yl)benzenesulfonamide",
                "4-methyl-N-(phenylmethyl)benzenesulfonamide",
                "4-nitrosobenzenesulfonamide",
                "5-(benzenesulfonyl)-N-[2-(3,4-dimethoxyphenyl)ethyl]-2-ethylbenzenesulfonamide",
                "5-(dimethylamino)-N-(4-aminobenzyl)naphthalene-1-sulfonamide",
                "5-(dimethylamino)-N-[4-(hydroxyamino)benzyl]naphthalene-1-sulfonamide",
                "Benzenesulfonamide",
                "N,4-dimethyl-N-(4-methylphenyl)benzenesulfonamide",
                "N,4-dimethyl-N-nitrosobenzenesulfonamide",
                "N-(2-ethylphenyl)-2-methoxy-5-methylbenzenesulfonamide",
                "N-(4-phenylmethoxyphenyl)methanesulfonamide",
                "N-[3-(4-methyl-1-piperidinyl)-1,4-dioxo-2-naphthalenyl]benzenesulfonamide",
                "N-[4-(methanesulfonamido)phenyl]acetamide",
                "N-cyclooctyl-4-methylbenzenesulfonamide",
                "N1,N1,4-trimethylbenzene-1-sulfonamide",
                "N1-[4-(aminosulfonyl)phenyl]-2,2-dimethylpropanamide"
            ],
            "TP": 2,
            "FP": 21,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Saccharin (SAC)",
            "Sulfonamide (SUL)",
            "Sulfamethoxazole (SMX)",
            "Sulfadiazine (SDZ)",
            "Sulfapyridine (SPY)",
            "Sulfadimethoxine (SDM)",
            "Sulfamethazine (SMZ)",
            "Sulfachloropyridazine (SCP)",
            "Sulfamonomethoxine (SMM)",
            "Sulfaquinoxaline (SQX)",
            "Sulfadoxine (SDX)",
            "Sulfamerazine (SMR)",
            "Sulfamethizole (SMT)",
            "Sulfisoxazole (SIX)",
            "Sulfaphenazole (SPZ)",
            "Sulfametoxydiazine (SMD)",
            "Sulfamethoxydiazine (SMX)",
            "Sulfamethoxypyridazine (SMP)",
            "Sulfacetamide (SCT)",
            "Sulfamethoxazole-Trimethoprim (SMX-TMP)",
            "Sulfadoxine-Pyrimethamine (SDX-PYR)",
            "Sulfamethoxazole-Trimethoprim-Folic Acid (SMX-TMP-FOL)",
            "Sulfamethoxazole-Trimethoprim-Leucovorin (SMX-TMP-LEU)",
            "Sulfamethoxazole-Trimethoprim-Folinic Acid (SMX-TMP-FOA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfamethoxazole",
                "Sulfadiazine",
                "Sulfapyridine",
                "Sulfadimethoxine",
                "Sulfamethazine",
                "Sulfachloropyridazine",
                "Sulfamonomethoxine",
                "Sulfadoxine",
                "Sulfamerazine",
                "Sulfamethizole",
                "Sulfisoxazole",
                "Sulfaphenazole",
                "Sulfamethoxydiazine",
                "Sulfamethoxypyridazine",
                "Sulfacetamide"
            ],
            "mismatches": [
                "Saccharin (SAC)",
                "Sulfonamide (SUL)",
                "Sulfaquinoxaline (SQX)",
                "Sulfametoxydiazine (SMD)",
                "Sulfamethoxazole-Trimethoprim (SMX-TMP)",
                "Sulfadoxine-Pyrimethamine (SDX-PYR)",
                "Sulfamethoxazole-Trimethoprim-Folic Acid (SMX-TMP-FOL)",
                "Sulfamethoxazole-Trimethoprim-Leucovorin (SMX-TMP-LEU)",
                "Sulfamethoxazole-Trimethoprim-Folinic Acid (SMX-TMP-FOA)"
            ],
            "true_referents": [
                "1-(4-ethyl-2-pyridinyl)-3-(4-methylphenyl)sulfonylurea",
                "N-sulfonylurea",
                "Sulfamonomethoxine",
                "glymidine",
                "sulfacetamide",
                "sulfachloropyridazine",
                "sulfachlorpyrazine",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfaethoxypyridazine",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfamethoxydiazine",
                "sulfamethoxypyridazine",
                "sulfamethylthiazole",
                "sulfaphenazole",
                "sulfapyridine",
                "sulfisoxazole",
                "sulfonamide antibiotic",
                "toluene-4-sulfonamide"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": "[\n  \"Sulfonamide (sulfanilamide)\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole\", \n  \"Sulfadoxine\", \n  \"Sulfamerazine\", \n  \"Sulfamethazine\", \n  \"Sulfadiazine\", \n  \"Sulfamethizole\", \n  \"Sulfacetamide\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfonamidochrysoidine\", \n  \"Sulfanilamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfonamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfonamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfonamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfonamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfonamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfonamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfonamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfonamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfonamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfonamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfonamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfonamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfonamide\", \n  \"Sulfapyridine\", \n  \"Sulfamethoxazole-trimethoprim\", \n  \"Sulfadoxine-pyrimethamine\", \n  \"Sulfamethoxazole-trimethopprim",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfanilamide (SLF)",
            "Sulfadiazine (SDZ)",
            "Sulfathiazole (STZ)",
            "Sulfapyridine (SPY)",
            "Sulfamethoxazole (SMZ)",
            "Sulfisoxazole (SXZ)",
            "Sulfachloropyridazine (SCP)",
            "Sulfadimethoxine (SDM)",
            "Sulfalene (SFL)",
            "Sulfamerazine (SMR)",
            "Sulfamethazine (SMT)",
            "Sulfamoxole (SMX)",
            "Sulfabenzamide (SBN)",
            "Sulfacetamide (SCT)",
            "Sulfachloridine (SCD)",
            "Sulfadimidine (SDI)",
            "Sulfaphenazole (SPZ)",
            "Sulfamonomethoxine (SMM)",
            "Sulfamethomidine (SMTD)",
            "Sulfaperin (SPR)",
            "Sulfaphridine (SPHD)",
            "Sulfatolamide (STL)",
            "Sulfanitran (SNT)",
            "Sulfathalidine (STD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfanilamide (SLF)",
                "Sulfadiazine (SDZ)",
                "Sulfathiazole (STZ)",
                "Sulfapyridine (SPY)",
                "Sulfamethoxazole (SMZ)",
                "Sulfisoxazole (SXZ)",
                "Sulfachloropyridazine (SCP)",
                "Sulfadimethoxine (SDM)",
                "Sulfamerazine (SMR)",
                "Sulfamethazine (SMT)",
                "Sulfamoxole (SMX)",
                "Sulfabenzamide (SBN)",
                "Sulfacetamide (SCT)",
                "Sulfaphenazole (SPZ)",
                "Sulfamonomethoxine (SMM)",
                "Sulfaperin (SPR)",
                "Sulfatolamide (STL)"
            ],
            "mismatches": [
                "Sulfalene (SFL)",
                "Sulfachloridine (SCD)",
                "Sulfadimidine (SDI)",
                "Sulfamethomidine (SMTD)",
                "Sulfaphridine (SPHD)",
                "Sulfanitran (SNT)",
                "Sulfathalidine (STD)"
            ],
            "true_referents": [
                "4-sulfanilamidobenzoic acid",
                "N-benzyl-4-sulfamoylbenzamide",
                "Sulfamonomethoxine",
                "Sulfatolamide",
                "sulfabenzamide",
                "sulfacetamide",
                "sulfachloropyridazine",
                "sulfachlorpyrazine",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfaethoxypyridazine",
                "sulfaguanidine",
                "sulfaguanole",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfamethylthiazole",
                "sulfamoxole",
                "sulfanilamide",
                "sulfaperin",
                "sulfaphenazole",
                "sulfapyridine",
                "sulfathiazole",
                "sulfisomidine",
                "sulfisoxazole"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            },
            {
                "Referent": "acetamide",
                "Canonical name": "acetamide"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [],
            "mismatches": [
                "acetamide"
            ],
            "true_referents": [
                "(S)-(-)-sulpiride",
                "(S)-metazosulfuron",
                "carbutamide"
            ],
            "TP": 0,
            "FP": 1,
            "FN": 0
        }
    }
]