[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfadiazine (SDZ)",
            "Sulfamethoxazole (SMX)",
            "Sulfisoxazole",
            "Sulfadoxine",
            "Sulfacetamide",
            "Sulfamonomethoxine",
            "Sulfanilamide",
            "Sulfapyridine",
            "Sulfasalazine",
            "Sulfadimethoxine",
            "Sulfamethazine",
            "Sulfamerazine",
            "Sulfisomidine",
            "Sulfamethizole",
            "Sulfamethoxypyridazine",
            "Sulfamethoxydiazine",
            "Sulfamethoxazole-trimethoprim",
            "Sulfadimidine",
            "Sulfaguanidine",
            "Sulfamerazine-trimethoprim",
            "Sulfadoxine-pyrimethamine",
            "Sulfanilic acid",
            "Sulfachloropyridazine",
            "Sulfamerazine-dihydrostreptomycin"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfadiazine (SDZ)",
                "Sulfamethoxazole (SMX)",
                "Sulfisoxazole",
                "Sulfadoxine",
                "Sulfacetamide",
                "Sulfamonomethoxine",
                "Sulfanilamide",
                "Sulfapyridine",
                "Sulfasalazine",
                "Sulfadimethoxine",
                "Sulfamethazine",
                "Sulfamerazine",
                "Sulfisomidine",
                "Sulfamethizole",
                "Sulfamethoxypyridazine",
                "Sulfamethoxydiazine",
                "Sulfaguanidine",
                "Sulfachloropyridazine"
            ],
            "mismatches": [
                "Sulfamethoxazole-trimethoprim",
                "Sulfadimidine",
                "Sulfamerazine-trimethoprim",
                "Sulfadoxine-pyrimethamine",
                "Sulfanilic acid",
                "Sulfamerazine-dihydrostreptomycin"
            ],
            "true_referents": [
                "4-sulfanilamidobenzoic acid",
                "Sulfamonomethoxine",
                "sulfacarbamide",
                "sulfacetamide",
                "sulfachloropyridazine",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfaethoxypyridazine",
                "sulfaguanidine",
                "sulfaguanole",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfamethoxydiazine",
                "sulfamethoxypyridazine",
                "sulfamoxole",
                "sulfanilamide",
                "sulfapyridine",
                "sulfasalazine",
                "sulfisomidine",
                "sulfisoxazole"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfamethoxazole (SMX)",
            "Sulfadiazine (SDZ)",
            "Sulfisoxazole (SUL)",
            "Sulfapyridine (SPY)",
            "Sulfamethizole (STM)",
            "Sulfadimidine (SDM)",
            "Sulfamerazine (SMZ)",
            "Sulfadoxine (SDD)",
            "Sulfachloropyridazine (SCP)",
            "Sulfadimethoxine (SDM)",
            "Sulfacetamide (SCM)",
            "Sulfadimethoxine (SDM)",
            "Sulfamethazine (SMZ)",
            "Sulfamethoxypyridazine (SMP)",
            "Sulfamethoxypyridazine (SMP)",
            "Sulfathiazole (STZ)",
            "Sulfisoxazole (SUL)",
            "Sulfamonomethoxine (SMM)",
            "Sulfadiazine Silver (SDZ)",
            "Sulfamethoxypyrazine (SMP)",
            "Sulfamethoxypyridazine (SMP)",
            "Sulfadoxine-Pyrimethamine (SP)",
            "Sulfisoxazole Acetyl (SUL-Ac)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfamethoxazole (SMX)",
                "Sulfadiazine (SDZ)",
                "Sulfisoxazole (SUL)",
                "Sulfapyridine (SPY)",
                "Sulfamethizole (STM)",
                "Sulfamerazine (SMZ)",
                "Sulfadoxine (SDD)",
                "Sulfachloropyridazine (SCP)",
                "Sulfadimethoxine (SDM)",
                "Sulfacetamide (SCM)",
                "Sulfamethazine (SMZ)",
                "Sulfamethoxypyridazine (SMP)",
                "Sulfathiazole (STZ)",
                "Sulfisoxazole Acetyl (SUL-Ac)",
                "Sulfamonomethoxine (SMM)"
            ],
            "mismatches": [
                "Sulfadimidine (SDM)",
                "Sulfadiazine Silver (SDZ)",
                "Sulfamethoxypyrazine (SMP)",
                "Sulfadoxine-Pyrimethamine (SP)"
            ],
            "true_referents": [
                "N-sulfonylpiperazine",
                "Sulfamonomethoxine",
                "sulfacetamide",
                "sulfachloropyridazine",
                "sulfachlorpyrazine",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfaethoxypyridazine",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfamethoxypyridazine",
                "sulfamethylthiazole",
                "sulfametrole",
                "sulfapyridine",
                "sulfathiazole",
                "sulfisomidine",
                "sulfisoxazole",
                "sulfisoxazole acetyl"
            ],
            "TP": 15,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfanilamide (Sulfonamide)",
            "Sulfamethoxazole (SMZ)",
            "Sulfadiazine (SD)",
            "Sulfapyridine (SP)",
            "Sulfadimethoxine (SDM)",
            "Sulfadimidine (SDM)",
            "Sulfamethazine (SMZ)",
            "Sulfamonomethoxine (SMM)",
            "Sulfathiazole (ST)",
            "Sulfacetamide (SA)",
            "Sulfadoxine (SDX)",
            "Sulfasalazine (SSZ)",
            "Sulfisoxazole (SIX)",
            "Sulfamethizole (SMT)",
            "Sulfametopyrazine (SMP)",
            "Sulfaphenazole (SPZ)",
            "Sulfamerazine (SMR)",
            "Sulfaguanidine (SG)",
            "Sulfanilamide (SFA)",
            "Sulfabenzamide (SBZ)",
            "Sulfapyrimidine (SPY)",
            "Sulfametoxazole (SMX)",
            "Sulfathalidine (STH)",
            "Sulfadimethoxine (SDM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfanilamide (Sulfonamide)",
                "Sulfamethoxazole (SMZ)",
                "Sulfadiazine (SD)",
                "Sulfapyridine (SP)",
                "Sulfadimethoxine (SDM)",
                "Sulfamonomethoxine (SMM)",
                "Sulfathiazole (ST)",
                "Sulfacetamide (SA)",
                "Sulfadoxine (SDX)",
                "Sulfasalazine (SSZ)",
                "Sulfisoxazole (SIX)",
                "Sulfamethizole (SMT)",
                "Sulfaphenazole (SPZ)",
                "Sulfamerazine (SMR)",
                "Sulfaguanidine (SG)",
                "Sulfabenzamide (SBZ)"
            ],
            "mismatches": [
                "Sulfadimidine (SDM)",
                "Sulfametopyrazine (SMP)",
                "Sulfanilamide (SFA)",
                "Sulfapyrimidine (SPY)",
                "Sulfametoxazole (SMX)",
                "Sulfathalidine (STH)"
            ],
            "true_referents": [
                "4-sulfanilamidobenzoic acid",
                "Sulfamonomethoxine",
                "sulfabenzamide",
                "sulfacetamide",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfaguanidine",
                "sulfaguanole",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethopyrazine",
                "sulfamethoxazole",
                "sulfamethylthiazole",
                "sulfametrole",
                "sulfamoylbenzoate",
                "sulfanilamide",
                "sulfaphenazole",
                "sulfapyridine",
                "sulfasalazine",
                "sulfathiazole",
                "sulfisomidine",
                "sulfisoxazole",
                "sulfonamide antibiotic"
            ],
            "TP": 16,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfanilamide (SUL)",
            "Sulfamethoxazole (SMX)",
            "Sulfadiazine (SDZ)",
            "Sulfisoxazole (SXI)",
            "Sulfasalazine (SAS)",
            "Sulfapyridine (SPY)",
            "Sulfathiazole (STZ)",
            "Sulfacetamide (SAC)",
            "Sulfadoxine (SDO)",
            "Sulfamerazine (SMR)",
            "Sulfadimidine (SDD)",
            "Celecoxib (CXB)",
            "Meloxicam (MLX)",
            "Valdecoxib (VDC)",
            "Parecoxib (PXC)",
            "Furosemide (FRS)",
            "Hydrochlorothiazide (HCT)",
            "Bumetanide (BUM)",
            "Torsemide (TOR)",
            "Acetazolamide (ACT)",
            "Dorzolamide (DOR)",
            "Brinzolamide (BRZ)",
            "Methazolamide (MZA)",
            "Sultam (STM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfanilamide (SUL)",
                "Sulfamethoxazole (SMX)",
                "Sulfadiazine (SDZ)",
                "Sulfisoxazole (SXI)",
                "Sulfasalazine (SAS)",
                "Sulfapyridine (SPY)",
                "Sulfathiazole (STZ)",
                "Sulfacetamide (SAC)",
                "Sulfadoxine (SDO)",
                "Sulfamerazine (SMR)",
                "Celecoxib (CXB)",
                "Valdecoxib (VDC)",
                "Parecoxib (PXC)",
                "Furosemide (FRS)",
                "Hydrochlorothiazide (HCT)",
                "Bumetanide (BUM)",
                "Acetazolamide (ACT)",
                "Dorzolamide (DOR)",
                "Brinzolamide (BRZ)",
                "Methazolamide (MZA)",
                "Sultam (STM)"
            ],
            "mismatches": [
                "Sulfadimidine (SDD)",
                "Meloxicam (MLX)",
                "Torsemide (TOR)"
            ],
            "true_referents": [
                "(S)-bendroflumethiazide",
                "4-sulfanilamidobenzoic acid",
                "Benzylhydrochlorothiazide",
                "Methazolamide",
                "N-(4-Aminobenzenesulfonyl) Sulfamethoxazole",
                "acetazolamide",
                "azosemide",
                "brinzolamide",
                "bumetanide",
                "butazolamide",
                "celecoxib",
                "cimicoxib",
                "deracoxib",
                "diclofenamide",
                "dorzolamide",
                "ethoxzolamide",
                "flusulfamide",
                "furosemide",
                "glisolamide",
                "hydrochlorothiazide",
                "mavacoxib",
                "parecoxib",
                "sulfacarbamide",
                "sulfacetamide",
                "sulfadiasulfone",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfamerazine",
                "sulfamethoxazole",
                "sulfamethylthiazole",
                "sulfamoxole",
                "sulfanilamide",
                "sulfapyridine",
                "sulfasalazine",
                "sulfathiazole",
                "sulfisoxazole",
                "sultam",
                "torasemide",
                "torasemide carboxylic acid",
                "trichlormethiazide",
                "valdecoxib"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfamethoxazole (SMX)",
            "Sulfadiazine",
            "Sulfisoxazole",
            "Sulfacetamide",
            "Sulfapyridine",
            "Sulfathiazole",
            "Sulfadoxine",
            "Sulfamethazine",
            "Sulfamerazine",
            "Sulfamethizole",
            "Sulfabenzamide",
            "Sulfaguanidine",
            "Sulfameter",
            "Sulfamoxole",
            "Sulfaphenazole",
            "Sulfaproxyline",
            "Sulfachlorpyridazine",
            "Sulfaquinoxaline",
            "Sulfadimethoxine",
            "Sulfasalazine",
            "Sulfamonomethoxine",
            "Sulfadimidine",
            "Sulfamethoxypyridazine",
            "Sulfametomidine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfamethoxazole",
                "Sulfadiazine",
                "Sulfisoxazole",
                "Sulfacetamide",
                "Sulfapyridine",
                "Sulfathiazole",
                "Sulfadoxine",
                "Sulfamethazine",
                "Sulfamerazine",
                "Sulfamethizole",
                "Sulfabenzamide",
                "Sulfaguanidine",
                "Sulfamoxole",
                "Sulfaphenazole",
                "Sulfadimethoxine",
                "Sulfasalazine",
                "Sulfamonomethoxine",
                "Sulfamethoxypyridazine"
            ],
            "mismatches": [
                "Sulfameter",
                "Sulfaproxyline",
                "Sulfachlorpyridazine",
                "Sulfaquinoxaline",
                "Sulfadimidine",
                "Sulfametomidine"
            ],
            "true_referents": [
                "Sulfamonomethoxine",
                "sulfabenzamide",
                "sulfacarbamide",
                "sulfacetamide",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfaguanidine",
                "sulfaguanole",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfamethoxypyridazine",
                "sulfamoxole",
                "sulfaphenazole",
                "sulfapyridine",
                "sulfasalazine",
                "sulfathiazole",
                "sulfisomidine",
                "sulfisoxazole"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfamethoxazole (SMX)",
            "Sulfadiazine (SD)",
            "Sulfisoxazole (SSZ)",
            "Sulfamethizole (Sulfamethizole)",
            "Sulfapyridine (SP)",
            "Sulfacetamide (Sulfacetamide sodium)",
            "Sulfamethoxazole/Trimethoprim (TMP/SMX)",
            "Sulfadimethoxine (SDM)",
            "Sulfamethazine (Sulfamethazine)",
            "Sulfaguanidine (SG)",
            "Sulfamethoxazole/Trimethoprim DS (TMP/SMX DS)",
            "Sulfadiazine silver (Silvadene)",
            "Sulfamethoxazole/Trimethoprim oral suspension (TMP/SMX oral suspension)",
            "Sulfathiazole (STZ)",
            "Sulfameter (Sulfameter)",
            "Sulfamethoxazole topical (Sulfamethoxazole topical)",
            "Sulfamethazine sodium (Sulfamethazine sodium)",
            "Sulfadimidine (Sulfadimidine)",
            "Sulfamethoxazole/Trimethoprim pediatric formulation (TMP/SMX pediatric)",
            "Sulfamethoxazole/Trimethoprim IV (TMP/SMX IV)",
            "Sulfamethoxazole/Trimethoprim prophylactic use (TMP/SMX prophylactic)",
            "Sulfamethoxazole/Trimethoprim for urinary tract infection (TMP/SMX UTI)",
            "Sulfamethoxazole/Trimethoprim for respiratory infections (TMP/SMX respiratory)",
            "Sulfamethoxazole/Trimethoprim for skin infections (TMP/SMX skin)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfamethoxazole",
                "Sulfadiazine",
                "Sulfisoxazole",
                "Sulfamethizole",
                "Sulfapyridine",
                "Sulfacetamide",
                "Sulfadimethoxine",
                "Sulfamethazine",
                "Sulfaguanidine",
                "Sulfathiazole"
            ],
            "mismatches": [
                "Sulfamethoxazole/Trimethoprim (TMP/SMX)",
                "Sulfadiazine silver (Silvadene)",
                "Sulfameter (Sulfameter)",
                "Sulfamethoxazole topical (Sulfamethoxazole topical)",
                "Sulfamethazine sodium (Sulfamethazine sodium)",
                "Sulfadimidine (Sulfadimidine)",
                "Sulfamethoxazole/Trimethoprim pediatric formulation (TMP/SMX pediatric)",
                "Sulfamethoxazole/Trimethoprim IV (TMP/SMX IV)",
                "Sulfamethoxazole/Trimethoprim prophylactic use (TMP/SMX prophylactic)",
                "Sulfamethoxazole/Trimethoprim for urinary tract infection (TMP/SMX UTI)",
                "Sulfamethoxazole/Trimethoprim for respiratory infections (TMP/SMX respiratory)",
                "Sulfamethoxazole/Trimethoprim for skin infections (TMP/SMX skin)"
            ],
            "true_referents": [
                "sulfacarbamide",
                "sulfacetamide",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfaguanidine",
                "sulfaguanole",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfametrole",
                "sulfapyridine",
                "sulfathiazole",
                "sulfisoxazole"
            ],
            "TP": 10,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfamethoxazole (SMX)",
            "Sulfadiazine",
            "Sulfapyridine",
            "Sulfisoxazole",
            "Sulfacetamide",
            "Sulfathiazole",
            "Sulfadoxine",
            "Sulfamethizole",
            "Sulfamethazine",
            "Sulfasalazine",
            "Sulfaguanidine",
            "Sulfaphenazole",
            "Sulfapyrazine",
            "Sulfadimethoxine",
            "Sulfamonomethoxine",
            "Sulfamoxole",
            "Sulfabenzamide",
            "Sulfabromomethazine",
            "Sulfacarbamide",
            "Sulfadimidine",
            "Sulfanilamide",
            "Mafenide",
            "Trimethoprim-sulfamethoxazole (TMP-SMX)",
            "Sulfisomidine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfamethoxazole",
                "Sulfadiazine",
                "Sulfapyridine",
                "Sulfisoxazole",
                "Sulfacetamide",
                "Sulfathiazole",
                "Sulfadoxine",
                "Sulfamethizole",
                "Sulfamethazine",
                "Sulfasalazine",
                "Sulfaguanidine",
                "Sulfaphenazole",
                "Sulfadimethoxine",
                "Sulfamonomethoxine",
                "Sulfamoxole",
                "Sulfabenzamide",
                "Sulfabromomethazine",
                "Sulfacarbamide",
                "Sulfanilamide",
                "Sulfisomidine"
            ],
            "mismatches": [
                "Sulfapyrazine",
                "Sulfadimidine",
                "Mafenide",
                "Trimethoprim-sulfamethoxazole (TMP-SMX)"
            ],
            "true_referents": [
                "4-sulfanilamidobenzoic acid",
                "Mefluidide",
                "Sulfamonomethoxine",
                "ambuside",
                "dofetilide",
                "sulfabenzamide",
                "sulfabromomethazine",
                "sulfacarbamide",
                "sulfacetamide",
                "sulfachlorpyrazine",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfaguanidine",
                "sulfaguanole",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfamoxole",
                "sulfanilamide",
                "sulfaphenazole",
                "sulfapyridine",
                "sulfasalazine",
                "sulfathiazole",
                "sulfisomidine",
                "sulfisoxazole"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": "",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfamethoxazole (SMX)",
            "Sulfadiazine (SDZ)",
            "Sulfapyridine",
            "Sulfasalazine (SASP)",
            "Sulfadoxine",
            "Sulfamethizole",
            "Sulfacetamide",
            "Sulfameter",
            "Sulfathiazole",
            "Sulfamerazine",
            "Sulfanilamide",
            "Sulfamonomethoxine",
            "Sulfamethazine",
            "Sulfametrole",
            "Sulfamethoxypyridazine",
            "Sulfadoxine-pyrimethamine",
            "Sulfamethoxazole-trimethoprim (Co-Trimoxazole)",
            "Sulfamethizole Sodium",
            "Sulfamethoxazole N-Acetylcysteine",
            "Sulfamethizol",
            "Sulfapyridine Sodium",
            "Sulfametingen",
            "Sulfameridine",
            "Sulfamethonazole"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfamethoxazole (SMX)",
                "Sulfadiazine (SDZ)",
                "Sulfapyridine",
                "Sulfasalazine (SASP)",
                "Sulfadoxine",
                "Sulfamethizole",
                "Sulfacetamide",
                "Sulfathiazole",
                "Sulfamerazine",
                "Sulfanilamide",
                "Sulfamonomethoxine",
                "Sulfamethazine",
                "Sulfametrole",
                "Sulfamethoxypyridazine"
            ],
            "mismatches": [
                "Sulfameter",
                "Sulfadoxine-pyrimethamine",
                "Sulfamethoxazole-trimethoprim (Co-Trimoxazole)",
                "Sulfamethizole Sodium",
                "Sulfamethoxazole N-Acetylcysteine",
                "Sulfamethizol",
                "Sulfapyridine Sodium",
                "Sulfametingen",
                "Sulfameridine",
                "Sulfamethonazole"
            ],
            "true_referents": [
                "4-sulfanilamidobenzoic acid",
                "N-acetylsulfamethoxazole",
                "Sulfamonomethoxine",
                "Sulfapyridine sodium",
                "Sulfathiazole sodium",
                "sulfacarbamide",
                "sulfacetamide",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfamethoxypyridazine",
                "sulfamethylthiazole",
                "sulfametrole",
                "sulfamoxole",
                "sulfanilamide",
                "sulfapyridine",
                "sulfasalazine",
                "sulfathiazole",
                "sulfometuron",
                "sulfometuron methyl"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfanilamide (SA)",
            "Sulfamethoxazole (SMX)",
            "Sulfadiazine (SDZ)",
            "Sulfadimethoxine (SDM)",
            "Sulfadoxine (SDX)",
            "Sulfamerazine (SMR)",
            "Sulfamethazine (SMZ)",
            "Sulfapyridine (SPY)",
            "Sulfacetamide (SAM)",
            "Sulfasalazine (SSZ)",
            "Sulfisoxazole (SIX)",
            "Sulfathiazole (STZ)",
            "Sulfamethizole (SMT)",
            "Sulfaphenazole (SPZ)",
            "Sulfaguanidine (SGN)",
            "Sulfachloropyridazine (SCP)",
            "Sulfadimidine (SDD)",
            "Sulfaquinoxaline (SQX)",
            "Sulfachrysoidine (SCH)",
            "Sulfamonomethoxine (SMM)",
            "Sulfanitran (SNT)",
            "Sulfaperin (SPE)",
            "Sulfametopyrazine (SMP)",
            "Sulfaclozine (SCZ)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfanilamide",
                "Sulfamethoxazole",
                "Sulfadiazine",
                "Sulfadimethoxine",
                "Sulfadoxine",
                "Sulfamerazine",
                "Sulfamethazine",
                "Sulfapyridine",
                "Sulfacetamide",
                "Sulfasalazine",
                "Sulfisoxazole",
                "Sulfathiazole",
                "Sulfamethizole",
                "Sulfaphenazole",
                "Sulfaguanidine",
                "Sulfachloropyridazine",
                "Sulfamonomethoxine",
                "Sulfaperin"
            ],
            "mismatches": [
                "Sulfadimidine",
                "Sulfaquinoxaline",
                "Sulfachrysoidine",
                "Sulfanitran",
                "Sulfametopyrazine",
                "Sulfaclozine"
            ],
            "true_referents": [
                "4-sulfanilamidobenzoic acid",
                "N(4)-acetylsulfadimethoxine",
                "Sulfamonomethoxine",
                "sulfacarbamide",
                "sulfacetamide",
                "sulfachloropyridazine",
                "sulfachlorpyrazine",
                "sulfadiasulfone",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfaethoxypyridazine",
                "sulfaguanidine",
                "sulfaguanole",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethopyrazine",
                "sulfamethoxazole",
                "sulfamethylthiazole",
                "sulfanilamide",
                "sulfaperin",
                "sulfaphenazole",
                "sulfapyridine",
                "sulfasalazine",
                "sulfathiazole",
                "sulfisoxazole"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfanilamide",
            "Sulfadiazine",
            "Sulfisoxazole",
            "Sulfamethoxazole (SMX)",
            "Sulfacetamide",
            "Mafenide",
            "Sulfasalazine",
            "Furosemide",
            "Bumetanide",
            "Celecoxib",
            "Acetazolamide",
            "Sumatriptan",
            "Probenecid",
            "Dapsone",
            "Zonisamide",
            "Dorzolamide",
            "Chlorothiazide",
            "Hydrochlorothiazide (HCTZ)",
            "Indapamide",
            "Metolazone",
            "Chlorthalidone",
            "Torsemide",
            "Ethoxzolamide",
            "Methazolamide"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfanilamide",
                "Sulfadiazine",
                "Sulfisoxazole",
                "Sulfacetamide",
                "Sulfasalazine",
                "Furosemide",
                "Bumetanide",
                "Celecoxib",
                "Acetazolamide",
                "Sumatriptan",
                "Probenecid",
                "Zonisamide",
                "Dorzolamide",
                "Hydrochlorothiazide",
                "Indapamide",
                "Metolazone",
                "Chlorthalidone",
                "Ethoxzolamide",
                "Methazolamide"
            ],
            "mismatches": [
                "Sulfamethoxazole (SMX)",
                "Mafenide",
                "Dapsone",
                "Chlorothiazide",
                "Torsemide"
            ],
            "true_referents": [
                "4-sulfanilamidobenzoic acid",
                "5-hydroxyindapamide",
                "Benzylhydrochlorothiazide",
                "Mefluidide",
                "Methazolamide",
                "Sulfamoyldapsone",
                "acetazolamide",
                "almotriptan",
                "ambuside",
                "brinzolamide",
                "bumetanide",
                "butazolamide",
                "celecoxib",
                "chlorpropamide",
                "chlorthalidone",
                "dehydroindapamide",
                "diclofenamide",
                "dofetilide",
                "dorzolamide",
                "etebenecid",
                "ethoxzolamide",
                "furosemide",
                "glisolamide",
                "hydrochlorothiazide",
                "hydroxy torasemide",
                "indapamide",
                "metipamide",
                "metolazone",
                "parecoxib",
                "phenbutamide",
                "probenecid",
                "sulfacarbamide",
                "sulfacetamide",
                "sulfadiazine",
                "sulfamazone",
                "sulfamethoxazole",
                "sulfamoxole",
                "sulfanilamide",
                "sulfasalazine",
                "sulfentrazone",
                "sulfisoxazole",
                "sumatriptan",
                "tamsulosin",
                "torasemide",
                "trichlormethiazide",
                "valdecoxib",
                "zonisamide"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfanilamide (SMN)",
            "Sulfacetamide (SCM)",
            "Sulfadiazine (SDZ)",
            "Sulfamethoxazole (SMX)",
            "Sulfadoxine (SDX)",
            "Sulfasalazine (SSZ)",
            "Sulfamethizole (SMZ)",
            "Sulfamethoxypyridazine (SMP)",
            "Sulfadimethoxine (SDM)",
            "Sulfaquinoxaline (SQX)",
            "Sulfachlorpyridazine (SCP)",
            "Sulfamerazine (SMR)",
            "Sulfaphenazole (SPZ)",
            "Sulfanitran (SNT)",
            "Sulfabenzamide (SBZ)",
            "Sulfacytine (SCY)",
            "Sulfaguanidine (SGN)",
            "Sulfapyridine (SPY)",
            "Sulfathiazole (STZ)",
            "Sulfisoxazole (SIX)",
            "Sulfamoxole (SMX)",
            "Sulfacetamide sodium (SCN)",
            "Sulfadimidine (SDM)",
            "Sulfamonomethoxine (SMM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfanilamide (SMN)",
                "Sulfacetamide (SCM)",
                "Sulfadiazine (SDZ)",
                "Sulfamethoxazole (SMX)",
                "Sulfadoxine (SDX)",
                "Sulfasalazine (SSZ)",
                "Sulfamethizole (SMZ)",
                "Sulfamethoxypyridazine (SMP)",
                "Sulfadimethoxine (SDM)",
                "Sulfachlorpyridazine (SCP)",
                "Sulfamerazine (SMR)",
                "Sulfaphenazole (SPZ)",
                "Sulfabenzamide (SBZ)",
                "Sulfacytine (SCY)",
                "Sulfaguanidine (SGN)",
                "Sulfapyridine (SPY)",
                "Sulfathiazole (STZ)",
                "Sulfisoxazole (SIX)",
                "Sulfamoxole (SMX)",
                "Sulfamonomethoxine (SMM)"
            ],
            "mismatches": [
                "Sulfaquinoxaline (SQX)",
                "Sulfanitran (SNT)",
                "Sulfacetamide sodium (SCN)",
                "Sulfadimidine (SDM)"
            ],
            "true_referents": [
                "4-sulfanilamidobenzoic acid",
                "Sulfamonomethoxine",
                "sulfabenzamide",
                "sulfacetamide",
                "sulfachloropyridazine",
                "sulfachlorpyrazine",
                "sulfacytine",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfaethoxypyridazine",
                "sulfaguanidine",
                "sulfaguanole",
                "sulfamerazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfamethoxypyridazine",
                "sulfamethylthiazole",
                "sulfametrole",
                "sulfamoxole",
                "sulfamoylbenzoate",
                "sulfanilamide",
                "sulfaphenazole",
                "sulfapyridine",
                "sulfasalazine",
                "sulfathiazole",
                "sulfisomidine",
                "sulfisoxazole"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfanilamide (SULF)",
            "Sulfamethoxazole (SMTX)",
            "Sulfadiazine (SDFZ)",
            "Sulfapyridine (SPYR)",
            "Sulfadoxine (SDOX)",
            "Sulfamethizole (SMTZ)",
            "Sulfamethoxypyridazine (SMXPZ)",
            "Sulfamethoxine (SMXN)",
            "Sulfamerazine (SMRZ)",
            "Sulfamethazine (SMTZ)",
            "Sulfadimethoxine (SDMX)",
            "Sulfacetamide (SACT)",
            "Sulfamonomethoxine (SMMX)",
            "Sulfaguanidine (SGDN)",
            "Sulfadimidine (SDMD)",
            "Sulfamoxole (SMXL)",
            "Sulfanitran (SNTN)",
            "Sulfaphenazole (SPNZ)",
            "Sulfabenzamide (SBZD)",
            "Sulfathiazole (STHZ)",
            "Sulfaperin (SPRN)",
            "Sulfamethoxine (SMXN)",
            "Sulfadoxine (SDOX)",
            "Sulfadimethoxine (SDMX)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfanilamide (SULF)",
                "Sulfamethoxazole (SMTX)",
                "Sulfadiazine (SDFZ)",
                "Sulfapyridine (SPYR)",
                "Sulfadoxine (SDOX)",
                "Sulfamethizole (SMTZ)",
                "Sulfamethoxypyridazine (SMXPZ)",
                "Sulfamerazine (SMRZ)",
                "Sulfamethazine (SMTZ)",
                "Sulfadimethoxine (SDMX)",
                "Sulfacetamide (SACT)",
                "Sulfamonomethoxine (SMMX)",
                "Sulfaguanidine (SGDN)",
                "Sulfamoxole (SMXL)",
                "Sulfaphenazole (SPNZ)",
                "Sulfabenzamide (SBZD)",
                "Sulfathiazole (STHZ)",
                "Sulfaperin (SPRN)"
            ],
            "mismatches": [
                "Sulfamethoxine (SMXN)",
                "Sulfadimidine (SDMD)",
                "Sulfanitran (SNTN)"
            ],
            "true_referents": [
                "4-sulfanilamidobenzoic acid",
                "N-benzyl-4-sulfamoylbenzamide",
                "Sulfamonomethoxine",
                "sulfabenzamide",
                "sulfacetamide",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfaethoxypyridazine",
                "sulfaguanidine",
                "sulfaguanole",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfamethoxypyridazine",
                "sulfamethylthiazole",
                "sulfamoxole",
                "sulfanilamide",
                "sulfaperin",
                "sulfaphenazole",
                "sulfapyridine",
                "sulfathiazole",
                "sulfentrazone",
                "sulfisoxazole"
            ],
            "TP": 18,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfanilamide (1)",
            "Sulfapyridine (2)",
            "Sulfadiazine (3)",
            "Sulfamethoxazole (4)",
            "Sulfadoxine (5)",
            "Sulfamerazine (6)",
            "Sulfamethizole (7)",
            "Sulfacetamide (8)",
            "Sulfasalazine (9)",
            "Sulfamethoxazole-trimethoprim (10)",
            "Sulfadimethoxine (11)",
            "Sulfadoxine-pyrimethamine (12)",
            "Sulfameter (13)",
            "Sulfamonomethoxine (14)",
            "Sulfapyridine (15)",
            "Sulfamethoxazole (16)",
            "Sulfadimethoxine (17)",
            "Sulfadoxine (18)",
            "Sulfameter (19)",
            "Sulfamonomethoxine (20)",
            "Sulfapyridine (21)",
            "Sulfamethoxazole-trimethoprim (22)",
            "Sulfadimethoxine (23)",
            "Sulfadoxine-pyrimethamine (24)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfanilamide (1)",
                "Sulfapyridine (2)",
                "Sulfadiazine (3)",
                "Sulfamethoxazole (4)",
                "Sulfadoxine (5)",
                "Sulfamerazine (6)",
                "Sulfamethizole (7)",
                "Sulfacetamide (8)",
                "Sulfasalazine (9)",
                "Sulfadimethoxine (11)",
                "Sulfamonomethoxine (14)"
            ],
            "mismatches": [
                "Sulfamethoxazole-trimethoprim (10)",
                "Sulfadoxine-pyrimethamine (12)",
                "Sulfameter (13)",
                "Sulfameter (19)",
                "Sulfamethoxazole-trimethoprim (22)",
                "Sulfadoxine-pyrimethamine (24)"
            ],
            "true_referents": [
                "(S)-sulfamazone",
                "4-sulfanilamidobenzoic acid",
                "Sulfamonomethoxine",
                "sulfacetamide",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfadoxine",
                "sulfamerazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfametrole",
                "sulfamoxole",
                "sulfanilamide",
                "sulfapyridine",
                "sulfasalazine",
                "sulfasomizole"
            ],
            "TP": 11,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": [
            "Sulfanilamide (SUL)",
            "Sulfamethoxazole (SMZ)",
            "Sulfadiazine (SDZ)",
            "Sulfisoxazole (SXZ)",
            "Sulfathalidine (STZ)",
            "Sulfacetamide (SU)",
            "Sulfamethazine (SMT)",
            "Sulfapyridine (SPY)",
            "Sulfafurazole (SFZ)",
            "Sulfadimethoxine (SDM)",
            "Sulfachloropyridazine (SCP)",
            "Sulfamonomethoxine (SMM)",
            "Sulfaphenazole (SPH)",
            "Sulfadimidine (SDI)",
            "Sulfametoxydiazine (SMD)",
            "Celecoxib (SCB)",
            "Furosemide (FSM)",
            "Azosulfamide (AZS)",
            "Sulfanitran (SNT)",
            "Sulfaphenide (SPN)",
            "Sulfaguanidine (SGD)",
            "Sulfanilic acid (SLA)",
            "Sulfacetamide sodium (SAS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Sulfanilamide",
                "Sulfamethoxazole",
                "Sulfadiazine",
                "Sulfisoxazole",
                "Sulfacetamide",
                "Sulfamethazine",
                "Sulfapyridine",
                "Sulfadimethoxine",
                "Sulfachloropyridazine",
                "Sulfamonomethoxine",
                "Sulfaphenazole",
                "Celecoxib",
                "Furosemide",
                "Sulfaguanidine"
            ],
            "mismatches": [
                "Sulfathalidine",
                "Sulfafurazole",
                "Sulfadimidine",
                "Sulfametoxydiazine",
                "Azosulfamide",
                "Sulfanitran",
                "Sulfaphenide",
                "Sulfanilic acid",
                "Sulfacetamide sodium"
            ],
            "true_referents": [
                "(S)-metazosulfuron",
                "2-aminobenzenesulfonamide",
                "4-sulfanilamidobenzoic acid",
                "Sulfamerazine sodium",
                "Sulfamonomethoxine",
                "celecoxib",
                "flusulfamide",
                "furosemide",
                "parecoxib",
                "sulfacarbamide",
                "sulfacetamide",
                "sulfachloropyridazine",
                "sulfachlorpyrazine",
                "sulfadiazine",
                "sulfadimethoxine",
                "sulfaethoxypyridazine",
                "sulfaguanidine",
                "sulfaguanole",
                "sulfamerazine",
                "sulfamethazine",
                "sulfamethizole",
                "sulfamethoxazole",
                "sulfamethoxydiazine",
                "sulfanilamide",
                "sulfaphenazole",
                "sulfapyridine",
                "sulfathiazole",
                "sulfisomidine",
                "sulfisoxazole",
                "thiazosulfone",
                "valdecoxib"
            ],
            "TP": 14,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "sulfonamide",
        "domain": "chemistry",
        "response": "error when calling model 'amazon.titan-text-express-v1': empty response",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]