[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Schizophrenia (SCZ)",
            "Bipolar Disorder (BD)",
            "Major Depressive Disorder (MDD)",
            "Anxiety Disorder (AD)",
            "Obsessive-Compulsive Disorder (OCD)",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Eating Disorder (ED)",
            "Dissociative Identity Disorder (DID)",
            "Attention Deficit Hyperactivity Disorder (ADHD)",
            "Autism Spectrum Disorder (ASD)",
            "Schizoaffective Disorder (SZA)",
            "Borderline Personality Disorder (BPD)",
            "Generalized Anxiety Disorder (GAD)",
            "Social Anxiety Disorder (SAD)",
            "Specific Phobia (SP)",
            "Panic Disorder (PD)",
            "Conduct Disorder (CD)",
            "Oppositional Defiant Disorder (ODD)",
            "Substance Use Disorder (SUD)",
            "Insomnia Disorder (ID)",
            "Narcissistic Personality Disorder (NPD)",
            "Avoidant Personality Disorder (AVPD)",
            "Histrionic Personality Disorder (HPD)",
            "Dependent Personality Disorder (DPD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Schizophrenia",
                "Bipolar Disorder",
                "Obsessive-Compulsive Disorder",
                "Dissociative Identity Disorder",
                "Autism Spectrum Disorder",
                "Borderline Personality Disorder",
                "Panic Disorder",
                "Conduct Disorder",
                "Oppositional Defiant Disorder",
                "Narcissistic Personality Disorder",
                "Histrionic Personality Disorder",
                "Dependent Personality Disorder"
            ],
            "mismatches": [
                "Major Depressive Disorder",
                "Anxiety Disorder",
                "Post-Traumatic Stress Disorder",
                "Eating Disorder",
                "Attention Deficit Hyperactivity Disorder",
                "Schizoaffective Disorder",
                "Generalized Anxiety Disorder",
                "Social Anxiety Disorder",
                "Specific Phobia",
                "Substance Use Disorder",
                "Insomnia Disorder",
                "Avoidant Personality Disorder"
            ],
            "true_referents": [
                "Agoraphobia",
                "Anorexia Nervosa",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Binge-Eating Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Borderline Personality Disorder",
                "Bulimia Nervosa",
                "Cocaine-Related Disorders",
                "Compulsive Personality Disorder",
                "Conduct Disorder",
                "Dependent Personality Disorder",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Disruptive, Impulse Control, and Conduct Disorders",
                "Dissociative Disorders",
                "Dissociative Identity Disorder",
                "Dyssomnias",
                "Histrionic Personality Disorder",
                "Hoarding Disorder",
                "Idiopathic Hypersomnia",
                "Narcissistic Personality Disorder",
                "Neurotic Disorders",
                "Obsessive-Compulsive Disorder",
                "Oppositional Defiant Disorder",
                "Panic Disorder",
                "Passive-Aggressive Personality Disorder",
                "Personality Disorders",
                "Phobia, Social",
                "Phobic Disorders",
                "Schizoid Personality Disorder",
                "Schizophrenia",
                "Schizophrenia Spectrum and Other Psychotic Disorders",
                "Schizophrenia, Paranoid",
                "Schizotypal Personality Disorder",
                "Sleep Initiation and Maintenance Disorders",
                "Social Communication Disorder",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Substance Withdrawal Syndrome",
                "Substance-Related Disorders",
                "Trauma and Stressor Related Disorders"
            ],
            "TP": 12,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Major Depressive Disorder (MDD)",
            "Bipolar Disorder",
            "Schizophrenia",
            "Obsessive-Compulsive Disorder (OCD)",
            "Generalized Anxiety Disorder (GAD)",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Social Anxiety Disorder",
            "Panic Disorder",
            "Borderline Personality Disorder (BPD)",
            "Attention-Deficit/Hyperactivity Disorder (ADHD)",
            "Anorexia Nervosa",
            "Bulimia Nervosa",
            "Antisocial Personality Disorder",
            "Histrionic Personality Disorder",
            "Narcissistic Personality Disorder",
            "Avoidant Personality Disorder",
            "Schizotypal Personality Disorder",
            "Paranoid Personality Disorder",
            "Substance-Induced Psychotic Disorder",
            "Delusional Disorder",
            "Body Dysmorphic Disorder",
            "Hoarding Disorder",
            "Trichotillomania (Hair-Pulling Disorder)",
            "Rumination Disorder",
            "Trichotillomania"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Bipolar Disorder",
                "Schizophrenia",
                "Obsessive-Compulsive Disorder (OCD)",
                "Panic Disorder",
                "Borderline Personality Disorder (BPD)",
                "Anorexia Nervosa",
                "Bulimia Nervosa",
                "Antisocial Personality Disorder",
                "Histrionic Personality Disorder",
                "Narcissistic Personality Disorder",
                "Schizotypal Personality Disorder",
                "Paranoid Personality Disorder",
                "Body Dysmorphic Disorder",
                "Hoarding Disorder",
                "Trichotillomania",
                "Rumination Disorder"
            ],
            "mismatches": [
                "Major Depressive Disorder (MDD)",
                "Generalized Anxiety Disorder (GAD)",
                "Post-Traumatic Stress Disorder (PTSD)",
                "Social Anxiety Disorder",
                "Attention-Deficit/Hyperactivity Disorder (ADHD)",
                "Avoidant Personality Disorder",
                "Substance-Induced Psychotic Disorder",
                "Delusional Disorder",
                "Trichotillomania (Hair-Pulling Disorder)"
            ],
            "true_referents": [
                "Agoraphobia",
                "Anorexia Nervosa",
                "Antisocial Personality Disorder",
                "Anxiety Disorders",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Binge-Eating Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Body Dysmorphic Disorders",
                "Borderline Personality Disorder",
                "Bulimia Nervosa",
                "Cognition Disorders",
                "Compulsive Personality Disorder",
                "Conduct Disorder",
                "Cyclothymic Disorder",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Dysthymic Disorder",
                "Factitious Disorders",
                "Histrionic Personality Disorder",
                "Hoarding Disorder",
                "Narcissistic Personality Disorder",
                "Obsessive-Compulsive Disorder",
                "Orthorexia Nervosa",
                "Panic Disorder",
                "Paranoid Disorders",
                "Paranoid Personality Disorder",
                "Passive-Aggressive Personality Disorder",
                "Personality Disorders",
                "Phobia, Social",
                "Psychoses, Substance-Induced",
                "Psychotic Disorders",
                "Rumination Syndrome",
                "Schizoid Personality Disorder",
                "Schizophrenia",
                "Schizophrenia, Paranoid",
                "Schizotypal Personality Disorder",
                "Shared Paranoid Disorder",
                "Social Communication Disorder",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Trauma and Stressor Related Disorders",
                "Trichotillomania"
            ],
            "TP": 16,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Schizophrenia",
            "Bipolar Disorder",
            "Major Depressive Disorder",
            "Anxiety Disorder",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Obsessive-Compulsive Disorder (OCD)",
            "Attention Deficit Hyperactivity Disorder (ADHD)",
            "Eating Disorders (e.g., Anorexia Nervosa, Bulimia Nervosa)",
            "Autism Spectrum Disorder",
            "Borderline Personality Disorder",
            "Dementia",
            "Alzheimer's Disease",
            "Parkinson's Disease",
            "Huntington's Disease",
            "Multiple Sclerosis",
            "Epilepsy",
            "Tourette Syndrome",
            "Narcolepsy",
            "Chronic Fatigue Syndrome",
            "Fibromyalgia",
            "Chronic Pain Syndrome",
            "Somatic Symptom Disorder",
            "Dissociative Identity Disorder",
            "Panic Disorder",
            "Seasonal Affective Disorder (SAD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Schizophrenia",
                "Bipolar Disorder",
                "Anxiety Disorders",
                "Obsessive-Compulsive Disorder",
                "Autism Spectrum Disorder",
                "Borderline Personality Disorder",
                "Dementia",
                "Huntington Disease",
                "Tourette Syndrome",
                "Narcolepsy",
                "Dissociative Identity Disorder",
                "Panic Disorder",
                "Seasonal Affective Disorder"
            ],
            "mismatches": [
                "Major Depressive Disorder",
                "Post-Traumatic Stress Disorder (PTSD)",
                "Attention Deficit Hyperactivity Disorder (ADHD)",
                "Eating Disorders (e.g., Anorexia Nervosa, Bulimia Nervosa)",
                "Alzheimer's Disease",
                "Parkinson's Disease",
                "Multiple Sclerosis",
                "Epilepsy",
                "Chronic Fatigue Syndrome",
                "Fibromyalgia",
                "Chronic Pain Syndrome",
                "Somatic Symptom Disorder"
            ],
            "true_referents": [
                "Agoraphobia",
                "Alzheimer Disease",
                "Anorexia Nervosa",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Binge-Eating Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Borderline Personality Disorder",
                "Bulimia Nervosa",
                "Cognitive Dysfunction",
                "Compulsive Personality Disorder",
                "Cyclothymic Disorder",
                "Dementia",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Dissociative Disorders",
                "Dissociative Identity Disorder",
                "Dyssomnias",
                "Hoarding Disorder",
                "Huntington Disease",
                "Hypochondriasis",
                "Lewy Body Disease",
                "Motor Disorders",
                "Narcissistic Personality Disorder",
                "Narcolepsy",
                "Neurasthenia",
                "Neurocognitive Disorders",
                "Obsessive-Compulsive Disorder",
                "Panic Disorder",
                "Personality Disorders",
                "Phobic Disorders",
                "Psychotic Disorders",
                "Restless Legs Syndrome",
                "Schizophrenia",
                "Schizophrenia, Paranoid",
                "Schizotypal Personality Disorder",
                "Seasonal Affective Disorder",
                "Sleep Wake Disorders",
                "Somatoform Disorders",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Tic Disorders",
                "Tourette Syndrome",
                "Trauma and Stressor Related Disorders"
            ],
            "TP": 13,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Major Depressive Disorder (MDD)",
            "Schizophrenia (SCH)",
            "Bipolar Disorder (BD)",
            "Generalized Anxiety Disorder (GAD)",
            "Obsessive-Compulsive Disorder (OCD)",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Panic Disorder (PD)",
            "Social Anxiety Disorder (SAD)",
            "Borderline Personality Disorder (BPD)",
            "Narcissistic Personality Disorder (NPD)",
            "Antisocial Personality Disorder (ASPD)",
            "Attention-Deficit/Hyperactivity Disorder (ADHD)",
            "Autism Spectrum Disorder (ASD)",
            "Anorexia Nervosa (AN)",
            "Bulimia Nervosa (BN)",
            "Body Dysmorphic Disorder (BDD)",
            "Delusional Disorder (DD)",
            "Dissociative Identity Disorder (DID)",
            "Histrionic Personality Disorder (HPD)",
            "Avoidant Personality Disorder (AvPD)",
            "Paranoid Personality Disorder (PPD)",
            "Cyclothymic Disorder (CTD)",
            "Dysthymic Disorder (DD)",
            "Seasonal Affective Disorder (SAD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Bipolar Disorder",
                "Obsessive-Compulsive Disorder",
                "Panic Disorder",
                "Borderline Personality Disorder",
                "Narcissistic Personality Disorder",
                "Antisocial Personality Disorder",
                "Autism Spectrum Disorder",
                "Anorexia Nervosa",
                "Bulimia Nervosa",
                "Dissociative Identity Disorder",
                "Histrionic Personality Disorder",
                "Paranoid Personality Disorder",
                "Cyclothymic Disorder",
                "Dysthymic Disorder",
                "Seasonal Affective Disorder"
            ],
            "mismatches": [
                "Major Depressive Disorder (MDD)",
                "Schizophrenia (SCH)",
                "Generalized Anxiety Disorder (GAD)",
                "Post-Traumatic Stress Disorder (PTSD)",
                "Social Anxiety Disorder (SAD)",
                "Attention-Deficit/Hyperactivity Disorder (ADHD)",
                "Body Dysmorphic Disorder (BDD)",
                "Delusional Disorder (DD)",
                "Avoidant Personality Disorder (AvPD)"
            ],
            "true_referents": [
                "Agoraphobia",
                "Anorexia Nervosa",
                "Antisocial Personality Disorder",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Binge-Eating Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Body Dysmorphic Disorders",
                "Borderline Personality Disorder",
                "Bulimia Nervosa",
                "Compulsive Personality Disorder",
                "Cyclothymic Disorder",
                "Dependent Personality Disorder",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Dissociative Disorders",
                "Dissociative Identity Disorder",
                "Dysthymic Disorder",
                "Factitious Disorders",
                "Histrionic Personality Disorder",
                "Hoarding Disorder",
                "Mood Disorders",
                "Narcissistic Personality Disorder",
                "Obsessive-Compulsive Disorder",
                "Orthorexia Nervosa",
                "Panic Disorder",
                "Paranoid Disorders",
                "Paranoid Personality Disorder",
                "Passive-Aggressive Personality Disorder",
                "Personality Disorders",
                "Phobia, Social",
                "Schizoid Personality Disorder",
                "Schizophrenia",
                "Schizophrenia, Catatonic",
                "Schizophrenia, Paranoid",
                "Schizotypal Personality Disorder",
                "Seasonal Affective Disorder",
                "Shared Paranoid Disorder",
                "Social Communication Disorder",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Trauma and Stressor Related Disorders"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Major Depressive Disorder (MDD)",
            "Bipolar Disorder (BD)",
            "Schizophrenia",
            "Generalized Anxiety Disorder (GAD)",
            "Obsessive-Compulsive Disorder (OCD)",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Panic Disorder",
            "Social Anxiety Disorder",
            "Attention-Deficit/Hyperactivity Disorder (ADHD)",
            "Autism Spectrum Disorder (ASD)",
            "Borderline Personality Disorder (BPD)",
            "Antisocial Personality Disorder",
            "Avoidant Personality Disorder",
            "Dependent Personality Disorder",
            "Histrionic Personality Disorder",
            "Narcissistic Personality Disorder",
            "Paranoid Personality Disorder",
            "Schizoid Personality Disorder",
            "Schizotypal Personality Disorder",
            "Anorexia Nervosa",
            "Bulimia Nervosa",
            "Binge-Eating Disorder",
            "Dissociative Identity Disorder (DID)",
            "Somatic Symptom Disorder"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Bipolar Disorder (BD)",
                "Schizophrenia",
                "Obsessive-Compulsive Disorder (OCD)",
                "Panic Disorder",
                "Autism Spectrum Disorder (ASD)",
                "Borderline Personality Disorder (BPD)",
                "Antisocial Personality Disorder",
                "Dependent Personality Disorder",
                "Histrionic Personality Disorder",
                "Narcissistic Personality Disorder",
                "Paranoid Personality Disorder",
                "Schizoid Personality Disorder",
                "Schizotypal Personality Disorder",
                "Anorexia Nervosa",
                "Bulimia Nervosa",
                "Binge-Eating Disorder"
            ],
            "mismatches": [
                "Major Depressive Disorder (MDD)",
                "Generalized Anxiety Disorder (GAD)",
                "Post-Traumatic Stress Disorder (PTSD)",
                "Social Anxiety Disorder",
                "Attention-Deficit/Hyperactivity Disorder (ADHD)",
                "Avoidant Personality Disorder",
                "Dissociative Identity Disorder (DID)",
                "Somatic Symptom Disorder"
            ],
            "true_referents": [
                "Agoraphobia",
                "Anorexia Nervosa",
                "Antisocial Personality Disorder",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Binge-Eating Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Borderline Personality Disorder",
                "Bulimia Nervosa",
                "Compulsive Personality Disorder",
                "Conduct Disorder",
                "Dependent Personality Disorder",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Dissociative Disorders",
                "Dissociative Identity Disorder",
                "Dysthymic Disorder",
                "Histrionic Personality Disorder",
                "Hoarding Disorder",
                "Hypochondriasis",
                "Narcissistic Personality Disorder",
                "Obsessive-Compulsive Disorder",
                "Orthorexia Nervosa",
                "Panic Disorder",
                "Paranoid Disorders",
                "Paranoid Personality Disorder",
                "Passive-Aggressive Personality Disorder",
                "Personality Disorders",
                "Phobia, Social",
                "Psychotic Disorders",
                "Schizoid Personality Disorder",
                "Schizophrenia",
                "Schizophrenia, Paranoid",
                "Schizotypal Personality Disorder",
                "Shared Paranoid Disorder",
                "Social Communication Disorder",
                "Somatoform Disorders",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Trauma and Stressor Related Disorders"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Major Depressive Disorder (MDD)",
            "Generalized Anxiety Disorder (GAD)",
            "Bipolar Disorder (BD)",
            "Schizophrenia (SCZ)",
            "Obsessive-Compulsive Disorder (OCD)",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Social Anxiety Disorder (SAD)",
            "Panic Disorder (PD)",
            "Attention-Deficit/Hyperactivity Disorder (ADHD)",
            "Borderline Personality Disorder (BPD)",
            "Autism Spectrum Disorder (ASD)",
            "Eating Disorder Not Otherwise Specified (EDNOS)",
            "Dysthymic Disorder (Persistent Depressive Disorder)",
            "Specific Phobia (SP)",
            "Agoraphobia (AG)",
            "Seasonal Affective Disorder (SAD)",
            "Substance Use Disorder (SUD)",
            "Schizoaffective Disorder (SAD)",
            "Psychotic Disorder Due to Another Medical Condition",
            "Delusional Disorder (DD)",
            "Intermittent Explosive Disorder (IED)",
            "Narcissistic Personality Disorder (NPD)",
            "Histrionic Personality Disorder (HPD)",
            "Adjustment Disorder (AD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Major Depressive Disorder (MDD)",
                "Bipolar Disorder (BD)",
                "Schizophrenia (SCZ)",
                "Obsessive-Compulsive Disorder (OCD)",
                "Panic Disorder (PD)",
                "Borderline Personality Disorder (BPD)",
                "Autism Spectrum Disorder (ASD)",
                "Dysthymic Disorder (Persistent Depressive Disorder)",
                "Agoraphobia (AG)",
                "Seasonal Affective Disorder (SAD)",
                "Narcissistic Personality Disorder (NPD)",
                "Histrionic Personality Disorder (HPD)",
                "Adjustment Disorder (AD)"
            ],
            "mismatches": [
                "Generalized Anxiety Disorder (GAD)",
                "Post-Traumatic Stress Disorder (PTSD)",
                "Social Anxiety Disorder (SAD)",
                "Attention-Deficit/Hyperactivity Disorder (ADHD)",
                "Eating Disorder Not Otherwise Specified (EDNOS)",
                "Specific Phobia (SP)",
                "Substance Use Disorder (SUD)",
                "Schizoaffective Disorder (SAD)",
                "Psychotic Disorder Due to Another Medical Condition",
                "Delusional Disorder (DD)",
                "Intermittent Explosive Disorder (IED)"
            ],
            "true_referents": [
                "Adjustment Disorders",
                "Agoraphobia",
                "Anorexia Nervosa",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Borderline Personality Disorder",
                "Bulimia Nervosa",
                "Cocaine-Related Disorders",
                "Combat Disorders",
                "Compulsive Personality Disorder",
                "Conduct Disorder",
                "Dependent Personality Disorder",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Disruptive, Impulse Control, and Conduct Disorders",
                "Dissociative Identity Disorder",
                "Dysthymic Disorder",
                "Factitious Disorders",
                "Histrionic Personality Disorder",
                "Hoarding Disorder",
                "Mood Disorders",
                "Narcissistic Personality Disorder",
                "Obsessive-Compulsive Disorder",
                "Orthorexia Nervosa",
                "Panic Disorder",
                "Personality Disorders",
                "Phobia, Social",
                "Phobic Disorders",
                "Psychotic Disorders",
                "Schizophrenia",
                "Schizophrenia Spectrum and Other Psychotic Disorders",
                "Schizophrenia, Paranoid",
                "Seasonal Affective Disorder",
                "Social Communication Disorder",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Substance Withdrawal Syndrome",
                "Substance-Related Disorders",
                "Trauma and Stressor Related Disorders"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Schizophrenia (SCZ)",
            "Major Depressive Disorder (MDD)",
            "Bipolar Disorder (BD)",
            "Obsessive-Compulsive Disorder (OCD)",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Generalized Anxiety Disorder (GAD)",
            "Panic Disorder (PD)",
            "Social Anxiety Disorder (SAD)",
            "Borderline Personality Disorder (BPD)",
            "Antisocial Personality Disorder (ASPD)",
            "Attention Deficit Hyperactivity Disorder (ADHD)",
            "Autism Spectrum Disorder (ASD)",
            "Dissociative Identity Disorder (DID)",
            "Body Dysmorphic Disorder (BDD)",
            "Specific Phobia (SP)",
            "Agoraphobia (AG)",
            "Paranoid Personality Disorder (PPD)",
            "Histrionic Personality Disorder (HPD)",
            "Narcissistic Personality Disorder (NPD)",
            "Dependent Personality Disorder (DPD)",
            "Anorexia Nervosa (AN)",
            "Bulimia Nervosa (BN)",
            "Substance Use Disorder (SUD)",
            "Gaming Disorder (GD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Schizophrenia",
                "Major Depressive Disorder",
                "Bipolar Disorder",
                "Obsessive-Compulsive Disorder",
                "Post-Traumatic Stress Disorder",
                "Panic Disorder",
                "Borderline Personality Disorder",
                "Antisocial Personality Disorder",
                "Autism Spectrum Disorder",
                "Dissociative Identity Disorder",
                "Body Dysmorphic Disorders",
                "Agoraphobia",
                "Paranoid Personality Disorder",
                "Histrionic Personality Disorder",
                "Narcissistic Personality Disorder",
                "Dependent Personality Disorder",
                "Anorexia Nervosa",
                "Bulimia Nervosa"
            ],
            "mismatches": [
                "Generalized Anxiety Disorder",
                "Social Anxiety Disorder",
                "Attention Deficit Hyperactivity Disorder",
                "Specific Phobia",
                "Substance Use Disorder",
                "Gaming Disorder"
            ],
            "true_referents": [
                "Agoraphobia",
                "Anorexia Nervosa",
                "Antisocial Personality Disorder",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Binge-Eating Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Body Dysmorphic Disorders",
                "Borderline Personality Disorder",
                "Bulimia Nervosa",
                "Cocaine-Related Disorders",
                "Compulsive Personality Disorder",
                "Conduct Disorder",
                "Dependent Personality Disorder",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Dissociative Disorders",
                "Dissociative Identity Disorder",
                "Histrionic Personality Disorder",
                "Hoarding Disorder",
                "Narcissistic Personality Disorder",
                "Obsessive-Compulsive Disorder",
                "Orthorexia Nervosa",
                "Panic Disorder",
                "Paranoid Disorders",
                "Paranoid Personality Disorder",
                "Personality Disorders",
                "Phobia, Social",
                "Phobic Disorders",
                "Schizophrenia",
                "Schizophrenia Spectrum and Other Psychotic Disorders",
                "Schizophrenia, Paranoid",
                "Schizotypal Personality Disorder",
                "Shared Paranoid Disorder",
                "Social Communication Disorder",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Substance Withdrawal Syndrome",
                "Substance-Related Disorders",
                "Trauma and Stressor Related Disorders"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Schizophrenia",
            "Major depressive disorder",
            "Bipolar disorder",
            "Generalized anxiety disorder",
            "Obsessive-compulsive disorder",
            "Post-traumatic stress disorder",
            "Attention deficit hyperactivity disorder",
            "Autism spectrum disorder",
            "Alzheimer's disease",
            "Parkinson's disease",
            "Huntington's disease",
            "Multiple sclerosis",
            "Amyotrophic lateral sclerosis",
            "Epilepsy",
            "Cancer",
            "Diabetes",
            "HIV/AIDS",
            "Malaria",
            "Tuberculosis",
            "Influenza",
            "COVID-19",
            "Sickle cell anemia",
            "Cystic fibrosis",
            "Rheumatoid arthritis"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Schizophrenia",
                "Depressive Disorder, Major",
                "Bipolar Disorder",
                "Obsessive-Compulsive Disorder",
                "Stress Disorders, Post-Traumatic",
                "Autism Spectrum Disorder",
                "Huntington Disease"
            ],
            "mismatches": [
                "Generalized anxiety disorder",
                "Attention deficit hyperactivity disorder",
                "Alzheimer's disease",
                "Parkinson's disease",
                "Multiple sclerosis",
                "Amyotrophic lateral sclerosis",
                "Epilepsy",
                "Cancer",
                "Diabetes",
                "HIV/AIDS",
                "Malaria",
                "Tuberculosis",
                "Influenza",
                "COVID-19",
                "Sickle cell anemia",
                "Cystic fibrosis",
                "Rheumatoid arthritis"
            ],
            "true_referents": [
                "AIDS Dementia Complex",
                "Agoraphobia",
                "Alzheimer Disease",
                "Anorexia Nervosa",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Chemotherapy-Related Cognitive Impairment",
                "Communication Disorders",
                "Compulsive Personality Disorder",
                "Creutzfeldt-Jakob Syndrome",
                "Cyclothymic Disorder",
                "Dementia",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Diabulimia",
                "Hoarding Disorder",
                "Huntington Disease",
                "Hypochondriasis",
                "Kluver-Bucy Syndrome",
                "Lewy Body Disease",
                "Morgellons Disease",
                "Motor Disorders",
                "Neurasthenia",
                "Neurocognitive Disorders",
                "Obsessive-Compulsive Disorder",
                "Panic Disorder",
                "Psychotic Disorders",
                "Schizophrenia",
                "Schizophrenia, Paranoid",
                "Seasonal Affective Disorder",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Trauma and Stressor Related Disorders"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Schizophrenia (SCH)",
            "Bipolar Disorder (BD)",
            "Major Depressive Disorder (MDD)",
            "Generalized Anxiety Disorder (GAD)",
            "Attention-Deficit/Hyperactivity Disorder (ADHD)",
            "Autism Spectrum Disorder (ASD)",
            "Obsessive-Compulsive Disorder (OCD)",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Borderline Personality Disorder (BPD)",
            "Antisocial Personality Disorder (ASPD)",
            "Narcissistic Personality Disorder (NPD)",
            "Histrionic Personality Disorder (HPD)",
            "Avoidant Personality Disorder (AVPD)",
            "Dependent Personality Disorder (DPD)",
            "Paranoid Personality Disorder (PPD)",
            "Schizotypal Personality Disorder (STPD)",
            "Bulimia Nervosa (BN)",
            "Anorexia Nervosa (AN)",
            "Panic Disorder (PD)",
            "Social Anxiety Disorder (SAD)",
            "Specific Phobias",
            "Cyclothymic Disorder",
            "Dissociative Identity Disorder (DID)",
            "Somatic Symptom Disorder"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Schizophrenia",
                "Bipolar Disorder",
                "Attention Deficit Disorder with Hyperactivity",
                "Autism Spectrum Disorder",
                "Obsessive-Compulsive Disorder",
                "Borderline Personality Disorder",
                "Antisocial Personality Disorder",
                "Narcissistic Personality Disorder",
                "Histrionic Personality Disorder",
                "Dependent Personality Disorder",
                "Paranoid Personality Disorder",
                "Schizotypal Personality Disorder",
                "Bulimia Nervosa",
                "Anorexia Nervosa",
                "Panic Disorder",
                "Cyclothymic Disorder",
                "Dissociative Identity Disorder"
            ],
            "mismatches": [
                "Major Depressive Disorder (MDD)",
                "Generalized Anxiety Disorder (GAD)",
                "Post-Traumatic Stress Disorder (PTSD)",
                "Avoidant Personality Disorder (AVPD)",
                "Social Anxiety Disorder (SAD)",
                "Specific Phobias",
                "Somatic Symptom Disorder"
            ],
            "true_referents": [
                "Agoraphobia",
                "Anorexia Nervosa",
                "Antisocial Personality Disorder",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Binge-Eating Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Borderline Personality Disorder",
                "Bulimia Nervosa",
                "Compulsive Personality Disorder",
                "Cyclothymic Disorder",
                "Dependent Personality Disorder",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Dissociative Disorders",
                "Dissociative Identity Disorder",
                "Dysthymic Disorder",
                "Histrionic Personality Disorder",
                "Hoarding Disorder",
                "Hypochondriasis",
                "Narcissistic Personality Disorder",
                "Obsessive-Compulsive Disorder",
                "Orthorexia Nervosa",
                "Panic Disorder",
                "Paranoid Disorders",
                "Paranoid Personality Disorder",
                "Passive-Aggressive Personality Disorder",
                "Personality Disorders",
                "Phobia, Social",
                "Phobic Disorders",
                "Schizoid Personality Disorder",
                "Schizophrenia",
                "Schizophrenia, Catatonic",
                "Schizophrenia, Paranoid",
                "Schizotypal Personality Disorder",
                "Shared Paranoid Disorder",
                "Social Communication Disorder",
                "Somatoform Disorders",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Trauma and Stressor Related Disorders"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Major Depressive Disorder (MDD)",
            "Generalized Anxiety Disorder (GAD)",
            "Bipolar Disorder",
            "Schizophrenia",
            "Obsessive-Compulsive Disorder (OCD)",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Borderline Personality Disorder (BPD)",
            "Anorexia Nervosa",
            "Bulimia Nervosa",
            "Attention Deficit Hyperactivity Disorder (ADHD)",
            "Autism Spectrum Disorder (ASD)",
            "Social Anxiety Disorder",
            "Panic Disorder",
            "Agoraphobia",
            "Specific Phobias",
            "Dissociative Identity Disorder (DID)",
            "Schizoaffective Disorder",
            "Body Dysmorphic Disorder (BDD)",
            "Trichotillomania",
            "Kleptomania",
            "Pyromania",
            "Gambling Disorder",
            "Substance Use Disorders",
            "Antisocial Personality Disorder"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Bipolar Disorder",
                "Schizophrenia",
                "Obsessive-Compulsive Disorder (OCD)",
                "Borderline Personality Disorder (BPD)",
                "Anorexia Nervosa",
                "Bulimia Nervosa",
                "Autism Spectrum Disorder (ASD)",
                "Panic Disorder",
                "Agoraphobia",
                "Dissociative Identity Disorder (DID)",
                "Body Dysmorphic Disorder (BDD)",
                "Trichotillomania",
                "Gambling Disorder",
                "Antisocial Personality Disorder"
            ],
            "mismatches": [
                "Major Depressive Disorder (MDD)",
                "Generalized Anxiety Disorder (GAD)",
                "Post-Traumatic Stress Disorder (PTSD)",
                "Attention Deficit Hyperactivity Disorder (ADHD)",
                "Social Anxiety Disorder",
                "Specific Phobias",
                "Schizoaffective Disorder",
                "Kleptomania",
                "Pyromania",
                "Substance Use Disorders"
            ],
            "true_referents": [
                "Agoraphobia",
                "Alcohol-Related Disorders",
                "Anorexia Nervosa",
                "Antisocial Personality Disorder",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Binge-Eating Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Body Dysmorphic Disorders",
                "Borderline Personality Disorder",
                "Bulimia Nervosa",
                "Compulsive Personality Disorder",
                "Conduct Disorder",
                "Cyclothymic Disorder",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Dissociative Disorders",
                "Dissociative Identity Disorder",
                "Gambling",
                "Hoarding Disorder",
                "Masochism",
                "Narcissistic Personality Disorder",
                "Obsessive-Compulsive Disorder",
                "Orthorexia Nervosa",
                "Panic Disorder",
                "Pedophilia",
                "Personality Disorders",
                "Phobia, Social",
                "Phobic Disorders",
                "Psychotic Disorders",
                "Sadism",
                "Schizoid Personality Disorder",
                "Schizophrenia",
                "Schizophrenia, Paranoid",
                "Schizotypal Personality Disorder",
                "Social Communication Disorder",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Substance-Related Disorders",
                "Tobacco Use Disorder",
                "Trauma and Stressor Related Disorders",
                "Trichotillomania"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Schizophrenia (SZ)",
            "Bipolar Disorder (BD)",
            "Major Depressive Disorder (MDD)",
            "Generalized Anxiety Disorder (GAD)",
            "Obsessive-Compulsive Disorder (OCD)",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Attention-Deficit/Hyperactivity Disorder (ADHD)",
            "Autism Spectrum Disorder (ASD)",
            "Borderline Personality Disorder (BPD)",
            "Narcissistic Personality Disorder (NPD)",
            "Panic Disorder (PD)",
            "Agoraphobia",
            "Social Anxiety Disorder (SAD)",
            "Specific Phobia",
            "Anorexia Nervosa (AN)",
            "Bulimia Nervosa (BN)",
            "Binge Eating Disorder (BED)",
            "Substance Use Disorder (SUD)",
            "Delusional Disorder",
            "Brief Psychotic Disorder",
            "Schizoaffective Disorder",
            "Cyclothymic Disorder",
            "Persistent Depressive Disorder (Dysthymia)",
            "Premenstrual Dysphoric Disorder (PMDD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Schizophrenia",
                "Bipolar Disorder",
                "Obsessive-Compulsive Disorder",
                "Attention Deficit Disorder with Hyperactivity",
                "Autism Spectrum Disorder",
                "Borderline Personality Disorder",
                "Narcissistic Personality Disorder",
                "Panic Disorder",
                "Agoraphobia",
                "Anorexia Nervosa",
                "Bulimia Nervosa",
                "Cyclothymic Disorder",
                "Premenstrual Dysphoric Disorder",
                "Dysthymic Disorder"
            ],
            "mismatches": [
                "Major Depressive Disorder (MDD)",
                "Generalized Anxiety Disorder (GAD)",
                "Post-Traumatic Stress Disorder (PTSD)",
                "Social Anxiety Disorder (SAD)",
                "Specific Phobia",
                "Binge Eating Disorder (BED)",
                "Substance Use Disorder (SUD)",
                "Delusional Disorder",
                "Brief Psychotic Disorder",
                "Schizoaffective Disorder"
            ],
            "true_referents": [
                "Agoraphobia",
                "Anorexia Nervosa",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Binge-Eating Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Borderline Personality Disorder",
                "Bulimia Nervosa",
                "Cocaine-Related Disorders",
                "Compulsive Personality Disorder",
                "Cyclothymic Disorder",
                "Dependent Personality Disorder",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Dysthymic Disorder",
                "Factitious Disorders",
                "Hoarding Disorder",
                "Mood Disorders",
                "Narcissistic Personality Disorder",
                "Obsessive-Compulsive Disorder",
                "Orthorexia Nervosa",
                "Panic Disorder",
                "Personality Disorders",
                "Phobia, Social",
                "Phobic Disorders",
                "Premenstrual Dysphoric Disorder",
                "Psychotic Disorders",
                "Schizoid Personality Disorder",
                "Schizophrenia",
                "Schizophrenia Spectrum and Other Psychotic Disorders",
                "Schizophrenia, Paranoid",
                "Social Communication Disorder",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Substance Withdrawal Syndrome",
                "Substance-Related Disorders",
                "Trauma and Stressor Related Disorders"
            ],
            "TP": 14,
            "FP": 10,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Schizophrenia (SCZ)",
            "Major Depressive Disorder (MDD)",
            "Bipolar Disorder (BD)",
            "Generalized Anxiety Disorder (GAD)",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Obsessive-Compulsive Disorder (OCD)",
            "Panic Disorder (PD)",
            "Social Anxiety Disorder (SAD)",
            "Specific Phobia",
            "Agoraphobia",
            "Anorexia Nervosa (AN)",
            "Bulimia Nervosa (BN)",
            "Binge Eating Disorder (BED)",
            "Substance Use Disorder (SUD)",
            "Alcohol Use Disorder (AUD)",
            "Gambling Disorder",
            "Autism Spectrum Disorder (ASD)",
            "Attention-Deficit/Hyperactivity Disorder (ADHD)",
            "Borderline Personality Disorder (BPD)",
            "Antisocial Personality Disorder (ASPD)",
            "Dissociative Identity Disorder (DID)",
            "Somatic Symptom Disorder",
            "Conversion Disorder",
            "Factitious Disorder"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Schizophrenia",
                "Major Depressive Disorder",
                "Bipolar Disorder",
                "Post-Traumatic Stress Disorder",
                "Obsessive-Compulsive Disorder",
                "Panic Disorder",
                "Agoraphobia",
                "Anorexia Nervosa",
                "Bulimia Nervosa",
                "Binge Eating Disorder",
                "Gambling",
                "Autism Spectrum Disorder",
                "Borderline Personality Disorder",
                "Antisocial Personality Disorder",
                "Dissociative Identity Disorder",
                "Conversion Disorder",
                "Factitious Disorders"
            ],
            "mismatches": [
                "Generalized Anxiety Disorder",
                "Social Anxiety Disorder",
                "Specific Phobia",
                "Substance Use Disorder",
                "Alcohol Use Disorder",
                "Attention-Deficit/Hyperactivity Disorder",
                "Somatic Symptom Disorder"
            ],
            "true_referents": [
                "Agoraphobia",
                "Alcohol-Related Disorders",
                "Alcoholism",
                "Anorexia Nervosa",
                "Antisocial Personality Disorder",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Binge Drinking",
                "Binge-Eating Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Borderline Personality Disorder",
                "Bulimia Nervosa",
                "Cocaine-Related Disorders",
                "Compulsive Personality Disorder",
                "Conversion Disorder",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Dissociative Disorders",
                "Dissociative Identity Disorder",
                "Factitious Disorders",
                "Gambling",
                "Hoarding Disorder",
                "Hypochondriasis",
                "Munchausen Syndrome",
                "Munchausen Syndrome by Proxy",
                "Narcissistic Personality Disorder",
                "Obsessive-Compulsive Disorder",
                "Orthorexia Nervosa",
                "Panic Disorder",
                "Personality Disorders",
                "Phobia, Social",
                "Phobic Disorders",
                "Schizophrenia",
                "Schizophrenia Spectrum and Other Psychotic Disorders",
                "Schizophrenia, Paranoid",
                "Schizotypal Personality Disorder",
                "Social Communication Disorder",
                "Somatoform Disorders",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Substance Withdrawal Syndrome",
                "Substance-Related Disorders",
                "Trauma and Stressor Related Disorders"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Schizophrenia (Sz)",
            "Bipolar Disorder (BD)",
            "Major Depressive Disorder (MDD)",
            "Generalized Anxiety Disorder (GAD)",
            "Obsessive-Compulsive Disorder (OCD)",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Borderline Personality Disorder (BPD)",
            "Autism Spectrum Disorder (ASD)",
            "Attention-Deficit/Hyperactivity Disorder (ADHD)",
            "Substance Use Disorder (SUD)",
            "Anorexia Nervosa (AN)",
            "Bulimia Nervosa (BN)",
            "Panic Disorder (PD)",
            "Social Anxiety Disorder (SAD)",
            "Body Dysmorphic Disorder (BDD)",
            "Hoarding Disorder (HD)",
            "Excoriation Disorder (ED)",
            "Trichotillomania (TTM)",
            "Tourette's Syndrome (TS)",
            "Oppositional Defiant Disorder (ODD)",
            "Conduct Disorder (CD)",
            "Antisocial Personality Disorder (ASPD)",
            "Narcissistic Personality Disorder (NPD)",
            "Avoidant Personality Disorder (AvPD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Schizophrenia",
                "Bipolar Disorder",
                "Obsessive-Compulsive Disorder",
                "Borderline Personality Disorder",
                "Autism Spectrum Disorder",
                "Anorexia Nervosa",
                "Bulimia Nervosa",
                "Panic Disorder",
                "Hoarding Disorder",
                "Excoriation Disorder",
                "Trichotillomania",
                "Tourette Syndrome",
                "Oppositional Defiant Disorder",
                "Conduct Disorder",
                "Antisocial Personality Disorder",
                "Narcissistic Personality Disorder"
            ],
            "mismatches": [
                "Major Depressive Disorder",
                "Generalized Anxiety Disorder",
                "Post-Traumatic Stress Disorder",
                "Attention-Deficit/Hyperactivity Disorder",
                "Substance Use Disorder",
                "Social Anxiety Disorder",
                "Body Dysmorphic Disorder",
                "Avoidant Personality Disorder"
            ],
            "true_referents": [
                "Agoraphobia",
                "Anorexia Nervosa",
                "Antisocial Personality Disorder",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Binge-Eating Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Body Dysmorphic Disorders",
                "Borderline Personality Disorder",
                "Bulimia Nervosa",
                "Cocaine-Related Disorders",
                "Combat Disorders",
                "Compulsive Personality Disorder",
                "Conduct Disorder",
                "Dependent Personality Disorder",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Disruptive, Impulse Control, and Conduct Disorders",
                "Excoriation Disorder",
                "Hoarding Disorder",
                "Narcissistic Personality Disorder",
                "Obsessive-Compulsive Disorder",
                "Oppositional Defiant Disorder",
                "Orthorexia Nervosa",
                "Panic Disorder",
                "Passive-Aggressive Personality Disorder",
                "Personality Disorders",
                "Phobia, Social",
                "Schizoid Personality Disorder",
                "Schizophrenia",
                "Schizophrenia Spectrum and Other Psychotic Disorders",
                "Schizophrenia, Paranoid",
                "Social Communication Disorder",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Substance Withdrawal Syndrome",
                "Substance-Related Disorders",
                "Tourette Syndrome",
                "Trauma and Stressor Related Disorders",
                "Trichotillomania"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Schizophrenia (Schiz)",
            "Bipolar Disorder (Bipol)",
            "Major Depressive Disorder (MDD)",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Obsessive-Compulsive Disorder (OCD)",
            "Anxiety Disorder",
            "Attention Deficit Hyperactivity Disorder (ADHD)",
            "Autism Spectrum Disorder (ASD)",
            "Borderline Personality Disorder (BPD)",
            "Dissociative Identity Disorder (DID)",
            "Generalized Anxiety Disorder (GAD)",
            "Histrionic Personality Disorder",
            "Hypochondriasis",
            "Mood Disorder",
            "Narcissistic Personality Disorder",
            "Obsessive-Compulsive Personality Disorder",
            "Panic Disorder",
            "Personality Disorder",
            "Postpartum Depression",
            "Psychotic Disorder",
            "Social Anxiety Disorder",
            "Somatization Disorder",
            "Traumatic Brain Injury (TBI)",
            "Unipolar Depression"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Schizophrenia",
                "Bipolar Disorder",
                "Obsessive-Compulsive Disorder",
                "Anxiety Disorder",
                "Autism Spectrum Disorder",
                "Borderline Personality Disorder",
                "Dissociative Identity Disorder",
                "Histrionic Personality Disorder",
                "Hypochondriasis",
                "Mood Disorder",
                "Narcissistic Personality Disorder",
                "Panic Disorder",
                "Personality Disorder",
                "Psychotic Disorder",
                "Somatization Disorder"
            ],
            "mismatches": [
                "Major Depressive Disorder (MDD)",
                "Post-Traumatic Stress Disorder (PTSD)",
                "Attention Deficit Hyperactivity Disorder (ADHD)",
                "Generalized Anxiety Disorder (GAD)",
                "Obsessive-Compulsive Personality Disorder",
                "Postpartum Depression",
                "Social Anxiety Disorder",
                "Traumatic Brain Injury (TBI)",
                "Unipolar Depression"
            ],
            "true_referents": [
                "Agoraphobia",
                "Antisocial Personality Disorder",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Borderline Personality Disorder",
                "Cognitive Dysfunction",
                "Compulsive Personality Disorder",
                "Depression, Postpartum",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Dissociative Disorders",
                "Dissociative Identity Disorder",
                "Dysthymic Disorder",
                "Histrionic Personality Disorder",
                "Hoarding Disorder",
                "Hypochondriasis",
                "Mood Disorders",
                "Narcissistic Personality Disorder",
                "Neurocognitive Disorders",
                "Neurotic Disorders",
                "Obsessive-Compulsive Disorder",
                "Panic Disorder",
                "Personality Disorders",
                "Phobia, Social",
                "Phobic Disorders",
                "Psychotic Disorders",
                "Schizoid Personality Disorder",
                "Schizophrenia",
                "Schizophrenia Spectrum and Other Psychotic Disorders",
                "Schizophrenia, Paranoid",
                "Schizotypal Personality Disorder",
                "Social Communication Disorder",
                "Somatoform Disorders",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Trauma and Stressor Related Disorders"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            "Schizophrenia (SCZ)",
            "Bipolar Disorder (BD)",
            "Major Depressive Disorder (MDD)",
            "Anxiety Disorder",
            "Post-Traumatic Stress Disorder (PTSD)",
            "Obsessive-Compulsive Disorder (OCD)",
            "Autism Spectrum Disorder (ASD)",
            "Attention Deficit Hyperactivity Disorder (ADHD)",
            "Dissociative Identity Disorder (DID)",
            "Eating Disorder",
            "Somatoform Disorder",
            "Tourette Syndrome",
            "Chronic Fatigue Syndrome",
            "Fibromyalgia",
            "Irritable Bowel Syndrome (IBS)",
            "Multiple Chemical Sensitivity (MCS)",
            "Dementia",
            "Delirium",
            "Psychotic Disorder",
            "Mood Disorder",
            "Personality Disorder",
            "Adjustment Disorder",
            "Dissociative Disorder",
            "Trauma and Stressor-Related Disorder"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Schizophrenia",
                "Bipolar Disorder",
                "Depressive Disorder, Major",
                "Anxiety Disorders",
                "Stress Disorders, Post-Traumatic",
                "Obsessive-Compulsive Disorder",
                "Autism Spectrum Disorder",
                "Attention Deficit Disorder with Hyperactivity",
                "Dissociative Identity Disorder",
                "Somatoform Disorders",
                "Tourette Syndrome",
                "Dementia",
                "Delirium",
                "Psychotic Disorders",
                "Mood Disorders",
                "Personality Disorders",
                "Adjustment Disorders",
                "Dissociative Disorders",
                "Trauma and Stressor Related Disorders"
            ],
            "mismatches": [
                "Eating Disorder",
                "Chronic Fatigue Syndrome",
                "Fibromyalgia",
                "Irritable Bowel Syndrome (IBS)",
                "Multiple Chemical Sensitivity (MCS)"
            ],
            "true_referents": [
                "Adjustment Disorders",
                "Alzheimer Disease",
                "Anorexia Nervosa",
                "Antisocial Personality Disorder",
                "Anxiety Disorders",
                "Asperger Syndrome",
                "Attention Deficit Disorder with Hyperactivity",
                "Attention Deficit and Disruptive Behavior Disorders",
                "Autism Spectrum Disorder",
                "Autistic Disorder",
                "Binge-Eating Disorder",
                "Bipolar Disorder",
                "Bipolar and Related Disorders",
                "Borderline Personality Disorder",
                "Bulimia Nervosa",
                "Cognitive Dysfunction",
                "Compulsive Personality Disorder",
                "Delirium",
                "Dementia",
                "Depressive Disorder",
                "Depressive Disorder, Major",
                "Depressive Disorder, Treatment-Resistant",
                "Dissociative Disorders",
                "Dissociative Identity Disorder",
                "Encopresis",
                "Enuresis",
                "Hoarding Disorder",
                "Hypochondriasis",
                "Mood Disorders",
                "Munchausen Syndrome",
                "Narcolepsy",
                "Neurasthenia",
                "Neurotic Disorders",
                "Obsessive-Compulsive Disorder",
                "Panic Disorder",
                "Personality Disorders",
                "Phobic Disorders",
                "Psychoses, Substance-Induced",
                "Psychotic Disorders",
                "Restless Legs Syndrome",
                "Schizoid Personality Disorder",
                "Schizophrenia",
                "Schizophrenia Spectrum and Other Psychotic Disorders",
                "Schizophrenia, Paranoid",
                "Schizotypal Personality Disorder",
                "Seasonal Affective Disorder",
                "Somatoform Disorders",
                "Stress Disorders, Post-Traumatic",
                "Stress Disorders, Traumatic",
                "Tic Disorders",
                "Tourette Syndrome",
                "Trauma and Stressor Related Disorders"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "mental disorder",
        "domain": "medicine",
        "response": [
            [
                "Referent",
                "Schizophrenia"
            ],
            [
                "Referent",
                "Schizoaffective disorder"
            ],
            [
                "Referent",
                "Delusional disorder"
            ],
            [
                "Referent",
                "Brief psychotic disorder"
            ],
            [
                "Referent",
                "Psychotic disorder not otherwise specified"
            ],
            [
                "Referent",
                "Schizotypal personality disorder"
            ],
            [
                "Referent",
                "Schizophreniform disorder"
            ],
            [
                "Referent",
                "Unspecified psychotic disorder"
            ]
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Schizophrenia",
                "Schizotypal personality disorder"
            ],
            "mismatches": [
                "Schizoaffective disorder",
                "Delusional disorder",
                "Brief psychotic disorder",
                "Psychotic disorder not otherwise specified",
                "Schizophreniform disorder",
                "Unspecified psychotic disorder"
            ],
            "true_referents": [
                "Dissociative Identity Disorder",
                "Factitious Disorders",
                "Psychotic Disorders",
                "Schizoid Personality Disorder",
                "Schizophrenia",
                "Schizophrenia Spectrum and Other Psychotic Disorders",
                "Schizophrenia, Catatonic",
                "Schizophrenia, Paranoid",
                "Schizotypal Personality Disorder"
            ],
            "TP": 2,
            "FP": 6,
            "FN": 0
        }
    }
]