[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "neuron (N)",
            "synapse",
            "neurotransmitter",
            "neural pathway",
            "glial cell",
            "cerebral cortex",
            "hippocampus",
            "amygdala",
            "thalamus",
            "hypothalamus",
            "basal ganglia",
            "cerebellum",
            "brainstem",
            "neurovascular unit",
            "neural tube",
            "neurogenesis",
            "neural crest",
            "neurotransmitter receptor",
            "neural stem cell",
            "neural circuit",
            "neurotransmitter transporter",
            "neuroepithelium",
            "neural lobe",
            "neural crest cell"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cerebral cortex",
                "hippocampus",
                "amygdala",
                "thalamus",
                "hypothalamus",
                "basal ganglia",
                "cerebellum"
            ],
            "mismatches": [
                "neuron (N)",
                "synapse",
                "neurotransmitter",
                "neural pathway",
                "glial cell",
                "brainstem",
                "neurovascular unit",
                "neural tube",
                "neurogenesis",
                "neural crest",
                "neurotransmitter receptor",
                "neural stem cell",
                "neural circuit",
                "neurotransmitter transporter",
                "neuroepithelium",
                "neural lobe",
                "neural crest cell"
            ],
            "true_referents": [
                "Amygdala",
                "Basal Ganglia",
                "Blood-Brain Barrier",
                "Brain Stem",
                "Central Amygdaloid Nucleus",
                "Cerebellar Cortex",
                "Cerebellum",
                "Cerebral Aqueduct",
                "Cerebral Cortex",
                "Cerebrum",
                "Choroid Plexus",
                "Corpus Striatum",
                "Entorhinal Cortex",
                "Glymphatic System",
                "Gray Matter",
                "Hippocampus",
                "Hypothalamus",
                "Limbic Lobe",
                "Limbic System",
                "Locus Coeruleus",
                "Medulla Oblongata",
                "Middle Hypothalamus",
                "Neocortex",
                "Neostriatum",
                "Nucleus Accumbens",
                "Occipital Lobe",
                "Olfactory Bulb",
                "Purkinje Cells",
                "Substantia Nigra",
                "Subthalamus",
                "Thalamic Nuclei",
                "Thalamus"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Cerebral cortex (CC)",
            "Hippocampus (HIPP)",
            "Amygdala (AMY)",
            "Thalamus (TH)",
            "Hypothalamus (HYPO)",
            "Pituitary gland (PIT)",
            "Cerebellum (CB)",
            "Medulla oblongata (MO)",
            "Pons (PONS)",
            "Spinal cord (SC)",
            "Basal ganglia (BG)",
            "Corpus callosum (CC)",
            "Lateral ventricle (LV)",
            "Third ventricle (3V)",
            "Fourth ventricle (4V)",
            "Optic nerve (ON)",
            "Olfactory bulb (OB)",
            "Broca's area (BA)",
            "Wernicke's area (WA)",
            "Primary motor cortex (PMC)",
            "Primary sensory cortex (PSC)",
            "Prefrontal cortex (PFC)",
            "Occipital lobe (OL)",
            "Temporal lobe (TL)",
            "Frontal lobe (FL)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cerebral cortex",
                "Hippocampus",
                "Amygdala",
                "Thalamus",
                "Hypothalamus",
                "Pituitary gland",
                "Cerebellum",
                "Medulla oblongata",
                "Pons",
                "Basal ganglia",
                "Corpus callosum",
                "Lateral ventricle",
                "Third ventricle",
                "Fourth ventricle",
                "Olfactory bulb",
                "Wernicke's area",
                "Prefrontal cortex",
                "Occipital lobe",
                "Temporal lobe",
                "Frontal lobe"
            ],
            "mismatches": [
                "Spinal cord",
                "Optic nerve",
                "Broca's area",
                "Primary motor cortex",
                "Primary sensory cortex"
            ],
            "true_referents": [
                "Amygdala",
                "Anterior Pituitary Gland",
                "Basal Forebrain",
                "Basal Ganglia",
                "Brain Stem",
                "Broca Area",
                "Central Amygdaloid Nucleus",
                "Cerebellar Cortex",
                "Cerebellar Nuclei",
                "Cerebellum",
                "Cerebral Cortex",
                "Cerebral Ventricles",
                "Cerebrum",
                "Corpus Callosum",
                "Dentate Gyrus",
                "Diagonal Band of Broca",
                "Dorsolateral Prefrontal Cortex",
                "Fourth Ventricle",
                "Frontal Lobe",
                "Hippocampus",
                "Hypothalamus",
                "Lateral Ventricles",
                "Medulla Oblongata",
                "Middle Hypothalamus",
                "Motor Cortex",
                "Myelencephalon",
                "Neocortex",
                "Occipital Lobe",
                "Olfactory Bulb",
                "Olfactory Cortex",
                "Optic Chiasm",
                "Optic Tract",
                "Parietal Lobe",
                "Periamygdaloid Cortex",
                "Pituitary Gland",
                "Pons",
                "Pontine Tegmentum",
                "Prefrontal Cortex",
                "Primary Visual Cortex",
                "Somatosensory Cortex",
                "Telencephalon",
                "Temporal Lobe",
                "Thalamic Nuclei",
                "Thalamus",
                "Third Ventricle",
                "Visual Cortex",
                "Wernicke Area"
            ],
            "TP": 20,
            "FP": 5,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Neuron (Neuron)",
            "Astrocyte (Astrocyte)",
            "Oligodendrocyte (Oligodendrocyte)",
            "Microglia (Microglia)",
            "Ependymal Cell (Ependymal Cell)",
            "Schwann Cell (Schwann Cell)",
            "Sensory neuron (Sensory neuron)",
            "Motor neuron (Motor neuron)",
            "Interneuron (Interneuron)",
            "Purkinje cell (Purkinje cell)",
            "Granule cell (Granule cell)",
            "Pyramidal cell (Pyramidal cell)",
            "Basal Ganglia (Basal Ganglia)",
            "Hippocampus (Hippocampus)",
            "Amygdala (Amygdala)",
            "Cerebellum (Cerebellum)",
            "Thalamus (Thalamus)",
            "Hypothalamus (Hypothalamus)",
            "Corpus Callosum (Corpus Callosum)",
            "Brainstem (Brainstem)",
            "Cerebral Cortex (Cerebral Cortex)",
            "Spinal Cord (Spinal Cord)",
            "Nucleus Accumbens (Nucleus Accumbens)",
            "Substantia Nigra (Substantia Nigra)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Basal Ganglia",
                "Hippocampus",
                "Amygdala",
                "Cerebellum",
                "Thalamus",
                "Hypothalamus",
                "Corpus Callosum",
                "Nucleus Accumbens",
                "Substantia Nigra"
            ],
            "mismatches": [
                "Neuron (Neuron)",
                "Astrocyte (Astrocyte)",
                "Oligodendrocyte (Oligodendrocyte)",
                "Microglia (Microglia)",
                "Ependymal Cell (Ependymal Cell)",
                "Schwann Cell (Schwann Cell)",
                "Sensory neuron (Sensory neuron)",
                "Motor neuron (Motor neuron)",
                "Interneuron (Interneuron)",
                "Purkinje cell (Purkinje cell)",
                "Granule cell (Granule cell)",
                "Pyramidal cell (Pyramidal cell)",
                "Brainstem (Brainstem)",
                "Cerebral Cortex (Cerebral Cortex)",
                "Spinal Cord (Spinal Cord)"
            ],
            "true_referents": [
                "Amygdala",
                "Basal Ganglia",
                "Blood-Brain Barrier",
                "Brain Stem",
                "Central Amygdaloid Nucleus",
                "Cerebellar Cortex",
                "Cerebellum",
                "Cerebral Cortex",
                "Cerebrum",
                "Corpus Callosum",
                "Corpus Striatum",
                "Entorhinal Cortex",
                "Ependyma",
                "Gray Matter",
                "Hippocampus",
                "Hypothalamus",
                "Mesencephalon",
                "Middle Hypothalamus",
                "Motor Cortex",
                "Neocortex",
                "Neostriatum",
                "Nucleus Accumbens",
                "Olfactory Bulb",
                "Prosencephalon",
                "Purkinje Cells",
                "Somatosensory Cortex",
                "Substantia Nigra",
                "Subthalamus",
                "Telencephalon",
                "Thalamic Nuclei",
                "Thalamus",
                "Trigeminal Motor Nucleus",
                "White Matter"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Neuron (N)",
            "Glial Cell (GC)",
            "Synapse (S)",
            "Axon (Ax)",
            "Dendrite (D)",
            "Myelin Sheath (MS)",
            "Node of Ranvier (NR)",
            "Brainstem (BS)",
            "Cerebellum (Cb)",
            "Cerebrum (Cx)",
            "Hippocampus (Hi)",
            "Amygdala (Am)",
            "Thalamus (Th)",
            "Hypothalamus (Hyp)",
            "Corpus Callosum (CC)",
            "Basal Ganglia (BG)",
            "Ventricle (V)",
            "Cerebrospinal Fluid (CSF)",
            "Blood-Brain Barrier (BBB)",
            "Gray Matter (GM)",
            "White Matter (WM)",
            "Prefrontal Cortex (PFC)",
            "Broca's Area (BA)",
            "Wernicke's Area (WA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Brainstem",
                "Cerebellum",
                "Cerebrum",
                "Hippocampus",
                "Amygdala",
                "Thalamus",
                "Hypothalamus",
                "Corpus Callosum",
                "Basal Ganglia",
                "Blood-Brain Barrier",
                "Gray Matter",
                "White Matter",
                "Prefrontal Cortex",
                "Broca's Area",
                "Wernicke's Area"
            ],
            "mismatches": [
                "Neuron (N)",
                "Glial Cell (GC)",
                "Synapse (S)",
                "Axon (Ax)",
                "Dendrite (D)",
                "Myelin Sheath (MS)",
                "Node of Ranvier (NR)",
                "Ventricle (V)",
                "Cerebrospinal Fluid (CSF)"
            ],
            "true_referents": [
                "Amygdala",
                "Basal Forebrain",
                "Basal Ganglia",
                "Blood-Brain Barrier",
                "Brain Stem",
                "Broca Area",
                "Central Amygdaloid Nucleus",
                "Cerebellar Cortex",
                "Cerebellar Nuclei",
                "Cerebellum",
                "Cerebral Cortex",
                "Cerebral Ventricles",
                "Cerebrum",
                "Choroid Plexus",
                "Corpus Callosum",
                "Dentate Gyrus",
                "Diagonal Band of Broca",
                "Dorsolateral Prefrontal Cortex",
                "Fourth Ventricle",
                "Frontal Lobe",
                "Gray Matter",
                "Hippocampal CA1 Region",
                "Hippocampus",
                "Hypothalamus",
                "Middle Hypothalamus",
                "Motor Cortex",
                "Myelencephalon",
                "Neocortex",
                "Nucleus Raphe Magnus",
                "Olfactory Bulb",
                "Parietal Lobe",
                "Periamygdaloid Cortex",
                "Prefrontal Cortex",
                "Prosencephalon",
                "Red Nucleus",
                "Reticular Formation",
                "Telencephalon",
                "Thalamic Nuclei",
                "Thalamus",
                "Third Ventricle",
                "Wernicke Area",
                "White Matter"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Neuron",
            "Astrocyte",
            "Oligodendrocyte",
            "Microglia",
            "Ependymal Cell",
            "Pyramidal Cell",
            "Purkinje Cell",
            "Granule Cell",
            "Basket Cell",
            "Stellate Cell",
            "Chandelier Cell",
            "Interneuron",
            "Thalamocortical Neuron",
            "Cerebellar Neuron",
            "Glial Cell",
            "Schwann Cell",
            "Radial Glia",
            "Bergmann Glia",
            "Mossy Fiber",
            "Climbing Fiber",
            "Synapse",
            "Dendrite",
            "Axon",
            "Blood-Brain Barrier"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Blood-Brain Barrier"
            ],
            "mismatches": [
                "Neuron",
                "Astrocyte",
                "Oligodendrocyte",
                "Microglia",
                "Ependymal Cell",
                "Pyramidal Cell",
                "Purkinje Cell",
                "Granule Cell",
                "Basket Cell",
                "Stellate Cell",
                "Chandelier Cell",
                "Interneuron",
                "Thalamocortical Neuron",
                "Cerebellar Neuron",
                "Glial Cell",
                "Schwann Cell",
                "Radial Glia",
                "Bergmann Glia",
                "Mossy Fiber",
                "Climbing Fiber",
                "Synapse",
                "Dendrite",
                "Axon"
            ],
            "true_referents": [
                "Barrington's Nucleus",
                "Basal Ganglia",
                "Blood-Brain Barrier",
                "Cerebellar Cortex",
                "Cerebellar Golgi Cells",
                "Cerebellar Nuclei",
                "Cerebellum",
                "Cerebral Cortex",
                "Choroid Plexus",
                "Entorhinal Cortex",
                "Ependyma",
                "Epithalamus",
                "Globus Pallidus",
                "Glymphatic System",
                "Gray Matter",
                "Hippocampal Mossy Fibers",
                "Hippocampus",
                "Intralaminar Thalamic Nuclei",
                "Kolliker-Fuse Nucleus",
                "Motor Cortex",
                "Neocortex",
                "Prosencephalon",
                "Purkinje Cells",
                "Solitary Nucleus",
                "Tectospinal Fibers",
                "Telencephalon",
                "Thalamic Nuclei",
                "Thalamus",
                "Visual Cortex",
                "White Matter"
            ],
            "TP": 1,
            "FP": 23,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Neuron (N)",
            "Glial cell (GC)",
            "Synapse (S)",
            "Cortex (C)",
            "Hippocampus (H)",
            "Amygdala (A)",
            "Thalamus (T)",
            "Hypothalamus (HYP)",
            "Cerebellum (CB)",
            "Brainstem (BS)",
            "Basal ganglia (BG)",
            "Corpus callosum (CC)",
            "Limbic system (LS)",
            "White matter (WM)",
            "Gray matter (GM)",
            "Ventricles (V)",
            "Meninges (M)",
            "Prefrontal cortex (PFC)",
            "Occipital lobe (OL)",
            "Temporal lobe (TL)",
            "Parietal lobe (PL)",
            "Insular cortex (IC)",
            "Substantia nigra (SN)",
            "Medulla oblongata (MO)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Hippocampus",
                "Amygdala",
                "Thalamus",
                "Hypothalamus",
                "Cerebellum",
                "Basal Ganglia",
                "Corpus Callosum",
                "Limbic System",
                "White Matter",
                "Gray Matter",
                "Prefrontal Cortex",
                "Occipital Lobe",
                "Temporal Lobe",
                "Parietal Lobe",
                "Insular Cortex",
                "Substantia Nigra",
                "Medulla Oblongata"
            ],
            "mismatches": [
                "Neuron (N)",
                "Glial cell (GC)",
                "Synapse (S)",
                "Cortex (C)",
                "Brainstem (BS)",
                "Ventricles (V)",
                "Meninges (M)"
            ],
            "true_referents": [
                "Amygdala",
                "Basal Forebrain",
                "Basal Ganglia",
                "Brain Stem",
                "Central Amygdaloid Nucleus",
                "Cerebellar Cortex",
                "Cerebellar Nuclei",
                "Cerebellum",
                "Cerebral Cortex",
                "Cerebral Ventricles",
                "Cerebrum",
                "Choroid Plexus",
                "Corpus Callosum",
                "Corpus Striatum",
                "Dorsolateral Prefrontal Cortex",
                "Frontal Lobe",
                "Gray Matter",
                "Hippocampal CA1 Region",
                "Hippocampus",
                "Hypothalamus",
                "Insular Cortex",
                "Lateral Ventricles",
                "Limbic Lobe",
                "Limbic System",
                "Medulla Oblongata",
                "Metencephalon",
                "Middle Hypothalamus",
                "Motor Cortex",
                "Myelencephalon",
                "Neocortex",
                "Neostriatum",
                "Occipital Lobe",
                "Olfactory Bulb",
                "Parietal Lobe",
                "Pontine Tegmentum",
                "Prefrontal Cortex",
                "Prosencephalon",
                "Substantia Nigra",
                "Telencephalon",
                "Temporal Lobe",
                "Thalamic Nuclei",
                "Thalamus",
                "Third Ventricle",
                "Visual Cortex",
                "White Matter"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Frontal Lobe (FL)",
            "Temporal Lobe (TL)",
            "Parietal Lobe (PL)",
            "Occipital Lobe (OL)",
            "Cerebellum (CB)",
            "Thalamus (TH)",
            "Hypothalamus (HY)",
            "Amygdala (AM)",
            "Hippocampus (HC)",
            "Midbrain (MB)",
            "Pons (PO)",
            "Medulla Oblongata (MO)",
            "Basal Ganglia (BG)",
            "Corpus Callosum (CC)",
            "Brainstem (BS)",
            "Prefrontal Cortex (PFC)",
            "Primary Motor Cortex (PMC)",
            "Primary Sensory Cortex (PSC)",
            "Primary Visual Cortex (PVC)",
            "Primary Auditory Cortex (PAC)",
            "Broca's Area (BA)",
            "Wernicke's Area (WA)",
            "Cingulate Cortex (CCx)",
            "Insular Cortex (IC)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Frontal Lobe",
                "Temporal Lobe",
                "Parietal Lobe",
                "Occipital Lobe",
                "Cerebellum",
                "Thalamus",
                "Hypothalamus",
                "Amygdala",
                "Hippocampus",
                "Pons",
                "Medulla Oblongata",
                "Basal Ganglia",
                "Corpus Callosum",
                "Prefrontal Cortex",
                "Primary Visual Cortex",
                "Wernicke Area",
                "Insular Cortex"
            ],
            "mismatches": [
                "Midbrain",
                "Brainstem",
                "Primary Motor Cortex",
                "Primary Sensory Cortex",
                "Primary Auditory Cortex",
                "Broca's Area",
                "Cingulate Cortex"
            ],
            "true_referents": [
                "Amygdala",
                "Auditory Cortex",
                "Basal Forebrain",
                "Basal Ganglia",
                "Brain Stem",
                "Broca Area",
                "Central Amygdaloid Nucleus",
                "Cerebellar Cortex",
                "Cerebellar Nuclei",
                "Cerebellum",
                "Cerebral Cortex",
                "Cerebrum",
                "Corpus Callosum",
                "Diagonal Band of Broca",
                "Dorsolateral Prefrontal Cortex",
                "Frontal Lobe",
                "Gyrus Cinguli",
                "Hippocampal CA1 Region",
                "Hippocampus",
                "Hypothalamus",
                "Insular Cortex",
                "Limbic Lobe",
                "Medulla Oblongata",
                "Midbrain Reticular Formation",
                "Middle Hypothalamus",
                "Motor Cortex",
                "Occipital Lobe",
                "Olfactory Bulb",
                "Olivary Nucleus",
                "Parietal Lobe",
                "Periamygdaloid Cortex",
                "Pons",
                "Pontine Tegmentum",
                "Prefrontal Cortex",
                "Primary Visual Cortex",
                "Prosencephalon",
                "Somatosensory Cortex",
                "Telencephalon",
                "Temporal Lobe",
                "Thalamic Nuclei",
                "Thalamus",
                "Visual Cortex",
                "Wernicke Area"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Neuron",
            "Glia cell",
            "Cerebral cortex",
            "Hippocampus",
            "Cerebellum",
            "Thalamus",
            "Amygdala",
            "Hypothalamus",
            "Brainstem",
            "Pituitary gland",
            "Olfactory bulb",
            "Basal ganglia",
            "Cerebral ventricles",
            "Spinal cord",
            "Pons",
            "Medulla oblongata",
            "Cranial nerves",
            "White matter",
            "Grey matter",
            "Cerebral hemisphere",
            "Frontal lobe",
            "Parietal lobe",
            "Temporal lobe",
            "Occipital lobe"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cerebral cortex",
                "Hippocampus",
                "Cerebellum",
                "Thalamus",
                "Amygdala",
                "Hypothalamus",
                "Pituitary gland",
                "Olfactory bulb",
                "Basal ganglia",
                "Cerebral ventricles",
                "Pons",
                "Medulla oblongata",
                "White matter",
                "Frontal lobe",
                "Parietal lobe",
                "Temporal lobe",
                "Occipital lobe"
            ],
            "mismatches": [
                "Neuron",
                "Glia cell",
                "Brainstem",
                "Spinal cord",
                "Cranial nerves",
                "Grey matter",
                "Cerebral hemisphere"
            ],
            "true_referents": [
                "Amygdala",
                "Anterior Pituitary Gland",
                "Basal Ganglia",
                "Brain Stem",
                "Central Amygdaloid Nucleus",
                "Cerebellar Cortex",
                "Cerebellar Golgi Cells",
                "Cerebellum",
                "Cerebral Cortex",
                "Cerebral Ventricles",
                "Cerebrum",
                "Epithalamus",
                "Frontal Lobe",
                "Gray Matter",
                "Hippocampus",
                "Hypothalamus",
                "Lateral Ventricles",
                "Locus Coeruleus",
                "Medulla Oblongata",
                "Middle Hypothalamus",
                "Neocortex",
                "Occipital Lobe",
                "Olfactory Bulb",
                "Olfactory Cortex",
                "Parietal Lobe",
                "Pituitary Gland",
                "Pons",
                "Prefrontal Cortex",
                "Purkinje Cells",
                "Subthalamus",
                "Telencephalon",
                "Temporal Lobe",
                "Thalamic Nuclei",
                "Thalamus",
                "Third Ventricle",
                "Visual Cortex",
                "White Matter"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Neuron (NRN)",
            "Astrocyte (AST)",
            "Oligodendrocyte (OLIG)",
            "Microglia (MG)",
            "Cortical Column",
            "Hippocampal Dentate Gyrus",
            "Basal Ganglia",
            "Thalamic Nucleus",
            "Cerebellar Cortex",
            "Corpus Callosum",
            "Amygdala",
            "Hypothalamus",
            "Broca's Area",
            "Wernicke's Area",
            "Purkinje Cell",
            "Pyramidal Neuron",
            "Reticular Formation",
            "Limbic System",
            "Striatum",
            "Red Nucleus",
            "Superior Colliculus",
            "Inferior Colliculus",
            "Pineal Gland",
            "Substantia Nigra"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Basal Ganglia",
                "Cerebellar Cortex",
                "Corpus Callosum",
                "Amygdala",
                "Hypothalamus",
                "Reticular Formation",
                "Limbic System",
                "Red Nucleus",
                "Pineal Gland",
                "Substantia Nigra"
            ],
            "mismatches": [
                "Neuron (NRN)",
                "Astrocyte (AST)",
                "Oligodendrocyte (OLIG)",
                "Microglia (MG)",
                "Cortical Column",
                "Hippocampal Dentate Gyrus",
                "Thalamic Nucleus",
                "Broca's Area",
                "Wernicke's Area",
                "Purkinje Cell",
                "Pyramidal Neuron",
                "Striatum",
                "Superior Colliculus",
                "Inferior Colliculus"
            ],
            "true_referents": [
                "Amygdala",
                "Auditory Cortex",
                "Basal Ganglia",
                "Blood-Brain Barrier",
                "Broca Area",
                "Central Amygdaloid Nucleus",
                "Cerebellar Cortex",
                "Cerebellar Nuclei",
                "Cerebellum",
                "Cerebral Cortex",
                "Cerebrum",
                "Corpus Callosum",
                "Corpus Striatum",
                "Dentate Gyrus",
                "Diagonal Band of Broca",
                "Entopeduncular Nucleus",
                "Hippocampus",
                "Hypothalamus",
                "Inferior Colliculi",
                "Limbic Lobe",
                "Limbic System",
                "Metencephalon",
                "Midbrain Reticular Formation",
                "Middle Hypothalamus",
                "Myelencephalon",
                "Neocortex",
                "Neostriatum",
                "Occipital Lobe",
                "Parietal Lobe",
                "Pineal Gland",
                "Piriform Cortex",
                "Pituitary Gland",
                "Posterior Thalamic Nuclei",
                "Purkinje Cells",
                "Red Nucleus",
                "Reticular Formation",
                "Solitary Nucleus",
                "Substantia Nigra",
                "Subthalamus",
                "Superior Colliculi",
                "Telencephalon",
                "Thalamic Nuclei",
                "Thalamus",
                "Ventral Striatum",
                "Ventral Tegmental Area",
                "Wernicke Area",
                "White Matter"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Neuron (nerve cell)",
            "Synapse",
            "Glial cell",
            "Cerebral cortex",
            "Hippocampus",
            "Amygdala",
            "Thalamus",
            "Hypothalamus",
            "Cerebellum",
            "Brainstem",
            "Corpus callosum",
            "Basal ganglia",
            "Prefrontal cortex",
            "Occipital lobe",
            "Temporal lobe",
            "Parietal lobe",
            "Frontal lobe",
            "Pituitary gland",
            "Pineal gland",
            "Ventricle",
            "Meninges",
            "Substantia nigra",
            "Nucleus accumbens",
            "Cingulate cortex"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cerebral cortex",
                "Hippocampus",
                "Amygdala",
                "Thalamus",
                "Hypothalamus",
                "Cerebellum",
                "Corpus callosum",
                "Basal ganglia",
                "Prefrontal cortex",
                "Occipital lobe",
                "Temporal lobe",
                "Parietal lobe",
                "Frontal lobe",
                "Pituitary gland",
                "Pineal gland",
                "Substantia nigra",
                "Nucleus accumbens"
            ],
            "mismatches": [
                "Neuron (nerve cell)",
                "Synapse",
                "Glial cell",
                "Brainstem",
                "Ventricle",
                "Meninges",
                "Cingulate cortex"
            ],
            "true_referents": [
                "Amygdala",
                "Anterior Pituitary Gland",
                "Basal Ganglia",
                "Brain Stem",
                "Central Amygdaloid Nucleus",
                "Cerebellar Cortex",
                "Cerebellum",
                "Cerebral Cortex",
                "Cerebral Ventricles",
                "Cerebrum",
                "Choroid Plexus",
                "Corpus Callosum",
                "Corpus Striatum",
                "Dorsolateral Prefrontal Cortex",
                "Fourth Ventricle",
                "Frontal Lobe",
                "Gray Matter",
                "Gyrus Cinguli",
                "Hippocampus",
                "Hypothalamus",
                "Medulla Oblongata",
                "Metencephalon",
                "Middle Hypothalamus",
                "Neocortex",
                "Neostriatum",
                "Nucleus Accumbens",
                "Occipital Lobe",
                "Parietal Lobe",
                "Pineal Gland",
                "Pituitary Gland",
                "Prefrontal Cortex",
                "Prosencephalon",
                "Purkinje Cells",
                "Substantia Nigra",
                "Subthalamus",
                "Telencephalon",
                "Temporal Lobe",
                "Thalamic Nuclei",
                "Thalamus",
                "Third Ventricle",
                "Ventral Striatum"
            ],
            "TP": 17,
            "FP": 7,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Neuron",
            "Glial cell",
            "Synapse",
            "Axon",
            "Dendrite",
            "Soma (Cell body)",
            "Myelin sheath",
            "Neurotransmitter",
            "Ion channel",
            "Receptor",
            "Cerebral cortex",
            "Hippocampus",
            "Amygdala",
            "Thalamus",
            "Hypothalamus",
            "Cerebellum",
            "Brainstem",
            "Spinal cord",
            "Basal ganglia",
            "Corpus callosum",
            "Olfactory bulb",
            "Limbic system",
            "Broca's area",
            "Wernicke's area"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cerebral cortex",
                "Hippocampus",
                "Amygdala",
                "Thalamus",
                "Hypothalamus",
                "Cerebellum",
                "Basal ganglia",
                "Corpus callosum",
                "Olfactory bulb",
                "Limbic system"
            ],
            "mismatches": [
                "Neuron",
                "Glial cell",
                "Synapse",
                "Axon",
                "Dendrite",
                "Soma (Cell body)",
                "Myelin sheath",
                "Neurotransmitter",
                "Ion channel",
                "Receptor",
                "Brainstem",
                "Spinal cord",
                "Broca's area",
                "Wernicke's area"
            ],
            "true_referents": [
                "Amygdala",
                "Basal Ganglia",
                "Brain Stem",
                "Broca Area",
                "Central Amygdaloid Nucleus",
                "Cerebellar Cortex",
                "Cerebellum",
                "Cerebral Cortex",
                "Cerebrum",
                "Corpus Callosum",
                "Corpus Striatum",
                "Diagonal Band of Broca",
                "Gray Matter",
                "Hippocampus",
                "Hypothalamus",
                "Internal Capsule",
                "Limbic Lobe",
                "Limbic System",
                "Medulla Oblongata",
                "Middle Hypothalamus",
                "Neocortex",
                "Olfactory Bulb",
                "Olfactory Cortex",
                "Parietal Lobe",
                "Perforant Pathway",
                "Purkinje Cells",
                "Somatosensory Cortex",
                "Subthalamus",
                "Thalamic Nuclei",
                "Thalamus",
                "Ventral Tegmental Area",
                "Visual Cortex",
                "Wernicke Area",
                "White Matter"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Neuron (N)",
            "Cerebral cortex (CC)",
            "Hippocampus (H)",
            "Amygdala (A)",
            "Thalamus (T)",
            "Hypothalamus (HT)",
            "Basal ganglia (BG)",
            "Cerebellum (CB)",
            "Brainstem (BS)",
            "Corpus callosum (CC)",
            "White matter (WM)",
            "Gray matter (GM)",
            "Frontal lobe (FL)",
            "Parietal lobe (PL)",
            "Temporal lobe (TL)",
            "Occipital lobe (OL)",
            "Glial cells (GC)",
            "Synapses (S)",
            "Neurotransmitters (NT)",
            "Myelin sheath (MS)",
            "Ventricles (V)",
            "Meninges (M)",
            "Blood-brain barrier (BBB)",
            "Cerebrospinal fluid (CSF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cerebral cortex",
                "Hippocampus",
                "Amygdala",
                "Thalamus",
                "Hypothalamus",
                "Basal ganglia",
                "Cerebellum",
                "Corpus callosum",
                "White matter",
                "Gray matter",
                "Frontal lobe",
                "Parietal lobe",
                "Temporal lobe",
                "Occipital lobe",
                "Blood-brain barrier"
            ],
            "mismatches": [
                "Neuron",
                "Brainstem",
                "Glial cells",
                "Synapses",
                "Neurotransmitters",
                "Myelin sheath",
                "Ventricles",
                "Meninges",
                "Cerebrospinal fluid"
            ],
            "true_referents": [
                "Amygdala",
                "Basal Forebrain",
                "Basal Ganglia",
                "Blood-Brain Barrier",
                "Brain Stem",
                "Central Amygdaloid Nucleus",
                "Cerebellar Cortex",
                "Cerebellar Nuclei",
                "Cerebellum",
                "Cerebral Cortex",
                "Cerebral Ventricles",
                "Cerebrum",
                "Choroid Plexus",
                "Corpus Callosum",
                "Corpus Striatum",
                "Frontal Lobe",
                "Gray Matter",
                "Hippocampal CA1 Region",
                "Hippocampus",
                "Hypothalamus",
                "Lateral Ventricles",
                "Metencephalon",
                "Middle Hypothalamus",
                "Motor Cortex",
                "Myelencephalon",
                "Neocortex",
                "Neostriatum",
                "Occipital Lobe",
                "Olfactory Bulb",
                "Parietal Lobe",
                "Prosencephalon",
                "Telencephalon",
                "Temporal Lobe",
                "Thalamic Nuclei",
                "Thalamus",
                "Third Ventricle",
                "White Matter"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Neuron (N)",
            "Astrocyte (A)",
            "Oligodendrocyte (O)",
            "Microglia (M)",
            "Cerebral cortex (CC)",
            "Hippocampus (H)",
            "Amygdala (Am)",
            "Basal ganglia (BG)",
            "Thalamus (T)",
            "Hypothalamus (Ht)",
            "Brainstem (BS)",
            "Cerebellum (Cb)",
            "Ventricle (V)",
            "Corpus callosum (CC)",
            "Frontal lobe (FL)",
            "Parietal lobe (PL)",
            "Temporal lobe (TL)",
            "Occipital lobe (OL)",
            "Prefrontal cortex (PFC)",
            "Motor cortex (MC)",
            "Sensory cortex (SC)",
            "Limbic system (LS)",
            "White matter (WM)",
            "Gray matter (GM)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cerebral cortex",
                "Hippocampus",
                "Amygdala",
                "Basal ganglia",
                "Thalamus",
                "Hypothalamus",
                "Cerebellum",
                "Corpus callosum",
                "Frontal lobe",
                "Parietal lobe",
                "Temporal lobe",
                "Occipital lobe",
                "Prefrontal cortex",
                "Limbic system",
                "White matter",
                "Gray matter"
            ],
            "mismatches": [
                "Neuron (N)",
                "Astrocyte (A)",
                "Oligodendrocyte (O)",
                "Microglia (M)",
                "Brainstem (BS)",
                "Ventricle (V)",
                "Motor cortex (MC)",
                "Sensory cortex (SC)"
            ],
            "true_referents": [
                "Amygdala",
                "Basal Forebrain",
                "Basal Ganglia",
                "Blood-Brain Barrier",
                "Brain Stem",
                "Central Amygdaloid Nucleus",
                "Cerebellar Cortex",
                "Cerebellar Nuclei",
                "Cerebellum",
                "Cerebral Cortex",
                "Cerebral Ventricles",
                "Cerebrum",
                "Corpus Callosum",
                "Dorsolateral Prefrontal Cortex",
                "Fourth Ventricle",
                "Frontal Lobe",
                "Gray Matter",
                "Hippocampal CA1 Region",
                "Hippocampus",
                "Hypothalamus",
                "Limbic Lobe",
                "Limbic System",
                "Mesencephalon",
                "Metencephalon",
                "Middle Hypothalamus",
                "Motor Cortex",
                "Neocortex",
                "Occipital Lobe",
                "Olfactory Bulb",
                "Parietal Lobe",
                "Prefrontal Cortex",
                "Prosencephalon",
                "Sensorimotor Cortex",
                "Somatosensory Cortex",
                "Telencephalon",
                "Temporal Lobe",
                "Thalamic Nuclei",
                "Thalamus",
                "Third Ventricle",
                "White Matter"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Synapse (Syn)",
            "Neuron",
            "Dendrite",
            "Axon",
            "Terminal button",
            "Nerve ending",
            "Neuroglia",
            "Microglia",
            "Oligodendrocyte",
            "Astrocyte",
            "Ependymal cell",
            "Cerebral cortex",
            "Cerebellum",
            "Brainstem",
            "Thalamus",
            "Hypothalamus",
            "Pons",
            "Medulla oblongata",
            "Cerebral hemisphere",
            "Cerebral lobe",
            "Frontal lobe",
            "Parietal lobe",
            "Temporal lobe",
            "Occipital lobe",
            "Basal ganglia"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cerebral cortex",
                "Cerebellum",
                "Thalamus",
                "Hypothalamus",
                "Pons",
                "Medulla oblongata",
                "Frontal lobe",
                "Parietal lobe",
                "Temporal lobe",
                "Occipital lobe"
            ],
            "mismatches": [
                "Synapse (Syn)",
                "Neuron",
                "Dendrite",
                "Axon",
                "Terminal button",
                "Nerve ending",
                "Neuroglia",
                "Microglia",
                "Oligodendrocyte",
                "Astrocyte",
                "Ependymal cell",
                "Brainstem",
                "Cerebral hemisphere",
                "Cerebral lobe",
                "Basal ganglia"
            ],
            "true_referents": [
                "Blood-Brain Barrier",
                "Brain Stem",
                "Cerebellar Cortex",
                "Cerebellum",
                "Cerebral Cortex",
                "Cerebrum",
                "Ependyma",
                "Epithalamus",
                "External Capsule",
                "Frontal Lobe",
                "Hippocampus",
                "Hypothalamus",
                "Locus Coeruleus",
                "Medulla Oblongata",
                "Middle Hypothalamus",
                "Motor Cortex",
                "Neocortex",
                "Nucleus Accumbens",
                "Occipital Lobe",
                "Olfactory Bulb",
                "Parietal Lobe",
                "Pons",
                "Prefrontal Cortex",
                "Prosencephalon",
                "Purkinje Cells",
                "Somatosensory Cortex",
                "Telencephalon",
                "Temporal Lobe",
                "Thalamic Nuclei",
                "Thalamus",
                "Ventral Striatum",
                "Visual Cortex",
                "White Matter"
            ],
            "TP": 10,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            "Cerebral cortex (CTX)",
            "Basal ganglia (BG)",
            "Hippocampus (HP)",
            "Amygdala (Amy)",
            "Cerebellum (CB)",
            "Brainstem (BS)",
            "Frontal lobe (FL)",
            "Parietal lobe (PL)",
            "Temporal lobe (TL)",
            "Occipital lobe (OL)",
            "Insula (I)",
            "Cingulate gyrus (CG)",
            "Thalamus (Thal)",
            "Hypothalamus (Hyp)",
            "Pons (P)",
            "Medulla oblongata (MO)",
            "Cerebral hemisphere (CH)",
            "Limbic system (LS)",
            "Default mode network (DMN)",
            "Salience network (SN)",
            "Central executive network (CEN)",
            "Basal forebrain (BFB)",
            "Neurogliovascular unit (NGVU)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cerebral cortex (CTX)",
                "Basal ganglia (BG)",
                "Hippocampus (HP)",
                "Amygdala (Amy)",
                "Cerebellum (CB)",
                "Frontal lobe (FL)",
                "Parietal lobe (PL)",
                "Temporal lobe (TL)",
                "Occipital lobe (OL)",
                "Thalamus (Thal)",
                "Hypothalamus (Hyp)",
                "Pons (P)",
                "Medulla oblongata (MO)",
                "Basal forebrain (BFB)"
            ],
            "mismatches": [
                "Brainstem (BS)",
                "Insula (I)",
                "Cingulate gyrus (CG)",
                "Cerebral hemisphere (CH)",
                "Limbic system (LS)",
                "Default mode network (DMN)",
                "Salience network (SN)",
                "Central executive network (CEN)",
                "Neurogliovascular unit (NGVU)"
            ],
            "true_referents": [
                "Amygdala",
                "Basal Forebrain",
                "Basal Ganglia",
                "Blood-Brain Barrier",
                "Brain Stem",
                "Central Amygdaloid Nucleus",
                "Cerebellar Cortex",
                "Cerebellar Nuclei",
                "Cerebellum",
                "Cerebral Cortex",
                "Cerebrum",
                "Choroid Plexus",
                "Dorsolateral Prefrontal Cortex",
                "Dorsomedial Hypothalamic Nucleus",
                "Frontal Lobe",
                "Gyrus Cinguli",
                "Hippocampus",
                "Hypothalamus",
                "Insular Cortex",
                "Lateral Ventricles",
                "Limbic Lobe",
                "Limbic System",
                "Locus Coeruleus",
                "Medulla Oblongata",
                "Middle Hypothalamus",
                "Neocortex",
                "Occipital Lobe",
                "Parahippocampal Gyrus",
                "Parietal Lobe",
                "Pons",
                "Pontine Tegmentum",
                "Posterior Thalamic Nuclei",
                "Prefrontal Cortex",
                "Primary Visual Cortex",
                "Prosencephalon",
                "Purkinje Cells",
                "Substantia Innominata",
                "Telencephalon",
                "Temporal Lobe",
                "Thalamic Nuclei",
                "Thalamus",
                "Visual Cortex"
            ],
            "TP": 14,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "brain structure",
        "domain": "medicine",
        "response": [
            {
                "referent": "amygdala",
                "canonical name": "amygdala"
            },
            {
                "referent": "basal ganglia",
                "canonical name": "basal ganglia"
            },
            {
                "referent": "cerebellum",
                "canonical name": "cerebellum"
            },
            {
                "referent": "hippocampus",
                "canonical name": "hippocampus"
            },
            {
                "referent": "hypothalamus",
                "canonical name": "hypothalamus"
            },
            {
                "referent": "limbic system",
                "canonical name": "limbic system"
            },
            {
                "referent": "medulla oblongata",
                "canonical name": "medulla oblongata"
            },
            {
                "referent": "midbrain",
                "canonical name": "midbrain"
            },
            {
                "referent": "pons",
                "canonical name": "pons"
            },
            {
                "referent": "pituitary gland",
                "canonical name": "pituitary gland"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            },
            {
                "referent": "thalamus",
                "canonical name": "thalamus"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "amygdala",
                "basal ganglia",
                "cerebellum",
                "hippocampus",
                "hypothalamus",
                "limbic system",
                "medulla oblongata",
                "pons",
                "pituitary gland",
                "thalamus"
            ],
            "mismatches": [
                "midbrain"
            ],
            "true_referents": [
                "Amygdala",
                "Anterior Pituitary Gland",
                "Basal Ganglia",
                "Cerebellar Cortex",
                "Cerebellar Nuclei",
                "Cerebellum",
                "Cerebrum",
                "Entorhinal Cortex",
                "Geniculate Bodies",
                "Hippocampus",
                "Hypothalamus",
                "Limbic Lobe",
                "Limbic System",
                "Medulla Oblongata",
                "Mesencephalon",
                "Myelencephalon",
                "Neocortex",
                "Pituitary Gland",
                "Pons",
                "Pontine Tegmentum",
                "Posterior Hypothalamus",
                "Telencephalon",
                "Thalamus",
                "Third Ventricle"
            ],
            "TP": 10,
            "FP": 1,
            "FN": 0
        }
    }
]