[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "mitochondrion (Mito)",
            "nucleus (Nucl)",
            "endoplasmic reticulum (ER)",
            "lysosome",
            "Golgi apparatus",
            "centriole",
            "chloroplast",
            "peroxisome",
            "vacuole",
            "cytoskeleton",
            "cilia",
            "flagella",
            "ribosome",
            "nucleolus",
            "plastid",
            "microvilli",
            "myofibril",
            "microtubule organizing center (MTOC)",
            "lipid droplet",
            "sarcoplasmic reticulum",
            "melanosome",
            "lamellipodium",
            "phagosome"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "mitochondrion (Mito)",
                "nucleus (Nucl)",
                "endoplasmic reticulum (ER)",
                "lysosome",
                "Golgi apparatus",
                "centriole",
                "chloroplast",
                "peroxisome",
                "vacuole",
                "cytoskeleton",
                "cilia",
                "flagella",
                "ribosome",
                "nucleolus",
                "plastid",
                "microvilli",
                "myofibril",
                "microtubule organizing center (MTOC)",
                "lipid droplet",
                "sarcoplasmic reticulum",
                "melanosome",
                "lamellipodium",
                "phagosome"
            ],
            "mismatches": [],
            "true_referents": [
                "Golgi apparatus",
                "centriole",
                "chloroplast",
                "cilia",
                "cytoskeleton",
                "endoplasmic reticulum (ER)",
                "flagella",
                "lamellipodium",
                "lipid droplet",
                "lysosome",
                "melanosome",
                "microtubule organizing center (MTOC)",
                "microvilli",
                "mitochondrion (Mito)",
                "myofibril",
                "nucleolus",
                "nucleus (Nucl)",
                "peroxisome",
                "phagosome",
                "plastid",
                "ribosome",
                "sarcoplasmic reticulum",
                "vacuole"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Nucleus (N)",
            "Mitochondrion (M)",
            "Ribosome (R)",
            "Endoplasmic Reticulum (ER)",
            "Golgi Apparatus (GA)",
            "Lysosome (L)",
            "Peroxisome (P)",
            "Plasma Membrane (PM)",
            "Cytoskeleton (CS)",
            "Centrosome (C)",
            "Chloroplast (Ch)",
            "Vacuole (V)",
            "Nucleolus (Nu)",
            "Peroxisomal Membrane (PM)",
            "Cilia (Ci)",
            "Flagella (F)",
            "Microvilli (Mi)",
            "Smooth Endoplasmic Reticulum (SER)",
            "Rough Endoplasmic Reticulum (RER)",
            "Autophagosome (A)",
            "Exosome (Ex)",
            "Spliceosome (Sp)",
            "Peroxisomal Enzyme Complex (PEC)",
            "Synaptic Vesicle (SV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nucleus (N)",
                "Mitochondrion (M)",
                "Ribosome (R)",
                "Endoplasmic Reticulum (ER)",
                "Golgi Apparatus (GA)",
                "Lysosome (L)",
                "Peroxisome (P)",
                "Plasma Membrane (PM)",
                "Cytoskeleton (CS)",
                "Centrosome (C)",
                "Chloroplast (Ch)",
                "Vacuole (V)",
                "Nucleolus (Nu)",
                "Peroxisomal Membrane (PM)",
                "Cilia (Ci)",
                "Flagella (F)",
                "Microvilli (Mi)",
                "Smooth Endoplasmic Reticulum (SER)",
                "Rough Endoplasmic Reticulum (RER)",
                "Autophagosome (A)",
                "Exosome (Ex)",
                "Spliceosome (Sp)",
                "Peroxisomal Enzyme Complex (PEC)",
                "Synaptic Vesicle (SV)"
            ],
            "mismatches": [],
            "true_referents": [
                "Autophagosome (A)",
                "Centrosome (C)",
                "Chloroplast (Ch)",
                "Cilia (Ci)",
                "Cytoskeleton (CS)",
                "Endoplasmic Reticulum (ER)",
                "Exosome (Ex)",
                "Flagella (F)",
                "Golgi Apparatus (GA)",
                "Lysosome (L)",
                "Microvilli (Mi)",
                "Mitochondrion (M)",
                "Nucleolus (Nu)",
                "Nucleus (N)",
                "Peroxisomal Enzyme Complex (PEC)",
                "Peroxisomal Membrane (PM)",
                "Peroxisome (P)",
                "Plasma Membrane (PM)",
                "Ribosome (R)",
                "Rough Endoplasmic Reticulum (RER)",
                "Smooth Endoplasmic Reticulum (SER)",
                "Spliceosome (Sp)",
                "Synaptic Vesicle (SV)",
                "Vacuole (V)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Nucleus (NU)",
            "Mitochondrion (MT)",
            "Ribosome (RI)",
            "Endoplasmic Reticulum (ER)",
            "Golgi Apparatus (GA)",
            "Lysosome (LY)",
            "Peroxisome",
            "Centrosome",
            "Cytoskeleton",
            "Vacuole",
            "Chloroplast (CP)",
            "Nucleolus",
            "Cytosol",
            "Cell Membrane",
            "Endosome",
            "Lipid Droplet",
            "Microtubule",
            "Microfilament",
            "Intermediate Filament",
            "Cytoplasmic Granule",
            "Plasma Membrane",
            "Nuclear Envelope",
            "Glyoxisome",
            "Spherosome"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nucleus (NU)",
                "Mitochondrion (MT)",
                "Ribosome (RI)",
                "Endoplasmic Reticulum (ER)",
                "Golgi Apparatus (GA)",
                "Lysosome (LY)",
                "Peroxisome",
                "Centrosome",
                "Cytoskeleton",
                "Vacuole",
                "Chloroplast (CP)",
                "Nucleolus",
                "Cytosol",
                "Cell Membrane",
                "Endosome",
                "Lipid Droplet",
                "Microtubule",
                "Microfilament",
                "Intermediate Filament",
                "Cytoplasmic Granule",
                "Plasma Membrane",
                "Nuclear Envelope",
                "Glyoxisome",
                "Spherosome"
            ],
            "mismatches": [],
            "true_referents": [
                "Cell Membrane",
                "Centrosome",
                "Chloroplast (CP)",
                "Cytoplasmic Granule",
                "Cytoskeleton",
                "Cytosol",
                "Endoplasmic Reticulum (ER)",
                "Endosome",
                "Glyoxisome",
                "Golgi Apparatus (GA)",
                "Intermediate Filament",
                "Lipid Droplet",
                "Lysosome (LY)",
                "Microfilament",
                "Microtubule",
                "Mitochondrion (MT)",
                "Nuclear Envelope",
                "Nucleolus",
                "Nucleus (NU)",
                "Peroxisome",
                "Plasma Membrane",
                "Ribosome (RI)",
                "Spherosome",
                "Vacuole"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Nucleus (NUC)",
            "Mitochondrion (MIT)",
            "Ribosome (RIB)",
            "Endoplasmic Reticulum (ER)",
            "Golgi Apparatus (GA)",
            "Lysosome (LYS)",
            "Peroxisome (PER)",
            "Centriole (CEN)",
            "Cytoskeleton (CYT)",
            "Cell Membrane (CM)",
            "Flagellum (FLA)",
            "Cilium (CLI)",
            "Vacuole (VAC)",
            "Chloroplast (CHP)",
            "Cell Wall (CW)",
            "Melanosome (MEL)",
            "Microvilli (MVI)",
            "Glyoxysome (GLY)",
            "Autophagosome (AUT)",
            "Stress Granule (SG)",
            "P-body (PB)",
            "Nuclear Pore Complex (NPC)",
            "Kinetochore (KIN)",
            "Spindle Pole Body (SPB)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nucleus (NUC)",
                "Mitochondrion (MIT)",
                "Ribosome (RIB)",
                "Endoplasmic Reticulum (ER)",
                "Golgi Apparatus (GA)",
                "Lysosome (LYS)",
                "Peroxisome (PER)",
                "Centriole (CEN)",
                "Cytoskeleton (CYT)",
                "Cell Membrane (CM)",
                "Flagellum (FLA)",
                "Cilium (CLI)",
                "Vacuole (VAC)",
                "Chloroplast (CHP)",
                "Cell Wall (CW)",
                "Melanosome (MEL)",
                "Microvilli (MVI)",
                "Glyoxysome (GLY)",
                "Autophagosome (AUT)",
                "Stress Granule (SG)",
                "P-body (PB)",
                "Nuclear Pore Complex (NPC)",
                "Kinetochore (KIN)",
                "Spindle Pole Body (SPB)"
            ],
            "mismatches": [],
            "true_referents": [
                "Autophagosome (AUT)",
                "Cell Membrane (CM)",
                "Cell Wall (CW)",
                "Centriole (CEN)",
                "Chloroplast (CHP)",
                "Cilium (CLI)",
                "Cytoskeleton (CYT)",
                "Endoplasmic Reticulum (ER)",
                "Flagellum (FLA)",
                "Glyoxysome (GLY)",
                "Golgi Apparatus (GA)",
                "Kinetochore (KIN)",
                "Lysosome (LYS)",
                "Melanosome (MEL)",
                "Microvilli (MVI)",
                "Mitochondrion (MIT)",
                "Nuclear Pore Complex (NPC)",
                "Nucleus (NUC)",
                "P-body (PB)",
                "Peroxisome (PER)",
                "Ribosome (RIB)",
                "Spindle Pole Body (SPB)",
                "Stress Granule (SG)",
                "Vacuole (VAC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Nucleus",
            "Mitochondrion",
            "Endoplasmic Reticulum (ER)",
            "Golgi Apparatus",
            "Lysosome",
            "Peroxisome",
            "Ribosome",
            "Chloroplast",
            "Vacuole",
            "Cytoskeleton",
            "Centrosome",
            "Cilia",
            "Flagella",
            "Nucleolus",
            "Plasma Membrane",
            "Cell Wall",
            "Tonoplast",
            "Microtubule",
            "Microfilament",
            "Intermediate Filament",
            "Chromosome",
            "Nuclear Envelope",
            "Nuclear Pore",
            "Transport Vesicle"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nucleus",
                "Mitochondrion",
                "Endoplasmic Reticulum (ER)",
                "Golgi Apparatus",
                "Lysosome",
                "Peroxisome",
                "Ribosome",
                "Chloroplast",
                "Vacuole",
                "Cytoskeleton",
                "Centrosome",
                "Cilia",
                "Flagella",
                "Nucleolus",
                "Plasma Membrane",
                "Cell Wall",
                "Tonoplast",
                "Microtubule",
                "Microfilament",
                "Intermediate Filament",
                "Chromosome",
                "Nuclear Envelope",
                "Nuclear Pore",
                "Transport Vesicle"
            ],
            "mismatches": [],
            "true_referents": [
                "Cell Wall",
                "Centrosome",
                "Chloroplast",
                "Chromosome",
                "Cilia",
                "Cytoskeleton",
                "Endoplasmic Reticulum (ER)",
                "Flagella",
                "Golgi Apparatus",
                "Intermediate Filament",
                "Lysosome",
                "Microfilament",
                "Microtubule",
                "Mitochondrion",
                "Nuclear Envelope",
                "Nuclear Pore",
                "Nucleolus",
                "Nucleus",
                "Peroxisome",
                "Plasma Membrane",
                "Ribosome",
                "Tonoplast",
                "Transport Vesicle",
                "Vacuole"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Nucleus (NCL)",
            "Mitochondrion (MIT)",
            "Chloroplast (CHL)",
            "Endoplasmic Reticulum (ER)",
            "Golgi Apparatus (GA)",
            "Lysosome (LYS)",
            "Peroxisome (PER)",
            "Ribosome (RIB)",
            "Cytoskeleton (CYT)",
            "Vesicle (VES)",
            "Centrosome (CEN)",
            "Plasma Membrane (PM)",
            "Vacuole (VAC)",
            "Nucleolus (NUL)",
            "Cilia (CIL)",
            "Flagella (FLA)",
            "Cell Wall (CW)",
            "Chromatin (CHR)",
            "Secretory Granule (SG)",
            "Endosome (END)",
            "Smooth Endoplasmic Reticulum (SER)",
            "Rough Endoplasmic Reticulum (RER)",
            "Microtubule (MT)",
            "Microfilament (MF)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nucleus (NCL)",
                "Mitochondrion (MIT)",
                "Chloroplast (CHL)",
                "Endoplasmic Reticulum (ER)",
                "Golgi Apparatus (GA)",
                "Lysosome (LYS)",
                "Peroxisome (PER)",
                "Ribosome (RIB)",
                "Cytoskeleton (CYT)",
                "Vesicle (VES)",
                "Centrosome (CEN)",
                "Plasma Membrane (PM)",
                "Vacuole (VAC)",
                "Nucleolus (NUL)",
                "Cilia (CIL)",
                "Flagella (FLA)",
                "Cell Wall (CW)",
                "Chromatin (CHR)",
                "Secretory Granule (SG)",
                "Endosome (END)",
                "Smooth Endoplasmic Reticulum (SER)",
                "Rough Endoplasmic Reticulum (RER)",
                "Microtubule (MT)",
                "Microfilament (MF)"
            ],
            "mismatches": [],
            "true_referents": [
                "Cell Wall (CW)",
                "Centrosome (CEN)",
                "Chloroplast (CHL)",
                "Chromatin (CHR)",
                "Cilia (CIL)",
                "Cytoskeleton (CYT)",
                "Endoplasmic Reticulum (ER)",
                "Endosome (END)",
                "Flagella (FLA)",
                "Golgi Apparatus (GA)",
                "Lysosome (LYS)",
                "Microfilament (MF)",
                "Microtubule (MT)",
                "Mitochondrion (MIT)",
                "Nucleolus (NUL)",
                "Nucleus (NCL)",
                "Peroxisome (PER)",
                "Plasma Membrane (PM)",
                "Ribosome (RIB)",
                "Rough Endoplasmic Reticulum (RER)",
                "Secretory Granule (SG)",
                "Smooth Endoplasmic Reticulum (SER)",
                "Vacuole (VAC)",
                "Vesicle (VES)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Nucleus (N)",
            "Mitochondria (M)",
            "Ribosomes (R)",
            "Endoplasmic Reticulum (ER)",
            "Golgi Apparatus (GA)",
            "Lysosomes (L)",
            "Peroxisomes (P)",
            "Centrosomes (C)",
            "Cytoskeleton (CS)",
            "Nucleolus (NL)",
            "Chromosomes (CHR)",
            "Chloroplasts (CHL)",
            "Vacuoles (V)",
            "Cell Wall (CW)",
            "Cell Membrane (CM)",
            "Cilia (CI)",
            "Flagella (F)",
            "Plastids (PL)",
            "Microtubules (MT)",
            "Microfilaments (MF)",
            "Intermediate Filaments (IF)",
            "Nuclear Envelope (NE)",
            "Nuclear Pores (NP)",
            "Vesicles (VE)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nucleus (N)",
                "Mitochondria (M)",
                "Ribosomes (R)",
                "Endoplasmic Reticulum (ER)",
                "Golgi Apparatus (GA)",
                "Lysosomes (L)",
                "Peroxisomes (P)",
                "Centrosomes (C)",
                "Cytoskeleton (CS)",
                "Nucleolus (NL)",
                "Chromosomes (CHR)",
                "Chloroplasts (CHL)",
                "Vacuoles (V)",
                "Cell Wall (CW)",
                "Cell Membrane (CM)",
                "Cilia (CI)",
                "Flagella (F)",
                "Plastids (PL)",
                "Microtubules (MT)",
                "Microfilaments (MF)",
                "Intermediate Filaments (IF)",
                "Nuclear Envelope (NE)",
                "Nuclear Pores (NP)",
                "Vesicles (VE)"
            ],
            "mismatches": [],
            "true_referents": [
                "Cell Membrane (CM)",
                "Cell Wall (CW)",
                "Centrosomes (C)",
                "Chloroplasts (CHL)",
                "Chromosomes (CHR)",
                "Cilia (CI)",
                "Cytoskeleton (CS)",
                "Endoplasmic Reticulum (ER)",
                "Flagella (F)",
                "Golgi Apparatus (GA)",
                "Intermediate Filaments (IF)",
                "Lysosomes (L)",
                "Microfilaments (MF)",
                "Microtubules (MT)",
                "Mitochondria (M)",
                "Nuclear Envelope (NE)",
                "Nuclear Pores (NP)",
                "Nucleolus (NL)",
                "Nucleus (N)",
                "Peroxisomes (P)",
                "Plastids (PL)",
                "Ribosomes (R)",
                "Vacuoles (V)",
                "Vesicles (VE)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Nucleus",
            "Mitochondria",
            "Chloroplast",
            "Endoplasmic reticulum",
            "Golgi apparatus",
            "Lysosome",
            "Vacuole",
            "Ribosome",
            "Cytoskeleton",
            "Cell membrane",
            "Cell wall",
            "Centriole",
            "Peroxisome",
            "Flagellum",
            "Cilia",
            "Microvilli",
            "Nucleolus",
            "Nuclear envelope",
            "Nuclear pore",
            "Nuclear lamina",
            "Nuclear matrix",
            "Nuclear speckles",
            "Nuclear bodies",
            "Nucleoplasm"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nucleus",
                "Mitochondria",
                "Chloroplast",
                "Endoplasmic reticulum",
                "Golgi apparatus",
                "Lysosome",
                "Vacuole",
                "Ribosome",
                "Cytoskeleton",
                "Cell membrane",
                "Cell wall",
                "Centriole",
                "Peroxisome",
                "Flagellum",
                "Cilia",
                "Microvilli",
                "Nucleolus",
                "Nuclear envelope",
                "Nuclear pore",
                "Nuclear lamina",
                "Nuclear matrix",
                "Nuclear speckles",
                "Nuclear bodies",
                "Nucleoplasm"
            ],
            "mismatches": [],
            "true_referents": [
                "Cell membrane",
                "Cell wall",
                "Centriole",
                "Chloroplast",
                "Cilia",
                "Cytoskeleton",
                "Endoplasmic reticulum",
                "Flagellum",
                "Golgi apparatus",
                "Lysosome",
                "Microvilli",
                "Mitochondria",
                "Nuclear bodies",
                "Nuclear envelope",
                "Nuclear lamina",
                "Nuclear matrix",
                "Nuclear pore",
                "Nuclear speckles",
                "Nucleolus",
                "Nucleoplasm",
                "Nucleus",
                "Peroxisome",
                "Ribosome",
                "Vacuole"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Nucleus (N)",
            "Mitochondrion (M)",
            "Rough Endoplasmic Reticulum (RER)",
            "Smooth Endoplasmic Reticulum (SER)",
            "Golgi Apparatus (GA)",
            "Lysosome (Ly)",
            "Peroxisome (Px)",
            "Ribosome (Rib)",
            "Cytoskeleton (CSK)",
            "Centrosome (CEN)",
            "Vacuole (Vac)",
            "Chloroplast (Chl)",
            "Plasma Membrane (PM)",
            "Cilia (cil)",
            "Flagella (flg)",
            "Vesicle (Ves)",
            "Microtubule (MT)",
            "Actin Filament (AF)",
            "Intermediate Filament (IF)",
            "Nuclear Pore Complex (NPC)",
            "Nucleolus (Nu)",
            "Mitochondrial Matrix (MM)",
            "Lipid Droplet (LD)",
            "Nuclear Envelope (NE)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nucleus (N)",
                "Mitochondrion (M)",
                "Rough Endoplasmic Reticulum (RER)",
                "Smooth Endoplasmic Reticulum (SER)",
                "Golgi Apparatus (GA)",
                "Lysosome (Ly)",
                "Peroxisome (Px)",
                "Ribosome (Rib)",
                "Cytoskeleton (CSK)",
                "Centrosome (CEN)",
                "Vacuole (Vac)",
                "Chloroplast (Chl)",
                "Plasma Membrane (PM)",
                "Cilia (cil)",
                "Flagella (flg)",
                "Vesicle (Ves)",
                "Microtubule (MT)",
                "Actin Filament (AF)",
                "Intermediate Filament (IF)",
                "Nuclear Pore Complex (NPC)",
                "Nucleolus (Nu)",
                "Mitochondrial Matrix (MM)",
                "Lipid Droplet (LD)",
                "Nuclear Envelope (NE)"
            ],
            "mismatches": [],
            "true_referents": [
                "Actin Filament (AF)",
                "Centrosome (CEN)",
                "Chloroplast (Chl)",
                "Cilia (cil)",
                "Cytoskeleton (CSK)",
                "Flagella (flg)",
                "Golgi Apparatus (GA)",
                "Intermediate Filament (IF)",
                "Lipid Droplet (LD)",
                "Lysosome (Ly)",
                "Microtubule (MT)",
                "Mitochondrial Matrix (MM)",
                "Mitochondrion (M)",
                "Nuclear Envelope (NE)",
                "Nuclear Pore Complex (NPC)",
                "Nucleolus (Nu)",
                "Nucleus (N)",
                "Peroxisome (Px)",
                "Plasma Membrane (PM)",
                "Ribosome (Rib)",
                "Rough Endoplasmic Reticulum (RER)",
                "Smooth Endoplasmic Reticulum (SER)",
                "Vacuole (Vac)",
                "Vesicle (Ves)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Nucleus (N)",
            "Mitochondrion (M)",
            "Endoplasmic reticulum (ER)",
            "Golgi apparatus (GA)",
            "Lysosome (L)",
            "Peroxisome (P)",
            "Chloroplast (C)",
            "Vacuole (V)",
            "Centriole (Ce)",
            "Ribosome (R)",
            "Nucleolus (Nu)",
            "Plasma membrane (PM)",
            "Cytoskeleton (CS)",
            "Flagellum (F)",
            "Cilium (Ci)",
            "Nuclear envelope (NE)",
            "Chromatin (Ch)",
            "Microtubule (MT)",
            "Microfilament (MF)",
            "Intermediate filament (IF)",
            "Vesicle (Ve)",
            "Nuclear pore complex (NPC)",
            "Desmosome (D)",
            "Gap junction (GJ)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nucleus (N)",
                "Mitochondrion (M)",
                "Endoplasmic reticulum (ER)",
                "Golgi apparatus (GA)",
                "Lysosome (L)",
                "Peroxisome (P)",
                "Chloroplast (C)",
                "Vacuole (V)",
                "Centriole (Ce)",
                "Ribosome (R)",
                "Nucleolus (Nu)",
                "Plasma membrane (PM)",
                "Cytoskeleton (CS)",
                "Flagellum (F)",
                "Cilium (Ci)",
                "Nuclear envelope (NE)",
                "Chromatin (Ch)",
                "Microtubule (MT)",
                "Microfilament (MF)",
                "Intermediate filament (IF)",
                "Vesicle (Ve)",
                "Nuclear pore complex (NPC)",
                "Desmosome (D)",
                "Gap junction (GJ)"
            ],
            "mismatches": [],
            "true_referents": [
                "Centriole (Ce)",
                "Chloroplast (C)",
                "Chromatin (Ch)",
                "Cilium (Ci)",
                "Cytoskeleton (CS)",
                "Desmosome (D)",
                "Endoplasmic reticulum (ER)",
                "Flagellum (F)",
                "Gap junction (GJ)",
                "Golgi apparatus (GA)",
                "Intermediate filament (IF)",
                "Lysosome (L)",
                "Microfilament (MF)",
                "Microtubule (MT)",
                "Mitochondrion (M)",
                "Nuclear envelope (NE)",
                "Nuclear pore complex (NPC)",
                "Nucleolus (Nu)",
                "Nucleus (N)",
                "Peroxisome (P)",
                "Plasma membrane (PM)",
                "Ribosome (R)",
                "Vacuole (V)",
                "Vesicle (Ve)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Nucleus (Nu)",
            "Mitochondrion (Mt)",
            "Endoplasmic Reticulum (ER)",
            "Golgi Apparatus (GA)",
            "Lysosome (Ly)",
            "Peroxisome (Px)",
            "Ribosome (Rb)",
            "Centrosome (Cs)",
            "Chloroplast (Cp)",
            "Vacuole (Vc)",
            "Cytoskeleton (Ck)",
            "Plasma Membrane (PM)",
            "Nucleolus (No)",
            "Smooth Endoplasmic Reticulum (SER)",
            "Rough Endoplasmic Reticulum (RER)",
            "Centriole (Ct)",
            "Autophagosome (Ap)",
            "Proteasome (Pt)",
            "Microfilament (Mf)",
            "Intermediate Filament (IF)",
            "Microtubule (Mt)",
            "Flagellum (Fl)",
            "Cilium (Ci)",
            "Glycosome (Gl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nucleus (Nu)",
                "Mitochondrion (Mt)",
                "Endoplasmic Reticulum (ER)",
                "Golgi Apparatus (GA)",
                "Lysosome (Ly)",
                "Peroxisome (Px)",
                "Ribosome (Rb)",
                "Centrosome (Cs)",
                "Chloroplast (Cp)",
                "Vacuole (Vc)",
                "Cytoskeleton (Ck)",
                "Plasma Membrane (PM)",
                "Nucleolus (No)",
                "Smooth Endoplasmic Reticulum (SER)",
                "Rough Endoplasmic Reticulum (RER)",
                "Centriole (Ct)",
                "Autophagosome (Ap)",
                "Proteasome (Pt)",
                "Microfilament (Mf)",
                "Intermediate Filament (IF)",
                "Microtubule (Mt)",
                "Flagellum (Fl)",
                "Cilium (Ci)",
                "Glycosome (Gl)"
            ],
            "mismatches": [],
            "true_referents": [
                "Autophagosome (Ap)",
                "Centriole (Ct)",
                "Centrosome (Cs)",
                "Chloroplast (Cp)",
                "Cilium (Ci)",
                "Cytoskeleton (Ck)",
                "Endoplasmic Reticulum (ER)",
                "Flagellum (Fl)",
                "Glycosome (Gl)",
                "Golgi Apparatus (GA)",
                "Intermediate Filament (IF)",
                "Lysosome (Ly)",
                "Microfilament (Mf)",
                "Microtubule (Mt)",
                "Mitochondrion (Mt)",
                "Nucleolus (No)",
                "Nucleus (Nu)",
                "Peroxisome (Px)",
                "Plasma Membrane (PM)",
                "Proteasome (Pt)",
                "Ribosome (Rb)",
                "Rough Endoplasmic Reticulum (RER)",
                "Smooth Endoplasmic Reticulum (SER)",
                "Vacuole (Vc)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Nucleus (nu)",
            "Mitochondrion (mt)",
            "Endoplasmic reticulum (ER)",
            "Golgi apparatus (GA)",
            "Lysosome (ly)",
            "Peroxisome (po)",
            "Ribosome (rb)",
            "Cytoskeleton (cy)",
            "Vacuole (va)",
            "Chloroplast (cp)",
            "Glyoxysome (gx)",
            "Centriole (ce)",
            "Cilium (ci)",
            "Flagellum (fl)",
            "Cell membrane (cm)",
            "Cell wall (cw)",
            "Nucleolus (nl)",
            "Rough endoplasmic reticulum (RER)",
            "Smooth endoplasmic reticulum (SER)",
            "Cis Golgi network (CGN)",
            "Trans Golgi network (TGN)",
            "Microbody (mb)",
            "Microsome (ms)",
            "Thylakoid (th)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Nucleus (nu)",
                "Mitochondrion (mt)",
                "Endoplasmic reticulum (ER)",
                "Golgi apparatus (GA)",
                "Lysosome (ly)",
                "Peroxisome (po)",
                "Ribosome (rb)",
                "Cytoskeleton (cy)",
                "Vacuole (va)",
                "Chloroplast (cp)",
                "Glyoxysome (gx)",
                "Centriole (ce)",
                "Cilium (ci)",
                "Flagellum (fl)",
                "Cell membrane (cm)",
                "Cell wall (cw)",
                "Nucleolus (nl)",
                "Rough endoplasmic reticulum (RER)",
                "Smooth endoplasmic reticulum (SER)",
                "Cis Golgi network (CGN)",
                "Trans Golgi network (TGN)",
                "Microbody (mb)",
                "Microsome (ms)",
                "Thylakoid (th)"
            ],
            "mismatches": [],
            "true_referents": [
                "Cell membrane (cm)",
                "Cell wall (cw)",
                "Centriole (ce)",
                "Chloroplast (cp)",
                "Cilium (ci)",
                "Cis Golgi network (CGN)",
                "Cytoskeleton (cy)",
                "Endoplasmic reticulum (ER)",
                "Flagellum (fl)",
                "Glyoxysome (gx)",
                "Golgi apparatus (GA)",
                "Lysosome (ly)",
                "Microbody (mb)",
                "Microsome (ms)",
                "Mitochondrion (mt)",
                "Nucleolus (nl)",
                "Nucleus (nu)",
                "Peroxisome (po)",
                "Ribosome (rb)",
                "Rough endoplasmic reticulum (RER)",
                "Smooth endoplasmic reticulum (SER)",
                "Thylakoid (th)",
                "Trans Golgi network (TGN)",
                "Vacuole (va)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Mitochondrion (MT)",
            "Chloroplast (CP)",
            "Nucleus (NC)",
            "Endoplasmic Reticulum (ER)",
            "Golgi Apparatus (GA)",
            "Lysosome (LY)",
            "Peroxisome (PX)",
            "Ribosome (RB)",
            "Centrosome (CN)",
            "Centriole (CE)",
            "Flagellum (FL)",
            "Cilium (CI)",
            "Vacuole (VC)",
            "Contractile Vacuole (CV)",
            "Microtubule (MT)",
            "Microfilament (MF)",
            "Intermediate Filament (IF)",
            "Cell Membrane (CM)",
            "Nuclear Envelope (NE)",
            "Nuclear Pore Complex (NPC)",
            "Nucleolus (NL)",
            "Rough Endoplasmic Reticulum (RER)",
            "Smooth Endoplasmic Reticulum (SER)",
            "Synaptic Vesicle (SV)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Mitochondrion (MT)",
                "Chloroplast (CP)",
                "Nucleus (NC)",
                "Endoplasmic Reticulum (ER)",
                "Golgi Apparatus (GA)",
                "Lysosome (LY)",
                "Peroxisome (PX)",
                "Ribosome (RB)",
                "Centrosome (CN)",
                "Centriole (CE)",
                "Flagellum (FL)",
                "Cilium (CI)",
                "Vacuole (VC)",
                "Contractile Vacuole (CV)",
                "Microtubule (MT)",
                "Microfilament (MF)",
                "Intermediate Filament (IF)",
                "Cell Membrane (CM)",
                "Nuclear Envelope (NE)",
                "Nuclear Pore Complex (NPC)",
                "Nucleolus (NL)",
                "Rough Endoplasmic Reticulum (RER)",
                "Smooth Endoplasmic Reticulum (SER)",
                "Synaptic Vesicle (SV)"
            ],
            "mismatches": [],
            "true_referents": [
                "Cell Membrane (CM)",
                "Centriole (CE)",
                "Centrosome (CN)",
                "Chloroplast (CP)",
                "Cilium (CI)",
                "Contractile Vacuole (CV)",
                "Endoplasmic Reticulum (ER)",
                "Flagellum (FL)",
                "Golgi Apparatus (GA)",
                "Intermediate Filament (IF)",
                "Lysosome (LY)",
                "Microfilament (MF)",
                "Microtubule (MT)",
                "Mitochondrion (MT)",
                "Nuclear Envelope (NE)",
                "Nuclear Pore Complex (NPC)",
                "Nucleolus (NL)",
                "Nucleus (NC)",
                "Peroxisome (PX)",
                "Ribosome (RB)",
                "Rough Endoplasmic Reticulum (RER)",
                "Smooth Endoplasmic Reticulum (SER)",
                "Synaptic Vesicle (SV)",
                "Vacuole (VC)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Mitochondrion (Mit)",
            "Centriole",
            "Golgi apparatus",
            "Lysosome",
            "Endoplasmic reticulum (ER)",
            "Ribosome",
            "Peroxisome",
            "Cytoskeleton",
            "Nucleolus",
            "Nucleus",
            "Cilia",
            "Flagellum",
            "Microtubule",
            "Microfilament",
            "Intermediate filament",
            "Centrosome",
            "Mitochondrial DNA",
            "Chloroplast",
            "Plastid",
            "Vacuole",
            "Chromatin",
            "Chromatid",
            "Telomere",
            "Centromere",
            "Kinetochores"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Mitochondrion (Mit)",
                "Centriole",
                "Golgi apparatus",
                "Lysosome",
                "Endoplasmic reticulum (ER)",
                "Ribosome",
                "Peroxisome",
                "Cytoskeleton",
                "Nucleolus",
                "Nucleus",
                "Cilia",
                "Flagellum",
                "Microtubule",
                "Microfilament",
                "Intermediate filament",
                "Centrosome",
                "Mitochondrial DNA",
                "Chloroplast",
                "Plastid",
                "Vacuole",
                "Chromatin",
                "Chromatid",
                "Telomere",
                "Centromere"
            ],
            "mismatches": [
                "Kinetochores"
            ],
            "true_referents": [
                "Centriole",
                "Centromere",
                "Centrosome",
                "Chloroplast",
                "Chromatid",
                "Chromatin",
                "Cilia",
                "Cytoskeleton",
                "Endoplasmic reticulum (ER)",
                "Flagellum",
                "Golgi apparatus",
                "Intermediate filament",
                "Lysosome",
                "Microfilament",
                "Microtubule",
                "Mitochondrial DNA",
                "Mitochondrion (Mit)",
                "Nucleolus",
                "Nucleus",
                "Peroxisome",
                "Plastid",
                "Ribosome",
                "Telomere",
                "Vacuole"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            "Mitochondria (mt)",
            "Golgi apparatus (GA)",
            "Lysosome (Ly)",
            "Endoplasmic reticulum (ER)",
            "Ribosome (Rb)",
            "Cytoskeleton (CS)",
            "Nucleus (N)",
            "Centriole (Cn)",
            "Peroxisome (Px)",
            "Cilium (Cm)",
            "Flagellum (Fl)",
            "Centromere (Cm)",
            "Chloroplast (Chl)",
            "Vacuole (V)",
            "Glyoxysome (Gx)",
            "Autophagosome (Ap)",
            "Phagosome (Ps)",
            "Acrosome (Acs)",
            "Melanosome (Ml)",
            "Weibel-Palade body (WP)",
            "Punctum adhaerens (PA)",
            "Focal adhesion (FA)",
            "Tight junction (TJ)",
            "Adherens junction (AJ)",
            "Gap junction (Gj)",
            "Desmosome (Dm)",
            "Hemidesmosome (Hd)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Mitochondria (mt)",
                "Golgi apparatus (GA)",
                "Lysosome (Ly)",
                "Endoplasmic reticulum (ER)",
                "Ribosome (Rb)",
                "Cytoskeleton (CS)",
                "Nucleus (N)",
                "Centriole (Cn)",
                "Peroxisome (Px)",
                "Cilium (Cm)",
                "Flagellum (Fl)",
                "Centromere (Cm)",
                "Chloroplast (Chl)",
                "Vacuole (V)",
                "Glyoxysome (Gx)",
                "Autophagosome (Ap)",
                "Phagosome (Ps)",
                "Acrosome (Acs)",
                "Melanosome (Ml)",
                "Weibel-Palade body (WP)",
                "Punctum adhaerens (PA)",
                "Focal adhesion (FA)",
                "Tight junction (TJ)",
                "Adherens junction (AJ)"
            ],
            "mismatches": [
                "Gap junction (Gj)",
                "Desmosome (Dm)",
                "Hemidesmosome (Hd)"
            ],
            "true_referents": [
                "Acrosome (Acs)",
                "Adherens junction (AJ)",
                "Autophagosome (Ap)",
                "Centriole (Cn)",
                "Centromere (Cm)",
                "Chloroplast (Chl)",
                "Cilium (Cm)",
                "Cytoskeleton (CS)",
                "Endoplasmic reticulum (ER)",
                "Flagellum (Fl)",
                "Focal adhesion (FA)",
                "Glyoxysome (Gx)",
                "Golgi apparatus (GA)",
                "Lysosome (Ly)",
                "Melanosome (Ml)",
                "Mitochondria (mt)",
                "Nucleus (N)",
                "Peroxisome (Px)",
                "Phagosome (Ps)",
                "Punctum adhaerens (PA)",
                "Ribosome (Rb)",
                "Tight junction (TJ)",
                "Vacuole (V)",
                "Weibel-Palade body (WP)"
            ],
            "TP": 24,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "organelle",
        "domain": "biology",
        "response": [
            {
                "Referent": "cell membrane",
                "Canonical Name": "cell membrane"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            },
            {
                "Referent": "cell wall",
                "Canonical Name": "cell wall"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cell membrane",
                "cell wall"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"cell membrane\", \"Canonical Name\": \"cell membrane\"}",
                "{\"Referent\": \"cell wall\", \"Canonical Name\": \"cell wall\"}"
            ],
            "TP": 2,
            "FP": 0,
            "FN": 0
        }
    }
]