[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Huntington's disease (HD)",
            "Tay-Sachs disease (TSD)",
            "Cystic fibrosis (CF)",
            "Sickle cell anemia",
            "Hemochromatosis (HHC)",
            "Duchenne muscular dystrophy (DMD)",
            "Thalassemia",
            "Familial hypercholesterolemia (FH)",
            "Marfan syndrome",
            "Hemophilia A",
            "Hereditary nonpolyposis colorectal cancer (HNPCC)",
            "Fragile X syndrome",
            "Gaucher disease",
            "Lactose intolerance",
            "Hypertrophic cardiomyopathy (HCM)",
            "Neurofibromatosis type 1 (NF1)",
            "Polycystic kidney disease (PKD)",
            "Hereditary breast and ovarian cancer syndrome (HBOC)",
            "Ataxia telangiectasia (A-T)",
            "Adrenoleukodystrophy (ALD)",
            "Retinitis pigmentosa (RP)",
            "Long QT syndrome (LQTS)",
            "Fabry disease",
            "Alzheimer's disease (early-onset form)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Huntington's disease (HD)",
                "Tay-Sachs disease (TSD)",
                "Cystic fibrosis (CF)",
                "Sickle cell anemia",
                "Hemochromatosis (HHC)",
                "Duchenne muscular dystrophy (DMD)",
                "Thalassemia",
                "Familial hypercholesterolemia (FH)",
                "Marfan syndrome",
                "Hemophilia A",
                "Hereditary nonpolyposis colorectal cancer (HNPCC)",
                "Fragile X syndrome",
                "Gaucher disease",
                "Lactose intolerance",
                "Hypertrophic cardiomyopathy (HCM)",
                "Neurofibromatosis type 1 (NF1)",
                "Polycystic kidney disease (PKD)",
                "Hereditary breast and ovarian cancer syndrome (HBOC)",
                "Ataxia telangiectasia (A-T)",
                "Adrenoleukodystrophy (ALD)",
                "Retinitis pigmentosa (RP)",
                "Long QT syndrome (LQTS)",
                "Fabry disease",
                "Alzheimer's disease (early-onset form)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenoleukodystrophy (ALD)",
                "Alzheimer's disease (early-onset form)",
                "Ataxia telangiectasia (A-T)",
                "Cystic fibrosis (CF)",
                "Duchenne muscular dystrophy (DMD)",
                "Fabry disease",
                "Familial hypercholesterolemia (FH)",
                "Fragile X syndrome",
                "Gaucher disease",
                "Hemochromatosis (HHC)",
                "Hemophilia A",
                "Hereditary breast and ovarian cancer syndrome (HBOC)",
                "Hereditary nonpolyposis colorectal cancer (HNPCC)",
                "Huntington's disease (HD)",
                "Hypertrophic cardiomyopathy (HCM)",
                "Lactose intolerance",
                "Long QT syndrome (LQTS)",
                "Marfan syndrome",
                "Neurofibromatosis type 1 (NF1)",
                "Polycystic kidney disease (PKD)",
                "Retinitis pigmentosa (RP)",
                "Sickle cell anemia",
                "Tay-Sachs disease (TSD)",
                "Thalassemia"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Cystic Fibrosis (CFTR gene mutation)",
            "Sickle Cell Disease (HBB gene mutation)",
            "Huntington's Disease (HTT gene mutation)",
            "Duchenne Muscular Dystrophy (DMD gene mutation)",
            "Fragile X Syndrome (FMR1 gene mutation)",
            "Tay-Sachs Disease (HEXA gene mutation)",
            "Tuberous Sclerosis (TSC1 or TSC2 gene mutation)",
            "Marfan Syndrome (FBN1 gene mutation)",
            "Hemophilia A (F8 gene mutation)",
            "Hemophilia B (F9 gene mutation)",
            "Phenylketonuria (PAH gene mutation)",
            "Wilson's Disease (ATP7B gene mutation)",
            "Osteogenesis Imperfecta (COL1A1 or COL1A2 gene mutation)",
            "Familial Hypercholesterolemia (LDLR gene mutation)",
            "Neurofibromatosis Type 1 (NF1 gene mutation)",
            "Neurofibromatosis Type 2 (NF2 gene mutation)",
            "Alport Syndrome (COL4A3, COL4A4, or COL4A5 gene mutation)",
            "Retinitis Pigmentosa (various gene mutations)",
            "Charcot-Marie-Tooth Disease (various gene mutations)",
            "Carpal Tunnel Syndrome (SCN9A gene mutation)",
            "Familial Hyperinsulinemic Hypoglycemia (ABCC8 or KCNJ11 gene mutation)",
            "Adrenoleukodystrophy (ABCD1 gene mutation)",
            "Bardet-Biedl Syndrome (various gene mutations)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cystic Fibrosis (CFTR gene mutation)",
                "Sickle Cell Disease (HBB gene mutation)",
                "Huntington's Disease (HTT gene mutation)",
                "Duchenne Muscular Dystrophy (DMD gene mutation)",
                "Fragile X Syndrome (FMR1 gene mutation)",
                "Tay-Sachs Disease (HEXA gene mutation)",
                "Tuberous Sclerosis (TSC1 or TSC2 gene mutation)",
                "Marfan Syndrome (FBN1 gene mutation)",
                "Hemophilia A (F8 gene mutation)",
                "Hemophilia B (F9 gene mutation)",
                "Phenylketonuria (PAH gene mutation)",
                "Wilson's Disease (ATP7B gene mutation)",
                "Osteogenesis Imperfecta (COL1A1 or COL1A2 gene mutation)",
                "Familial Hypercholesterolemia (LDLR gene mutation)",
                "Neurofibromatosis Type 1 (NF1 gene mutation)",
                "Neurofibromatosis Type 2 (NF2 gene mutation)",
                "Alport Syndrome (COL4A3, COL4A4, or COL4A5 gene mutation)",
                "Retinitis Pigmentosa (various gene mutations)",
                "Charcot-Marie-Tooth Disease (various gene mutations)",
                "Carpal Tunnel Syndrome (SCN9A gene mutation)",
                "Familial Hyperinsulinemic Hypoglycemia (ABCC8 or KCNJ11 gene mutation)",
                "Adrenoleukodystrophy (ABCD1 gene mutation)",
                "Bardet-Biedl Syndrome (various gene mutations)"
            ],
            "mismatches": [],
            "true_referents": [
                "Adrenoleukodystrophy (ABCD1 gene mutation)",
                "Alport Syndrome (COL4A3, COL4A4, or COL4A5 gene mutation)",
                "Bardet-Biedl Syndrome (various gene mutations)",
                "Carpal Tunnel Syndrome (SCN9A gene mutation)",
                "Charcot-Marie-Tooth Disease (various gene mutations)",
                "Cystic Fibrosis (CFTR gene mutation)",
                "Duchenne Muscular Dystrophy (DMD gene mutation)",
                "Familial Hypercholesterolemia (LDLR gene mutation)",
                "Familial Hyperinsulinemic Hypoglycemia (ABCC8 or KCNJ11 gene mutation)",
                "Fragile X Syndrome (FMR1 gene mutation)",
                "Hemophilia A (F8 gene mutation)",
                "Hemophilia B (F9 gene mutation)",
                "Huntington's Disease (HTT gene mutation)",
                "Marfan Syndrome (FBN1 gene mutation)",
                "Neurofibromatosis Type 1 (NF1 gene mutation)",
                "Neurofibromatosis Type 2 (NF2 gene mutation)",
                "Osteogenesis Imperfecta (COL1A1 or COL1A2 gene mutation)",
                "Phenylketonuria (PAH gene mutation)",
                "Retinitis Pigmentosa (various gene mutations)",
                "Sickle Cell Disease (HBB gene mutation)",
                "Tay-Sachs Disease (HEXA gene mutation)",
                "Tuberous Sclerosis (TSC1 or TSC2 gene mutation)",
                "Wilson's Disease (ATP7B gene mutation)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Cystic Fibrosis (CF)",
            "Sickle Cell Anemia (SCA)",
            "Huntington's Disease (HD)",
            "Tay-Sachs Disease",
            "Phenylketonuria (PKU)",
            "Duchenne Muscular Dystrophy (DMD)",
            "Fragile X Syndrome (FXS)",
            "Marfan Syndrome",
            "Neurofibromatosis Type 1 (NF1)",
            "Neurofibromatosis Type 2 (NF2)",
            "Hemophilia A",
            "Hemophilia B",
            "Von Willebrand Disease",
            "Familial Hypercholesterolemia (FH)",
            "Polycystic Kidney Disease (PKD)",
            "Hereditary Spherocytosis (HS)",
            "Gaucher Disease",
            "Fabry Disease",
            "Krabbe Disease",
            "Metachromatic Leukodystrophy",
            "Niemann-Pick Disease",
            "Wilson's Disease",
            "Tuberous Sclerosis Complex (TSC)",
            "Alpha-1 Antitrypsin Deficiency (A1AD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cystic Fibrosis (CF)",
                "Sickle Cell Anemia (SCA)",
                "Huntington's Disease (HD)",
                "Tay-Sachs Disease",
                "Phenylketonuria (PKU)",
                "Duchenne Muscular Dystrophy (DMD)",
                "Fragile X Syndrome (FXS)",
                "Marfan Syndrome",
                "Neurofibromatosis Type 1 (NF1)",
                "Neurofibromatosis Type 2 (NF2)",
                "Hemophilia A",
                "Hemophilia B",
                "Von Willebrand Disease",
                "Familial Hypercholesterolemia (FH)",
                "Polycystic Kidney Disease (PKD)",
                "Hereditary Spherocytosis (HS)",
                "Gaucher Disease",
                "Fabry Disease",
                "Krabbe Disease",
                "Metachromatic Leukodystrophy",
                "Niemann-Pick Disease",
                "Wilson's Disease",
                "Tuberous Sclerosis Complex (TSC)",
                "Alpha-1 Antitrypsin Deficiency (A1AD)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alpha-1 Antitrypsin Deficiency (A1AD)",
                "Cystic Fibrosis (CF)",
                "Duchenne Muscular Dystrophy (DMD)",
                "Fabry Disease",
                "Familial Hypercholesterolemia (FH)",
                "Fragile X Syndrome (FXS)",
                "Gaucher Disease",
                "Hemophilia A",
                "Hemophilia B",
                "Hereditary Spherocytosis (HS)",
                "Huntington's Disease (HD)",
                "Krabbe Disease",
                "Marfan Syndrome",
                "Metachromatic Leukodystrophy",
                "Neurofibromatosis Type 1 (NF1)",
                "Neurofibromatosis Type 2 (NF2)",
                "Niemann-Pick Disease",
                "Phenylketonuria (PKU)",
                "Polycystic Kidney Disease (PKD)",
                "Sickle Cell Anemia (SCA)",
                "Tay-Sachs Disease",
                "Tuberous Sclerosis Complex (TSC)",
                "Von Willebrand Disease",
                "Wilson's Disease"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Cystic Fibrosis (CF)",
            "Sickle Cell Anemia (SCA)",
            "Phenylketonuria (PKU)",
            "Tay-Sachs Disease (TSD)",
            "Huntington's Disease (HD)",
            "Familial Hypercholesterolemia (FH)",
            "Alpha-1 Antitrypsin Deficiency (AATD)",
            "Galactosemia (GAL)",
            "Maple Syrup Urine Disease (MSUD)",
            "Hereditary Hemochromatosis (HHC)",
            "Wilson's Disease (WD)",
            "Gaucher Disease (GD)",
            "Niemann-Pick Disease Type C (NPC)",
            "Bloom Syndrome (BS)",
            "Fanconi Anemia (FA)",
            "Ataxia-Telangiectasia (AT)",
            "Retinitis Pigmentosa (RP) - certain subtypes",
            "Neurofibromatosis Type 1 (NF1)",
            "Marfan Syndrome (MFS)",
            "Ehlers-Danlos Syndrome - certain subtypes (EDS)",
            "Polycystic Kidney Disease - Autosomal Dominant (ADPKD)",
            "Hereditary Spherocytosis (HS)",
            "Glucose-6-Phosphate Dehydrogenase Deficiency (G6PD)",
            "Alpha Thalassemia (\u03b1-Thal)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cystic Fibrosis (CF)",
                "Sickle Cell Anemia (SCA)",
                "Phenylketonuria (PKU)",
                "Tay-Sachs Disease (TSD)",
                "Huntington's Disease (HD)",
                "Familial Hypercholesterolemia (FH)",
                "Alpha-1 Antitrypsin Deficiency (AATD)",
                "Galactosemia (GAL)",
                "Maple Syrup Urine Disease (MSUD)",
                "Hereditary Hemochromatosis (HHC)",
                "Wilson's Disease (WD)",
                "Gaucher Disease (GD)",
                "Niemann-Pick Disease Type C (NPC)",
                "Bloom Syndrome (BS)",
                "Fanconi Anemia (FA)",
                "Ataxia-Telangiectasia (AT)",
                "Retinitis Pigmentosa (RP) - certain subtypes",
                "Neurofibromatosis Type 1 (NF1)",
                "Marfan Syndrome (MFS)",
                "Ehlers-Danlos Syndrome - certain subtypes (EDS)",
                "Polycystic Kidney Disease - Autosomal Dominant (ADPKD)",
                "Hereditary Spherocytosis (HS)",
                "Glucose-6-Phosphate Dehydrogenase Deficiency (G6PD)",
                "Alpha Thalassemia (\u03b1-Thal)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alpha Thalassemia (\u03b1-Thal)",
                "Alpha-1 Antitrypsin Deficiency (AATD)",
                "Ataxia-Telangiectasia (AT)",
                "Bloom Syndrome (BS)",
                "Cystic Fibrosis (CF)",
                "Ehlers-Danlos Syndrome - certain subtypes (EDS)",
                "Familial Hypercholesterolemia (FH)",
                "Fanconi Anemia (FA)",
                "Galactosemia (GAL)",
                "Gaucher Disease (GD)",
                "Glucose-6-Phosphate Dehydrogenase Deficiency (G6PD)",
                "Hereditary Hemochromatosis (HHC)",
                "Hereditary Spherocytosis (HS)",
                "Huntington's Disease (HD)",
                "Maple Syrup Urine Disease (MSUD)",
                "Marfan Syndrome (MFS)",
                "Neurofibromatosis Type 1 (NF1)",
                "Niemann-Pick Disease Type C (NPC)",
                "Phenylketonuria (PKU)",
                "Polycystic Kidney Disease - Autosomal Dominant (ADPKD)",
                "Retinitis Pigmentosa (RP) - certain subtypes",
                "Sickle Cell Anemia (SCA)",
                "Tay-Sachs Disease (TSD)",
                "Wilson's Disease (WD)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Cystic Fibrosis (CF)",
            "Sickle Cell Disease (SCD)",
            "Huntington's Disease (HD)",
            "Marfan Syndrome (MFS)",
            "Neurofibromatosis Type 1 (NF1)",
            "Polycystic Kidney Disease (PKD)",
            "Familial Hypercholesterolemia (FH)",
            "Tuberous Sclerosis Complex (TSC)",
            "Hereditary Hemochromatosis (HH)",
            "Alpha-1 Antitrypsin Deficiency (AATD)",
            "Phenylketonuria (PKU)",
            "Duchenne Muscular Dystrophy (DMD)",
            "Myotonic Dystrophy (DM)",
            "Fragile X Syndrome (FXS)",
            "X-linked Agammaglobulinemia (XLA)",
            "Beta Thalassemia",
            "Hemophilia A",
            "Hemophilia B",
            "Rett Syndrome",
            "Achondroplasia",
            "Osteogenesis Imperfecta",
            "Noonan Syndrome",
            "Congenital Adrenal Hyperplasia (CAH)",
            "Wilson's Disease"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cystic Fibrosis (CF)",
                "Sickle Cell Disease (SCD)",
                "Huntington's Disease (HD)",
                "Marfan Syndrome (MFS)",
                "Neurofibromatosis Type 1 (NF1)",
                "Polycystic Kidney Disease (PKD)",
                "Familial Hypercholesterolemia (FH)",
                "Tuberous Sclerosis Complex (TSC)",
                "Hereditary Hemochromatosis (HH)",
                "Alpha-1 Antitrypsin Deficiency (AATD)",
                "Phenylketonuria (PKU)",
                "Duchenne Muscular Dystrophy (DMD)",
                "Myotonic Dystrophy (DM)",
                "Fragile X Syndrome (FXS)",
                "X-linked Agammaglobulinemia (XLA)",
                "Beta Thalassemia",
                "Hemophilia A",
                "Hemophilia B",
                "Rett Syndrome",
                "Achondroplasia",
                "Osteogenesis Imperfecta",
                "Noonan Syndrome",
                "Congenital Adrenal Hyperplasia (CAH)",
                "Wilson's Disease"
            ],
            "mismatches": [],
            "true_referents": [
                "Achondroplasia",
                "Alpha-1 Antitrypsin Deficiency (AATD)",
                "Beta Thalassemia",
                "Congenital Adrenal Hyperplasia (CAH)",
                "Cystic Fibrosis (CF)",
                "Duchenne Muscular Dystrophy (DMD)",
                "Familial Hypercholesterolemia (FH)",
                "Fragile X Syndrome (FXS)",
                "Hemophilia A",
                "Hemophilia B",
                "Hereditary Hemochromatosis (HH)",
                "Huntington's Disease (HD)",
                "Marfan Syndrome (MFS)",
                "Myotonic Dystrophy (DM)",
                "Neurofibromatosis Type 1 (NF1)",
                "Noonan Syndrome",
                "Osteogenesis Imperfecta",
                "Phenylketonuria (PKU)",
                "Polycystic Kidney Disease (PKD)",
                "Rett Syndrome",
                "Sickle Cell Disease (SCD)",
                "Tuberous Sclerosis Complex (TSC)",
                "Wilson's Disease",
                "X-linked Agammaglobulinemia (XLA)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Cystic Fibrosis (CF)",
            "Sickle Cell Anemia (SCA)",
            "Huntington's Disease (HD)",
            "Duchenne Muscular Dystrophy (DMD)",
            "Hemophilia A (HA)",
            "Phenylketonuria (PKU)",
            "Marfan Syndrome (MS)",
            "Neurofibromatosis Type 1 (NF1)",
            "Tay-Sachs Disease (TSD)",
            "Wilson's Disease (WD)",
            "Spinal Muscular Atrophy (SMA)",
            "Thalassemia (THAL)",
            "Achondroplasia (ACH)",
            "Gaucher Disease (GD)",
            "Albinism (ALB)",
            "Familial Hypercholesterolemia (FH)",
            "Myotonic Dystrophy (MD)",
            "Congenital Adrenal Hyperplasia (CAH)",
            "Oculocutaneous Albinism (OCA)",
            "Long QT Syndrome (LQTS)",
            "Beta Thalassemia (BT)",
            "Usher Syndrome (US)",
            "Smith-Lemli-Opitz Syndrome (SLOS)",
            "Ehlers-Danlos Syndrome (EDS)",
            "Bardet-Biedl Syndrome (BBS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cystic Fibrosis (CF)",
                "Sickle Cell Anemia (SCA)",
                "Huntington's Disease (HD)",
                "Duchenne Muscular Dystrophy (DMD)",
                "Hemophilia A (HA)",
                "Phenylketonuria (PKU)",
                "Marfan Syndrome (MS)",
                "Neurofibromatosis Type 1 (NF1)",
                "Tay-Sachs Disease (TSD)",
                "Wilson's Disease (WD)",
                "Spinal Muscular Atrophy (SMA)",
                "Thalassemia (THAL)",
                "Achondroplasia (ACH)",
                "Gaucher Disease (GD)",
                "Albinism (ALB)",
                "Familial Hypercholesterolemia (FH)",
                "Myotonic Dystrophy (MD)",
                "Congenital Adrenal Hyperplasia (CAH)",
                "Oculocutaneous Albinism (OCA)",
                "Long QT Syndrome (LQTS)",
                "Beta Thalassemia (BT)",
                "Usher Syndrome (US)",
                "Smith-Lemli-Opitz Syndrome (SLOS)",
                "Ehlers-Danlos Syndrome (EDS)"
            ],
            "mismatches": [
                "Bardet-Biedl Syndrome (BBS)"
            ],
            "true_referents": [
                "Achondroplasia (ACH)",
                "Albinism (ALB)",
                "Beta Thalassemia (BT)",
                "Congenital Adrenal Hyperplasia (CAH)",
                "Cystic Fibrosis (CF)",
                "Duchenne Muscular Dystrophy (DMD)",
                "Ehlers-Danlos Syndrome (EDS)",
                "Familial Hypercholesterolemia (FH)",
                "Gaucher Disease (GD)",
                "Hemophilia A (HA)",
                "Huntington's Disease (HD)",
                "Long QT Syndrome (LQTS)",
                "Marfan Syndrome (MS)",
                "Myotonic Dystrophy (MD)",
                "Neurofibromatosis Type 1 (NF1)",
                "Oculocutaneous Albinism (OCA)",
                "Phenylketonuria (PKU)",
                "Sickle Cell Anemia (SCA)",
                "Smith-Lemli-Opitz Syndrome (SLOS)",
                "Spinal Muscular Atrophy (SMA)",
                "Tay-Sachs Disease (TSD)",
                "Thalassemia (THAL)",
                "Usher Syndrome (US)",
                "Wilson's Disease (WD)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Cystic Fibrosis (CF)",
            "Huntington's Disease (HD)",
            "Sickle Cell Anemia (SCA)",
            "Hemophilia A (HA)",
            "Duchenne Muscular Dystrophy (DMD)",
            "Phenylketonuria (PKU)",
            "Polycystic Kidney Disease (PKD)",
            "Marfan Syndrome (MFS)",
            "Fragile X Syndrome (FXS)",
            "Tay-Sachs Disease (TSD)",
            "Neurofibromatosis (NF)",
            "Wilson's Disease (WD)",
            "Alpha-1 Antitrypsin Deficiency (AATD)",
            "Hereditary Hemochromatosis (HH)",
            "Fabry Disease (FD)",
            "Gaucher's Disease (GD)",
            "Osteogenesis Imperfecta (OI)",
            "Retinoblastoma (RB)",
            "Li-Fraumeni Syndrome (LFS)",
            "Von Hippel-Lindau Syndrome (VHL)",
            "Alkaptonuria (AKU)",
            "Hereditary Spherocytosis (HS)",
            "Congenital Adrenal Hyperplasia (CAH)",
            "Maple Syrup Urine Disease (MSUD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cystic Fibrosis (CF)",
                "Huntington's Disease (HD)",
                "Sickle Cell Anemia (SCA)",
                "Hemophilia A (HA)",
                "Duchenne Muscular Dystrophy (DMD)",
                "Phenylketonuria (PKU)",
                "Polycystic Kidney Disease (PKD)",
                "Marfan Syndrome (MFS)",
                "Fragile X Syndrome (FXS)",
                "Tay-Sachs Disease (TSD)",
                "Neurofibromatosis (NF)",
                "Wilson's Disease (WD)",
                "Alpha-1 Antitrypsin Deficiency (AATD)",
                "Hereditary Hemochromatosis (HH)",
                "Fabry Disease (FD)",
                "Gaucher's Disease (GD)",
                "Osteogenesis Imperfecta (OI)",
                "Retinoblastoma (RB)",
                "Li-Fraumeni Syndrome (LFS)",
                "Von Hippel-Lindau Syndrome (VHL)",
                "Alkaptonuria (AKU)",
                "Hereditary Spherocytosis (HS)",
                "Congenital Adrenal Hyperplasia (CAH)",
                "Maple Syrup Urine Disease (MSUD)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alkaptonuria (AKU)",
                "Alpha-1 Antitrypsin Deficiency (AATD)",
                "Congenital Adrenal Hyperplasia (CAH)",
                "Cystic Fibrosis (CF)",
                "Duchenne Muscular Dystrophy (DMD)",
                "Fabry Disease (FD)",
                "Fragile X Syndrome (FXS)",
                "Gaucher's Disease (GD)",
                "Hemophilia A (HA)",
                "Hereditary Hemochromatosis (HH)",
                "Hereditary Spherocytosis (HS)",
                "Huntington's Disease (HD)",
                "Li-Fraumeni Syndrome (LFS)",
                "Maple Syrup Urine Disease (MSUD)",
                "Marfan Syndrome (MFS)",
                "Neurofibromatosis (NF)",
                "Osteogenesis Imperfecta (OI)",
                "Phenylketonuria (PKU)",
                "Polycystic Kidney Disease (PKD)",
                "Retinoblastoma (RB)",
                "Sickle Cell Anemia (SCA)",
                "Tay-Sachs Disease (TSD)",
                "Von Hippel-Lindau Syndrome (VHL)",
                "Wilson's Disease (WD)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Cystic fibrosis",
            "Huntington's disease",
            "Sickle cell anemia",
            "Duchenne muscular dystrophy",
            "Fragile X syndrome",
            "Spinal muscular atrophy",
            "Tay-Sachs disease",
            "Polycystic kidney disease",
            "Marfan syndrome",
            "Hemophilia A",
            "Hemophilia B",
            "Williams syndrome",
            "Neurofibromatosis type 1",
            "Rett syndrome",
            "Myotonic dystrophy",
            "Familial hypercholesterolemia",
            "Charcot-Marie-Tooth disease",
            "Friedreich's ataxia",
            "Hereditary spherocytosis",
            "Autosomal dominant polycystic kidney disease",
            "Autosomal recessive polycystic kidney disease",
            "X-linked agammaglobulinemia",
            "Alkaptonuria",
            "Oculocutaneous albinism"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cystic fibrosis",
                "Huntington's disease",
                "Sickle cell anemia",
                "Duchenne muscular dystrophy",
                "Fragile X syndrome",
                "Spinal muscular atrophy",
                "Tay-Sachs disease",
                "Polycystic kidney disease",
                "Marfan syndrome",
                "Hemophilia A",
                "Hemophilia B",
                "Williams syndrome",
                "Neurofibromatosis type 1",
                "Rett syndrome",
                "Myotonic dystrophy",
                "Familial hypercholesterolemia",
                "Charcot-Marie-Tooth disease",
                "Friedreich's ataxia",
                "Hereditary spherocytosis",
                "Autosomal dominant polycystic kidney disease",
                "Autosomal recessive polycystic kidney disease",
                "X-linked agammaglobulinemia",
                "Alkaptonuria",
                "Oculocutaneous albinism"
            ],
            "mismatches": [],
            "true_referents": [
                "Alkaptonuria",
                "Autosomal dominant polycystic kidney disease",
                "Autosomal recessive polycystic kidney disease",
                "Charcot-Marie-Tooth disease",
                "Cystic fibrosis",
                "Duchenne muscular dystrophy",
                "Familial hypercholesterolemia",
                "Fragile X syndrome",
                "Friedreich's ataxia",
                "Hemophilia A",
                "Hemophilia B",
                "Hereditary spherocytosis",
                "Huntington's disease",
                "Marfan syndrome",
                "Myotonic dystrophy",
                "Neurofibromatosis type 1",
                "Oculocutaneous albinism",
                "Polycystic kidney disease",
                "Rett syndrome",
                "Sickle cell anemia",
                "Spinal muscular atrophy",
                "Tay-Sachs disease",
                "Williams syndrome",
                "X-linked agammaglobulinemia"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Cystic fibrosis (CF)",
            "Huntington disease (HD)",
            "Sickle cell disease (SCD)",
            "Phenylketonuria (PKU)",
            "Hemophilia A",
            "Hemophilia B",
            "Marfan syndrome",
            "Tay-Sachs disease",
            "Duchenne muscular dystrophy (DMD)",
            "Familial hypercholesterolemia",
            "Neurofibromatosis type 1 (NF1)",
            "Osteogenesis imperfecta",
            "Myotonic dystrophy",
            "Retinitis pigmentosa",
            "Gaucher disease",
            "Wilson disease",
            "Charcot-Marie-Tooth disease",
            "Fragile X syndrome",
            "von Willebrand disease",
            "Alpha-1 antitrypsin deficiency",
            "G6PD deficiency",
            "Tuberous sclerosis",
            "Prader-Willi syndrome",
            "Becker muscular dystrophy"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cystic fibrosis (CF)",
                "Huntington disease (HD)",
                "Sickle cell disease (SCD)",
                "Phenylketonuria (PKU)",
                "Hemophilia A",
                "Hemophilia B",
                "Marfan syndrome",
                "Tay-Sachs disease",
                "Duchenne muscular dystrophy (DMD)",
                "Familial hypercholesterolemia",
                "Neurofibromatosis type 1 (NF1)",
                "Osteogenesis imperfecta",
                "Myotonic dystrophy",
                "Retinitis pigmentosa",
                "Gaucher disease",
                "Wilson disease",
                "Charcot-Marie-Tooth disease",
                "Fragile X syndrome",
                "von Willebrand disease",
                "Alpha-1 antitrypsin deficiency",
                "G6PD deficiency",
                "Tuberous sclerosis",
                "Prader-Willi syndrome",
                "Becker muscular dystrophy"
            ],
            "mismatches": [],
            "true_referents": [
                "Alpha-1 antitrypsin deficiency",
                "Becker muscular dystrophy",
                "Charcot-Marie-Tooth disease",
                "Cystic fibrosis (CF)",
                "Duchenne muscular dystrophy (DMD)",
                "Familial hypercholesterolemia",
                "Fragile X syndrome",
                "G6PD deficiency",
                "Gaucher disease",
                "Hemophilia A",
                "Hemophilia B",
                "Huntington disease (HD)",
                "Marfan syndrome",
                "Myotonic dystrophy",
                "Neurofibromatosis type 1 (NF1)",
                "Osteogenesis imperfecta",
                "Phenylketonuria (PKU)",
                "Prader-Willi syndrome",
                "Retinitis pigmentosa",
                "Sickle cell disease (SCD)",
                "Tay-Sachs disease",
                "Tuberous sclerosis",
                "Wilson disease",
                "von Willebrand disease"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Cystic fibrosis (CF)",
            "Sickle cell disease (SCD)",
            "Huntington's disease (HD)",
            "Duchenne muscular dystrophy (DMD)",
            "Hemophilia A",
            "Fragile X syndrome (FXS)",
            "Neurofibromatosis type 1 (NF1)",
            "Marfan syndrome",
            "Phenylketonuria (PKU)",
            "Tay-Sachs disease",
            "Familial hypercholesterolemia (FH)",
            "Hereditary hemochromatosis",
            "Spinal muscular atrophy (SMA)",
            "Myotonic dystrophy type 1 (DM1)",
            "Polycystic kidney disease (PKD)",
            "Familial adenomatous polyposis (FAP)",
            "Retinitis pigmentosa",
            "Osteogenesis imperfecta",
            "Friedreich's ataxia (FA)",
            "Tuberous sclerosis complex (TSC)",
            "Angelman syndrome",
            "Prader-Willi syndrome",
            "Rett syndrome",
            "Wilson's disease"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cystic fibrosis (CF)",
                "Sickle cell disease (SCD)",
                "Huntington's disease (HD)",
                "Duchenne muscular dystrophy (DMD)",
                "Hemophilia A",
                "Fragile X syndrome (FXS)",
                "Neurofibromatosis type 1 (NF1)",
                "Marfan syndrome",
                "Phenylketonuria (PKU)",
                "Tay-Sachs disease",
                "Familial hypercholesterolemia (FH)",
                "Hereditary hemochromatosis",
                "Spinal muscular atrophy (SMA)",
                "Myotonic dystrophy type 1 (DM1)",
                "Polycystic kidney disease (PKD)",
                "Familial adenomatous polyposis (FAP)",
                "Retinitis pigmentosa",
                "Osteogenesis imperfecta",
                "Friedreich's ataxia (FA)",
                "Tuberous sclerosis complex (TSC)",
                "Angelman syndrome",
                "Prader-Willi syndrome",
                "Rett syndrome",
                "Wilson's disease"
            ],
            "mismatches": [],
            "true_referents": [
                "Angelman syndrome",
                "Cystic fibrosis (CF)",
                "Duchenne muscular dystrophy (DMD)",
                "Familial adenomatous polyposis (FAP)",
                "Familial hypercholesterolemia (FH)",
                "Fragile X syndrome (FXS)",
                "Friedreich's ataxia (FA)",
                "Hemophilia A",
                "Hereditary hemochromatosis",
                "Huntington's disease (HD)",
                "Marfan syndrome",
                "Myotonic dystrophy type 1 (DM1)",
                "Neurofibromatosis type 1 (NF1)",
                "Osteogenesis imperfecta",
                "Phenylketonuria (PKU)",
                "Polycystic kidney disease (PKD)",
                "Prader-Willi syndrome",
                "Retinitis pigmentosa",
                "Rett syndrome",
                "Sickle cell disease (SCD)",
                "Spinal muscular atrophy (SMA)",
                "Tay-Sachs disease",
                "Tuberous sclerosis complex (TSC)",
                "Wilson's disease"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Cystic fibrosis (CF)",
            "Sickle cell anemia (SCA)",
            "Huntington's disease (HD)",
            "Duchenne muscular dystrophy (DMD)",
            "Fragile X syndrome (FXS)",
            "Tay-Sachs disease (TSD)",
            "Hemophilia A (HA)",
            "Marfan syndrome (MFS)",
            "Neurofibromatosis type 1 (NF1)",
            "Phenylketonuria (PKU)",
            "Spinal muscular atrophy (SMA)",
            "Myotonic dystrophy type 1 (DM1)",
            "Polycystic kidney disease (PKD)",
            "Familial hypercholesterolemia (FH)",
            "Achondroplasia (ACH)",
            "Osteogenesis imperfecta (OI)",
            "Retinitis pigmentosa (RP)",
            "Hemochromatosis (HFE)",
            "Fabry disease (FD)",
            "Gaucher disease (GD)",
            "Pompe disease (PD)",
            "Charcot-Marie-Tooth disease (CMT)",
            "Hereditary spherocytosis (HS)",
            "Wilson's disease (WD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cystic fibrosis (CF)",
                "Sickle cell anemia (SCA)",
                "Huntington's disease (HD)",
                "Duchenne muscular dystrophy (DMD)",
                "Fragile X syndrome (FXS)",
                "Tay-Sachs disease (TSD)",
                "Hemophilia A (HA)",
                "Marfan syndrome (MFS)",
                "Neurofibromatosis type 1 (NF1)",
                "Phenylketonuria (PKU)",
                "Spinal muscular atrophy (SMA)",
                "Myotonic dystrophy type 1 (DM1)",
                "Polycystic kidney disease (PKD)",
                "Familial hypercholesterolemia (FH)",
                "Achondroplasia (ACH)",
                "Osteogenesis imperfecta (OI)",
                "Retinitis pigmentosa (RP)",
                "Hemochromatosis (HFE)",
                "Fabry disease (FD)",
                "Gaucher disease (GD)",
                "Pompe disease (PD)",
                "Charcot-Marie-Tooth disease (CMT)",
                "Hereditary spherocytosis (HS)",
                "Wilson's disease (WD)"
            ],
            "mismatches": [],
            "true_referents": [
                "Achondroplasia (ACH)",
                "Charcot-Marie-Tooth disease (CMT)",
                "Cystic fibrosis (CF)",
                "Duchenne muscular dystrophy (DMD)",
                "Fabry disease (FD)",
                "Familial hypercholesterolemia (FH)",
                "Fragile X syndrome (FXS)",
                "Gaucher disease (GD)",
                "Hemochromatosis (HFE)",
                "Hemophilia A (HA)",
                "Hereditary spherocytosis (HS)",
                "Huntington's disease (HD)",
                "Marfan syndrome (MFS)",
                "Myotonic dystrophy type 1 (DM1)",
                "Neurofibromatosis type 1 (NF1)",
                "Osteogenesis imperfecta (OI)",
                "Phenylketonuria (PKU)",
                "Polycystic kidney disease (PKD)",
                "Pompe disease (PD)",
                "Retinitis pigmentosa (RP)",
                "Sickle cell anemia (SCA)",
                "Spinal muscular atrophy (SMA)",
                "Tay-Sachs disease (TSD)",
                "Wilson's disease (WD)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Cystic fibrosis (CF)",
            "Sickle cell disease (SCD)",
            "Huntington's disease (HD)",
            "Hemophilia A (FVIII deficiency)",
            "Hemophilia B (FIX deficiency)",
            "Duchenne muscular dystrophy (DMD)",
            "Marfan syndrome (MFS)",
            "Neurofibromatosis type 1 (NF1)",
            "Familial hypercholesterolemia (FH)",
            "Phenylketonuria (PKU)",
            "Galactosemia",
            "Maple syrup urine disease (MSUD)",
            "Tay-Sachs disease",
            "Niemann-Pick disease",
            "Gaucher disease",
            "Fabry disease",
            "Pompe disease",
            "Mucopolysaccharidosis I (MPS I)",
            "Mucopolysaccharidosis II (MPS II)",
            "Mucopolysaccharidosis III (MPS III)",
            "Mucopolysaccharidosis IV (MPS IV)",
            "Mucopolysaccharidosis VI (MPS VI)",
            "Mucopolysaccharidosis VII (MPS VII)",
            "Wilson's disease"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cystic fibrosis (CF)",
                "Sickle cell disease (SCD)",
                "Huntington's disease (HD)",
                "Hemophilia A (FVIII deficiency)",
                "Hemophilia B (FIX deficiency)",
                "Duchenne muscular dystrophy (DMD)",
                "Marfan syndrome (MFS)",
                "Neurofibromatosis type 1 (NF1)",
                "Familial hypercholesterolemia (FH)",
                "Phenylketonuria (PKU)",
                "Galactosemia",
                "Maple syrup urine disease (MSUD)",
                "Tay-Sachs disease",
                "Niemann-Pick disease",
                "Gaucher disease",
                "Fabry disease",
                "Pompe disease",
                "Mucopolysaccharidosis I (MPS I)",
                "Mucopolysaccharidosis II (MPS II)",
                "Mucopolysaccharidosis III (MPS III)",
                "Mucopolysaccharidosis IV (MPS IV)",
                "Mucopolysaccharidosis VI (MPS VI)",
                "Mucopolysaccharidosis VII (MPS VII)",
                "Wilson's disease"
            ],
            "mismatches": [],
            "true_referents": [
                "Cystic fibrosis (CF)",
                "Duchenne muscular dystrophy (DMD)",
                "Fabry disease",
                "Familial hypercholesterolemia (FH)",
                "Galactosemia",
                "Gaucher disease",
                "Hemophilia A (FVIII deficiency)",
                "Hemophilia B (FIX deficiency)",
                "Huntington's disease (HD)",
                "Maple syrup urine disease (MSUD)",
                "Marfan syndrome (MFS)",
                "Mucopolysaccharidosis I (MPS I)",
                "Mucopolysaccharidosis II (MPS II)",
                "Mucopolysaccharidosis III (MPS III)",
                "Mucopolysaccharidosis IV (MPS IV)",
                "Mucopolysaccharidosis VI (MPS VI)",
                "Mucopolysaccharidosis VII (MPS VII)",
                "Neurofibromatosis type 1 (NF1)",
                "Niemann-Pick disease",
                "Phenylketonuria (PKU)",
                "Pompe disease",
                "Sickle cell disease (SCD)",
                "Tay-Sachs disease",
                "Wilson's disease"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Cystic Fibrosis (CF)",
            "Sickle Cell Anemia (SCA)",
            "Huntington's Disease (HD)",
            "Duchenne Muscular Dystrophy (DMD)",
            "Phenylketonuria (PKU)",
            "Maple Syrup Urine Disease (MSUD)",
            "Homocystinuria (HCU)",
            "Galactosemia (GAL)",
            "Niemann-Pick Disease (NPD)",
            "Gaucher Disease (GD)",
            "Fabry Disease (FD)",
            "Pompe Disease (PD)",
            "Lesch-Nyhan Syndrome (LNS)",
            "Familial Hypercholesterolemia (FH)",
            "Familial Amyloid Polyneuropathy (FAP)",
            "Marfan Syndrome (MFS)",
            "Neurofibromatosis Type 1 (NF1)",
            "Tuberous Sclerosis (TS)",
            "Polycystic Kidney Disease (PKD)",
            "Familial Adenomatous Polyposis (FAP)",
            "Ataxia-Telangiectasia (AT)",
            "Xeroderma Pigmentosum (XP)",
            "Fanconi Anemia (FA)",
            "Homozygous Familial Hypercholesterolemia (HoFH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cystic Fibrosis (CF)",
                "Sickle Cell Anemia (SCA)",
                "Huntington's Disease (HD)",
                "Duchenne Muscular Dystrophy (DMD)",
                "Phenylketonuria (PKU)",
                "Maple Syrup Urine Disease (MSUD)",
                "Homocystinuria (HCU)",
                "Galactosemia (GAL)",
                "Niemann-Pick Disease (NPD)",
                "Gaucher Disease (GD)",
                "Fabry Disease (FD)",
                "Pompe Disease (PD)",
                "Lesch-Nyhan Syndrome (LNS)",
                "Familial Hypercholesterolemia (FH)",
                "Familial Amyloid Polyneuropathy (FAP)",
                "Marfan Syndrome (MFS)",
                "Neurofibromatosis Type 1 (NF1)",
                "Tuberous Sclerosis (TS)",
                "Polycystic Kidney Disease (PKD)",
                "Familial Adenomatous Polyposis (FAP)",
                "Ataxia-Telangiectasia (AT)",
                "Xeroderma Pigmentosum (XP)",
                "Fanconi Anemia (FA)",
                "Homozygous Familial Hypercholesterolemia (HoFH)"
            ],
            "mismatches": [],
            "true_referents": [
                "Ataxia-Telangiectasia (AT)",
                "Cystic Fibrosis (CF)",
                "Duchenne Muscular Dystrophy (DMD)",
                "Fabry Disease (FD)",
                "Familial Adenomatous Polyposis (FAP)",
                "Familial Amyloid Polyneuropathy (FAP)",
                "Familial Hypercholesterolemia (FH)",
                "Fanconi Anemia (FA)",
                "Galactosemia (GAL)",
                "Gaucher Disease (GD)",
                "Homocystinuria (HCU)",
                "Homozygous Familial Hypercholesterolemia (HoFH)",
                "Huntington's Disease (HD)",
                "Lesch-Nyhan Syndrome (LNS)",
                "Maple Syrup Urine Disease (MSUD)",
                "Marfan Syndrome (MFS)",
                "Neurofibromatosis Type 1 (NF1)",
                "Niemann-Pick Disease (NPD)",
                "Phenylketonuria (PKU)",
                "Polycystic Kidney Disease (PKD)",
                "Pompe Disease (PD)",
                "Sickle Cell Anemia (SCA)",
                "Tuberous Sclerosis (TS)",
                "Xeroderma Pigmentosum (XP)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Fragile X Syndrome (FXS)",
            "Huntington's Disease (HD)",
            "Friedreich's Ataxia (FRDA)",
            "Cystic Fibrosis (CF)",
            "Sickle Cell Anemia (SCA)",
            "Tay-Sachs Disease (TSD)",
            "Muscular Dystrophy (MD)",
            "Hemophilia A (HA)",
            "Hemophilia B (HB)",
            "Thalassemia Major (TM)",
            "Thalassemia Minor (TMn)",
            "Sickle Cell Trait (SCT)",
            "Mucopolysaccharidosis Type I (MPS I)",
            "Mucopolysaccharidosis Type II (MPS II)",
            "Mucopolysaccharidosis Type III (MPS III)",
            "Mucopolysaccharidosis Type IV (MPS IV)",
            "Mucopolysaccharidosis Type VI (MPS VI)",
            "Mucopolysaccharidosis Type VII (MPS VII)",
            "Mucopolysaccharidosis Type IX (MPS IX)",
            "Fabry Disease (FD)",
            "Gaucher Disease (GD)",
            "Niemann-Pick Disease (NPD)",
            "Torsion Dystonia (TD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Fragile X Syndrome (FXS)",
                "Huntington's Disease (HD)",
                "Friedreich's Ataxia (FRDA)",
                "Cystic Fibrosis (CF)",
                "Sickle Cell Anemia (SCA)",
                "Tay-Sachs Disease (TSD)",
                "Muscular Dystrophy (MD)",
                "Hemophilia A (HA)",
                "Hemophilia B (HB)",
                "Thalassemia Major (TM)",
                "Thalassemia Minor (TMn)",
                "Sickle Cell Trait (SCT)",
                "Mucopolysaccharidosis Type I (MPS I)",
                "Mucopolysaccharidosis Type II (MPS II)",
                "Mucopolysaccharidosis Type III (MPS III)",
                "Mucopolysaccharidosis Type IV (MPS IV)",
                "Mucopolysaccharidosis Type VI (MPS VI)",
                "Mucopolysaccharidosis Type VII (MPS VII)",
                "Mucopolysaccharidosis Type IX (MPS IX)",
                "Fabry Disease (FD)",
                "Gaucher Disease (GD)",
                "Niemann-Pick Disease (NPD)",
                "Torsion Dystonia (TD)"
            ],
            "mismatches": [],
            "true_referents": [
                "Cystic Fibrosis (CF)",
                "Fabry Disease (FD)",
                "Fragile X Syndrome (FXS)",
                "Friedreich's Ataxia (FRDA)",
                "Gaucher Disease (GD)",
                "Hemophilia A (HA)",
                "Hemophilia B (HB)",
                "Huntington's Disease (HD)",
                "Mucopolysaccharidosis Type I (MPS I)",
                "Mucopolysaccharidosis Type II (MPS II)",
                "Mucopolysaccharidosis Type III (MPS III)",
                "Mucopolysaccharidosis Type IV (MPS IV)",
                "Mucopolysaccharidosis Type IX (MPS IX)",
                "Mucopolysaccharidosis Type VI (MPS VI)",
                "Mucopolysaccharidosis Type VII (MPS VII)",
                "Muscular Dystrophy (MD)",
                "Niemann-Pick Disease (NPD)",
                "Sickle Cell Anemia (SCA)",
                "Sickle Cell Trait (SCT)",
                "Tay-Sachs Disease (TSD)",
                "Thalassemia Major (TM)",
                "Thalassemia Minor (TMn)",
                "Torsion Dystonia (TD)"
            ],
            "TP": 23,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": [
            "Cystic Fibrosis (CF)",
            "Sickle Cell Anemia (HbS)",
            "Marfan Syndrome (MFS)",
            "Huntington's Disease (HD)",
            "Muscular Dystrophy (MD)",
            "Tay-Sachs Disease (TSD)",
            "Phenylketonuria (PKU)",
            "Thalassemia (THAL)",
            "Familial Hypercholesterolemia (FH)",
            "Achondroplasia (ACH)",
            "Ehlers-Danlos Syndrome (EDS)",
            "Osteogenesis Imperfecta (OI)",
            "Fragile X Syndrome (FXS)",
            "Spinal Muscular Atrophy (SMA)",
            "Duchenne Muscular Dystrophy (DMD)",
            "Becker Muscular Dystrophy (BMD)",
            "Myotonic Dystrophy (DM)",
            "Niemann-Pick Disease (NPD)",
            "Maple Syrup Urine Disease (MSUD)",
            "Homocystinuria (HCU)",
            "Crouzon Syndrome (CS)",
            "Apert Syndrome (AS)",
            "Pfeiffer Syndrome (PS)",
            "Mucopolysaccharidosis (MPS)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cystic Fibrosis (CF)",
                "Sickle Cell Anemia (HbS)",
                "Marfan Syndrome (MFS)",
                "Huntington's Disease (HD)",
                "Muscular Dystrophy (MD)",
                "Tay-Sachs Disease (TSD)",
                "Phenylketonuria (PKU)",
                "Thalassemia (THAL)",
                "Familial Hypercholesterolemia (FH)",
                "Achondroplasia (ACH)",
                "Ehlers-Danlos Syndrome (EDS)",
                "Osteogenesis Imperfecta (OI)",
                "Fragile X Syndrome (FXS)",
                "Spinal Muscular Atrophy (SMA)",
                "Duchenne Muscular Dystrophy (DMD)",
                "Becker Muscular Dystrophy (BMD)",
                "Myotonic Dystrophy (DM)",
                "Niemann-Pick Disease (NPD)",
                "Maple Syrup Urine Disease (MSUD)",
                "Homocystinuria (HCU)",
                "Crouzon Syndrome (CS)",
                "Apert Syndrome (AS)",
                "Pfeiffer Syndrome (PS)",
                "Mucopolysaccharidosis (MPS)"
            ],
            "mismatches": [],
            "true_referents": [
                "Achondroplasia (ACH)",
                "Apert Syndrome (AS)",
                "Becker Muscular Dystrophy (BMD)",
                "Crouzon Syndrome (CS)",
                "Cystic Fibrosis (CF)",
                "Duchenne Muscular Dystrophy (DMD)",
                "Ehlers-Danlos Syndrome (EDS)",
                "Familial Hypercholesterolemia (FH)",
                "Fragile X Syndrome (FXS)",
                "Homocystinuria (HCU)",
                "Huntington's Disease (HD)",
                "Maple Syrup Urine Disease (MSUD)",
                "Marfan Syndrome (MFS)",
                "Mucopolysaccharidosis (MPS)",
                "Muscular Dystrophy (MD)",
                "Myotonic Dystrophy (DM)",
                "Niemann-Pick Disease (NPD)",
                "Osteogenesis Imperfecta (OI)",
                "Pfeiffer Syndrome (PS)",
                "Phenylketonuria (PKU)",
                "Sickle Cell Anemia (HbS)",
                "Spinal Muscular Atrophy (SMA)",
                "Tay-Sachs Disease (TSD)",
                "Thalassemia (THAL)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "monogenic disease with high (1>20000) prevalence in human",
        "domain": "medicine",
        "response": "[\"it is a disease\", \"it has a prevalence of greater than 1 in 20,000 individuals in the human population\"]}\n{\"Referent\": \"Huntington's disease\", \"Canonical Name\": \"Huntington's disease\", \"Definition\": [\"it is a disease\", \"it has a prevalence of greater than 1 in 20,000 individuals in the human population\"]",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]