[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Estrogen (E2)",
            "Testosterone",
            "Progesterone",
            "Cortisol",
            "Dexamethasone",
            "Prednisone",
            "Androstenedione",
            "Dehydroepiandrosterone (DHEA)",
            "Allopregnanolone",
            "Estradiol",
            "Estrone",
            "Androsterone",
            "Epiandrosterone",
            "11-Deoxycortisol",
            "Androstanediol",
            "Estrone sulfate",
            "Pregnenolone",
            "17-Hydroxyprogesterone",
            "11-Dehydrocorticosterone",
            "Dihydrotestosterone",
            "17-Ketosteroids",
            "17-Hydroxycorticosteroids",
            "17-OH-progesterone",
            "Androstenediol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Progesterone",
                "Cortisol",
                "Dexamethasone",
                "Prednisone",
                "11-Deoxycortisol"
            ],
            "mismatches": [
                "Estrogen (E2)",
                "Testosterone",
                "Androstenedione",
                "Dehydroepiandrosterone (DHEA)",
                "Allopregnanolone",
                "Estradiol",
                "Estrone",
                "Androsterone",
                "Epiandrosterone",
                "Androstanediol",
                "Estrone sulfate",
                "Pregnenolone",
                "17-Hydroxyprogesterone",
                "11-Dehydrocorticosterone",
                "Dihydrotestosterone",
                "17-Ketosteroids",
                "17-Hydroxycorticosteroids",
                "17-OH-progesterone",
                "Androstenediol"
            ],
            "true_referents": [
                "11-deoxycorticosterone",
                "11-deoxycorticosterone pivalate",
                "11-deoxycortisol",
                "15alpha-Hydroxyprogesterone",
                "16-Hydroxyprogesterone",
                "16-a-Hydroxypregnenolone",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "18-hydroxycortisol",
                "21-Deoxycortisone",
                "3alpha,17alpha-dihydroxy-5beta-pregnan-20-one",
                "5alpha-dihydrodeoxycorticosterone",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol-11-one",
                "C21-steroid hormone",
                "Delta(1)-dihydrotestosterone",
                "Dexamethasone acetate",
                "Ethyltestosterone",
                "Hydroxyprogesterone acetate",
                "anabolic androgenic steroid",
                "boldenone",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisol 17-valerate",
                "dexamethasone",
                "dexamethasone dipropionate",
                "fluoxymesterone",
                "nandrolone",
                "norgesterone",
                "oxandrolone",
                "prednisolone",
                "prednisone",
                "progesterone",
                "trenbolone"
            ],
            "TP": 5,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Cortisol (C21H30O5)",
            "Aldosterone (C21H28O5)",
            "Testosterone (C19H28O2)",
            "Estradiol (C18H24O2)",
            "Progesterone (C21H30O2)",
            "Dihydrotestosterone (DHT) (C19H30O2)",
            "Dehydroepiandrosterone (DHEA) (C19H28O2)",
            "Androstenedione (C19H26O2)",
            "Epiandrosterone (C19H30O2)",
            "Pregnenolone (C21H32O2)",
            "Cholesterol (C27H46O)",
            "Deoxycorticosterone (DOC) (C21H30O3)",
            "11-deoxycortisol (C21H30O4)",
            "Cortisone (C21H28O5)",
            "Estrone (C18H22O2)",
            "Estriol (C18H24O3)",
            "Ethyne (C2H2)",
            "Thyroxine (T4) (C15H11I4NO4)",
            "Triiodothyronine (T3) (C15H12I3NO4)",
            "Catecholamines (e.g., Epinephrine, Norepinephrine)",
            "Melatonin (C13H16N2O2)",
            "Vitamin D3 (Cholecalciferol) (C27H44O)",
            "Retinoic Acid (C20H28O2)",
            "Vitamin D2 (Ergocalciferol) (C28H44O)",
            "Bile Acids (e.g., Cholic Acid, Chenodeoxycholic Acid)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "cortisol",
                "aldosterone",
                "progesterone",
                "11-deoxycortisol",
                "cortisone"
            ],
            "mismatches": [
                "Cortisol (C21H30O5)",
                "Aldosterone (C21H28O5)",
                "Testosterone (C19H28O2)",
                "Estradiol (C18H24O2)",
                "Progesterone (C21H30O2)",
                "Dihydrotestosterone (DHT) (C19H30O2)",
                "Dehydroepiandrosterone (DHEA) (C19H28O2)",
                "Androstenedione (C19H26O2)",
                "Epiandrosterone (C19H30O2)",
                "Pregnenolone (C21H32O2)",
                "Cholesterol (C27H46O)",
                "Deoxycorticosterone (DOC) (C21H30O3)",
                "11-deoxycortisol (C21H30O4)",
                "Cortisone (C21H28O5)",
                "Estrone (C18H22O2)",
                "Estriol (C18H24O3)",
                "Ethyne (C2H2)",
                "Thyroxine (T4) (C15H11I4NO4)",
                "Triiodothyronine (T3) (C15H12I3NO4)",
                "Catecholamines (e.g., Epinephrine, Norepinephrine)",
                "Melatonin (C13H16N2O2)",
                "Vitamin D3 (Cholecalciferol) (C27H44O)",
                "Retinoic Acid (C20H28O2)",
                "Vitamin D2 (Ergocalciferol) (C28H44O)",
                "Bile Acids (e.g., Cholic Acid, Chenodeoxycholic Acid)"
            ],
            "true_referents": [
                "(3a,5b,6a)- 17-(acetyloxy)-3-hydroxy-6-methyl- Pregnan-20-one",
                "(5alpha)-3-oxocholestan-26-oic acid",
                "(5alpha,25S)-3-oxocholestan-26-oic acid",
                "11-deoxycorticosterone",
                "11-deoxycortisol",
                "11alpha-Hydroxy-12alpha-methyl-pregn-4-ene-3,20-dione",
                "11alpha-Hydroxy-5beta-pregnane-3,20-dione",
                "11beta,21-Dihydroxypregn-4-ene-3,20-dione 21-acetate",
                "11beta-Hydroxy-6alpha,11-dimethylpregn-4-ene-3,20-dione",
                "12beta-hydroxy-24-norcholesta-1,4,22E-trien-3-one",
                "16-a-Hydroxypregnenolone",
                "16-alpha,17-Epoxypregn-4-ene-3,20-dione",
                "16alpha,17-Isopropylidenedioxy-6alpha-methylprogesterone",
                "17,20,21-trihydroxypregn-1-ene-3,11-dione",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "18-hydroxycortisol",
                "18-oxocortisol",
                "1alpha,2beta,25-trihydroxy vitamin D3",
                "21-Deoxycortisone",
                "24-Nor-5beta-chol-22-ene-3alpha,7alpha,12alpha-triol",
                "24-Nor-5beta-cholane-3alpha,7alpha,12alpha-triol",
                "2alpha-Methylpregn-4-ene-3,11,20-trione",
                "3alpha,12alpha-Dihydroxy-5beta-pregnan-20-one",
                "3alpha,17alpha-Dihydroxy-5beta-pregnane-11,20-dione",
                "3alpha,6alpha-Dihydroxy-5beta-pregnan-20-one",
                "3beta,14beta-dihydroxy-5beta-pregnane-20-one",
                "5alpha-dihydrodeoxycorticosterone",
                "6alpha-Chloro-17-acetoxyprogesterone",
                "7alpha-Methyl-4-pregnene-3,20-dione",
                "C21-steroid hormone",
                "Cortisone acetate",
                "Delta(1)-dihydrotestosterone",
                "Deoxycorticosterone acetate",
                "Dexamethasone 21-(4-Pyridinecarboxylate)",
                "Ethyltestosterone",
                "Pregn-5-ene-3beta,20beta-diol",
                "aldosterone",
                "anabolic androgenic steroid",
                "clobetasol propionate",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisone",
                "progesterone"
            ],
            "TP": 5,
            "FP": 25,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Cortisol (Hydrocortisone)",
            "Aldosterone",
            "Testosterone",
            "Estradiol",
            "Progesterone",
            "Corticosterone",
            "Dehydroepiandrosterone (DHEA)",
            "Androstenedione",
            "Dihydrotestosterone (DHT)",
            "Prednisone",
            "Prednisolone",
            "Methylprednisolone",
            "Cortisone",
            "17-Hydroxyprogesterone",
            "Pregnenolone",
            "11-Deoxycortisol",
            "17-Hydroxypregnenolone",
            "11-Deoxycorticosterone",
            "Androsterone",
            "Etiolcholanolone",
            "Cortisyl",
            "Corticosterone acetate",
            "Cortisone acetate",
            "Estriol",
            "19-Nortestosterone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aldosterone",
                "Progesterone",
                "Corticosterone",
                "Prednisone",
                "Prednisolone",
                "Cortisone",
                "11-Deoxycortisol",
                "11-Deoxycorticosterone",
                "Cortisone acetate"
            ],
            "mismatches": [
                "Cortisol (Hydrocortisone)",
                "Testosterone",
                "Estradiol",
                "Dehydroepiandrosterone (DHEA)",
                "Androstenedione",
                "Dihydrotestosterone (DHT)",
                "Methylprednisolone",
                "17-Hydroxyprogesterone",
                "Pregnenolone",
                "17-Hydroxypregnenolone",
                "Androsterone",
                "Etiolcholanolone",
                "Cortisyl",
                "Corticosterone acetate",
                "Estriol",
                "19-Nortestosterone"
            ],
            "true_referents": [
                "11-deoxycorticosterone",
                "11-deoxycorticosterone pivalate",
                "11-deoxycortisol",
                "15alpha-Hydroxyprogesterone",
                "16-Hydroxyprogesterone",
                "16-a-Hydroxypregnenolone",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "21-Deoxycortisone",
                "5alpha-dihydrodeoxycorticosterone",
                "Alphaxolone",
                "Cortisone acetate",
                "Delta(1)-dihydrotestosterone",
                "Dexamethasone acetate",
                "Ethyltestosterone",
                "Hydroxyprogesterone acetate",
                "Prednisolone acetate",
                "aldosterone",
                "anabolic androgenic steroid",
                "clocortolone",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisone",
                "dexamethasone",
                "methylprednisolone acetate",
                "mineralocorticoid",
                "nandrolone",
                "norethandrolone",
                "norgesterone",
                "oxandrolone",
                "prednisolone",
                "prednisone",
                "progesterone",
                "trenbolone"
            ],
            "TP": 9,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Cortisol (COR)",
            "Testosterone (TEST)",
            "Estradiol (E2)",
            "Progesterone (PROG)",
            "Aldosterone (ALDO)",
            "Corticosterone (CORT)",
            "Dehydroepiandrosterone (DHEA)",
            "Androstenedione (ANDRO)",
            "Estriol (E3)",
            "Estrone (E1)",
            "Pregnenolone (PREG)",
            "Dihydrotestosterone (DHT)",
            "Prednisone (PRED)",
            "Prednisolone (PREDL)",
            "Methylprednisolone (MPRED)",
            "Dexamethasone (DEX)",
            "Triamcinolone (TRIAM)",
            "Betamethasone (BETA)",
            "Hydrocortisone (HYDRO)",
            "Spironolactone (SPIR)",
            "Mifepristone (MIFE)",
            "Fludrocortisone (FLUD)",
            "Drospirenone (DROSP)",
            "Gestrinone (GEST)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cortisol (COR)",
                "Progesterone (PROG)",
                "Aldosterone (ALDO)",
                "Corticosterone (CORT)",
                "Prednisone (PRED)",
                "Prednisolone (PREDL)",
                "Dexamethasone (DEX)",
                "Triamcinolone (TRIAM)",
                "Betamethasone (BETA)",
                "Fludrocortisone (FLUD)"
            ],
            "mismatches": [
                "Testosterone (TEST)",
                "Estradiol (E2)",
                "Dehydroepiandrosterone (DHEA)",
                "Androstenedione (ANDRO)",
                "Estriol (E3)",
                "Estrone (E1)",
                "Pregnenolone (PREG)",
                "Dihydrotestosterone (DHT)",
                "Methylprednisolone (MPRED)",
                "Hydrocortisone (HYDRO)",
                "Spironolactone (SPIR)",
                "Mifepristone (MIFE)",
                "Drospirenone (DROSP)",
                "Gestrinone (GEST)"
            ],
            "true_referents": [
                "15beta-hydroxycyproterone acetate",
                "16-a-Hydroxypregnenolone",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "19-Norprogesterone",
                "5alpha-dihydrodeoxycorticosterone",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol",
                "C21-steroid hormone",
                "Delta(1)-dihydrotestosterone",
                "Delta(6)-prednisolone",
                "Delta(6)-prednisone",
                "Dexamethasone acetate",
                "Ethyltestosterone",
                "Hydrocortisone cypionate",
                "Prednisolone acetate",
                "Pregn-5-ene-3beta,20alpha-diol",
                "aldosterone",
                "anabolic androgenic steroid",
                "betamethasone",
                "clocortolone",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisone",
                "dexamethasone",
                "dexamethasone dipropionate",
                "estetrol",
                "fludrocortisone",
                "fludrocortisone acetate",
                "flumethasone",
                "gestonorone",
                "hydrocortisone aceponate",
                "methylprednisolone aceponate",
                "methylprednisolone acetate",
                "mineralocorticoid",
                "norethandrolone",
                "norgesterone",
                "oxandrolone",
                "prednisolone",
                "prednisone",
                "progesterone",
                "trenbolone",
                "triamcinolone",
                "triamcinolone acetonide"
            ],
            "TP": 10,
            "FP": 14,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Testosterone (T)",
            "Estradiol (E2)",
            "Cortisol (F)",
            "Aldosterone (Aldo)",
            "Progesterone (P4)",
            "Dehydroepiandrosterone (DHEA)",
            "Androstenedione (A4)",
            "Estrone (E1)",
            "Estriol (E3)",
            "Corticosterone (B)",
            "17\u03b1-Hydroxyprogesterone (17-OHP)",
            "Dihydrotestosterone (DHT)",
            "11-Deoxycorticosterone (DOC)",
            "11-Deoxycortisol (S)",
            "Calcitriol (1,25(OH)2D3)",
            "Dehydroepiandrosterone sulfate (DHEA-S)",
            "Pregnenolone (P5)",
            "17\u03b1-Estradiol (17\u03b1-E2)",
            "Tetrahydrocorticosterone (THB)",
            "Tetrahydrocortisol (THF)",
            "5-Androstenediol",
            "11\u03b2-Hydroxyandrostenedione",
            "17\u03b1-Hydroxypregnenolone",
            "5\u03b1-Androstanediol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cortisol (F)",
                "Aldosterone (Aldo)",
                "Progesterone (P4)",
                "Corticosterone (B)",
                "11-Deoxycorticosterone (DOC)",
                "11-Deoxycortisol (S)",
                "Tetrahydrocorticosterone (THB)",
                "Tetrahydrocortisol (THF)"
            ],
            "mismatches": [
                "Testosterone (T)",
                "Estradiol (E2)",
                "Dehydroepiandrosterone (DHEA)",
                "Androstenedione (A4)",
                "Estrone (E1)",
                "Estriol (E3)",
                "17\u03b1-Hydroxyprogesterone (17-OHP)",
                "Dihydrotestosterone (DHT)",
                "Calcitriol (1,25(OH)2D3)",
                "Dehydroepiandrosterone sulfate (DHEA-S)",
                "Pregnenolone (P5)",
                "17\u03b1-Estradiol (17\u03b1-E2)",
                "5-Androstenediol",
                "11\u03b2-Hydroxyandrostenedione",
                "17\u03b1-Hydroxypregnenolone",
                "5\u03b1-Androstanediol"
            ],
            "true_referents": [
                "11-deoxycorticosterone",
                "11-deoxycorticosterone pivalate",
                "11-deoxycortisol",
                "11a-Hydroxyprogesterone",
                "15alpha-Hydroxyprogesterone",
                "16-Hydroxyprogesterone",
                "16-a-Hydroxypregnenolone",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "1alpha,2beta,25-trihydroxy vitamin D3",
                "21-Deoxycortisone",
                "24-Nor-5beta-chol-22-ene-3alpha,12alpha-diol",
                "3alpha,17alpha-dihydroxy-5beta-pregnan-20-one",
                "4-Chloroprogesterone",
                "5a-Tetrahydrocorticosterone",
                "5a-Tetrahydrocortisol",
                "5alpha-dihydrodeoxycorticosterone",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol",
                "C21-steroid hormone",
                "Delta(1)-dihydrotestosterone",
                "Deoxycorticosterone acetate",
                "Ethyltestosterone",
                "Pregn-5-ene-3beta,20alpha-diol",
                "Pregn-5-ene-3beta,20beta-diol",
                "aldosterone",
                "anabolic androgenic steroid",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisone",
                "estetrol",
                "fludrocortisone",
                "mineralocorticoid",
                "norgesterone",
                "progesterone",
                "tetrahydrocortisol",
                "trenbolone"
            ],
            "TP": 8,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Testosterone (T)",
            "Estrogen (E)",
            "Progesterone (P)",
            "Cortisol (C)",
            "Aldosterone (A)",
            "Dihydrotestosterone (DHT)",
            "Dehydroepiandrosterone (DHEA)",
            "Androstenedione (A4)",
            "Estradiol (E2)",
            "Estrone (E1)",
            "Hydrocortisone (HC)",
            "Norethindrone (NET)",
            "Methyltestosterone (MT)",
            "Prednisone (PD)",
            "Fludrocortisone (FC)",
            "Cholesterol (Ch)",
            "Androsterone (A)",
            "Bile acids (BA)",
            "Calcitriol (CT)",
            "Vitamin D3 (D3)",
            "Thyroid hormones (TH)",
            "Pregnenolone (P5)",
            "Corticosterone (CST)",
            "Corticotropin-releasing hormone (CRH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Progesterone",
                "Cortisol",
                "Aldosterone",
                "Prednisone",
                "Fludrocortisone",
                "Corticosterone"
            ],
            "mismatches": [
                "Testosterone (T)",
                "Estrogen (E)",
                "Dihydrotestosterone (DHT)",
                "Dehydroepiandrosterone (DHEA)",
                "Androstenedione (A4)",
                "Estradiol (E2)",
                "Estrone (E1)",
                "Hydrocortisone (HC)",
                "Norethindrone (NET)",
                "Methyltestosterone (MT)",
                "Cholesterol (Ch)",
                "Androsterone (A)",
                "Bile acids (BA)",
                "Calcitriol (CT)",
                "Vitamin D3 (D3)",
                "Thyroid hormones (TH)",
                "Pregnenolone (P5)",
                "Corticotropin-releasing hormone (CRH)"
            ],
            "true_referents": [
                "(5alpha)-3-oxocholestan-26-oic acid",
                "(5alpha,25S)-3-oxocholestan-26-oic acid",
                "16-a-Hydroxypregnenolone",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "19-Norprogesterone",
                "1alpha,2beta,25-trihydroxy vitamin D3",
                "24-Nor-5beta-chol-22-ene-3alpha,12alpha-diol",
                "24-Nor-5beta-chol-22-ene-3alpha,6alpha-diol",
                "24-Nor-5beta-chol-22-ene-3alpha,7alpha,12alpha-triol",
                "5alpha-dihydrodeoxycorticosterone",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol-11-one",
                "C21-steroid hormone",
                "Delta(1)-dihydrotestosterone",
                "Delta(6)-prednisone",
                "Ethyltestosterone",
                "Hydrocortisone cypionate",
                "Pregn-5-ene-3beta,20alpha-diol",
                "Pregn-5-ene-3beta,20beta-diol",
                "aldosterone",
                "anabolic androgenic steroid",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisone",
                "dexamethasone",
                "fludrocortisone",
                "fludrocortisone acetate",
                "flumethasone",
                "hydrocortisone aceponate",
                "hydrocortisone caproate",
                "mineralocorticoid",
                "norethandrolone",
                "norgesterone",
                "norvinisterone",
                "oxandrolone",
                "prednisolone",
                "prednisone",
                "progesterone",
                "selenium (75Se) tauroselcholic acid",
                "trenbolone"
            ],
            "TP": 6,
            "FP": 18,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Cortisol (COR)",
            "Testosterone (T)",
            "Estradiol (E2)",
            "Progesterone (P4)",
            "Aldosterone (ALD)",
            "Dehydroepiandrosterone (DHEA)",
            "Estriol (E3)",
            "Estrone (E1)",
            "17\u03b1-Hydroxyprogesterone (17\u03b1-OHP)",
            "Corticosterone (CORT)",
            "Prednisone (PRD)",
            "Prednisolone (PRDL)",
            "Dexamethasone (DXM)",
            "Betamethasone (BET)",
            "Triamcinolone (TRIAM)",
            "Hydrocortisone (HC)",
            "Fludrocortisone (FLU)",
            "Desoxycorticosterone (DOC)",
            "11-Deoxycortisol (S)",
            "17\u03b1-Hydroxypregnenolone (17P)",
            "Pregnenolone (P5)",
            "17\u03b1-Hydroxyprogesterone (17-OHP)",
            "Cholesterol (CHOL)",
            "Vitamin D (Vit D)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Corticosterone",
                "Prednisone",
                "Prednisolone",
                "Dexamethasone",
                "Betamethasone",
                "Triamcinolone",
                "Fludrocortisone",
                "Aldosterone",
                "11-Deoxycortisol"
            ],
            "mismatches": [
                "Cortisol (COR)",
                "Testosterone (T)",
                "Estradiol (E2)",
                "Progesterone (P4)",
                "Dehydroepiandrosterone (DHEA)",
                "Estriol (E3)",
                "Estrone (E1)",
                "17\u03b1-Hydroxyprogesterone (17\u03b1-OHP)",
                "Hydrocortisone (HC)",
                "Desoxycorticosterone (DOC)",
                "17\u03b1-Hydroxypregnenolone (17P)",
                "Pregnenolone (P5)",
                "17\u03b1-Hydroxyprogesterone (17-OHP)",
                "Cholesterol (CHOL)",
                "Vitamin D (Vit D)"
            ],
            "true_referents": [
                "11-deoxycorticosterone",
                "11-deoxycortisol",
                "15alpha-Hydroxyprogesterone",
                "16-Hydroxyprogesterone",
                "16-a-Hydroxypregnenolone",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "1alpha,2beta,25-trihydroxy vitamin D3",
                "21-Deoxycortisone",
                "24-Nor-5beta-chol-22-ene-3alpha,12alpha-diol",
                "24-Nor-5beta-chol-22-ene-3alpha,6alpha-diol",
                "24-Nor-5beta-chol-22-ene-3alpha,7alpha,12alpha-triol",
                "4-Chloroprogesterone",
                "5alpha-dihydrodeoxycorticosterone",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol-11-one",
                "C21-steroid hormone",
                "Delta(1)-dihydrotestosterone",
                "Delta(6)-prednisolone",
                "Delta(6)-prednisone",
                "Deoxycorticosterone acetate",
                "Dexamethasone acetate",
                "Ethyltestosterone",
                "Hydrocortisone cypionate",
                "Hydroxyprogesterone acetate",
                "Prednisolone acetate",
                "Pregn-5-ene-3beta,20alpha-diol",
                "Pregn-5-ene-3beta,20beta-diol",
                "aldosterone",
                "anabolic androgenic steroid",
                "betamethasone",
                "betamethasone butyrate propionate",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisone",
                "dexamethasone",
                "dexamethasone dipropionate",
                "estetrol",
                "fludrocortisone",
                "fludrocortisone acetate",
                "flumethasone",
                "hydrocortisone aceponate",
                "hydrocortisone caproate",
                "mineralocorticoid",
                "norgesterone",
                "prednisolone",
                "prednisone",
                "progesterone",
                "trenbolone",
                "triamcinolone",
                "triamcinolone acetonide"
            ],
            "TP": 9,
            "FP": 15,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Cortisol",
            "Estrogen",
            "Progesterone",
            "Testosterone",
            "Aldosterone",
            "Dexamethasone",
            "Cortisone",
            "Androstenedione",
            "Dihydrotestosterone",
            "Estradiol",
            "Estrone",
            "Dehydroepiandrosterone",
            "Corticosterone",
            "Prednisone",
            "Prednisolone",
            "Fludrocortisone",
            "Spironolactone",
            "Hydrocortisone",
            "Drospirenone",
            "Methylprednisolone",
            "Betamethasone",
            "Triamcinolone",
            "Desoxycorticosterone",
            "Mineralocorticoid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Cortisol",
                "Progesterone",
                "Aldosterone",
                "Dexamethasone",
                "Cortisone",
                "Corticosterone",
                "Prednisone",
                "Prednisolone",
                "Fludrocortisone",
                "Betamethasone",
                "Triamcinolone",
                "Mineralocorticoid"
            ],
            "mismatches": [
                "Estrogen",
                "Testosterone",
                "Androstenedione",
                "Dihydrotestosterone",
                "Estradiol",
                "Estrone",
                "Dehydroepiandrosterone",
                "Spironolactone",
                "Hydrocortisone",
                "Drospirenone",
                "Methylprednisolone",
                "Desoxycorticosterone"
            ],
            "true_referents": [
                "11-deoxycorticosterone",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "5alpha-dihydrodeoxycorticosterone",
                "Delta(1)-dihydrotestosterone",
                "Deoxycorticosterone acetate",
                "Dexamethasone acetate",
                "Ethyltestosterone",
                "Hydroxyprogesterone acetate",
                "Prednisolone acetate",
                "aldosterone",
                "anabolic androgenic steroid",
                "betamethasone",
                "boldenone",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisone",
                "dexamethasone",
                "dexamethasone dipropionate",
                "fludrocortisone",
                "fludrocortisone acetate",
                "flumethasone",
                "hydrocortisone aceponate",
                "methylprednisolone acetate",
                "mineralocorticoid",
                "norgesterone",
                "oxandrolone",
                "prednisolone",
                "prednisone",
                "progesterone",
                "trenbolone",
                "triamcinolone",
                "triamcinolone acetonide"
            ],
            "TP": 12,
            "FP": 12,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Testosterone (Testo)",
            "Estradiol (E2)",
            "Estrone (E1)",
            "Estriol (E3)",
            "Progesterone",
            "Cortisol (Hydrocortisone)",
            "Aldosterone",
            "Prednisone",
            "Prednisolone",
            "Dexamethasone",
            "Cortisone",
            "Androstenedione",
            "Dehydroepiandrosterone (DHEA)",
            "Dehydroepiandrosterone sulfate (DHEA-S)",
            "Pregnenolone",
            "17-Hydroxyprogesterone",
            "Androsterone",
            "Epiandrosterone",
            "11-Deoxycorticosterone",
            "11-Deoxycortisol",
            "Etiocholanolone",
            "Nandrolone (19-Nortestosterone)",
            "Methandrostenolone",
            "Boldenone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Progesterone",
                "Cortisol (Hydrocortisone)",
                "Aldosterone",
                "Prednisone",
                "Prednisolone",
                "Dexamethasone",
                "Cortisone",
                "11-Deoxycorticosterone",
                "11-Deoxycortisol",
                "Nandrolone (19-Nortestosterone)",
                "Boldenone"
            ],
            "mismatches": [
                "Testosterone (Testo)",
                "Estradiol (E2)",
                "Estrone (E1)",
                "Estriol (E3)",
                "Androstenedione",
                "Dehydroepiandrosterone (DHEA)",
                "Dehydroepiandrosterone sulfate (DHEA-S)",
                "Pregnenolone",
                "17-Hydroxyprogesterone",
                "Androsterone",
                "Epiandrosterone",
                "Etiocholanolone",
                "Methandrostenolone"
            ],
            "true_referents": [
                "11-deoxycorticosterone",
                "11-deoxycorticosterone pivalate",
                "11-deoxycortisol",
                "15alpha-Hydroxyprogesterone",
                "16-Hydroxyprogesterone",
                "16-a-Hydroxypregnenolone",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "21-Deoxycortisone",
                "5alpha-dihydrodeoxycorticosterone",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol",
                "Alphaxolone",
                "C21-steroid hormone",
                "Delta(1)-dihydrotestosterone",
                "Dexamethasone acetate",
                "Ethyltestosterone",
                "Hydroxyprogesterone acetate",
                "Prednisolone acetate",
                "aldosterone",
                "anabolic androgenic steroid",
                "boldenone",
                "clocortolone",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisone",
                "dexamethasone",
                "dexamethasone dipropionate",
                "estetrol",
                "mineralocorticoid",
                "nandrolone",
                "norgesterone",
                "oxandrolone",
                "oxymetholone",
                "prednisolone",
                "prednisone",
                "progesterone",
                "stanozolol",
                "trenbolone"
            ],
            "TP": 11,
            "FP": 13,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Testosterone (T)",
            "Estradiol (E2)",
            "Progesterone (P4)",
            "Cortisol",
            "Aldosterone",
            "Estrone (E1)",
            "Estriol (E3)",
            "Androstenedione",
            "Dehydroepiandrosterone (DHEA)",
            "Corticosterone",
            "11-Deoxycorticosterone (DOC)",
            "17\u03b1-Hydroxyprogesterone",
            "Dihydrotestosterone (DHT)",
            "Pregnenolone",
            "Ecdysone",
            "20-Hydroxyecdysone",
            "Cortisone",
            "11-Deoxycortisol",
            "18-Hydroxycorticosterone",
            "Androsterone",
            "Etiocholanolone",
            "17\u03b2-Estradiol",
            "Estradiol valerate",
            "Medroxyprogesterone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Progesterone (P4)",
                "Cortisol",
                "Aldosterone",
                "Corticosterone",
                "11-Deoxycorticosterone (DOC)",
                "Cortisone",
                "11-Deoxycortisol"
            ],
            "mismatches": [
                "Testosterone (T)",
                "Estradiol (E2)",
                "Estrone (E1)",
                "Estriol (E3)",
                "Androstenedione",
                "Dehydroepiandrosterone (DHEA)",
                "17\u03b1-Hydroxyprogesterone",
                "Dihydrotestosterone (DHT)",
                "Pregnenolone",
                "Ecdysone",
                "20-Hydroxyecdysone",
                "18-Hydroxycorticosterone",
                "Androsterone",
                "Etiocholanolone",
                "17\u03b2-Estradiol",
                "Estradiol valerate",
                "Medroxyprogesterone"
            ],
            "true_referents": [
                "1-beta-hydroxymedroxyprogesterone",
                "11-deoxycorticosterone",
                "11-deoxycorticosterone pivalate",
                "11-deoxycortisol",
                "15alpha-Hydroxyprogesterone",
                "16-Hydroxyprogesterone",
                "16-a-Hydroxypregnenolone",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "18-hydroxycortisol",
                "21-Deoxycortisone",
                "3alpha,17alpha-Dihydroxy-5beta-pregnane-11,20-dione",
                "3alpha,6alpha-Dihydroxy-5beta-pregnan-20-one",
                "3beta,14beta-dihydroxy-5beta-pregnane-20-one",
                "4-Chloroprogesterone",
                "5alpha-dihydrodeoxycorticosterone",
                "5alpha-pregnane-3,20-dione",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol-11-one",
                "Alphaxolone",
                "C21-steroid hormone",
                "Delta(1)-dihydrotestosterone",
                "Deoxycorticosterone acetate",
                "Diflucortolone valerate",
                "Ethyltestosterone",
                "Hydroxyprogesterone acetate",
                "aldosterone",
                "anabolic androgenic steroid",
                "clocortolone",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisol 17-valerate",
                "cortisone",
                "estetrol",
                "mineralocorticoid",
                "nandrolone",
                "norgesterone",
                "oxandrolone",
                "prednisolone valerate acetate",
                "progesterone",
                "trenbolone"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Testosterone",
            "Estradiol (E2)",
            "Progesterone",
            "Cortisol",
            "Aldosterone",
            "Dehydroepiandrosterone (DHEA)",
            "Androstenedione",
            "Corticosterone",
            "11-Deoxycorticosterone",
            "11-Deoxycortisol",
            "Estrone (E1)",
            "Estriol (E3)",
            "Dihydrotestosterone (DHT)",
            "Pregnenolone",
            "17\u03b1-Hydroxypregnenolone",
            "17\u03b1-Hydroxyprogesterone",
            "Dehydroepiandrosterone sulfate (DHEA-S)",
            "Androstenediol",
            "Androsterone",
            "Epiandrosterone",
            "Allopregnanolone",
            "Tetrahydrocorticosterone",
            "Tetrahydrodeoxycorticosterone",
            "Tetrahydrocortisol"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Progesterone",
                "Cortisol",
                "Aldosterone",
                "Corticosterone",
                "11-Deoxycorticosterone",
                "11-Deoxycortisol",
                "Tetrahydrocortisol"
            ],
            "mismatches": [
                "Testosterone",
                "Estradiol (E2)",
                "Dehydroepiandrosterone (DHEA)",
                "Androstenedione",
                "Estrone (E1)",
                "Estriol (E3)",
                "Dihydrotestosterone (DHT)",
                "Pregnenolone",
                "17\u03b1-Hydroxypregnenolone",
                "17\u03b1-Hydroxyprogesterone",
                "Dehydroepiandrosterone sulfate (DHEA-S)",
                "Androstenediol",
                "Androsterone",
                "Epiandrosterone",
                "Allopregnanolone",
                "Tetrahydrocorticosterone",
                "Tetrahydrodeoxycorticosterone"
            ],
            "true_referents": [
                "11-deoxycorticosterone",
                "11-deoxycorticosterone pivalate",
                "11-deoxycortisol",
                "15alpha-Hydroxyprogesterone",
                "16-Hydroxyprogesterone",
                "16-a-Hydroxypregnenolone",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "21-Deoxycortisone",
                "3alpha,17alpha-dihydroxy-5beta-pregnan-20-one",
                "5a-Tetrahydrocorticosterone",
                "5a-Tetrahydrocortisol",
                "5alpha-dihydrodeoxycorticosterone",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol-11-one",
                "C21-steroid hormone",
                "Delta(1)-dihydrotestosterone",
                "Ethyltestosterone",
                "Hydroxyprogesterone acetate",
                "aldosterone",
                "anabolic androgenic steroid",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisone",
                "estetrol",
                "mineralocorticoid",
                "nandrolone",
                "norgesterone",
                "oxandrolone",
                "progesterone",
                "tetrahydrocortisol",
                "trenbolone"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Cholesterol (C27H46O)",
            "Cortisol (C21H30O5)",
            "Aldosterone (C21H28O5)",
            "Testosterone (C19H28O2)",
            "Estradiol (C18H24O2)",
            "Progesterone (C21H30O2)",
            "Vitamin D3 (C27H44O)",
            "Ecdysone (C27H44O7)",
            "Brassinolide (C28H48O6)",
            "Ergocalciferol (C28H44O)",
            "Androstenedione (C19H26O2)",
            "Dehydroepiandrosterone (C19H28O2)",
            "Corticosterone (C21H30O4)",
            "Pregnenolone (C21H32O2)",
            "Calcitriol (C27H44O3)",
            "Diosgenin (C27H42O3)",
            "Ecdysterone (C27H44O7)",
            "Ergosterol (C28H44O)",
            "Stigmasterol (C29H48O)",
            "Campesterol (C28H48O)",
            "Brassinolide (C28H48O6)",
            "Castasterone (C28H48O6)",
            "Teasterone (C19H28O2)",
            "Boldenone (C19H26O2)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aldosterone (C21H28O5)",
                "Progesterone (C21H30O2)",
                "Corticosterone (C21H30O4)",
                "Boldenone (C19H26O2)"
            ],
            "mismatches": [
                "Cholesterol (C27H46O)",
                "Cortisol (C21H30O5)",
                "Testosterone (C19H28O2)",
                "Estradiol (C18H24O2)",
                "Vitamin D3 (C27H44O)",
                "Ecdysone (C27H44O7)",
                "Brassinolide (C28H48O6)",
                "Ergocalciferol (C28H44O)",
                "Androstenedione (C19H26O2)",
                "Dehydroepiandrosterone (C19H28O2)",
                "Pregnenolone (C21H32O2)",
                "Calcitriol (C27H44O3)",
                "Diosgenin (C27H42O3)",
                "Ecdysterone (C27H44O7)",
                "Ergosterol (C28H44O)",
                "Stigmasterol (C29H48O)",
                "Campesterol (C28H48O)",
                "Castasterone (C28H48O6)",
                "Teasterone (C19H28O2)"
            ],
            "true_referents": [
                "(3a,5b,6a)- 17-(acetyloxy)-3-hydroxy-6-methyl- Pregnan-20-one",
                "(5alpha)-3-oxocholestan-26-oic acid",
                "(5alpha,25S)-3-oxocholestan-26-oic acid",
                "11,17-Dihydroxy-3,20-dioxopregn-4-en-21-yl acetate",
                "11alpha,15alpha-Dihydroxypregn-4-ene-3,20-dione",
                "11alpha-Hydroxy-5beta-pregnane-3,20-dione",
                "11beta,21-Dihydroxypregn-4-ene-3,20-dione 21-acetate",
                "11beta-Hydroxy-6alpha,11-dimethylpregn-4-ene-3,20-dione",
                "12alpha-Bromo-11beta-hydroxypregn-4-ene-3,20-dione",
                "12beta-hydroxy-24-norcholesta-1,4,22E-trien-3-one",
                "16-a-Hydroxypregnenolone",
                "16-alpha,17-Epoxypregn-4-ene-3,20-dione",
                "16alpha,17-Dihydroxypregn-4-ene-3,20-dione cyclic acetal with 2-furyl methyl ketone",
                "16alpha,17-Isopropylidenedioxy-6alpha-methylprogesterone",
                "17,20,21-trihydroxypregn-1-ene-3,11-dione",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "18-hydroxypregna-1,4,20-trien-3-one",
                "18-oxocortisol",
                "1alpha,2beta,25-trihydroxy vitamin D3",
                "21-Deoxycortisone",
                "22,23-epoxy-5beta-campestan-3beta-ol",
                "24-Nor-5beta-chol-22-ene-3alpha,6alpha-diol",
                "3alpha,17alpha-Dihydroxy-5beta-pregnane-11,20-dione",
                "3beta,14beta-dihydroxy-5beta-pregnane-20-one",
                "5alpha-dihydrodeoxycorticosterone",
                "6alpha-Chloro-17-acetoxyprogesterone",
                "9-Bromo-11beta-hydroxy-16alpha-methylpregn-4-ene-3,20-dione",
                "C21-steroid hormone",
                "Delta(1)-dihydrotestosterone",
                "Ethyltestosterone",
                "Pregnane-3,3-diol",
                "aldosterone",
                "anabolic androgenic steroid",
                "boldenone",
                "corticosteroid hormone",
                "corticosterone",
                "progesterone"
            ],
            "TP": 4,
            "FP": 19,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Testosterone (T)",
            "Estradiol (E2)",
            "Progesterone (P4)",
            "Cortisol (CORT)",
            "Aldosterone (ALDO)",
            "Cholesterol (CHOL)",
            "Dehydroepiandrosterone (DHEA)",
            "Pregnenolone (PREG)",
            "Corticosterone (CORT)",
            "Androstenedione (A4)",
            "Dihydrotestosterone (DHT)",
            "Estriol (E3)",
            "Estrone (E1)",
            "Hydrocortisone (HCORT)",
            "Dexamethasone (DEX)",
            "Prednisone (PRED)",
            "Prednisolone (PREDL)",
            "Fludrocortisone (FLUDC)",
            "Spironolactone (SPIRO)",
            "Etiocholanolone (ETIO)",
            "Androsterone (ANDRO)",
            "Allopregnanolone (ALLO)",
            "Pregnanolone (PREG-OL)",
            "Hydroxyprogesterone (17OHP)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Progesterone (P4)",
                "Corticosterone (CORT)",
                "Aldosterone (ALDO)",
                "Dexamethasone (DEX)",
                "Prednisone (PRED)",
                "Prednisolone (PREDL)",
                "Fludrocortisone (FLUDC)"
            ],
            "mismatches": [
                "Testosterone (T)",
                "Estradiol (E2)",
                "Cortisol (CORT)",
                "Cholesterol (CHOL)",
                "Dehydroepiandrosterone (DHEA)",
                "Pregnenolone (PREG)",
                "Androstenedione (A4)",
                "Dihydrotestosterone (DHT)",
                "Estriol (E3)",
                "Estrone (E1)",
                "Hydrocortisone (HCORT)",
                "Spironolactone (SPIRO)",
                "Etiocholanolone (ETIO)",
                "Androsterone (ANDRO)",
                "Allopregnanolone (ALLO)",
                "Pregnanolone (PREG-OL)",
                "Hydroxyprogesterone (17OHP)"
            ],
            "true_referents": [
                "15alpha-Hydroxyprogesterone",
                "16-Hydroxyprogesterone",
                "16-a-Hydroxypregnenolone",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "24-Nor-5beta-chol-22-ene-3alpha,12alpha-diol",
                "24-Nor-5beta-chol-22-ene-3alpha,6alpha-diol",
                "24-Nor-5beta-chol-22-ene-3alpha,7alpha,12alpha-triol",
                "3alpha,12alpha-Dihydroxy-5beta-pregnan-20-one",
                "4-Chloroprogesterone",
                "5alpha-Pregnan-20alpha-ol-3-one",
                "5alpha-dihydrodeoxycorticosterone",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol-11-one",
                "Alphaxolone",
                "C21-steroid hormone",
                "Delta(1)-dihydrotestosterone",
                "Delta(6)-prednisolone",
                "Delta(6)-prednisone",
                "Dexamethasone acetate",
                "Ethyltestosterone",
                "Hydrocortisone cypionate",
                "Hydroxyprogesterone acetate",
                "Prednisolone acetate",
                "Pregn-5-ene-3beta,20alpha-diol",
                "aldosterone",
                "anabolic androgenic steroid",
                "clocortolone",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisone",
                "dexamethasone",
                "dexamethasone dipropionate",
                "estetrol",
                "fludrocortisone",
                "fludrocortisone acetate",
                "flumethasone",
                "hydrocortisone aceponate",
                "hydrocortisone caproate",
                "mineralocorticoid",
                "norethandrolone",
                "norgesterone",
                "oxandrolone",
                "prednisolone",
                "prednisone",
                "progesterone",
                "trenbolone"
            ],
            "TP": 7,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Estradiol (E2)",
            "Testosterone",
            "Progesterone",
            "Cortisol",
            "Aldosterone",
            "Androstenedione",
            "Dihydrotestosterone (DHT)",
            "Estriol",
            "Pregnenolone",
            "Dehydroepiandrosterone (DHEA)",
            "Cholesterol",
            "Pregnanediol",
            "Androstenone",
            "Estriol",
            "Pregnanolone",
            "Dehydroisoandrosterone (DHEA-S)",
            "Cortisone",
            "Allopregnanolone",
            "Epitestosterone",
            "Pregnanetriol",
            "Dehydroandrosterone (DHA)",
            "Pregnanolone",
            "Cortisol",
            "Androstenedione",
            "Estrone"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Progesterone",
                "Cortisol",
                "Aldosterone",
                "Pregnanediol",
                "Cortisone"
            ],
            "mismatches": [
                "Estradiol (E2)",
                "Testosterone",
                "Androstenedione",
                "Dihydrotestosterone (DHT)",
                "Estriol",
                "Pregnenolone",
                "Dehydroepiandrosterone (DHEA)",
                "Cholesterol",
                "Androstenone",
                "Pregnanolone",
                "Dehydroisoandrosterone (DHEA-S)",
                "Allopregnanolone",
                "Epitestosterone",
                "Pregnanetriol",
                "Dehydroandrosterone (DHA)",
                "Estrone"
            ],
            "true_referents": [
                "15beta-hydroxycyproterone acetate",
                "16-a-Hydroxypregnenolone",
                "17beta-hydroxyandrostan-1,3-dione",
                "24-Nor-5beta-chol-22-ene-3alpha,12alpha-diol",
                "24-Nor-5beta-chol-22-ene-3alpha,7alpha,12alpha-triol",
                "3a,20b-Pregnanediol",
                "3alpha,17alpha-Dihydroxy-5beta-pregnane-11,20-dione",
                "5alpha-dihydrodeoxycorticosterone",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol-11-one",
                "C21-steroid hormone",
                "Delta(1)-dihydrotestosterone",
                "Ethyltestosterone",
                "Hydroxyprogesterone acetate",
                "Pregnane-3,3-diol",
                "Pregnanediol",
                "aldosterone",
                "anabolic androgenic steroid",
                "clocortolone",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisone",
                "mineralocorticoid",
                "nandrolone",
                "norethandrolone",
                "norgesterone",
                "prednisolone",
                "progesterone",
                "trenbolone"
            ],
            "TP": 5,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            "Aldosterone (ALD)",
            "Androstenedione (AND)",
            "Androsterone (ADT)",
            "Cholecalciferol (Vitamin D3)",
            "Cholesterol",
            "Corticosterone (B)",
            "Cortisone (E)",
            "Dehydroepiandrosterone (DHEA)",
            "Deoxycorticosterone (DOC)",
            "Dihydrotestosterone (DHT)",
            "Estradiol (E2)",
            "Estrone (E1)",
            "Estriol (E3)",
            "Fludrocortisone (F)",
            "Glucocorticoids",
            "Pregnenolone (P5)",
            "Progesterone (P4)",
            "Testosterone (T)",
            "Triamcinolone (T)",
            "Aldosterone (ALD)",
            "11-Deoxycortisol (CDF)",
            "Cortisol (F)",
            "11-Deoxycorticosterone (DOC)",
            "Dihydroandrosterone (DHAD)",
            "Androstanedione (5-Dione)",
            "Androstenetriol (AT)",
            "Pregnanetriol (PT)",
            "Pregnanedione (PD)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aldosterone (ALD)",
                "Corticosterone (B)",
                "Cortisone (E)",
                "Deoxycorticosterone (DOC)",
                "Fludrocortisone (F)",
                "Glucocorticoids",
                "Progesterone (P4)",
                "Triamcinolone (T)",
                "11-Deoxycortisol (CDF)",
                "Cortisol (F)",
                "11-Deoxycorticosterone (DOC)"
            ],
            "mismatches": [
                "Androstenedione (AND)",
                "Androsterone (ADT)",
                "Cholecalciferol (Vitamin D3)",
                "Cholesterol",
                "Dehydroepiandrosterone (DHEA)",
                "Dihydrotestosterone (DHT)",
                "Estradiol (E2)",
                "Estrone (E1)",
                "Estriol (E3)",
                "Pregnenolone (P5)",
                "Testosterone (T)",
                "Dihydroandrosterone (DHAD)",
                "Androstanedione (5-Dione)",
                "Androstenetriol (AT)",
                "Pregnanetriol (PT)",
                "Pregnanedione (PD)"
            ],
            "true_referents": [
                "11-deoxycorticosterone",
                "11-deoxycorticosterone pivalate",
                "11-deoxycortisol",
                "16-a-Hydroxypregnenolone",
                "17beta-hydroxy-17-methylestra-4,9,11-trien-3-one",
                "17beta-hydroxyandrostan-1,3-dione",
                "1alpha,2beta,25-trihydroxy vitamin D3",
                "21-Deoxycortisone",
                "24-Nor-5beta-chol-22-ene-3alpha,12alpha-diol",
                "24-Nor-5beta-chol-22-ene-3alpha,7alpha,12alpha-triol",
                "4-Chloroprogesterone",
                "5alpha-dihydrodeoxycorticosterone",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol",
                "5beta-Pregnane-3alpha,17alpha,20alpha-triol-11-one",
                "C21-steroid hormone",
                "Delta(1)-dihydrotestosterone",
                "Deoxycorticosterone acetate",
                "Ethyltestosterone",
                "Pregn-5-ene-3beta,20alpha-diol",
                "Pregn-5-ene-3beta,20beta-diol",
                "aldosterone",
                "anabolic androgenic steroid",
                "corticosteroid hormone",
                "corticosterone",
                "cortisol",
                "cortisone",
                "estetrol",
                "fludrocortisone",
                "fludrocortisone acetate",
                "flumethasone",
                "glucocorticoid",
                "mineralocorticoid",
                "norgesterone",
                "oxandrolone",
                "progesterone",
                "trenbolone",
                "triamcinolone",
                "triamcinolone acetonide"
            ],
            "TP": 11,
            "FP": 16,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "steroid hormone",
        "domain": "biology",
        "response": [
            {
                "Referent": "corticosteroids",
                "Canonical name": "corticosteroids"
            },
            {
                "Referent": "testosterone",
                "Canonical name": "testosterone"
            },
            {
                "Referent": "progesterone",
                "Canonical name": "progesterone"
            },
            {
                "Referent": "estrogen",
                "Canonical name": "estrogen"
            },
            {
                "Referent": "glucocorticoids",
                "Canonical name": "glucocorticoids"
            },
            {
                "Referent": "corticosteroid",
                "Canonical name": "corticosteroid"
            },
            {
                "Referent": "androgen",
                "Canonical name": "androgen"
            },
            {
                "Referent": "corticotropin",
                "Canonical name": "corticotropin"
            },
            {
                "Referent": "glucocorticoid",
                "Canonical name": "glucocorticoid"
            },
            {
                "Referent": "glucocorticoid hormone",
                "Canonical name": "glucocorticoid hormone"
            },
            {
                "Referent": "glucocorticoid receptor",
                "Canonical name": "glucocorticoid receptor"
            },
            {
                "Referent": "glucocorticoid receptor agonist",
                "Canonical name": "glucocorticoid receptor agonist"
            },
            {
                "Referent": "glucocorticoid receptor antagonist",
                "Canonical name": "glucocorticoid receptor antagonist"
            },
            {
                "Referent": "glucocorticoid receptor agonist",
                "Canonical name": "glucocorticoid receptor agonist"
            },
            {
                "Referent": "glucocorticoid receptor antagonist",
                "Canonical name": "glucocorticoid receptor antagonist"
            },
            {
                "Referent": "glucocorticoid receptor",
                "Canonical name": "glucocorticoid receptor"
            },
            {
                "Referent": "glucocorticoid receptor agonist",
                "Canonical name": "glucocorticoid receptor agonist"
            },
            {
                "Referent": "glucocorticoid receptor antagonist",
                "Canonical name": "glucocorticoid receptor antagonist"
            },
            {
                "Referent": "glucocorticoid receptor",
                "Canonical name": "glucocorticoid receptor"
            },
            {
                "Referent": "glucocorticoid receptor agonist",
                "Canonical name": "glucocorticoid receptor agonist"
            },
            {
                "Referent": "glucocorticoid receptor antagonist",
                "Canonical name": "glucocorticoid receptor antagonist"
            },
            {
                "Referent": "glucocorticoid receptor",
                "Canonical name": "glucocorticoid receptor"
            },
            {
                "Referent": "glucocorticoid receptor agonist",
                "Canonical name": "glucocorticoid receptor agonist"
            },
            {
                "Referent": "glucocorticoid receptor antagonist",
                "Canonical name": "glucocorticoid receptor antagonist"
            },
            {
                "Referent": "glucocorticoid receptor",
                "Canonical name": "glucocorticoid receptor"
            },
            {
                "Referent": "glucocorticoid receptor agonist",
                "Canonical name": "glucocorticoid receptor agonist"
            },
            {
                "Referent": "glucocorticoid receptor antagonist",
                "Canonical name": "glucocorticoid receptor antagonist"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "progesterone",
                "glucocorticoid"
            ],
            "mismatches": [
                "corticosteroids",
                "testosterone",
                "estrogen",
                "corticosteroid",
                "androgen",
                "corticotropin",
                "glucocorticoid hormone",
                "glucocorticoid receptor",
                "glucocorticoid receptor agonist",
                "glucocorticoid receptor antagonist"
            ],
            "true_referents": [
                "21-Deoxycortisone",
                "3alpha,11beta,17alpha-Trihydroxy-5beta-pregnan-20-one",
                "3alpha,12alpha-Dihydroxy-5beta-pregnan-20-one",
                "3alpha,6alpha-Dihydroxy-5beta-pregnan-20-one",
                "C21-steroid hormone",
                "Delta(1)-dihydrotestosterone",
                "Ethyltestosterone",
                "anabolic androgenic steroid",
                "corticosteroid hormone",
                "cortisol",
                "cortisone",
                "dexamethasone",
                "glucocorticoid",
                "prednisone",
                "progesterone"
            ],
            "TP": 2,
            "FP": 10,
            "FN": 0
        }
    }
]