[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Phosphoserine",
            "Phosphothreonine",
            "Phosphotyrosine",
            "Homocysteic acid",
            "Selenocysteine",
            "5-Hydroxytryptophan",
            "3-Methylhistidine",
            "Homoserine",
            "Homoglutamic acid",
            "Dehydroalanine",
            "Dehydrobutyrine",
            "Norvaline",
            "Norleucine",
            "Penicillamine",
            "Pyrrolysine",
            "Thioctic acid",
            "Thioctic acid (alpha-lipoic acid)",
            "Taurine",
            "Cysteic acid",
            "Homocysteine",
            "Homoserine lactone",
            "Sulfadiazine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Phosphoserine",
                "Phosphothreonine",
                "Phosphotyrosine",
                "Homocysteic acid",
                "Selenocysteine",
                "5-Hydroxytryptophan",
                "3-Methylhistidine",
                "Homoserine",
                "Homoglutamic acid",
                "Dehydroalanine",
                "Dehydrobutyrine",
                "Norvaline",
                "Norleucine",
                "Penicillamine",
                "Pyrrolysine",
                "Thioctic acid",
                "Thioctic acid (alpha-lipoic acid)",
                "Taurine",
                "Cysteic acid",
                "Homocysteine",
                "Homoserine lactone",
                "Sulfadiazine"
            ],
            "mismatches": [],
            "true_referents": [
                "3-Methylhistidine",
                "5-Hydroxytryptophan",
                "Aspartic acid (Asp)",
                "Cysteic acid",
                "Dehydroalanine",
                "Dehydrobutyrine",
                "Glutamic acid (Glu)",
                "Homocysteic acid",
                "Homocysteine",
                "Homoglutamic acid",
                "Homoserine",
                "Homoserine lactone",
                "Norleucine",
                "Norvaline",
                "Penicillamine",
                "Phosphoserine",
                "Phosphothreonine",
                "Phosphotyrosine",
                "Pyrrolysine",
                "Selenocysteine",
                "Sulfadiazine",
                "Taurine",
                "Thioctic acid",
                "Thioctic acid (alpha-lipoic acid)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic acid (Asp, D)",
            "Glutamic acid (Glu, E)",
            "Asparagine (Asn, N)",
            "Glutamine (Gln, Q)",
            "Cysteine (Cys, C)",
            "Tyrosine (Tyr, Y)",
            "Histidine (His, H)",
            "Phenylalanine (Phe, F)",
            "Tryptophan (Trp, W)",
            "Proline (Pro, P)",
            "Valine (Val, V)",
            "Leucine (Leu, L)",
            "Isoleucine (Ile, I)",
            "Methionine (Met, M)",
            "Lysine (Lys, K)",
            "Arginine (Arg, R)",
            "Alanine (Ala, A)",
            "Serine (Ser, S)",
            "Threonine (Thr, T)",
            "Glycine (Gly, G)",
            "Cystine (Cys2, C)",
            "Selenocysteine (Sec, U)",
            "Pyroglutamic acid (pGlu, pE)",
            "N-Methylglutamic acid (NMeGlu)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid (Asp, D)",
                "Glutamic acid (Glu, E)",
                "Asparagine (Asn, N)",
                "Glutamine (Gln, Q)",
                "Cysteine (Cys, C)",
                "Tyrosine (Tyr, Y)",
                "Histidine (His, H)",
                "Phenylalanine (Phe, F)",
                "Tryptophan (Trp, W)",
                "Proline (Pro, P)",
                "Valine (Val, V)",
                "Leucine (Leu, L)",
                "Isoleucine (Ile, I)",
                "Methionine (Met, M)",
                "Lysine (Lys, K)",
                "Arginine (Arg, R)",
                "Alanine (Ala, A)",
                "Serine (Ser, S)",
                "Threonine (Thr, T)",
                "Glycine (Gly, G)",
                "Cystine (Cys2, C)",
                "Selenocysteine (Sec, U)",
                "Pyroglutamic acid (pGlu, pE)",
                "N-Methylglutamic acid (NMeGlu)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alanine (Ala, A)",
                "Arginine (Arg, R)",
                "Asparagine (Asn, N)",
                "Aspartic acid (Asp, D)",
                "Cysteine (Cys, C)",
                "Cystine (Cys2, C)",
                "Glutamic acid (Glu, E)",
                "Glutamine (Gln, Q)",
                "Glycine (Gly, G)",
                "Histidine (His, H)",
                "Isoleucine (Ile, I)",
                "Leucine (Leu, L)",
                "Lysine (Lys, K)",
                "Methionine (Met, M)",
                "N-Methylglutamic acid (NMeGlu)",
                "Phenylalanine (Phe, F)",
                "Proline (Pro, P)",
                "Pyroglutamic acid (pGlu, pE)",
                "Selenocysteine (Sec, U)",
                "Serine (Ser, S)",
                "Threonine (Thr, T)",
                "Tryptophan (Trp, W)",
                "Tyrosine (Tyr, Y)",
                "Valine (Val, V)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic acid (Asp, D)",
            "Glutamic acid (Glu, E)",
            "Aspartate",
            "Glutamate",
            "D-Aspartic acid",
            "D-Glutamic acid",
            "Cysteine (Cys, C)",
            "Tyrosine (Tyr, Y)",
            "Histidine (His, H)",
            "Acidic amino acid residue in proteins",
            "Aspartate anion",
            "Glutamate anion",
            "N-Acetylaspartic acid",
            "N-Acetylglutamic acid",
            "N-Methylaspartic acid",
            "N-Methylglutamic acid",
            "\u03b1-Aminoadipic acid",
            "\u03b1-Aminopimelic acid",
            "\u03b3-Aminobutyric acid (GABA)",
            "Homoglutamic acid",
            "Homocysteic acid",
            "Iminodipropionic acid",
            "Sulfocysteine",
            "Thiocysteine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid (Asp, D)",
                "Glutamic acid (Glu, E)",
                "Aspartate",
                "Glutamate",
                "D-Aspartic acid",
                "D-Glutamic acid",
                "Cysteine (Cys, C)",
                "Tyrosine (Tyr, Y)",
                "Histidine (His, H)",
                "Acidic amino acid residue in proteins",
                "Aspartate anion",
                "Glutamate anion",
                "N-Acetylaspartic acid",
                "N-Acetylglutamic acid",
                "N-Methylaspartic acid",
                "N-Methylglutamic acid",
                "\u03b1-Aminoadipic acid",
                "\u03b1-Aminopimelic acid",
                "\u03b3-Aminobutyric acid (GABA)",
                "Homoglutamic acid",
                "Homocysteic acid",
                "Iminodipropionic acid",
                "Sulfocysteine",
                "Thiocysteine"
            ],
            "mismatches": [],
            "true_referents": [
                "Acidic amino acid residue in proteins",
                "Aspartate",
                "Aspartate anion",
                "Aspartic acid (Asp, D)",
                "Cysteine (Cys, C)",
                "D-Aspartic acid",
                "D-Glutamic acid",
                "Glutamate",
                "Glutamate anion",
                "Glutamic acid (Glu, E)",
                "Histidine (His, H)",
                "Homocysteic acid",
                "Homoglutamic acid",
                "Iminodipropionic acid",
                "N-Acetylaspartic acid",
                "N-Acetylglutamic acid",
                "N-Methylaspartic acid",
                "N-Methylglutamic acid",
                "Sulfocysteine",
                "Thiocysteine",
                "Tyrosine (Tyr, Y)",
                "\u03b1-Aminoadipic acid",
                "\u03b1-Aminopimelic acid",
                "\u03b3-Aminobutyric acid (GABA)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic acid (Asp)",
            "Aspartate",
            "Aspartic acid residue in a protein",
            "Aspartyl tRNA synthetase substrate",
            "N-formylaspartate",
            "Aspartyl-phosphate",
            "O-Aspartyl-homoserine",
            "Aspartate aminotransferase substrate",
            "Fumarate (product of aspartate degradation)",
            "Oxaloacetate (intermediate in aspartate synthesis)",
            "L-Aspartic acid \u03b1-ester",
            "D-Aspartic acid",
            "Isoaspartic acid",
            "Glutamic acid (Glu)",
            "Glutamate",
            "Glutamic acid residue in a protein",
            "Glutamyl tRNA synthetase substrate",
            "\u03b1-Ketoglutarate (intermediate in glutamate metabolism)",
            "Glutathione (containing glutamate)",
            "Pyroglutamic acid",
            "Glutamyl-peptide",
            "Glutamate dehydrogenase substrate",
            "Glutamine (precursor to glutamate)",
            "5-Glutamylpolypeptides"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid (Asp)",
                "Aspartate",
                "Aspartic acid residue in a protein",
                "Aspartyl tRNA synthetase substrate",
                "N-formylaspartate",
                "Aspartyl-phosphate",
                "O-Aspartyl-homoserine",
                "Aspartate aminotransferase substrate",
                "Fumarate (product of aspartate degradation)",
                "Oxaloacetate (intermediate in aspartate synthesis)",
                "L-Aspartic acid \u03b1-ester",
                "D-Aspartic acid",
                "Isoaspartic acid",
                "Glutamic acid (Glu)",
                "Glutamate",
                "Glutamic acid residue in a protein",
                "Glutamyl tRNA synthetase substrate",
                "\u03b1-Ketoglutarate (intermediate in glutamate metabolism)",
                "Glutathione (containing glutamate)",
                "Pyroglutamic acid",
                "Glutamyl-peptide",
                "Glutamate dehydrogenase substrate",
                "Glutamine (precursor to glutamate)",
                "5-Glutamylpolypeptides"
            ],
            "mismatches": [],
            "true_referents": [
                "5-Glutamylpolypeptides",
                "Aspartate",
                "Aspartate aminotransferase substrate",
                "Aspartic acid (Asp)",
                "Aspartic acid residue in a protein",
                "Aspartyl tRNA synthetase substrate",
                "Aspartyl-phosphate",
                "D-Aspartic acid",
                "Fumarate (product of aspartate degradation)",
                "Glutamate",
                "Glutamate dehydrogenase substrate",
                "Glutamic acid (Glu)",
                "Glutamic acid residue in a protein",
                "Glutamine (precursor to glutamate)",
                "Glutamyl tRNA synthetase substrate",
                "Glutamyl-peptide",
                "Glutathione (containing glutamate)",
                "Isoaspartic acid",
                "L-Aspartic acid \u03b1-ester",
                "N-formylaspartate",
                "O-Aspartyl-homoserine",
                "Oxaloacetate (intermediate in aspartate synthesis)",
                "Pyroglutamic acid",
                "\u03b1-Ketoglutarate (intermediate in glutamate metabolism)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)"
            ],
            "TP": 2,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Asparagine (Asn)",
            "Glutamine (Gln)",
            "Cysteine (Cys)",
            "Tyrosine (Tyr)",
            "Histidine (His)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Methionine (Met)",
            "Proline (Pro)",
            "Lysine (Lys)",
            "Arginine (Arg)",
            "Phenylalanine (Phe)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Valine (Val)",
            "Tryptophan (Trp)",
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Glutathione (GSH)",
            "Lactic acid (C3H6O3)",
            "Citric acid (C6H8O7)",
            "Acetic acid (C2H4O2)",
            "Formic acid (HCOOH)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Asparagine (Asn)",
                "Glutamine (Gln)",
                "Cysteine (Cys)",
                "Tyrosine (Tyr)",
                "Histidine (His)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Methionine (Met)",
                "Proline (Pro)",
                "Lysine (Lys)",
                "Arginine (Arg)",
                "Phenylalanine (Phe)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Valine (Val)",
                "Tryptophan (Trp)",
                "Glycine (Gly)",
                "Alanine (Ala)",
                "Glutathione (GSH)",
                "Lactic acid (C3H6O3)",
                "Citric acid (C6H8O7)",
                "Acetic acid (C2H4O2)"
            ],
            "mismatches": [
                "Formic acid (HCOOH)"
            ],
            "true_referents": [
                "Acetic acid (C2H4O2)",
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Citric acid (C6H8O7)",
                "Cysteine (Cys)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Glutathione (GSH)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Lactic acid (C3H6O3)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)"
            ],
            "TP": 24,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Glutamic Acid (Glu)",
            "Aspartic Acid (Asp)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glutamic Acid (Glu)",
                "Aspartic Acid (Asp)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aspartic Acid (Asp)",
                "Glutamic Acid (Glu)"
            ],
            "TP": 2,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Aspartate (Asp-)",
            "Glutamate (Glu-)",
            "Isoaspartate (isoAsp)",
            "Homocysteic acid (Hcys)",
            "Homocysteine (Hcys-)",
            "Phosphoserine (pSer)",
            "Phosphothreonine (pThr)",
            "Phosphotyrosine (pTyr)",
            "3-Phosphohistidine (3pHis)",
            "4-Phosphohistidine (4pHis)",
            "5-Phosphohistidine (5pHis)",
            "6-Phosphohistidine (6pHis)",
            "7-Phosphohistidine (7pHis)",
            "8-Phosphohistidine (8pHis)",
            "9-Phosphohistidine (9pHis)",
            "10-Phosphohistidine (10pHis)",
            "11-Phosphohistidine (11pHis)",
            "12-Phosphohistidine (12pHis)",
            "13-Phosphohistidine (13pHis)",
            "14-Phosphohistidine (14pHis)",
            "15-Phosphohistidine (15pHis)",
            "16-Phosphohistidine (16pHis)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Aspartate (Asp-)",
                "Glutamate (Glu-)",
                "Isoaspartate (isoAsp)",
                "Homocysteic acid (Hcys)",
                "Homocysteine (Hcys-)",
                "Phosphoserine (pSer)",
                "Phosphothreonine (pThr)",
                "Phosphotyrosine (pTyr)",
                "3-Phosphohistidine (3pHis)",
                "4-Phosphohistidine (4pHis)",
                "5-Phosphohistidine (5pHis)",
                "6-Phosphohistidine (6pHis)",
                "7-Phosphohistidine (7pHis)",
                "8-Phosphohistidine (8pHis)",
                "9-Phosphohistidine (9pHis)",
                "10-Phosphohistidine (10pHis)",
                "11-Phosphohistidine (11pHis)",
                "12-Phosphohistidine (12pHis)",
                "13-Phosphohistidine (13pHis)",
                "14-Phosphohistidine (14pHis)",
                "15-Phosphohistidine (15pHis)",
                "16-Phosphohistidine (16pHis)"
            ],
            "mismatches": [],
            "true_referents": [
                "10-Phosphohistidine (10pHis)",
                "11-Phosphohistidine (11pHis)",
                "12-Phosphohistidine (12pHis)",
                "13-Phosphohistidine (13pHis)",
                "14-Phosphohistidine (14pHis)",
                "15-Phosphohistidine (15pHis)",
                "16-Phosphohistidine (16pHis)",
                "3-Phosphohistidine (3pHis)",
                "4-Phosphohistidine (4pHis)",
                "5-Phosphohistidine (5pHis)",
                "6-Phosphohistidine (6pHis)",
                "7-Phosphohistidine (7pHis)",
                "8-Phosphohistidine (8pHis)",
                "9-Phosphohistidine (9pHis)",
                "Aspartate (Asp-)",
                "Aspartic acid (Asp)",
                "Glutamate (Glu-)",
                "Glutamic acid (Glu)",
                "Homocysteic acid (Hcys)",
                "Homocysteine (Hcys-)",
                "Isoaspartate (isoAsp)",
                "Phosphoserine (pSer)",
                "Phosphothreonine (pThr)",
                "Phosphotyrosine (pTyr)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic acid (Asp, D)",
            "Glutamic acid (Glu, E)",
            "Phosphoserine (pSer)",
            "Phosphothreonine (pThr)",
            "Gamma-carboxyglutamic acid (Gla)",
            "Sulfoglutamic acid",
            "Sulfodiaminoglutaric acid",
            "3-Methylaspartic acid",
            "4-Methylglutamic acid",
            "3,4-Dehydroaspartic acid",
            "Selenoaspartic acid",
            "Phosphoaspartic acid",
            "Phosphoglutamic acid",
            "3-Phosphoglutamic acid",
            "Beta-Carboxyaspartic acid",
            "Gamma-Aminobutyric acid",
            "Phosphorylated aspartate",
            "Phosphorylated glutamate",
            "Hydroxylated aspartic acid",
            "Hydroxylated glutamic acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid (Asp, D)",
                "Glutamic acid (Glu, E)",
                "Phosphoserine (pSer)",
                "Phosphothreonine (pThr)",
                "Gamma-carboxyglutamic acid (Gla)",
                "Sulfoglutamic acid",
                "Sulfodiaminoglutaric acid",
                "3-Methylaspartic acid",
                "4-Methylglutamic acid",
                "3,4-Dehydroaspartic acid",
                "Selenoaspartic acid",
                "Phosphoaspartic acid",
                "Phosphoglutamic acid",
                "3-Phosphoglutamic acid",
                "Beta-Carboxyaspartic acid",
                "Gamma-Aminobutyric acid",
                "Phosphorylated aspartate",
                "Phosphorylated glutamate",
                "Hydroxylated aspartic acid",
                "Hydroxylated glutamic acid"
            ],
            "mismatches": [],
            "true_referents": [
                "3,4-Dehydroaspartic acid",
                "3-Methylaspartic acid",
                "3-Phosphoglutamic acid",
                "4-Methylglutamic acid",
                "Aspartic acid (Asp, D)",
                "Beta-Carboxyaspartic acid",
                "Gamma-Aminobutyric acid",
                "Gamma-carboxyglutamic acid (Gla)",
                "Glutamic acid (Glu, E)",
                "Hydroxylated aspartic acid",
                "Hydroxylated glutamic acid",
                "Phosphoaspartic acid",
                "Phosphoglutamic acid",
                "Phosphorylated aspartate",
                "Phosphorylated glutamate",
                "Phosphoserine (pSer)",
                "Phosphothreonine (pThr)",
                "Selenoaspartic acid",
                "Sulfodiaminoglutaric acid",
                "Sulfoglutamic acid"
            ],
            "TP": 20,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic acid (Asp, D)",
            "Glutamic acid (Glu, E)",
            "Phosphoserine",
            "Phosphothreonine",
            "Phosphotyrosine",
            "\u03b3-Carboxyglutamic acid",
            "Cysteic acid",
            "Homocysteic acid",
            "2-Aminoadipic acid",
            "3-Sulfoalanine",
            "O-Sulfotyrosine",
            "Pyroglutamic acid",
            "N-Methyl-D-aspartic acid",
            "\u03b1-Aminoadipic acid",
            "\u03b2-Hydroxyaspartic acid",
            "Cysteine sulfinic acid",
            "Selenocysteine (when oxidized)",
            "3-Nitrotyrosine",
            "4-Carboxyglutamic acid",
            "5-Hydroxy-2-aminovaleric acid",
            "2,3-Diaminopropanoic acid (when carboxylated)",
            "4-Hydroxyproline (when carboxylated)",
            "Homoserine (when phosphorylated)",
            "Citrulline (when carboxylated)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid (Asp, D)",
                "Glutamic acid (Glu, E)",
                "Phosphoserine",
                "Phosphothreonine",
                "Phosphotyrosine",
                "\u03b3-Carboxyglutamic acid",
                "Cysteic acid",
                "Homocysteic acid",
                "2-Aminoadipic acid",
                "3-Sulfoalanine",
                "O-Sulfotyrosine",
                "Pyroglutamic acid",
                "N-Methyl-D-aspartic acid",
                "\u03b1-Aminoadipic acid",
                "\u03b2-Hydroxyaspartic acid",
                "Cysteine sulfinic acid",
                "Selenocysteine (when oxidized)",
                "3-Nitrotyrosine",
                "4-Carboxyglutamic acid",
                "5-Hydroxy-2-aminovaleric acid",
                "2,3-Diaminopropanoic acid (when carboxylated)",
                "4-Hydroxyproline (when carboxylated)",
                "Homoserine (when phosphorylated)",
                "Citrulline (when carboxylated)"
            ],
            "mismatches": [],
            "true_referents": [
                "2,3-Diaminopropanoic acid (when carboxylated)",
                "2-Aminoadipic acid",
                "3-Nitrotyrosine",
                "3-Sulfoalanine",
                "4-Carboxyglutamic acid",
                "4-Hydroxyproline (when carboxylated)",
                "5-Hydroxy-2-aminovaleric acid",
                "Aspartic acid (Asp, D)",
                "Citrulline (when carboxylated)",
                "Cysteic acid",
                "Cysteine sulfinic acid",
                "Glutamic acid (Glu, E)",
                "Homocysteic acid",
                "Homoserine (when phosphorylated)",
                "N-Methyl-D-aspartic acid",
                "O-Sulfotyrosine",
                "Phosphoserine",
                "Phosphothreonine",
                "Phosphotyrosine",
                "Pyroglutamic acid",
                "Selenocysteine (when oxidized)",
                "\u03b1-Aminoadipic acid",
                "\u03b2-Hydroxyaspartic acid",
                "\u03b3-Carboxyglutamic acid"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Cysteic acid",
            "Homocysteic acid",
            "3-Sulfinoalanine (Cys-SO2H)",
            "3-Sulfino-\u03b2-alanine",
            "2-Aminoadipic acid",
            "\u03b1-Aminoadipic acid",
            "3-Hydroxyaspartic acid",
            "4-Hydroxyglutamic acid",
            "N-Methylaspartic acid",
            "N-Methylglutamic acid",
            "\u03b2-Methylaspartic acid",
            "\u03b3-Carboxyglutamic acid (Gla)",
            "Phosphoaspartic acid",
            "Phosphohomoserine",
            "Phosphoserine (Sep)",
            "Phosphothreonine (Tpo)",
            "Phosphotyrosine (Ptr)",
            "S-Sulfo-L-cysteine",
            "3-Sulfinoalanine",
            "2-Aminomalonic acid",
            "Isoglutamic acid",
            "Pyrrolysine (Pyl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Cysteic acid",
                "Homocysteic acid",
                "3-Sulfinoalanine (Cys-SO2H)",
                "3-Sulfino-\u03b2-alanine",
                "2-Aminoadipic acid",
                "\u03b1-Aminoadipic acid",
                "3-Hydroxyaspartic acid",
                "4-Hydroxyglutamic acid",
                "N-Methylaspartic acid",
                "N-Methylglutamic acid",
                "\u03b2-Methylaspartic acid",
                "\u03b3-Carboxyglutamic acid (Gla)",
                "Phosphoaspartic acid",
                "Phosphohomoserine",
                "Phosphoserine (Sep)",
                "Phosphothreonine (Tpo)",
                "Phosphotyrosine (Ptr)",
                "S-Sulfo-L-cysteine",
                "3-Sulfinoalanine",
                "2-Aminomalonic acid",
                "Isoglutamic acid",
                "Pyrrolysine (Pyl)"
            ],
            "mismatches": [],
            "true_referents": [
                "2-Aminoadipic acid",
                "2-Aminomalonic acid",
                "3-Hydroxyaspartic acid",
                "3-Sulfino-\u03b2-alanine",
                "3-Sulfinoalanine",
                "3-Sulfinoalanine (Cys-SO2H)",
                "4-Hydroxyglutamic acid",
                "Aspartic acid (Asp)",
                "Cysteic acid",
                "Glutamic acid (Glu)",
                "Homocysteic acid",
                "Isoglutamic acid",
                "N-Methylaspartic acid",
                "N-Methylglutamic acid",
                "Phosphoaspartic acid",
                "Phosphohomoserine",
                "Phosphoserine (Sep)",
                "Phosphothreonine (Tpo)",
                "Phosphotyrosine (Ptr)",
                "Pyrrolysine (Pyl)",
                "S-Sulfo-L-cysteine",
                "\u03b1-Aminoadipic acid",
                "\u03b2-Methylaspartic acid",
                "\u03b3-Carboxyglutamic acid (Gla)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Cysteine (Cys)",
            "Tyrosine (Tyr)",
            "Histidine (His)",
            "Asparagine (Asn)",
            "Glutamine (Gln)",
            "Arginine (Arg)",
            "Lysine (Lys)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Proline (Pro)",
            "Phenylalanine (Phe)",
            "Tryptophan (Trp)",
            "Methionine (Met)",
            "Homoserine (Hse)",
            "Hydroxyproline (Hyp)",
            "Norleucine (Nle)",
            "Ornithine (Orn)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Cysteine (Cys)",
                "Tyrosine (Tyr)",
                "Histidine (His)",
                "Asparagine (Asn)",
                "Glutamine (Gln)",
                "Arginine (Arg)",
                "Lysine (Lys)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Glycine (Gly)",
                "Alanine (Ala)",
                "Valine (Val)",
                "Leucine (Leu)",
                "Isoleucine (Ile)",
                "Proline (Pro)",
                "Phenylalanine (Phe)",
                "Tryptophan (Trp)",
                "Methionine (Met)",
                "Homoserine (Hse)",
                "Hydroxyproline (Hyp)",
                "Norleucine (Nle)",
                "Ornithine (Orn)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Homoserine (Hse)",
                "Hydroxyproline (Hyp)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Norleucine (Nle)",
                "Ornithine (Orn)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic Acid (Asp, D)",
            "Glutamic Acid (Glu, E)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic Acid (Asp, D)",
                "Glutamic Acid (Glu, E)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aspartic Acid (Asp, D)",
                "Glutamic Acid (Glu, E)"
            ],
            "TP": 2,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic acid (Asp)",
            "Aspartate",
            "Asp",
            "Glu",
            "Glutamic acid",
            "Glutamate",
            "Glutamic acid (Glu)",
            "Glutamate (Glu)",
            "Glutamic",
            "Glutamic acid, L-",
            "Glutamic acid, D-",
            "Glutamic acid, DL-",
            "Glutamic acid, L- (Glu)",
            "Glutamic acid, D- (Glu)",
            "Glutamic acid, DL- (Glu)",
            "Glutamate, L-",
            "Glutamate, D-",
            "Glutamate, DL-",
            "Glutamate, L- (Glu)",
            "Glutamate, D- (Glu)",
            "Glutamate, DL- (Glu)",
            "Glutamic acid, L- (Asp)",
            "Glutamic acid, D- (Asp)",
            "Glutamic acid, DL- (Asp)",
            "Glutamate, L- (Asp)",
            "Glutamate, D- (Asp)",
            "Glutamate, DL- (Asp)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid (Asp)",
                "Aspartate",
                "Asp",
                "Glu",
                "Glutamic acid",
                "Glutamate",
                "Glutamic acid (Glu)",
                "Glutamate (Glu)",
                "Glutamic",
                "Glutamic acid, L-",
                "Glutamic acid, D-",
                "Glutamic acid, DL-",
                "Glutamic acid, L- (Glu)",
                "Glutamic acid, D- (Glu)",
                "Glutamic acid, DL- (Glu)",
                "Glutamate, L-",
                "Glutamate, D-",
                "Glutamate, DL-",
                "Glutamate, L- (Glu)",
                "Glutamate, D- (Glu)",
                "Glutamate, DL- (Glu)",
                "Glutamic acid, L- (Asp)",
                "Glutamic acid, D- (Asp)",
                "Glutamic acid, DL- (Asp)"
            ],
            "mismatches": [
                "Glutamate, L- (Asp)",
                "Glutamate, D- (Asp)",
                "Glutamate, DL- (Asp)"
            ],
            "true_referents": [
                "Asp",
                "Aspartate",
                "Aspartic acid (Asp)",
                "Glu",
                "Glutamate",
                "Glutamate (Glu)",
                "Glutamate, D-",
                "Glutamate, D- (Glu)",
                "Glutamate, DL-",
                "Glutamate, DL- (Glu)",
                "Glutamate, L-",
                "Glutamate, L- (Glu)",
                "Glutamic",
                "Glutamic acid",
                "Glutamic acid (Glu)",
                "Glutamic acid, D-",
                "Glutamic acid, D- (Asp)",
                "Glutamic acid, D- (Glu)",
                "Glutamic acid, DL-",
                "Glutamic acid, DL- (Asp)",
                "Glutamic acid, DL- (Glu)",
                "Glutamic acid, L-",
                "Glutamic acid, L- (Asp)",
                "Glutamic acid, L- (Glu)"
            ],
            "TP": 24,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            "Aspartic acid (D)",
            "Glutamic acid (E)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid (D)",
                "Glutamic acid (E)"
            ],
            "mismatches": [],
            "true_referents": [
                "Aspartic acid (D)",
                "Glutamic acid (E)"
            ],
            "TP": 2,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "acidic amino acid at physiological pH",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Aspartic acid (Asp)",
                "Canonical name": "Aspartic acid"
            },
            {
                "Referent": "Glutamic acid (Glu)",
                "Canonical name": "Glutamic acid"
            },
            {
                "Referent": "Glutamine (Gln)",
                "Canonical name": "Glutamine"
            },
            {
                "Referent": "Serine (Ser)",
                "Canonical name": "Serine"
            },
            {
                "Referent": "Threonine (Thr)",
                "Canonical name": "Threonine"
            },
            {
                "Referent": "Cysteine (Cys)",
                "Canonical name": "Cysteine"
            },
            {
                "Referent": "Asparagine (Asn)",
                "Canonical name": "Asparagine"
            },
            {
                "Referent": "Glutathione (GSH)",
                "Canonical name": "Glutathione"
            },
            {
                "Referent": "Alanine (Ala)",
                "Canonical name": "Alanine"
            },
            {
                "Referent": "Histidine (His)",
                "Canonical name": "Histidine"
            },
            {
                "Referent": "Arginine (Arg)",
                "Canonical name": "Arginine"
            },
            {
                "Referent": "Lysine (Lys)",
                "Canonical name": "Lysine"
            },
            {
                "Referent": "Methionine (Met)",
                "Canonical name": "Methionine"
            },
            {
                "Referent": "Tryptophan (Trp)",
                "Canonical name": "Tryptophan"
            },
            {
                "Referent": "Proline (Pro)",
                "Canonical name": "Proline"
            },
            {
                "Referent": "Glycine (Gly)",
                "Canonical name": "Glycine"
            },
            {
                "Referent": "Tyrosine (Tyr)",
                "Canonical name": "Tyrosine"
            },
            {
                "Referent": "Phenylalanine (Phe)",
                "Canonical name": "Phenylalanine"
            },
            {
                "Referent": "Leucine (Leu)",
                "Canonical name": "Leucine"
            },
            {
                "Referent": "Isoleucine (Ile)",
                "Canonical name": "Isoleucine"
            },
            {
                "Referent": "Valine (Val)",
                "Canonical name": "Valine"
            },
            {
                "Referent": "Ornithine (Orn)",
                "Canonical name": "Ornithine"
            },
            {
                "Referent": "Citrulline (Cit)",
                "Canonical name": "Citrulline"
            },
            {
                "Referent": "Taurine (Tau)",
                "Canonical name": "Taurine"
            },
            {
                "Referent": "Citric acid (Cit)",
                "Canonical name": "Citric acid"
            },
            {
                "Referent": "Pyruvic acid (Pyr)",
                "Canonical name": "Pyruvic acid"
            },
            {
                "Referent": "Succinic acid (Suc)",
                "Canonical name": "Succinic acid"
            },
            {
                "Referent": "Maleic acid (Mal)",
                "Canonical name": "Maleic acid"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aspartic acid",
                "Glutamic acid",
                "Glutamine",
                "Serine",
                "Threonine",
                "Cysteine",
                "Asparagine",
                "Glutathione",
                "Alanine",
                "Histidine",
                "Arginine",
                "Lysine",
                "Methionine",
                "Tryptophan",
                "Proline",
                "Glycine",
                "Tyrosine",
                "Phenylalanine",
                "Leucine",
                "Isoleucine",
                "Valine",
                "Ornithine",
                "Citrulline",
                "Taurine"
            ],
            "mismatches": [
                "Citric acid",
                "Pyruvic acid",
                "Succinic acid",
                "Maleic acid"
            ],
            "true_referents": [
                "{\"Referent\": \"Alanine (Ala)\", \"Canonical name\": \"Alanine\"}",
                "{\"Referent\": \"Arginine (Arg)\", \"Canonical name\": \"Arginine\"}",
                "{\"Referent\": \"Asparagine (Asn)\", \"Canonical name\": \"Asparagine\"}",
                "{\"Referent\": \"Aspartic acid (Asp)\", \"Canonical name\": \"Aspartic acid\"}",
                "{\"Referent\": \"Citrulline (Cit)\", \"Canonical name\": \"Citrulline\"}",
                "{\"Referent\": \"Cysteine (Cys)\", \"Canonical name\": \"Cysteine\"}",
                "{\"Referent\": \"Glutamic acid (Glu)\", \"Canonical name\": \"Glutamic acid\"}",
                "{\"Referent\": \"Glutamine (Gln)\", \"Canonical name\": \"Glutamine\"}",
                "{\"Referent\": \"Glutathione (GSH)\", \"Canonical name\": \"Glutathione\"}",
                "{\"Referent\": \"Glycine (Gly)\", \"Canonical name\": \"Glycine\"}",
                "{\"Referent\": \"Histidine (His)\", \"Canonical name\": \"Histidine\"}",
                "{\"Referent\": \"Isoleucine (Ile)\", \"Canonical name\": \"Isoleucine\"}",
                "{\"Referent\": \"Leucine (Leu)\", \"Canonical name\": \"Leucine\"}",
                "{\"Referent\": \"Lysine (Lys)\", \"Canonical name\": \"Lysine\"}",
                "{\"Referent\": \"Methionine (Met)\", \"Canonical name\": \"Methionine\"}",
                "{\"Referent\": \"Ornithine (Orn)\", \"Canonical name\": \"Ornithine\"}",
                "{\"Referent\": \"Phenylalanine (Phe)\", \"Canonical name\": \"Phenylalanine\"}",
                "{\"Referent\": \"Proline (Pro)\", \"Canonical name\": \"Proline\"}",
                "{\"Referent\": \"Serine (Ser)\", \"Canonical name\": \"Serine\"}",
                "{\"Referent\": \"Taurine (Tau)\", \"Canonical name\": \"Taurine\"}",
                "{\"Referent\": \"Threonine (Thr)\", \"Canonical name\": \"Threonine\"}",
                "{\"Referent\": \"Tryptophan (Trp)\", \"Canonical name\": \"Tryptophan\"}",
                "{\"Referent\": \"Tyrosine (Tyr)\", \"Canonical name\": \"Tyrosine\"}",
                "{\"Referent\": \"Valine (Val)\", \"Canonical name\": \"Valine\"}"
            ],
            "TP": 24,
            "FP": 4,
            "FN": 0
        }
    }
]