[
    {
        "test": "limited-list-referents",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala)",
            "Arginine (Arg)",
            "Asparagine (Asn)",
            "Aspartic acid (Asp)",
            "Cysteine (Cys)",
            "Glutamic acid (Glu)",
            "Glutamine (Gln)",
            "Glycine (Gly)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Tyrosine (Tyr)",
            "Valine (Val)",
            "Selenocysteine",
            "Pyrrolysine",
            "Beta-alanine",
            "Homocysteine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Valine (Val)",
                "Selenocysteine",
                "Pyrrolysine",
                "Beta-alanine",
                "Homocysteine"
            ],
            "mismatches": [
                "Cysteine (Cys)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Lysine (Lys)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)"
            ],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "beta-alanine",
                "beta-alanine betaine",
                "beta-alanopine",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "homocysteine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "phi-v4",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala, A)",
            "Arginine (Arg, R)",
            "Asparagine (Asn, N)",
            "Aspartic acid (Asp, D)",
            "Cysteine (Cys, C)",
            "Glutamine (Gln, Q)",
            "Glutamic acid (Glu, E)",
            "Glycine (Gly, G)",
            "Histidine (His, H)",
            "Isoleucine (Ile, I)",
            "Leucine (Leu, L)",
            "Lysine (Lys, K)",
            "Methionine (Met, M)",
            "Phenylalanine (Phe, F)",
            "Proline (Pro, P)",
            "Serine (Ser, S)",
            "Threonine (Thr, T)",
            "Tryptophan (Trp, W)",
            "Tyrosine (Tyr, Y)",
            "Valine (Val, V)",
            "Selenocysteine (Sec, U)",
            "Pyrrolysine (Pyl, O)",
            "Homocysteine",
            "Citrulline"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Asparagine (Asn, N)",
                "Cysteine (Cys, C)",
                "Glutamic acid (Glu, E)",
                "Glycine (Gly, G)",
                "Histidine (His, H)",
                "Isoleucine (Ile, I)",
                "Phenylalanine (Phe, F)",
                "Proline (Pro, P)",
                "Serine (Ser, S)",
                "Threonine (Thr, T)",
                "Valine (Val, V)",
                "Selenocysteine (Sec, U)",
                "Pyrrolysine (Pyl, O)",
                "Homocysteine",
                "Citrulline"
            ],
            "mismatches": [
                "Alanine (Ala, A)",
                "Arginine (Arg, R)",
                "Aspartic acid (Asp, D)",
                "Glutamine (Gln, Q)",
                "Leucine (Leu, L)",
                "Lysine (Lys, K)",
                "Methionine (Met, M)",
                "Tryptophan (Trp, W)",
                "Tyrosine (Tyr, Y)"
            ],
            "true_referents": [
                "D-arginine",
                "D-aspartic acid",
                "Glu-Gln",
                "L-alanine",
                "L-asparagine",
                "L-citrulline",
                "L-glutamic acid",
                "L-leucine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "Valine-d8",
                "arginine",
                "asparagine",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glycine",
                "histidine",
                "homocysteine",
                "isoleucine",
                "isoleucine derivative",
                "lysine",
                "methionine",
                "methyl-L-methionine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 15,
            "FP": 9,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "mistral-small-instruct-24B",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala)",
            "Arginine (Arg)",
            "Asparagine (Asn)",
            "Aspartic Acid (Asp)",
            "Cysteine (Cys)",
            "Glutamic Acid (Glu)",
            "Glutamine (Gln)",
            "Glycine (Gly)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Tyrosine (Tyr)",
            "Valine (Val)",
            "Selenocysteine (Sec)",
            "Pyrrolysine (Pyl)",
            "Ornithine",
            "Citrulline"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic Acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic Acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)",
                "Selenocysteine (Sec)",
                "Pyrrolysine (Pyl)",
                "Ornithine",
                "Citrulline"
            ],
            "mismatches": [],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gemma-3",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala)",
            "Arginine (Arg)",
            "Asparagine (Asn)",
            "Aspartic Acid (Asp)",
            "Cysteine (Cys)",
            "Glutamic Acid (Glu)",
            "Glutamine (Gln)",
            "Glycine (Gly)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Tyrosine (Tyr)",
            "Valine (Val)",
            "Selenocysteine (Sec)",
            "Pyrrolysine (Pyl)",
            "Homocysteine",
            "Ornithine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic Acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic Acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)",
                "Selenocysteine (Sec)",
                "Pyrrolysine (Pyl)",
                "Ornithine"
            ],
            "mismatches": [
                "Lysine (Lys)",
                "Homocysteine"
            ],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "homocysteine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala)",
            "Arginine (Arg)",
            "Asparagine (Asn)",
            "Aspartic acid (Asp)",
            "Cysteine (Cys)",
            "Glutamic acid (Glu)",
            "Glutamine (Gln)",
            "Glycine (Gly)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Tyrosine (Tyr)",
            "Valine (Val)",
            "Selenocysteine (Sec)",
            "Pyrrolysine (Pyl)",
            "Ornithine",
            "Citrulline"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)",
                "Selenocysteine (Sec)",
                "Pyrrolysine (Pyl)",
                "Ornithine",
                "Citrulline"
            ],
            "mismatches": [
                "Lysine (Lys)"
            ],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4o-mini",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Cysteine (Cys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Tyrosine (Tyr)",
            "Tryptophan (Trp)",
            "Aspartic Acid (Asp)",
            "Glutamic Acid (Glu)",
            "Asparagine (Asn)",
            "Glutamine (Gln)",
            "Proline (Pro)",
            "Arginine (Arg)",
            "Lysine (Lys)",
            "Histidine (His)",
            "Selenocysteine (Sec)",
            "Pyrrolysine (Pyl)",
            "Ornithine (Orn)",
            "Citric Acid (Cit)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glycine (Gly)",
                "Alanine (Ala)",
                "Valine (Val)",
                "Leucine (Leu)",
                "Isoleucine (Ile)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Cysteine (Cys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Tyrosine (Tyr)",
                "Tryptophan (Trp)",
                "Aspartic Acid (Asp)",
                "Glutamic Acid (Glu)",
                "Asparagine (Asn)",
                "Glutamine (Gln)",
                "Proline (Pro)",
                "Arginine (Arg)",
                "Lysine (Lys)",
                "Histidine (His)",
                "Selenocysteine (Sec)",
                "Pyrrolysine (Pyl)",
                "Ornithine (Orn)"
            ],
            "mismatches": [
                "Citric Acid (Cit)"
            ],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "cysteic acid",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-4-32k",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala, A)",
            "Arginine (Arg, R)",
            "Asparagine (Asn, N)",
            "Aspartic acid (Asp, D)",
            "Cysteine (Cys, C)",
            "Glutamine (Gln, Q)",
            "Glutamic acid (Glu, E)",
            "Glycine (Gly, G)",
            "Histidine (His, H)",
            "Isoleucine (Ile, I)",
            "Leucine (Leu, L)",
            "Lysine (Lys, K)",
            "Methionine (Met, M)",
            "Phenylalanine (Phe, F)",
            "Proline (Pro, P)",
            "Serine (Ser, S)",
            "Threonine (Thr, T)",
            "Tryptophan (Trp, W)",
            "Tyrosine (Tyr, Y)",
            "Valine (Val, V)",
            "Selenocysteine (Sec, U)",
            "Pyrrolysine (Pyl, O)",
            "Ornithine (Orn)",
            "Citrulline (Cit)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Arginine (Arg, R)",
                "Asparagine (Asn, N)",
                "Aspartic acid (Asp, D)",
                "Cysteine (Cys, C)",
                "Glutamic acid (Glu, E)",
                "Glycine (Gly, G)",
                "Histidine (His, H)",
                "Isoleucine (Ile, I)",
                "Leucine (Leu, L)",
                "Lysine (Lys, K)",
                "Methionine (Met, M)",
                "Phenylalanine (Phe, F)",
                "Proline (Pro, P)",
                "Serine (Ser, S)",
                "Threonine (Thr, T)",
                "Tryptophan (Trp, W)",
                "Tyrosine (Tyr, Y)",
                "Valine (Val, V)",
                "Selenocysteine (Sec, U)",
                "Pyrrolysine (Pyl, O)",
                "Ornithine (Orn)",
                "Citrulline (Cit)"
            ],
            "mismatches": [
                "Alanine (Ala, A)",
                "Glutamine (Gln, Q)"
            ],
            "true_referents": [
                "D-arginine",
                "D-aspartic acid",
                "Glu-Gln",
                "L-alanine",
                "L-asparagine",
                "L-citrulline",
                "L-glutamic acid",
                "L-leucine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "Valine-d8",
                "arginine",
                "asparagine",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glycine",
                "histidine",
                "isoleucine",
                "isoleucine derivative",
                "lysine",
                "methionine",
                "methyl-L-methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "gpt-35-turbo-16k",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala)",
            "Arginine (Arg)",
            "Asparagine (Asn)",
            "Aspartic acid (Asp)",
            "Cysteine (Cys)",
            "Glutamine (Gln)",
            "Glutamic acid (Glu)",
            "Glycine (Gly)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Tyrosine (Tyr)",
            "Valine (Val)",
            "Selenocysteine (Sec)",
            "Pyrrolysine (Pyl)",
            "Norleucine (Nle)",
            "Hydroxyproline (Hyp)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Cysteine (Cys)",
                "Glutamine (Gln)",
                "Glutamic acid (Glu)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)",
                "Selenocysteine (Sec)",
                "Norleucine (Nle)",
                "Hydroxyproline (Hyp)"
            ],
            "mismatches": [
                "Pyrrolysine (Pyl)"
            ],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-norleucine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "hydroxyproline",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "o1-mini",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala, A)",
            "Arginine (Arg, R)",
            "Asparagine (Asn, N)",
            "Aspartic acid (Asp, D)",
            "Cysteine (Cys, C)",
            "Glutamine (Gln, Q)",
            "Glutamic acid (Glu, E)",
            "Glycine (Gly, G)",
            "Histidine (His, H)",
            "Isoleucine (Ile, I)",
            "Leucine (Leu, L)",
            "Lysine (Lys, K)",
            "Methionine (Met, M)",
            "Phenylalanine (Phe, F)",
            "Proline (Pro, P)",
            "Serine (Ser, S)",
            "Threonine (Thr, T)",
            "Tryptophan (Trp, W)",
            "Tyrosine (Tyr, Y)",
            "Valine (Val, V)",
            "Selenocysteine (Sec, U)",
            "Pyrrolysine (Pyl, O)",
            "Hydroxyproline (Hyp)",
            "Ornithine (Orn)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Asparagine (Asn, N)",
                "Glutamic acid (Glu, E)",
                "Glycine (Gly, G)",
                "Histidine (His, H)",
                "Ornithine (Orn)",
                "Phenylalanine (Phe, F)",
                "Proline (Pro, P)",
                "Serine (Ser, S)",
                "Threonine (Thr, T)",
                "Valine (Val, V)",
                "Selenocysteine (Sec, U)",
                "Pyrrolysine (Pyl, O)",
                "Hydroxyproline (Hyp)"
            ],
            "mismatches": [
                "Alanine (Ala, A)",
                "Arginine (Arg, R)",
                "Aspartic acid (Asp, D)",
                "Cysteine (Cys, C)",
                "Glutamine (Gln, Q)",
                "Isoleucine (Ile, I)",
                "Leucine (Leu, L)",
                "Lysine (Lys, K)",
                "Methionine (Met, M)",
                "Tryptophan (Trp, W)",
                "Tyrosine (Tyr, Y)"
            ],
            "true_referents": [
                "D-arginine",
                "D-aspartic acid",
                "Glu-Gln",
                "L-alanine",
                "L-asparagine",
                "L-glutamic acid",
                "L-leucine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "Valine-d8",
                "arginine",
                "asparagine",
                "cysteine",
                "glutamic acid",
                "glycine",
                "histidine",
                "hydroxyproline",
                "isoleucine",
                "isoleucine derivative",
                "lysine",
                "methionine",
                "methyl-L-methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 13,
            "FP": 11,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala)",
            "Arginine (Arg)",
            "Asparagine (Asn)",
            "Aspartic acid (Asp)",
            "Cysteine (Cys)",
            "Glutamic acid (Glu)",
            "Glutamine (Gln)",
            "Glycine (Gly)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Tyrosine (Tyr)",
            "Valine (Val)",
            "Selenocysteine (Sec)",
            "Pyrrolysine (Pyl)",
            "Ornithine (Orn)",
            "Citrulline (Cit)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)",
                "Selenocysteine (Sec)",
                "Pyrrolysine (Pyl)",
                "Ornithine (Orn)",
                "Citrulline (Cit)"
            ],
            "mismatches": [],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala)",
            "Arginine (Arg)",
            "Asparagine (Asn)",
            "Aspartic acid (Asp)",
            "Cysteine (Cys)",
            "Glutamic acid (Glu)",
            "Glutamine (Gln)",
            "Glycine (Gly)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Tyrosine (Tyr)",
            "Valine (Val)",
            "Selenocysteine (Sec)",
            "Pyrrolysine (Pyl)",
            "Ornithine (Orn)",
            "Citrulline (Cit)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)",
                "Selenocysteine (Sec)",
                "Ornithine (Orn)",
                "Citrulline (Cit)"
            ],
            "mismatches": [
                "Pyrrolysine (Pyl)"
            ],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala)",
            "Arginine (Arg)",
            "Asparagine (Asn)",
            "Aspartic acid (Asp)",
            "Cysteine (Cys)",
            "Glutamic acid (Glu)",
            "Glutamine (Gln)",
            "Glycine (Gly)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Tyrosine (Tyr)",
            "Valine (Val)",
            "Selenocysteine (Sec)",
            "Pyrrolysine (Pyl)",
            "Ornithine (Orn)",
            "Citrulline (Cit)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Valine (Val)",
                "Selenocysteine (Sec)",
                "Ornithine (Orn)",
                "Citrulline (Cit)"
            ],
            "mismatches": [
                "Glycine (Gly)",
                "Histidine (His)",
                "Lysine (Lys)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Pyrrolysine (Pyl)"
            ],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 18,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala)",
            "Arginine (Arg)",
            "Asparagine (Asn)",
            "Aspartic Acid (Asp)",
            "Cysteine (Cys)",
            "Glutamic Acid (Glu)",
            "Glutamine (Gln)",
            "Glycine (Gly)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Tyrosine (Tyr)",
            "Valine (Val)",
            "Selenocysteine (Sec)",
            "Pyrrolysine (Pyl)",
            "Ornithine (Orn)",
            "Citrulline (Cit)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic Acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic Acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)",
                "Selenocysteine (Sec)",
                "Ornithine (Orn)",
                "Citrulline (Cit)"
            ],
            "mismatches": [
                "Pyrrolysine (Pyl)"
            ],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala or A)",
            "Arginine (Arg or R)",
            "Asparagine (Asn or N)",
            "Aspartic acid (Asp or D)",
            "Cysteine (Cys or C)",
            "Cystine (Cys2)",
            "Glycine (Gly or G)",
            "Glutamic acid (Glu or E)",
            "Glutamine (Gln or Q)",
            "Histidine (His or H)",
            "Isoleucine (Ile or I)",
            "Leucine (Leu or L)",
            "Leucyl-tRNA synthetase",
            "Lysine (Lys or K)",
            "Methionine (Met or M)",
            "Phenylalanine (Phe or F)",
            "Proline (Pro or P)",
            "Protease",
            "Proteomics",
            "Serine (Ser or S)",
            "Threonine (Thr or T)",
            "Thrombin",
            "Tyrosine (Tyr or Y)",
            "Valine (Val or V)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Arginine (Arg or R)",
                "Asparagine (Asn or N)",
                "Aspartic acid (Asp or D)",
                "Cysteine (Cys or C)",
                "Cystine (Cys2)",
                "Glutamic acid (Glu or E)",
                "Glutamine (Gln or Q)",
                "Isoleucine (Ile or I)",
                "Leucine (Leu or L)",
                "Lysine (Lys or K)",
                "Phenylalanine (Phe or F)",
                "Proline (Pro or P)",
                "Serine (Ser or S)",
                "Threonine (Thr or T)",
                "Tyrosine (Tyr or Y)",
                "Valine (Val or V)"
            ],
            "mismatches": [
                "Alanine (Ala or A)",
                "Glycine (Gly or G)",
                "Histidine (His or H)",
                "Leucyl-tRNA synthetase",
                "Methionine (Met or M)",
                "Protease",
                "Proteomics",
                "Thrombin"
            ],
            "true_referents": [
                "Amicoumacin B",
                "Arginine glutamate",
                "D-aspartic acid",
                "L-alanine",
                "L-asparagine",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-phenylalanine",
                "L-proline",
                "L-serine",
                "L-threonine",
                "L-valine",
                "Leu-Thr-Gln",
                "Peptidyl-L-lysine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "cystine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "methyl-L-methionine",
                "peptidyl-glycine",
                "peptidyl-proline",
                "phenylalanine",
                "proline",
                "serine",
                "threonine",
                "tyrosine",
                "valine"
            ],
            "TP": 16,
            "FP": 8,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala or A)",
            "Arginine (Arg or R)",
            "Asparagine (Asn or N)",
            "Aspartic acid (Asp or D)",
            "Cysteine (Cys or C)",
            "Glutamic acid (Glu or E)",
            "Glutamine (Gln or Q)",
            "Glycine (Gly or G)",
            "Histidine (His or H)",
            "Isoleucine (Ile or I)",
            "Leucine (Leu or L)",
            "Lysine (Lys or K)",
            "Methionine (Met or M)",
            "Phenylalanine (Phe or F)",
            "Proline (Pro or P)",
            "Serine (Ser or S)",
            "Threonine (Thr or T)",
            "Tyrosine (Tyr or Y)",
            "Valine (Val or V)",
            "Triiodothyronine (T3)",
            "Thyroxine (T4)",
            "Homoarginine",
            "Ornithine",
            "Citrulline",
            "Sarcosine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Arginine (Arg or R)",
                "Asparagine (Asn or N)",
                "Aspartic acid (Asp or D)",
                "Cysteine (Cys or C)",
                "Glutamic acid (Glu or E)",
                "Glutamine (Gln or Q)",
                "Isoleucine (Ile or I)",
                "Leucine (Leu or L)",
                "Phenylalanine (Phe or F)",
                "Proline (Pro or P)",
                "Serine (Ser or S)",
                "Threonine (Thr or T)",
                "Valine (Val or V)",
                "Tyrosine (Tyr or Y)",
                "Alanine (Ala or A)",
                "Glycine (Gly or G)",
                "Histidine (His or H)",
                "Lysine (Lys or K)",
                "Methionine (Met or M)",
                "Thyroxine (T4)",
                "Homoarginine",
                "Ornithine",
                "Citrulline"
            ],
            "mismatches": [
                "Triiodothyronine (T3)",
                "Sarcosine"
            ],
            "true_referents": [
                "3,3',5'-triiodothyronine",
                "Arginine glutamate",
                "D-aspartic acid",
                "L-alanine",
                "L-asparagine",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-homoarginine",
                "L-isoleucine",
                "L-leucine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-serine",
                "L-threonine",
                "L-valine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "homoarginine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "methyl-L-methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "serine",
                "threonine",
                "thyroxine",
                "tyrosine",
                "valine"
            ],
            "TP": 23,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents",
        "responder": "amazon.titan-text-express-v1",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Alanine (Ala)",
                "Canonical Name": "Alanine"
            },
            {
                "Referent": "Arginine (Arg)",
                "Canonical Name": "Arginine"
            },
            {
                "Referent": "Asparagine (Asn)",
                "Canonical Name": "Asparagine"
            },
            {
                "Referent": "Aspartic acid (Asp)",
                "Canonical Name": "Aspartic acid"
            },
            {
                "Referent": "Cysteine (Cys)",
                "Canonical Name": "Cysteine"
            },
            {
                "Referent": "Glutamic acid (Glu)",
                "Canonical Name": "Glutamic acid"
            },
            {
                "Referent": "Glutamine (Gln)",
                "Canonical Name": "Glutamine"
            },
            {
                "Referent": "Glycine (Gly)",
                "Canonical Name": "Glycine"
            },
            {
                "Referent": "Histidine (His)",
                "Canonical Name": "Histidine"
            },
            {
                "Referent": "Isoleucine (Ile)",
                "Canonical Name": "Isoleucine"
            },
            {
                "Referent": "Leucine (Leu)",
                "Canonical Name": "Leucine"
            },
            {
                "Referent": "Lysine (Lys)",
                "Canonical Name": "Lysine"
            },
            {
                "Referent": "Methionine (Met)",
                "Canonical Name": "Methionine"
            },
            {
                "Referent": "Phenylalanine (Phe)",
                "Canonical Name": "Phenylalanine"
            },
            {
                "Referent": "Proline (Pro)",
                "Canonical Name": "Proline"
            },
            {
                "Referent": "Serine (Ser)",
                "Canonical Name": "Serine"
            },
            {
                "Referent": "Threonine (Thr)",
                "Canonical Name": "Threonine"
            },
            {
                "Referent": "Tryptophan (Trp)",
                "Canonical Name": "Tryptophan"
            },
            {
                "Referent": "Tyrosine (Tyr)",
                "Canonical Name": "Tyrosine"
            },
            {
                "Referent": "Valine (Val)",
                "Canonical Name": "Valine"
            },
            {
                "Referent": "Citrulline (Cit)",
                "Canonical Name": "Citrulline"
            },
            {
                "Referent": "Ornithine (Orn)",
                "Canonical Name": "Ornithine"
            },
            {
                "Referent": "Selenocysteine (Sec)",
                "Canonical Name": "Selenocysteine"
            },
            {
                "Referent": "Taurine (Tau)",
                "Canonical Name": "Taurine"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Asparagine",
                "Aspartic acid",
                "Cysteine",
                "Glutamic acid",
                "Glutamine",
                "Glycine",
                "Histidine",
                "Isoleucine",
                "Lysine",
                "Methionine",
                "Phenylalanine",
                "Proline",
                "Serine",
                "Threonine",
                "Tryptophan",
                "Tyrosine",
                "Citrulline",
                "Ornithine",
                "Selenocysteine"
            ],
            "mismatches": [
                "Alanine",
                "Arginine",
                "Leucine",
                "Valine",
                "Taurine"
            ],
            "true_referents": [
                "(-)-jasmonyl-(S)-valine",
                "(S)-beta-alanopine",
                "Arg-Lys-Cys-Gly",
                "L-alanine-2,3,3,3-d4",
                "L-citrulline",
                "L-isoleucine",
                "L-methionine",
                "L-ornithine",
                "L-proline",
                "L-selenocysteine",
                "L-threonine",
                "L-valine",
                "Phenylalanine-13C9",
                "alanine-2,3,3,3-d4",
                "asparagine",
                "aspartate family amino acid",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glutamine family amino acid",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "selenocysteine",
                "serine",
                "serine family amino acid",
                "threonine",
                "tryptophan",
                "tyrosine"
            ],
            "TP": 19,
            "FP": 5,
            "FN": 0
        }
    }
]