[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Tryptophan (Trp)",
            "Threonine (Thr)",
            "Histidine (His)",
            "Arginine (Arg)",
            "Cysteine (Cys)",
            "Tyrosine (Tyr)",
            "Alanine (Ala)",
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Asparagine (Asn)",
            "Glutamine (Gln)",
            "Glycine (Gly)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Cysteine (Cys)",
            "Tyrosine (Tyr)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Valine (Val)",
                "Leucine (Leu)",
                "Isoleucine (Ile)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Tryptophan (Trp)",
                "Threonine (Thr)",
                "Histidine (His)",
                "Arginine (Arg)",
                "Cysteine (Cys)",
                "Tyrosine (Tyr)",
                "Alanine (Ala)",
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Asparagine (Asn)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Proline (Pro)",
                "Serine (Ser)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)"
            ],
            "TP": 20,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Valine (Val)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)"
            ],
            "mismatches": [],
            "true_referents": [
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)"
            ],
            "TP": 9,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala)",
            "Arginine (Arg)",
            "Asparagine (Asn)",
            "Aspartic acid (Asp)",
            "Cysteine (Cys)",
            "Glutamic acid (Glu)",
            "Glutamine (Gln)",
            "Glycine (Gly)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Tyrosine (Tyr)",
            "Valine (Val)",
            "Threonine",
            "Arginine",
            "Serine",
            "Tryptophan"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)",
                "Threonine",
                "Arginine",
                "Serine",
                "Tryptophan"
            ],
            "mismatches": [],
            "true_referents": [
                "Alanine (Ala)",
                "Arginine",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine",
                "Serine (Ser)",
                "Threonine",
                "Threonine (Thr)",
                "Tryptophan",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Valine (Val)",
            "Arginine (Arg)",
            "Histidine (His) - infants",
            "Isoleucine (Ile) - premature infants",
            "Leucine (Leu) - growing children",
            "Lysine (Lys) - individuals with limited protein sources",
            "Methionine (Met) - individuals with certain metabolic disorders",
            "Phenylalanine (Phe) - individuals with PKU (under controlled conditions)",
            "Threonine (Thr) - individuals recovering from burns",
            "Tryptophan (Trp) - individuals with limited dietary access",
            "Valine (Val) - athletes during intense training",
            "Arginine (Arg) - during periods of rapid growth",
            "Histidine (His) - during tissue repair",
            "Isoleucine (Ile) - muscle protein synthesis",
            "Leucine (Leu) - stimulating muscle growth",
            "Lysine (Lys) - calcium absorption"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)",
                "Arginine (Arg)",
                "Histidine (His) - infants",
                "Isoleucine (Ile) - premature infants",
                "Leucine (Leu) - growing children",
                "Lysine (Lys) - individuals with limited protein sources",
                "Methionine (Met) - individuals with certain metabolic disorders",
                "Phenylalanine (Phe) - individuals with PKU (under controlled conditions)",
                "Threonine (Thr) - individuals recovering from burns",
                "Tryptophan (Trp) - individuals with limited dietary access",
                "Valine (Val) - athletes during intense training",
                "Arginine (Arg) - during periods of rapid growth",
                "Histidine (His) - during tissue repair",
                "Isoleucine (Ile) - muscle protein synthesis",
                "Leucine (Leu) - stimulating muscle growth",
                "Lysine (Lys) - calcium absorption"
            ],
            "mismatches": [],
            "true_referents": [
                "Arginine (Arg)",
                "Arginine (Arg) - during periods of rapid growth",
                "Histidine (His)",
                "Histidine (His) - during tissue repair",
                "Histidine (His) - infants",
                "Isoleucine (Ile)",
                "Isoleucine (Ile) - muscle protein synthesis",
                "Isoleucine (Ile) - premature infants",
                "Leucine (Leu)",
                "Leucine (Leu) - growing children",
                "Leucine (Leu) - stimulating muscle growth",
                "Lysine (Lys)",
                "Lysine (Lys) - calcium absorption",
                "Lysine (Lys) - individuals with limited protein sources",
                "Methionine (Met)",
                "Methionine (Met) - individuals with certain metabolic disorders",
                "Phenylalanine (Phe)",
                "Phenylalanine (Phe) - individuals with PKU (under controlled conditions)",
                "Threonine (Thr)",
                "Threonine (Thr) - individuals recovering from burns",
                "Tryptophan (Trp)",
                "Tryptophan (Trp) - individuals with limited dietary access",
                "Valine (Val)",
                "Valine (Val) - athletes during intense training"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Valine (Val)",
            "Arginine (Arg)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)",
                "Arginine (Arg)"
            ],
            "mismatches": [],
            "true_referents": [
                "Arginine (Arg)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)"
            ],
            "TP": 10,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Lysine (Lys)",
            "Methionine (Met)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Histidine (His)",
            "Phenylalanine (Phe)",
            "Arginine (Arg)",
            "Cysteine (Cys)",
            "Tyrosine (Tyr)",
            "Glutamine (Gln)",
            "Asparagine (Asn)",
            "Serine (Ser)",
            "Proline (Pro)",
            "Alanine (Ala)",
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Glycine (Gly)",
            "Ornithine (Orn)",
            "Selenocysteine (Sec)",
            "Pyrrolysine (Pyl)",
            "Dihydroxyphenylalanine (DOPA)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Lysine (Lys)",
                "Methionine (Met)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)",
                "Leucine (Leu)",
                "Isoleucine (Ile)",
                "Histidine (His)",
                "Phenylalanine (Phe)",
                "Arginine (Arg)",
                "Cysteine (Cys)",
                "Tyrosine (Tyr)",
                "Glutamine (Gln)",
                "Asparagine (Asn)",
                "Serine (Ser)",
                "Proline (Pro)",
                "Alanine (Ala)",
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Glycine (Gly)",
                "Ornithine (Orn)",
                "Selenocysteine (Sec)",
                "Pyrrolysine (Pyl)",
                "Dihydroxyphenylalanine (DOPA)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Cysteine (Cys)",
                "Dihydroxyphenylalanine (DOPA)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Ornithine (Orn)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Pyrrolysine (Pyl)",
                "Selenocysteine (Sec)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Arginine (Arg)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Valine (Val)",
            "Cysteine (Cys)",
            "Tyrosine (Tyr)",
            "Alanine (Ala)",
            "Asparagine (Asn)",
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Glutamine (Gln)",
            "Glycine (Gly)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Selenocysteine (Sec)",
            "Pyrrolysine (Pyl)",
            "Ornithine (Orn)",
            "Citrulline (Cit)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Arginine (Arg)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)",
                "Cysteine (Cys)",
                "Tyrosine (Tyr)",
                "Alanine (Ala)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Selenocysteine (Sec)",
                "Pyrrolysine (Pyl)",
                "Ornithine (Orn)",
                "Citrulline (Cit)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Citrulline (Cit)",
                "Cysteine (Cys)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Ornithine (Orn)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Pyrrolysine (Pyl)",
                "Selenocysteine (Sec)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine",
            "Arginine",
            "Asparagine",
            "Aspartic acid",
            "Cysteine",
            "Glutamic acid",
            "Glutamine",
            "Glycine",
            "Histidine",
            "Isoleucine",
            "Leucine",
            "Lysine",
            "Methionine",
            "Phenylalanine",
            "Proline",
            "Serine",
            "Threonine",
            "Tryptophan",
            "Tyrosine",
            "Valine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine",
                "Arginine",
                "Asparagine",
                "Aspartic acid",
                "Cysteine",
                "Glutamic acid",
                "Glutamine",
                "Glycine",
                "Histidine",
                "Isoleucine",
                "Leucine",
                "Lysine",
                "Methionine",
                "Phenylalanine",
                "Proline",
                "Serine",
                "Threonine",
                "Tryptophan",
                "Tyrosine",
                "Valine"
            ],
            "mismatches": [],
            "true_referents": [
                "Alanine",
                "Arginine",
                "Asparagine",
                "Aspartic acid",
                "Cysteine",
                "Glutamic acid",
                "Glutamine",
                "Glycine",
                "Histidine",
                "Isoleucine",
                "Leucine",
                "Lysine",
                "Methionine",
                "Phenylalanine",
                "Proline",
                "Serine",
                "Threonine",
                "Tryptophan",
                "Tyrosine",
                "Valine"
            ],
            "TP": 20,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Valine (Val)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)"
            ],
            "mismatches": [],
            "true_referents": [
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)"
            ],
            "TP": 9,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Valine (Val)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)"
            ],
            "mismatches": [],
            "true_referents": [
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)"
            ],
            "TP": 9,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Valine (Val)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)"
            ],
            "mismatches": [],
            "true_referents": [
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)"
            ],
            "TP": 9,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Valine (Val)",
            "Arginine (Arg)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)",
                "Arginine (Arg)"
            ],
            "mismatches": [],
            "true_referents": [
                "Arginine (Arg)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Valine (Val)"
            ],
            "TP": 10,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala)",
            "Arginine (Arg)",
            "Asparagine (Asn)",
            "Aspartic Acid (Asp)",
            "Cysteine (Cys)",
            "Glutamic Acid (Glu)",
            "Glutamine (Gln)",
            "Glycine (Gly)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Tyrosine (Tyr)",
            "Valine (Val)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic Acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic Acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic Acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic Acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)"
            ],
            "TP": 20,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Histidine (His)",
            "Lysine (Lys)",
            "Arginine (Arg)",
            "Threonine (Thr)",
            "Valine (Val)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Phenylalanine (Phe)",
            "Tryptophan (Trp)",
            "Methionine (Met)",
            "Cysteine (Cys)",
            "Tyrosine (Tyr)",
            "Glutamine (Gln)",
            "Asparagine (Asn)",
            "Glutamic acid (Glu)",
            "Aspartic acid (Asp)",
            "Serine (Ser)",
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Proline (Pro)",
            "Hydroxyproline (Hyp)",
            "Glycylglycine (Gly-Gly)",
            "Carnosine (\u03b2-Ala-His)",
            "Anserine (\u03b2-Ala-His-Arg)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Histidine (His)",
                "Lysine (Lys)",
                "Arginine (Arg)",
                "Threonine (Thr)",
                "Valine (Val)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Phenylalanine (Phe)",
                "Tryptophan (Trp)",
                "Methionine (Met)",
                "Cysteine (Cys)",
                "Tyrosine (Tyr)",
                "Glutamine (Gln)",
                "Asparagine (Asn)",
                "Glutamic acid (Glu)",
                "Aspartic acid (Asp)",
                "Serine (Ser)",
                "Glycine (Gly)",
                "Alanine (Ala)",
                "Proline (Pro)",
                "Hydroxyproline (Hyp)",
                "Glycylglycine (Gly-Gly)",
                "Carnosine (\u03b2-Ala-His)",
                "Anserine (\u03b2-Ala-His-Arg)"
            ],
            "mismatches": [],
            "true_referents": [
                "Alanine (Ala)",
                "Anserine (\u03b2-Ala-His-Arg)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Carnosine (\u03b2-Ala-His)",
                "Cysteine (Cys)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Glycylglycine (Gly-Gly)",
                "Histidine (His)",
                "Hydroxyproline (Hyp)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            "Phenylalanine (Phe)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Threonine (Thr)",
            "Valine (Val)",
            "Tryptophan (Trp)",
            "Arginine (Arg)",
            "Tyrosine (Tyr)",
            "Cysteine (Cys)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Phenylalanine (Phe)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Threonine (Thr)",
                "Valine (Val)",
                "Tryptophan (Trp)",
                "Arginine (Arg)",
                "Tyrosine (Tyr)",
                "Cysteine (Cys)"
            ],
            "mismatches": [],
            "true_referents": [
                "Arginine (Arg)",
                "Cysteine (Cys)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)"
            ],
            "TP": 12,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "essential amino acid",
        "domain": "chemistry",
        "response": [
            {
                "Referent": "Alanine",
                "Canonical Name": "Alanine"
            },
            {
                "Referent": "Arginine",
                "Canonical Name": "Arginine"
            },
            {
                "Referent": "Asparagine",
                "Canonical Name": "Asparagine"
            },
            {
                "Referent": "Cysteine",
                "Canonical Name": "Cysteine"
            },
            {
                "Referent": "Glutamine",
                "Canonical Name": "Glutamine"
            },
            {
                "Referent": "Glycine",
                "Canonical Name": "Glycine"
            },
            {
                "Referent": "Histidine",
                "Canonical Name": "Histidine"
            },
            {
                "Referent": "Isoleucine",
                "Canonical Name": "Isoleucine"
            },
            {
                "Referent": "Leucine",
                "Canonical Name": "Leucine"
            },
            {
                "Referent": "Methionine",
                "Canonical Name": "Methionine"
            },
            {
                "Referent": "Phenylalanine",
                "Canonical Name": "Phenylalanine"
            },
            {
                "Referent": "Proline",
                "Canonical Name": "Proline"
            },
            {
                "Referent": "Serine",
                "Canonical Name": "Serine"
            },
            {
                "Referent": "Threonine",
                "Canonical Name": "Threonine"
            },
            {
                "Referent": "Tryptophan",
                "Canonical Name": "Tryptophan"
            },
            {
                "Referent": "Tyrosine",
                "Canonical Name": "Tyrosine"
            },
            {
                "Referent": "Valine",
                "Canonical Name": "Valine"
            }
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine",
                "Arginine",
                "Asparagine",
                "Cysteine",
                "Glutamine",
                "Glycine",
                "Histidine",
                "Isoleucine",
                "Leucine",
                "Methionine",
                "Phenylalanine",
                "Proline",
                "Serine",
                "Threonine",
                "Tryptophan",
                "Tyrosine",
                "Valine"
            ],
            "mismatches": [],
            "true_referents": [
                "{\"Referent\": \"Alanine\", \"Canonical Name\": \"Alanine\"}",
                "{\"Referent\": \"Arginine\", \"Canonical Name\": \"Arginine\"}",
                "{\"Referent\": \"Asparagine\", \"Canonical Name\": \"Asparagine\"}",
                "{\"Referent\": \"Cysteine\", \"Canonical Name\": \"Cysteine\"}",
                "{\"Referent\": \"Glutamine\", \"Canonical Name\": \"Glutamine\"}",
                "{\"Referent\": \"Glycine\", \"Canonical Name\": \"Glycine\"}",
                "{\"Referent\": \"Histidine\", \"Canonical Name\": \"Histidine\"}",
                "{\"Referent\": \"Isoleucine\", \"Canonical Name\": \"Isoleucine\"}",
                "{\"Referent\": \"Leucine\", \"Canonical Name\": \"Leucine\"}",
                "{\"Referent\": \"Methionine\", \"Canonical Name\": \"Methionine\"}",
                "{\"Referent\": \"Phenylalanine\", \"Canonical Name\": \"Phenylalanine\"}",
                "{\"Referent\": \"Proline\", \"Canonical Name\": \"Proline\"}",
                "{\"Referent\": \"Serine\", \"Canonical Name\": \"Serine\"}",
                "{\"Referent\": \"Threonine\", \"Canonical Name\": \"Threonine\"}",
                "{\"Referent\": \"Tryptophan\", \"Canonical Name\": \"Tryptophan\"}",
                "{\"Referent\": \"Tyrosine\", \"Canonical Name\": \"Tyrosine\"}",
                "{\"Referent\": \"Valine\", \"Canonical Name\": \"Valine\"}"
            ],
            "TP": 17,
            "FP": 0,
            "FN": 0
        }
    }
]