[
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "qwen-v2.5-14b-instruct",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "glycine (Gly)",
            "alanine (Ala)",
            "valine (Val)",
            "leucine (Leu)",
            "isoleucine (Ile)",
            "proline (Pro)",
            "phenylalanine (Phe)",
            "tryptophan (Trp)",
            "tyrosine (Tyr)",
            "methionine (Met)",
            "threonine (Thr)",
            "serine (Ser)",
            "cysteine (Cys)",
            "lysine (Lys)",
            "arginine (Arg)",
            "histidine (His)",
            "asparagine (Asn)",
            "glutamine (Gln)",
            "aspartic acid (Asp)",
            "glutamic acid (Glu)",
            "ornithine",
            "citrulline",
            "homocysteine",
            "homoserine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "glycine (Gly)",
                "alanine (Ala)",
                "valine (Val)",
                "leucine (Leu)",
                "isoleucine (Ile)",
                "proline (Pro)",
                "phenylalanine (Phe)",
                "tryptophan (Trp)",
                "tyrosine (Tyr)",
                "methionine (Met)",
                "threonine (Thr)",
                "serine (Ser)",
                "cysteine (Cys)",
                "lysine (Lys)",
                "arginine (Arg)",
                "histidine (His)",
                "asparagine (Asn)",
                "glutamine (Gln)",
                "aspartic acid (Asp)",
                "glutamic acid (Glu)",
                "ornithine",
                "citrulline",
                "homocysteine",
                "homoserine"
            ],
            "mismatches": [],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "homocysteine",
                "homoserine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "phi-v4",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Cysteine (Cys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Tyrosine (Tyr)",
            "Tryptophan (Trp)",
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Asparagine (Asn)",
            "Glutamine (Gln)",
            "Histidine (His)",
            "Lysine (Lys)",
            "Arginine (Arg)",
            "Carnosine",
            "Anserine",
            "Homocarnosine",
            "Prolinol carboxylic acid",
            "N-Acetylglutamic acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glycine (Gly)",
                "Alanine (Ala)",
                "Valine (Val)",
                "Leucine (Leu)",
                "Isoleucine (Ile)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Tyrosine (Tyr)",
                "Tryptophan (Trp)",
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Asparagine (Asn)",
                "Glutamine (Gln)",
                "Histidine (His)",
                "Lysine (Lys)",
                "Arginine (Arg)",
                "Anserine",
                "Homocarnosine"
            ],
            "mismatches": [
                "Cysteine (Cys)",
                "Carnosine",
                "Prolinol carboxylic acid",
                "N-Acetylglutamic acid"
            ],
            "true_referents": [
                "3-propylidene-delta1-pyrroline-5-carboxylic acid",
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-phenylalanine",
                "L-serine",
                "L-threonine",
                "L-valine",
                "N-acetyl-L-glutamic acid",
                "N-acylglutamic acid",
                "N-acylserine",
                "N-benzyloxycarbonyl-L-prolyl-L-prolinal",
                "alanine",
                "anserine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "homocarnosine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "phenylalanine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "mistral-small-instruct-24B",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Asparagine (Asn)",
            "Glutamine (Gln)",
            "Lysine (Lys)",
            "Arginine (Arg)",
            "Histidine (His)",
            "Citrulline",
            "Ornithine",
            "Cysteine (Cys)",
            "Methionine (Met)",
            "Proline (Pro)",
            "Tyrosine (Tyr)",
            "Tryptophan (Trp)",
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Phenylalanine (Phe)",
            "Cysteic acid",
            "Homocysteine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glycine (Gly)",
                "Alanine (Ala)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Asparagine (Asn)",
                "Glutamine (Gln)",
                "Arginine (Arg)",
                "Citrulline",
                "Ornithine",
                "Cysteine (Cys)",
                "Methionine (Met)",
                "Proline (Pro)",
                "Valine (Val)",
                "Leucine (Leu)",
                "Isoleucine (Ile)",
                "Phenylalanine (Phe)",
                "Cysteic acid",
                "Histidine (His)",
                "Tyrosine (Tyr)"
            ],
            "mismatches": [
                "Lysine (Lys)",
                "Homocysteine",
                "Tryptophan (Trp)"
            ],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteic acid",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "homocysteine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 21,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gemma-3",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Cysteine (Cys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Tyrosine (Tyr)",
            "Tryptophan (Trp)",
            "Aspartic Acid (Asp)",
            "Glutamic Acid (Glu)",
            "Lysine (Lys)",
            "Arginine (Arg)",
            "Histidine (His)",
            "Proline (Pro)",
            "Ornithine (Orn)",
            "Citrulline (Cit)",
            "Homocysteine (Hcy)",
            "Homoserine (Hse)",
            "Sarcosine (Sar)",
            "Beta-Alanine (\u03b2-Ala)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glycine",
                "Alanine",
                "Valine",
                "Leucine",
                "Isoleucine",
                "Serine",
                "Threonine",
                "Cysteine",
                "Methionine",
                "Phenylalanine",
                "Tyrosine",
                "Tryptophan",
                "Aspartic Acid",
                "Glutamic Acid",
                "Lysine",
                "Arginine",
                "Histidine",
                "Proline",
                "Ornithine",
                "Citrulline",
                "Homocysteine",
                "Homoserine",
                "Sarcosine",
                "Beta-Alanine"
            ],
            "mismatches": [],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "aspartic acid",
                "beta-alanine",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glycine",
                "histidine",
                "homocysteine",
                "homoserine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "sarcosine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Cysteine (Cys)",
            "Methionine (Met)",
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Asparagine (Asn)",
            "Glutamine (Gln)",
            "Lysine (Lys)",
            "Arginine (Arg)",
            "Histidine (His)",
            "Phenylalanine (Phe)",
            "Tyrosine (Tyr)",
            "Tryptophan (Trp)",
            "Proline (Pro)",
            "Ornithine",
            "Citrulline",
            "Homocysteine",
            "Taurine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glycine (Gly)",
                "Alanine (Ala)",
                "Valine (Val)",
                "Leucine (Leu)",
                "Isoleucine (Ile)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Cysteine (Cys)",
                "Methionine (Met)",
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Asparagine (Asn)",
                "Glutamine (Gln)",
                "Lysine (Lys)",
                "Arginine (Arg)",
                "Histidine (His)",
                "Phenylalanine (Phe)",
                "Tyrosine (Tyr)",
                "Tryptophan (Trp)",
                "Proline (Pro)",
                "Ornithine",
                "Citrulline",
                "Homocysteine"
            ],
            "mismatches": [
                "Taurine"
            ],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "homocysteine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "serine",
                "tauropine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4o-mini",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Aminoacetic acid (Glycine)",
            "Aminobutyric acid (GABA)",
            "Aminocaproic acid",
            "Aminoadipic acid",
            "Aminosalicylic acid",
            "2-Aminobenzoic acid (Anthranilic acid)",
            "3-Aminobenzoic acid (p-Aminobenzoic acid)",
            "4-Aminobenzoic acid (p-Aminobenzoic acid)",
            "Lysine",
            "Arginine",
            "Citrulline",
            "Ornithine",
            "Asparagine",
            "Glutamine",
            "2-Amino-3-methylbutanoic acid (Leucine)",
            "2-Amino-4-methylpentanoic acid (Valine)",
            "Aminohexanoic acid",
            "Aminophenylacetic acid",
            "Aminomethylbenzoic acid",
            "Aminobenzenesulfonic acid (Sulfanilic acid)",
            "Amino-2-hydroxybutyric acid",
            "Amino-3-hydroxybutyric acid",
            "Aminosuccinic acid (Aspartic acid)",
            "Aminothiobutyric acid",
            "Aminotriacetic acid (EDTA)",
            "Aminopropionic acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Aminoadipic acid",
                "Lysine",
                "Arginine",
                "Citrulline",
                "Ornithine",
                "Asparagine",
                "Glutamine",
                "3-Aminobenzoic acid",
                "4-Aminobenzoic acid"
            ],
            "mismatches": [
                "Aminoacetic acid (Glycine)",
                "Aminobutyric acid (GABA)",
                "Aminocaproic acid",
                "Aminosalicylic acid",
                "2-Aminobenzoic acid (Anthranilic acid)",
                "2-Amino-3-methylbutanoic acid (Leucine)",
                "2-Amino-4-methylpentanoic acid (Valine)",
                "Aminohexanoic acid",
                "Aminophenylacetic acid",
                "Aminomethylbenzoic acid",
                "Aminobenzenesulfonic acid (Sulfanilic acid)",
                "Amino-2-hydroxybutyric acid",
                "Amino-3-hydroxybutyric acid",
                "Aminosuccinic acid (Aspartic acid)",
                "Aminothiobutyric acid",
                "Aminotriacetic acid (EDTA)",
                "Aminopropionic acid"
            ],
            "true_referents": [
                "(2s)-2-Amino-4-sulfinobutanoic acid",
                "(3R)-3-amino-4-hydroxybutanoic acid",
                "2-Amino-4-methylbenzoic acid",
                "2-amino-2-hydroxybutanoic acid",
                "2-amino-2-methylbutanoic acid",
                "2-amino-3-hydroxybutanoic acid",
                "2-aminoadipic acid",
                "2-aminohexanoic acid",
                "3-Amino-5-methylsulfanylpentanoic acid",
                "3-Aminocaproic acid",
                "3-aminobenzoic acid",
                "4-aminobenzoic acid",
                "4-aminosalicylic acid",
                "4-methylthio-2-oxobutanoic acid",
                "5-aminosalicyluric acid",
                "6-aminohexanoic acid",
                "L-alpha-aminobutyric acid",
                "L-arginine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamine",
                "L-ornithine",
                "L-valine",
                "N-acetyl-5-aminosalicylic acid",
                "N-acetylphenylalanine",
                "N-purin-6-oyl-epsilon-aminocaproic acid",
                "alpha-aminobutyric acid",
                "aminobenzoic acid",
                "anthranilic acid",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "gamma-amino-beta-hydroxybutyric acid",
                "glutamine",
                "glycine",
                "lysine",
                "ornithine"
            ],
            "TP": 9,
            "FP": 17,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-4-32k",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Aminoacetic Acid (Glycine)",
            "2-Aminopropanoic Acid (Alanine)",
            "3-Aminopropanoic Acid (Serine)",
            "2-Amino-3-methylbutanoic Acid (Isoleucine)",
            "2-Amino-3-phenylpropanoic Acid (Phenylalanine)",
            "2-Amino-3-(indol-3-yl)propanoic Acid (Tryptophan)",
            "2-Amino-3-(4-hydroxyphenyl)propanoic Acid (Tyrosine)",
            "2-Amino-4-methylpentanoic Acid (Leucine)",
            "2-Amino-3-(1H-imidazol-5-yl)propanoic Acid (Histidine)",
            "2-Amino-3-(3-methyl-2-oxoimidazolidin-1-yl)propanoic Acid (Threonine)",
            "2-Amino-3-(carbamoylamino)propanoic Acid (Asparagine)",
            "2-Amino-4-(carbamoylamino)butanoic Acid (Aspartic Acid)",
            "2-Amino-3-(3-carboxy-3-oxopropyl)propanoic Acid (Glutamic Acid)",
            "2-Amino-3-(1-carboxy-2-oxopropyl)propanoic Acid (Glutamine)",
            "2-Amino-3-(4-hydroxy-3-methoxyphenyl)propanoic Acid (Methionine)",
            "2-Amino-3-(3-methyl-2-oxopentan-3-yl)propanoic Acid (Valine)",
            "2-Amino-3-(3-methyl-2-oxobutyl)propanoic Acid (Arginine)",
            "2-Amino-3-(1-amino-2-hydroxy-3-oxopropyl)propanoic Acid (Lysine)",
            "2-Amino-3-(3-methyl-2-oxobutyl)propanoic Acid (Proline)",
            "2-Amino-3-(3-hydroxy-2-methylpropanoyl)propanoic Acid (Cysteine)",
            "2-Amino-3-(1-amino-3-oxopropyl)propanoic Acid (Ornithine)",
            "2-Amino-3-(1-amino-2-hydroxy-3-oxobutyl)propanoic Acid (Citrulline)",
            "2-Amino-3-(1-amino-3-oxopropyl)propanoic Acid (GABA)",
            "2-Amino-3-(1-amino-2-hydroxy-3-oxopropyl)propanoic Acid (Taurine)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "asparagine",
                "glycine"
            ],
            "mismatches": [
                "2-Aminopropanoic Acid (Alanine)",
                "3-Aminopropanoic Acid (Serine)",
                "2-Amino-3-methylbutanoic Acid (Isoleucine)",
                "2-Amino-3-phenylpropanoic Acid (Phenylalanine)",
                "2-Amino-3-(indol-3-yl)propanoic Acid (Tryptophan)",
                "2-Amino-3-(4-hydroxyphenyl)propanoic Acid (Tyrosine)",
                "2-Amino-4-methylpentanoic Acid (Leucine)",
                "2-Amino-3-(1H-imidazol-5-yl)propanoic Acid (Histidine)",
                "2-Amino-3-(3-methyl-2-oxoimidazolidin-1-yl)propanoic Acid (Threonine)",
                "2-Amino-4-(carbamoylamino)butanoic Acid (Aspartic Acid)",
                "2-Amino-3-(3-carboxy-3-oxopropyl)propanoic Acid (Glutamic Acid)",
                "2-Amino-3-(1-carboxy-2-oxopropyl)propanoic Acid (Glutamine)",
                "2-Amino-3-(4-hydroxy-3-methoxyphenyl)propanoic Acid (Methionine)",
                "2-Amino-3-(3-methyl-2-oxopentan-3-yl)propanoic Acid (Valine)",
                "2-Amino-3-(3-methyl-2-oxobutyl)propanoic Acid (Arginine)",
                "2-Amino-3-(1-amino-2-hydroxy-3-oxopropyl)propanoic Acid (Lysine)",
                "2-Amino-3-(3-methyl-2-oxobutyl)propanoic Acid (Proline)",
                "2-Amino-3-(3-hydroxy-2-methylpropanoyl)propanoic Acid (Cysteine)",
                "2-Amino-3-(1-amino-3-oxopropyl)propanoic Acid (Ornithine)",
                "2-Amino-3-(1-amino-2-hydroxy-3-oxobutyl)propanoic Acid (Citrulline)",
                "2-Amino-3-(1-amino-3-oxopropyl)propanoic Acid (GABA)",
                "2-Amino-3-(1-amino-2-hydroxy-3-oxopropyl)propanoic Acid (Taurine)"
            ],
            "true_referents": [
                "(2S)-2-Amino-8-hydroxyoctanoic acid",
                "(2S)-2-amino-3-[4-hydroxy-3-(3-methylbut-2-enyl)phenyl]propanoic acid",
                "(3R,5R)-5-amino-3-methyl-D-proline",
                "(3S)-3-Amino-4-(1H-indol-3-yl)butanoic acid",
                "(3S)-3-hydroxy-L-lysine",
                "(3S)-3-hydroxy-L-ornithine",
                "(5S)-5-amino-3-oxohexanoic acid",
                "(R)-2-amino-4-oxopentanoic acid",
                "(R)-3-amino-3-phenylpropanoic acid",
                "(S)-3-amino-3-phenylpropanoic acid",
                "(S)-N-(4,5-Dihydro-1-methyl-4-oxo-1H-imidazol-2-yl)alanine",
                "2-(3-benzyl-2-oxoimidazolidin-1-yl)-N-propylacetamide",
                "2-Amino-4-[(2-hydroxy-1-oxopropyl)amino]butanoic acid",
                "2-[3-carboxy-3-(dimethylamino)propyl]-L-histidine",
                "2-amino-2-methylbutanoic acid",
                "2-amino-3-(2-amino-4-hydroxyphenyl)propanoic acid",
                "2-amino-3-(2-oxo-2,3-dihydro-1H-indol-3-yl)propanoic acid",
                "2-amino-3-methylpentanoic acid",
                "2-amino-3-oxobutanoic acid",
                "2-aminooctanoic acid",
                "2-aminopentanoic acid",
                "2-imino-3-methylene-5-L-(carboxy-L-threoninyl)pyrrolidine",
                "3'-L-asparaginyl-AMP",
                "3-Amino-4-(1H-indol-3-yl)butanoic Acid",
                "3-amino-3-(4-hydroxyphenyl)propanoic acid",
                "3-amino-3-phenylpropanoic acid",
                "4-Amino-2-methylenebutanoic acid",
                "L-N-(3-Carboxypropyl)glutamine",
                "L-alpha-aminobutyric acid",
                "L-citrulline",
                "N(delta)-hydroxy-N(omega)-methyl-L-citrulline zwitterion",
                "N-Acetyl-S-(1-hydroxymethyl-2-propenyl)-cysteine",
                "N-acetyl-S-(3-hydroxypropyl-1-methyl)-L-cysteine",
                "N-carbamoyl-L-aspartic acid",
                "N2-(3-Carboxy-2-hydroxy-1-oxopropyl)arginine",
                "S-(3-Oxo-3-carboxy-n-propyl)cysteine",
                "alpha-N-(3-hydroxyoctadecanoyl)-L-ornithine",
                "asparagine",
                "glycine"
            ],
            "TP": 2,
            "FP": 22,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "gpt-35-turbo-16k",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Aminoacetic acid (Glycine)",
            "Lysine",
            "Aspartic acid",
            "Glutamic acid",
            "Asparagine",
            "Glutamine",
            "Alanine",
            "Valine",
            "Leucine",
            "Isoleucine",
            "Serine",
            "Threonine",
            "Cysteine",
            "Methionine",
            "Phenylalanine",
            "Tyrosine",
            "Tryptophan",
            "Histidine",
            "Arginine",
            "Proline",
            "Ornithine",
            "Citrulline",
            "Homocysteine",
            "Homoserine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Lysine",
                "Aspartic acid",
                "Glutamic acid",
                "Asparagine",
                "Glutamine",
                "Alanine",
                "Valine",
                "Leucine",
                "Isoleucine",
                "Serine",
                "Threonine",
                "Cysteine",
                "Methionine",
                "Phenylalanine",
                "Tyrosine",
                "Tryptophan",
                "Histidine",
                "Arginine",
                "Proline",
                "Ornithine",
                "Citrulline",
                "Homocysteine",
                "Homoserine"
            ],
            "mismatches": [
                "Aminoacetic acid (Glycine)"
            ],
            "true_referents": [
                "L-alanine",
                "L-arginine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-serine",
                "L-threonine",
                "Valine-d8",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "homocysteine",
                "homoserine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 23,
            "FP": 1,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "o1-mini",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Alanine (Ala)",
            "Arginine (Arg)",
            "Asparagine (Asn)",
            "Aspartic acid (Asp)",
            "Cysteine (Cys)",
            "Glutamic acid (Glu)",
            "Glutamine (Gln)",
            "Glycine (Gly)",
            "Histidine (His)",
            "Isoleucine (Ile)",
            "Leucine (Leu)",
            "Lysine (Lys)",
            "Methionine (Met)",
            "Phenylalanine (Phe)",
            "Proline (Pro)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Tryptophan (Trp)",
            "Tyrosine (Tyr)",
            "Valine (Val)",
            "Selenocysteine (Sec)",
            "Pyrrolysine (Pyl)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Alanine (Ala)",
                "Arginine (Arg)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Cysteine (Cys)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Glycine (Gly)",
                "Histidine (His)",
                "Isoleucine (Ile)",
                "Leucine (Leu)",
                "Lysine (Lys)",
                "Methionine (Met)",
                "Phenylalanine (Phe)",
                "Proline (Pro)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Tryptophan (Trp)",
                "Tyrosine (Tyr)",
                "Valine (Val)",
                "Selenocysteine (Sec)",
                "Pyrrolysine (Pyl)"
            ],
            "mismatches": [],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-phenylalanine",
                "L-proline",
                "L-selenocysteine",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "phenylalanine",
                "proline",
                "pyrrolysine",
                "selenocysteine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 22,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-5-sonnet-v1:0",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Serine (Ser)",
            "Cysteine (Cys)",
            "Threonine (Thr)",
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Methionine (Met)",
            "Proline (Pro)",
            "Phenylalanine (Phe)",
            "Tyrosine (Tyr)",
            "Tryptophan (Trp)",
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Asparagine (Asn)",
            "Glutamine (Gln)",
            "Histidine (His)",
            "Lysine (Lys)",
            "Arginine (Arg)",
            "Ornithine",
            "Beta-alanine",
            "Gamma-aminobutyric acid (GABA)",
            "Taurine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glycine (Gly)",
                "Alanine (Ala)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Valine (Val)",
                "Leucine (Leu)",
                "Isoleucine (Ile)",
                "Methionine (Met)",
                "Proline (Pro)",
                "Phenylalanine (Phe)",
                "Tyrosine (Tyr)",
                "Tryptophan (Trp)",
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Asparagine (Asn)",
                "Glutamine (Gln)",
                "Histidine (His)",
                "Lysine (Lys)",
                "Arginine (Arg)",
                "Ornithine",
                "Beta-alanine",
                "Gamma-aminobutyric acid (GABA)"
            ],
            "mismatches": [
                "Cysteine (Cys)",
                "Taurine"
            ],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "alpha-aminobutyric acid",
                "arginine",
                "asparagine",
                "aspartic acid",
                "beta-alanine",
                "beta-alanine betaine",
                "beta-alanopine",
                "cysteine",
                "gamma-aminobutyric acid",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "serine",
                "tauropine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-opus-v1:0",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Proline (Pro)",
            "Phenylalanine (Phe)",
            "Tyrosine (Tyr)",
            "Tryptophan (Trp)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Cysteine (Cys)",
            "Methionine (Met)",
            "Asparagine (Asn)",
            "Glutamine (Gln)",
            "Lysine (Lys)",
            "Arginine (Arg)",
            "Histidine (His)",
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "\u03b3-Aminobutyric acid (GABA)",
            "\u03b4-Aminolevulinic acid (ALA)",
            "Ornithine",
            "Citrulline"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glycine (Gly)",
                "Alanine (Ala)",
                "Valine (Val)",
                "Leucine (Leu)",
                "Isoleucine (Ile)",
                "Proline (Pro)",
                "Phenylalanine (Phe)",
                "Tyrosine (Tyr)",
                "Tryptophan (Trp)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Cysteine (Cys)",
                "Methionine (Met)",
                "Asparagine (Asn)",
                "Glutamine (Gln)",
                "Lysine (Lys)",
                "Arginine (Arg)",
                "Histidine (His)",
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Ornithine",
                "Citrulline"
            ],
            "mismatches": [
                "\u03b3-Aminobutyric acid (GABA)",
                "\u03b4-Aminolevulinic acid (ALA)"
            ],
            "true_referents": [
                "5-aminolevulinic acid",
                "5-aminolevulinic acid hexyl ester",
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "alpha-aminobutyric acid",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "gamma-aminobutyric acid",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "methyl 5-aminolevulinate",
                "ornithine",
                "phenylalanine",
                "proline",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 22,
            "FP": 2,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-sonnet-v1:0",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Proline (Pro)",
            "Tryptophan (Trp)",
            "Phenylalanine (Phe)",
            "Methionine (Met)",
            "Cysteine (Cys)",
            "Tyrosine (Tyr)",
            "Histidine (His)",
            "Lysine (Lys)",
            "Arginine (Arg)",
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Asparagine (Asn)",
            "Glutamine (Gln)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Aminobutyric acid",
            "Aminocaproic acid",
            "Aminovaleric acid",
            "Aminoisobutyric acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glycine (Gly)",
                "Alanine (Ala)",
                "Valine (Val)",
                "Leucine (Leu)",
                "Isoleucine (Ile)",
                "Proline (Pro)",
                "Tryptophan (Trp)",
                "Phenylalanine (Phe)",
                "Methionine (Met)",
                "Cysteine (Cys)",
                "Tyrosine (Tyr)",
                "Histidine (His)",
                "Lysine (Lys)",
                "Arginine (Arg)",
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Asparagine (Asn)",
                "Glutamine (Gln)",
                "Serine (Ser)",
                "Threonine (Thr)"
            ],
            "mismatches": [
                "Aminobutyric acid",
                "Aminocaproic acid",
                "Aminovaleric acid",
                "Aminoisobutyric acid"
            ],
            "true_referents": [
                "2-aminoacrylic acid",
                "2-aminoisobutyric acid",
                "3-Aminocaproic acid",
                "3-aminoisobutyric acid",
                "Arginine glutamate",
                "L-alanine",
                "L-alpha-aminobutyric acid",
                "L-asparagine",
                "L-aspartic acid",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-phenylalanine",
                "L-proline",
                "L-serine",
                "L-threonine",
                "L-valine",
                "N-purin-6-oyl-epsilon-aminocaproic acid",
                "alanine",
                "alpha-amino acid",
                "alpha-aminobutyric acid",
                "arginine",
                "asparagine",
                "aspartic acid",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "phenylalanine",
                "proline",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 20,
            "FP": 4,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "anthropic.claude-3-haiku-v1:0",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Cysteine (Cys)",
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Proline (Pro)",
            "Phenylalanine (Phe)",
            "Tyrosine (Tyr)",
            "Tryptophan (Trp)",
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Lysine (Lys)",
            "Arginine (Arg)",
            "Histidine (His)",
            "Asparagine (Asn)",
            "Glutamine (Gln)",
            "Methionine (Met)",
            "Ornithine (Orn)",
            "Citrulline (Cit)",
            "Homocysteine (Hcy)",
            "Homoserine (Hse)"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glycine (Gly)",
                "Alanine (Ala)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Cysteine (Cys)",
                "Valine (Val)",
                "Leucine (Leu)",
                "Isoleucine (Ile)",
                "Proline (Pro)",
                "Phenylalanine (Phe)",
                "Tyrosine (Tyr)",
                "Tryptophan (Trp)",
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Lysine (Lys)",
                "Arginine (Arg)",
                "Histidine (His)",
                "Asparagine (Asn)",
                "Glutamine (Gln)",
                "Methionine (Met)",
                "Ornithine (Orn)",
                "Citrulline (Cit)",
                "Homocysteine (Hcy)",
                "Homoserine (Hse)"
            ],
            "mismatches": [],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-ornithine",
                "L-phenylalanine",
                "L-proline",
                "L-serine",
                "L-threonine",
                "L-valine",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "homocysteine",
                "homoserine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "ornithine",
                "phenylalanine",
                "proline",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 24,
            "FP": 0,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-8b-instruct-v1:0",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Phenylalanine (Phe)",
            "Tyrosine (Tyr)",
            "Tryptophan (Trp)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Asparagine (Asn)",
            "Glutamine (Gln)",
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Lysine (Lys)",
            "Arginine (Arg)",
            "Histidine (His)",
            "Cysteine (Cys)",
            "Methionine (Met)",
            "Proline (Pro)",
            "Glutathione",
            "Creatine",
            "Carnosine",
            "Anserine",
            "Orotidine monophosphate",
            "N-Acetylglycine"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glycine (Gly)",
                "Alanine (Ala)",
                "Valine (Val)",
                "Leucine (Leu)",
                "Isoleucine (Ile)",
                "Phenylalanine (Phe)",
                "Tyrosine (Tyr)",
                "Tryptophan (Trp)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Asparagine (Asn)",
                "Glutamine (Gln)",
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Lysine (Lys)",
                "Arginine (Arg)",
                "Histidine (His)",
                "Cysteine (Cys)",
                "Methionine (Met)",
                "Proline (Pro)",
                "Glutathione",
                "Creatine",
                "Anserine"
            ],
            "mismatches": [
                "Carnosine",
                "Orotidine monophosphate",
                "N-Acetylglycine"
            ],
            "true_referents": [
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-glutamic acid",
                "L-glutamine",
                "L-isoleucine",
                "L-leucine",
                "L-methionine",
                "L-phenylalanine",
                "L-proline",
                "L-serine",
                "L-threonine",
                "L-valine",
                "N-acylserine",
                "alanine",
                "anserine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "creatine",
                "cysteine",
                "glutamic acid",
                "glutamine",
                "glutathione",
                "glycine",
                "histidine",
                "homocarnosine",
                "isoleucine",
                "leucine",
                "lysine",
                "methionine",
                "phenylalanine",
                "proline",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 23,
            "FP": 3,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "meta.llama3-70b-instruct-v1:0",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": [
            "Glycine (Gly)",
            "Alanine (Ala)",
            "Valine (Val)",
            "Leucine (Leu)",
            "Isoleucine (Ile)",
            "Phenylalanine (Phe)",
            "Tyrosine (Tyr)",
            "Tryptophan (Trp)",
            "Serine (Ser)",
            "Threonine (Thr)",
            "Asparagine (Asn)",
            "Aspartic acid (Asp)",
            "Glutamic acid (Glu)",
            "Glutamine (Gln)",
            "Arginine (Arg)",
            "Histidine (His)",
            "Lysine (Lys)",
            "Citrulline",
            "Homocitrulline",
            " Ornithine",
            "alpha-Aminoadipic acid",
            "2-Aminomuconic acid",
            "2-Aminopimelic acid",
            "N-Acetylaspartic acid",
            "N-Acetylglutamic acid"
        ],
        "scorer": "gpt-4o",
        "judgement": {
            "matches": [
                "Glycine (Gly)",
                "Alanine (Ala)",
                "Valine (Val)",
                "Leucine (Leu)",
                "Isoleucine (Ile)",
                "Phenylalanine (Phe)",
                "Tyrosine (Tyr)",
                "Tryptophan (Trp)",
                "Serine (Ser)",
                "Threonine (Thr)",
                "Asparagine (Asn)",
                "Aspartic acid (Asp)",
                "Glutamic acid (Glu)",
                "Glutamine (Gln)",
                "Arginine (Arg)",
                "Histidine (His)",
                "Lysine (Lys)",
                "Citrulline",
                "Ornithine"
            ],
            "mismatches": [
                "Homocitrulline",
                "alpha-Aminoadipic acid",
                "2-Aminomuconic acid",
                "2-Aminopimelic acid",
                "N-Acetylaspartic acid",
                "N-Acetylglutamic acid"
            ],
            "true_referents": [
                "(2E,4Z)-2-aminomuconic acid",
                "2-aminomuconic acid",
                "2-aminopimelic acid",
                "3-aminoadipic acid",
                "Arginine glutamate",
                "L-alanine",
                "L-asparagine",
                "L-aspartic acid",
                "L-citrulline",
                "L-glutamic acid",
                "L-glutamine",
                "L-homocitrulline",
                "L-isoleucine",
                "L-leucine",
                "L-ornithine",
                "L-phenylalanine",
                "L-serine",
                "L-threonine",
                "L-valine",
                "N-acetyl-L-aspartic acid",
                "alanine",
                "arginine",
                "asparagine",
                "aspartic acid",
                "citrulline",
                "glutamic acid",
                "glutamine",
                "glycine",
                "histidine",
                "isoleucine",
                "leucine",
                "lysine",
                "ornithine",
                "phenylalanine",
                "serine",
                "threonine",
                "tryptophan",
                "tyrosine",
                "valine"
            ],
            "TP": 19,
            "FP": 6,
            "FN": 0
        }
    },
    {
        "test": "limited-list-referents-from-selection-criteria",
        "responder": "amazon.titan-text-express-v1",
        "concept": "amino acid",
        "domain": "chemistry",
        "response": "Sorry - this model is unable to respond to this request.",
        "scorer": "gpt-4o",
        "judgement": {
            "TP": 0,
            "FP": 0
        }
    }
]