[{"key": "35232142", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4882833960702494, "ground_truth": 0}, {"key": "35232142", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5851011688070976, "ground_truth": 0}, {"key": "35232142", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.501953112230448, "ground_truth": 0}, {"key": "35232142", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2991051964221994, "ground_truth": 0}, {"key": "35232142", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.47268347778313186, "ground_truth": 0}, {"key": "40143035", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6619228614321888, "ground_truth": 0}, {"key": "40143035", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6132365760624339, "ground_truth": 0}, {"key": "40143035", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8577681048431857, "ground_truth": 0}, {"key": "40143035", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786410589237, "ground_truth": 0}, {"key": "40143035", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9079671317567157, "ground_truth": 0}, {"key": "35951548", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.07640768034374251, "ground_truth": 0}, {"key": "35951548", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26588048160116345, "ground_truth": 0}, {"key": "35951548", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1530421503742101, "ground_truth": 0}, {"key": "35951548", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.0863234712938483, "ground_truth": 0}, {"key": "35951548", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17441029352613371, "ground_truth": 0}, {"key": "36266422", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31573597888025184, "ground_truth": 0}, {"key": "36266422", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.33458946840476, "ground_truth": 0}, {"key": "36266422", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38491216055424116, "ground_truth": 0}, {"key": "36266422", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2909808479269678, "ground_truth": 0}, {"key": "36266422", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26133093502084387, "ground_truth": 0}, {"key": "38826984", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3738758186900707, "ground_truth": 0}, {"key": "38826984", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.284576023600916, "ground_truth": 0}, {"key": "38826984", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6460136768962959, "ground_truth": 0}, {"key": "38826984", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.472683472898067, "ground_truth": 0}, {"key": "38826984", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883686919384, "ground_truth": 0}, {"key": "34540833", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4073334110121783, "ground_truth": 0}, {"key": "34540833", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.44939263417411274, "ground_truth": 0}, {"key": "34540833", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34864512019825944, "ground_truth": 0}, {"key": "34540833", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4148988557947039, "ground_truth": 0}, {"key": "34540833", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.25832597838977966, "ground_truth": 0}, {"key": "20836172", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4016877854896062, "ground_truth": 0}, {"key": "20836172", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5117166086052224, "ground_truth": 0}, {"key": "20836172", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4359015188383829, "ground_truth": 0}, {"key": "20836172", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033678313656, "ground_truth": 0}, {"key": "20836172", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793783949730015, "ground_truth": 0}, {"key": "35932467", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.46295860079126794, "ground_truth": 0}, {"key": "35932467", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31069436578976317, "ground_truth": 0}, {"key": "35932467", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.47073662968608676, "ground_truth": 0}, {"key": "35932467", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35577488595596113, "ground_truth": 0}, {"key": "35932467", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3328523172901299, "ground_truth": 0}, {"key": "40758845", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.567936594054859, "ground_truth": 0}, {"key": "40758845", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30735801617154024, "ground_truth": 0}, {"key": "40758845", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5312093626627072, "ground_truth": 0}, {"key": "40758845", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3140505172678464, "ground_truth": 0}, {"key": "40758845", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30074555611809467, "ground_truth": 0}, {"key": "30358490", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6842640168030676, "ground_truth": 0}, {"key": "30358490", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3720487488250958, "ground_truth": 0}, {"key": "30358490", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6388352276052414, "ground_truth": 0}, {"key": "30358490", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976088971229213, "ground_truth": 0}, {"key": "30358490", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943903566229, "ground_truth": 0}, {"key": "34615665", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7201715103768018, "ground_truth": 0}, {"key": "34615665", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.786622824939558, "ground_truth": 0}, {"key": "34615665", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8267117857234516, "ground_truth": 0}, {"key": "34615665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359866557772, "ground_truth": 0}, {"key": "34615665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718434850943743, "ground_truth": 0}, {"key": "35890902", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5563995482040368, "ground_truth": 0}, {"key": "35890902", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5117166224036772, "ground_truth": 0}, {"key": "35890902", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5097643575634945, "ground_truth": 0}, {"key": "35890902", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995921440057, "ground_truth": 0}, {"key": "35890902", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3738758103596964, "ground_truth": 0}, {"key": "37922330", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7759445435039714, "ground_truth": 0}, {"key": "37922330", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4649015538176484, "ground_truth": 0}, {"key": "37922330", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7892336915768411, "ground_truth": 0}, {"key": "37922330", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159552807453, "ground_truth": 0}, {"key": "37922330", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647871647499, "ground_truth": 0}, {"key": "30844962", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44167299373856694, "ground_truth": 0}, {"key": "30844962", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3923368469849281, "ground_truth": 0}, {"key": "30844962", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.177810866591421, "ground_truth": 0}, {"key": "30844962", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49804688036981887, "ground_truth": 0}, {"key": "30844962", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3293916787179394, "ground_truth": 0}, {"key": "36217333", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32939171446328686, "ground_truth": 0}, {"key": "36217333", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.39047582376841483, "ground_truth": 0}, {"key": "36217333", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3886180410104813, "ground_truth": 0}, {"key": "36217333", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35756752487716925, "ground_truth": 0}, {"key": "36217333", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991051667343433, "ground_truth": 0}, {"key": "30816523", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3293917477774365, "ground_truth": 0}, {"key": "30816523", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.33633105052865164, "ground_truth": 0}, {"key": "30816523", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4882833937633189, "ground_truth": 0}, {"key": "30816523", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36296918279319307, "ground_truth": 0}, {"key": "30816523", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360042219592094, "ground_truth": 0}, {"key": "38900884", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8344068768485048, "ground_truth": 0}, {"key": "38900884", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.562176502960349, "ground_truth": 0}, {"key": "38900884", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7690802215311209, "ground_truth": 0}, {"key": "38900884", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.712232189540726, "ground_truth": 0}, {"key": "38900884", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.77864931120601, "ground_truth": 0}, {"key": "13890581", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5926665848169695, "ground_truth": 0}, {"key": "13890581", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.15203224713443983, "ground_truth": 0}, {"key": "13890581", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42250459943185203, "ground_truth": 0}, {"key": "13890581", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631815221605, "ground_truth": 0}, {"key": "13890581", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.47852882855176254, "ground_truth": 0}, {"key": "40194700", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6442251076230586, "ground_truth": 0}, {"key": "40194700", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7943849532319096, "ground_truth": 0}, {"key": "40194700", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6909762992464019, "ground_truth": 0}, {"key": "40194700", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206784311209, "ground_truth": 0}, {"key": "40194700", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148413288527, "ground_truth": 0}, {"key": "37903647", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.07751765844586819, "ground_truth": 0}, {"key": "37903647", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.15817434379128636, "ground_truth": 0}, {"key": "37903647", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1311732243126002, "ground_truth": 0}, {"key": "37903647", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.06705628365054218, "ground_truth": 0}, {"key": "37903647", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1159607191731954, "ground_truth": 0}, {"key": "13291223", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23510836662995094, "ground_truth": 0}, {"key": "13291223", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3073580186567427, "ground_truth": 0}, {"key": "13291223", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.324235421818759, "ground_truth": 0}, {"key": "13291223", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2553436406814759, "ground_truth": 0}, {"key": "13291223", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27512973402281826, "ground_truth": 0}, {"key": "36052570", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21076631189815836, "ground_truth": 0}, {"key": "36052570", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5019530898026967, "ground_truth": 0}, {"key": "36052570", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40922082257295944, "ground_truth": 0}, {"key": "36052570", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31912139033796244, "ground_truth": 0}, {"key": "36052570", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22405544852432233, "ground_truth": 0}, {"key": "34944735", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28616925752272493, "ground_truth": 0}, {"key": "34944735", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4551985888414865, "ground_truth": 0}, {"key": "34944735", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5851011442280163, "ground_truth": 0}, {"key": "34944735", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.738669057504894, "ground_truth": 0}, {"key": "34944735", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621765080093593, "ground_truth": 0}, {"key": "32159602", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3007455891770545, "ground_truth": 0}, {"key": "32159602", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3056973145886061, "ground_truth": 0}, {"key": "32159602", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24508502252143047, "ground_truth": 0}, {"key": "32159602", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25386100547353146, "ground_truth": 0}, {"key": "32159602", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23370635786555233, "ground_truth": 0}, {"key": "34988915", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38861803113940585, "ground_truth": 0}, {"key": "34988915", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23231013519703517, "ground_truth": 0}, {"key": "34988915", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30569730500702486, "ground_truth": 0}, {"key": "34988915", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593641454295875, "ground_truth": 0}, {"key": "34988915", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.25238404124979413, "ground_truth": 0}, {"key": "37889203", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6113819645956095, "ground_truth": 0}, {"key": "37889203", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8688267866053639, "ground_truth": 0}, {"key": "37889203", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8019358089863085, "ground_truth": 0}, {"key": "37889203", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575650631086, "ground_truth": 0}, {"key": "37889203", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723317174544414, "ground_truth": 0}, {"key": "33609927", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21601153766555553, "ground_truth": 0}, {"key": "33609927", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23792989051601218, "ground_truth": 0}, {"key": "33609927", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1561048881544773, "ground_truth": 0}, {"key": "33609927", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.270480203680656, "ground_truth": 0}, {"key": "33609927", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3647775402700572, "ground_truth": 0}, {"key": "33578778", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48633153156882514, "ground_truth": 0}, {"key": "33578778", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.359364167346555, "ground_truth": 0}, {"key": "33578778", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.32939171893132035, "ground_truth": 0}, {"key": "33578778", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42059960012263337, "ground_truth": 0}, {"key": "33578778", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4687906452868287, "ground_truth": 0}, {"key": "36888270", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7008947991479848, "ground_truth": 0}, {"key": "36888270", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4668455998579149, "ground_truth": 0}, {"key": "36888270", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6334102642266393, "ground_truth": 0}, {"key": "36888270", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437746752644, "ground_truth": 0}, {"key": "36888270", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419753831434, "ground_truth": 0}, {"key": "36846007", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.925229947910607, "ground_truth": 0}, {"key": "36846007", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8397339872745198, "ground_truth": 0}, {"key": "36846007", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8705972639720398, "ground_truth": 0}, {"key": "36846007", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357682525865, "ground_truth": 0}, {"key": "36846007", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9278877926701776, "ground_truth": 0}, {"key": "31723471", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5097644056409801, "ground_truth": 0}, {"key": "31723471", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5717666096013896, "ground_truth": 0}, {"key": "31723471", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4532618511425256, "ground_truth": 0}, {"key": "31723471", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.687630000220625, "ground_truth": 0}, {"key": "31723471", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269643099887, "ground_truth": 0}, {"key": "15921828", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49414089641660564, "ground_truth": 0}, {"key": "15921828", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3259495174640213, "ground_truth": 0}, {"key": "15921828", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30074556425761384, "ground_truth": 0}, {"key": "15921828", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35936411345604924, "ground_truth": 0}, {"key": "15921828", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064506878043, "ground_truth": 0}, {"key": "39109408", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.06512754818385341, "ground_truth": 0}, {"key": "39109408", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10017220820526886, "ground_truth": 0}, {"key": "39109408", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18126321104557006, "ground_truth": 0}, {"key": "39109408", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2942149887327722, "ground_truth": 0}, {"key": "39109408", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.10087861728144659, "ground_truth": 0}, {"key": "20936833", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1159607118979452, "ground_truth": 0}, {"key": "20936833", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.06754668960788765, "ground_truth": 0}, {"key": "20936833", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.0953494632134608, "ground_truth": 0}, {"key": "20936833", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.06804041791037514, "ground_truth": 0}, {"key": "20936833", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.08756383295503745, "ground_truth": 0}, {"key": "36832879", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3242353703620367, "ground_truth": 0}, {"key": "36832879", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49804687328555347, "ground_truth": 0}, {"key": "36832879", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39047585609654356, "ground_truth": 0}, {"key": "36832879", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3720487918261448, "ground_truth": 0}, {"key": "36832879", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20055767631791993, "ground_truth": 0}, {"key": "14958201", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4148988415619033, "ground_truth": 0}, {"key": "14958201", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.47073656950056897, "ground_truth": 0}, {"key": "14958201", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35577488292834086, "ground_truth": 0}, {"key": "14958201", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632162717168154, "ground_truth": 0}, {"key": "14958201", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43206337800997957, "ground_truth": 0}, {"key": "34352262", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.04958902736081325, "ground_truth": 0}, {"key": "34352262", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11279540172774477, "ground_truth": 0}, {"key": "34352262", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.09009299272149084, "ground_truth": 0}, {"key": "34352262", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.08882029174922537, "ground_truth": 0}, {"key": "34352262", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.0821066241862719, "ground_truth": 0}, {"key": "39805395", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25386099811199947, "ground_truth": 0}, {"key": "39805395", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17781088205444076, "ground_truth": 0}, {"key": "39805395", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2829881261791239, "ground_truth": 0}, {"key": "39805395", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2766905129193479, "ground_truth": 0}, {"key": "39805395", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3191213848968649, "ground_truth": 0}, {"key": "34303109", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1490353037880726, "ground_truth": 0}, {"key": "34303109", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13477591890895357, "ground_truth": 0}, {"key": "34303109", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13028542082925765, "ground_truth": 0}, {"key": "34303109", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16238002709366192, "ground_truth": 0}, {"key": "34303109", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.10669058997579867, "ground_truth": 0}, {"key": "39939090", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6636689763756216, "ground_truth": 0}, {"key": "39939090", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2845759919736916, "ground_truth": 0}, {"key": "39939090", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42250465135503285, "ground_truth": 0}, {"key": "39939090", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3979384269604852, "ground_truth": 0}, {"key": "39939090", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105530194425, "ground_truth": 0}, {"key": "29347771", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.640635866313716, "ground_truth": 0}, {"key": "29347771", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4960938237055499, "ground_truth": 0}, {"key": "29347771", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6460137149374641, "ground_truth": 0}, {"key": "29347771", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819757372959, "ground_truth": 0}, {"key": "29347771", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876299964820364, "ground_truth": 0}, {"key": "36783415", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22541662483032168, "ground_truth": 0}, {"key": "36783415", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17667161207283316, "ground_truth": 0}, {"key": "36783415", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12940271701910191, "ground_truth": 0}, {"key": "36783415", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31069438976507513, "ground_truth": 0}, {"key": "36783415", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.218669366768771, "ground_truth": 0}, {"key": "37935687", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3433417324530007, "ground_truth": 0}, {"key": "37935687", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43590151630375673, "ground_truth": 0}, {"key": "37935687", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4668456099355448, "ground_truth": 0}, {"key": "37935687", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937836947531756, "ground_truth": 0}, {"key": "37935687", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3575675186738205, "ground_truth": 0}, {"key": "40260829", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6206216290274694, "ground_truth": 0}, {"key": "40260829", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.519521336421701, "ground_truth": 0}, {"key": "40260829", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5097643724114794, "ground_truth": 0}, {"key": "40260829", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40544874836182987, "ground_truth": 0}, {"key": "40260829", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704681630881, "ground_truth": 0}, {"key": "36478199", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.647798224598032, "ground_truth": 0}, {"key": "36478199", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5195213312822418, "ground_truth": 0}, {"key": "36478199", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5039061824554572, "ground_truth": 0}, {"key": "36478199", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4513265046304664, "ground_truth": 0}, {"key": "36478199", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531103413872, "ground_truth": 0}, {"key": "34541803", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4726834679285257, "ground_truth": 0}, {"key": "34541803", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19193277552415738, "ground_truth": 0}, {"key": "34541803", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6113819891969954, "ground_truth": 0}, {"key": "34541803", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1120159561125936, "ground_truth": 0}, {"key": "34541803", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11201595520556437, "ground_truth": 0}, {"key": "35360841", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7310585827878092, "ground_truth": 0}, {"key": "35360841", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7008948120683826, "ground_truth": 0}, {"key": "35360841", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.49218812288934866, "ground_truth": 0}, {"key": "35360841", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388353130117507, "ground_truth": 0}, {"key": "35360841", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121668197975, "ground_truth": 0}, {"key": "35550407", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4980468937508455, "ground_truth": 0}, {"key": "35550407", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.39420095606645583, "ground_truth": 0}, {"key": "35550407", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4843800749794059, "ground_truth": 0}, {"key": "35550407", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3174262938511354, "ground_truth": 0}, {"key": "35550407", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3611647315782491, "ground_truth": 0}, {"key": "37561590", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6943026601348153, "ground_truth": 0}, {"key": "37561590", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5234203625078101, "ground_truth": 0}, {"key": "37561590", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8955226824464524, "ground_truth": 0}, {"key": "37561590", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982340071952, "ground_truth": 0}, {"key": "37561590", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802546194587, "ground_truth": 0}, {"key": "39328843", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8354835381100969, "ground_truth": 0}, {"key": "39328843", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8587185723073811, "ground_truth": 0}, {"key": "39328843", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8887587896512347, "ground_truth": 0}, {"key": "39328843", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.874077236559965, "ground_truth": 0}, {"key": "39328843", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086178973081955, "ground_truth": 0}, {"key": "35389665", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9039745111962257, "ground_truth": 0}, {"key": "35389665", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8705972664277253, "ground_truth": 0}, {"key": "35389665", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9489172641079628, "ground_truth": 0}, {"key": "35389665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.942081914402821, "ground_truth": 0}, {"key": "35389665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9394706053286577, "ground_truth": 0}, {"key": "33080187", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10302442601208216, "ground_truth": 0}, {"key": "33080187", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.08449275109948436, "ground_truth": 0}, {"key": "33080187", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.07751765464206498, "ground_truth": 0}, {"key": "33080187", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.06187598401648724, "ground_truth": 0}, {"key": "33080187", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.05749327352328194, "ground_truth": 0}, {"key": "38636995", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2351083921488054, "ground_truth": 0}, {"key": "38636995", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30569734723337116, "ground_truth": 0}, {"key": "38636995", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28140560569599915, "ground_truth": 0}, {"key": "38636995", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30569735015666893, "ground_truth": 0}, {"key": "38636995", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4111108600270896, "ground_truth": 0}, {"key": "18536236", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5583269719546111, "ground_truth": 0}, {"key": "18536236", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6279512227314107, "ground_truth": 0}, {"key": "18536236", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "18536236", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073527456474, "ground_truth": 0}, {"key": "18536236", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352713854403, "ground_truth": 0}, {"key": "36289151", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.147064528885372, "ground_truth": 0}, {"key": "36289151", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5039061698014226, "ground_truth": 0}, {"key": "36289151", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25832597174888244, "ground_truth": 0}, {"key": "36289151", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4882833763954215, "ground_truth": 0}, {"key": "36289151", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3647775462720865, "ground_truth": 0}, {"key": "23017045", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3812195857358667, "ground_truth": 0}, {"key": "23017045", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5698526369714441, "ground_truth": 0}, {"key": "23017045", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6076631693629204, "ground_truth": 0}, {"key": "23017045", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.583203369504352, "ground_truth": 0}, {"key": "23017045", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531256749648, "ground_truth": 0}, {"key": "36418082", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5717665975486264, "ground_truth": 0}, {"key": "36418082", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5888891273241526, "ground_truth": 0}, {"key": "36418082", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.697608911914202, "ground_truth": 0}, {"key": "36418082", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004154296849, "ground_truth": 0}, {"key": "36418082", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102512028343, "ground_truth": 0}, {"key": "34396551", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33111971750530533, "ground_truth": 0}, {"key": "34396551", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4186968929100951, "ground_truth": 0}, {"key": "34396551", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26588045411330546, "ground_truth": 0}, {"key": "34396551", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4474603152660311, "ground_truth": 0}, {"key": "34396551", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33633104777904704, "ground_truth": 0}, {"key": "39720944", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5214711698831139, "ground_truth": 0}, {"key": "39720944", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6654105585322732, "ground_truth": 0}, {"key": "39720944", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.675764578817017, "ground_truth": 0}, {"key": "39720944", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512401399552, "ground_truth": 0}, {"key": "39720944", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365587300584, "ground_truth": 0}, {"key": "35884842", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14903527780827996, "ground_truth": 0}, {"key": "35884842", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2538609839444346, "ground_truth": 0}, {"key": "35884842", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18713267598794972, "ground_truth": 0}, {"key": "35884842", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20689404877755485, "ground_truth": 0}, {"key": "35884842", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11838509649387459, "ground_truth": 0}, {"key": "35403375", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1581743519891611, "ground_truth": 0}, {"key": "35403375", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1550784674891175, "ground_truth": 0}, {"key": "35403375", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11279538974090371, "ground_truth": 0}, {"key": "35403375", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1699562174729245, "ground_truth": 0}, {"key": "35403375", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15921740124371964, "ground_truth": 0}, {"key": "26341324", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8322366491292174, "ground_truth": 0}, {"key": "26341324", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7648916181369521, "ground_truth": 0}, {"key": "26341324", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7892336892319175, "ground_truth": 0}, {"key": "26341324", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438950901130553, "ground_truth": 0}, {"key": "26341324", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757645940425913, "ground_truth": 0}, {"key": "19212345", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5117166030349528, "ground_truth": 0}, {"key": "19212345", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5794004332275141, "ground_truth": 0}, {"key": "19212345", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6187803918712581, "ground_truth": 0}, {"key": "19212345", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468510553694, "ground_truth": 0}, {"key": "19212345", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365655684442, "ground_truth": 0}, {"key": "30548367", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4921881427993071, "ground_truth": 0}, {"key": "30548367", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6842640301770717, "ground_truth": 0}, {"key": "30548367", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.715423988484102, "ground_truth": 0}, {"key": "30548367", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358233315583, "ground_truth": 0}, {"key": "30548367", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737238219152, "ground_truth": 0}, {"key": "37919402", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.760650654417809, "ground_truth": 0}, {"key": "37919402", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6943026539467917, "ground_truth": 0}, {"key": "37919402", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5717666125906116, "ground_truth": 0}, {"key": "37919402", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324801752754, "ground_truth": 0}, {"key": "37919402", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.783988464511167, "ground_truth": 0}, {"key": "39995133", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.835483532069894, "ground_truth": 0}, {"key": "39995133", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8887587951573226, "ground_truth": 0}, {"key": "39995133", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7386690959967155, "ground_truth": 0}, {"key": "39995133", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825912014307, "ground_truth": 0}, {"key": "39995133", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476672388309, "ground_truth": 0}, {"key": "40249088", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "40249088", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6943026956784022, "ground_truth": 0}, {"key": "40249088", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3380771101490131, "ground_truth": 0}, {"key": "40249088", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891365127416, "ground_truth": 0}, {"key": "40249088", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.754914996463337, "ground_truth": 0}, {"key": "40254388", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.40922080140876443, "ground_truth": 0}, {"key": "40254388", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.33285232247715557, "ground_truth": 0}, {"key": "40254388", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4397473473279116, "ground_truth": 0}, {"key": "40254388", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203425515309, "ground_truth": 0}, {"key": "40254388", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092207902682025, "ground_truth": 0}, {"key": "31995230", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6460136767557672, "ground_truth": 0}, {"key": "31995230", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6057990095742585, "ground_truth": 0}, {"key": "31995230", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8056321905807604, "ground_truth": 0}, {"key": "31995230", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233284004967615, "ground_truth": 0}, {"key": "31995230", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513668560634, "ground_truth": 0}, {"key": "38632129", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6076631594709737, "ground_truth": 0}, {"key": "38632129", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49804689075694714, "ground_truth": 0}, {"key": "38632129", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5698526752525257, "ground_truth": 0}, {"key": "38632129", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4707366020737605, "ground_truth": 0}, {"key": "38632129", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723316857812336, "ground_truth": 0}, {"key": "35720795", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5331544078068281, "ground_truth": 0}, {"key": "35720795", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.616935837808878, "ground_truth": 0}, {"key": "35720795", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "35720795", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601360268558, "ground_truth": 0}, {"key": "35720795", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4301473492963133, "ground_truth": 0}, {"key": "23906759", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24944723468129856, "ground_truth": 0}, {"key": "23906759", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6859494621804748, "ground_truth": 0}, {"key": "23906759", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6076631759052318, "ground_truth": 0}, {"key": "23906759", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4746311711527146, "ground_truth": 0}, {"key": "23906759", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704834360167, "ground_truth": 0}, {"key": "19410108", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.45132651260409545, "ground_truth": 0}, {"key": "19410108", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4551986182371055, "ground_truth": 0}, {"key": "19410108", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26133094981121174, "ground_truth": 0}, {"key": "19410108", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3812195555933664, "ground_truth": 0}, {"key": "19410108", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544875551450765, "ground_truth": 0}, {"key": "30745137", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.294214951870483, "ground_truth": 0}, {"key": "30745137", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4687906474163052, "ground_truth": 0}, {"key": "30745137", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2479874237581508, "ground_truth": 0}, {"key": "30745137", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26894143761696926, "ground_truth": 0}, {"key": "30745137", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27202454719167424, "ground_truth": 0}, {"key": "26553115", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30902370766336007, "ground_truth": 0}, {"key": "26553115", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.332852331859079, "ground_truth": 0}, {"key": "26553115", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25982564951516346, "ground_truth": 0}, {"key": "26553115", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3157359781643777, "ground_truth": 0}, {"key": "26553115", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.10818894725359994, "ground_truth": 0}, {"key": "37872311", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8365545609422624, "ground_truth": 0}, {"key": "37872311", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6548947205367824, "ground_truth": 0}, {"key": "37872311", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9246876968643833, "ground_truth": 0}, {"key": "37872311", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943591678801, "ground_truth": 0}, {"key": "37872311", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445534346116, "ground_truth": 0}, {"key": "35553131", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7122321689845477, "ground_truth": 0}, {"key": "35553131", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8705972859735136, "ground_truth": 0}, {"key": "35553131", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8596637505209744, "ground_truth": 0}, {"key": "35553131", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909763079379629, "ground_truth": 0}, {"key": "35553131", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760334578325, "ground_truth": 0}, {"key": "39038936", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49218815876648797, "ground_truth": 0}, {"key": "39038936", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37022536380820736, "ground_truth": 0}, {"key": "39038936", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33458945887533775, "ground_truth": 0}, {"key": "39038936", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792281511114, "ground_truth": 0}, {"key": "39038936", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.41300355289913754, "ground_truth": 0}, {"key": "38735486", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9844563531301089, "ground_truth": 0}, {"key": "38735486", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9481545344362227, "ground_truth": 0}, {"key": "38735486", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9681411432099031, "ground_truth": 0}, {"key": "38735486", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9284087970250822, "ground_truth": 0}, {"key": "38735486", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9202179872990183, "ground_truth": 0}, {"key": "17087845", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2553436453110467, "ground_truth": 0}, {"key": "17087845", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37937839193108125, "ground_truth": 0}, {"key": "17087845", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3040416714232261, "ground_truth": 0}, {"key": "17087845", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35398629202043785, "ground_truth": 0}, {"key": "17087845", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19193278356875051, "ground_truth": 0}, {"key": "37443011", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5467381358045074, "ground_truth": 0}, {"key": "37443011", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6943026644334926, "ground_truth": 0}, {"key": "37443011", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.511716602750749, "ground_truth": 0}, {"key": "37443011", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.718594375540974, "ground_truth": 0}, {"key": "37443011", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.548673504202631, "ground_truth": 0}, {"key": "36855749", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5964331411470184, "ground_truth": 0}, {"key": "36855749", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6352224503448812, "ground_truth": 0}, {"key": "36855749", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6132365689258347, "ground_truth": 0}, {"key": "36855749", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082588313811, "ground_truth": 0}, {"key": "36855749", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419730859915, "ground_truth": 0}, {"key": "35613141", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5907791793002939, "ground_truth": 0}, {"key": "35613141", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6279512006236891, "ground_truth": 0}, {"key": "35613141", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.37204878183548645, "ground_truth": 0}, {"key": "35613141", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.45519858671903846, "ground_truth": 0}, {"key": "35613141", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35220177668945063, "ground_truth": 0}, {"key": "39088847", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5078118668237559, "ground_truth": 0}, {"key": "39088847", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.36477756698136327, "ground_truth": 0}, {"key": "39088847", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39606815489820607, "ground_truth": 0}, {"key": "39088847", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.352201784782752, "ground_truth": 0}, {"key": "39088847", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34687308581279297, "ground_truth": 0}, {"key": "33197277", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32423540077470214, "ground_truth": 0}, {"key": "33197277", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7371581585272685, "ground_truth": 0}, {"key": "33197277", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6388352463659527, "ground_truth": 0}, {"key": "33197277", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943850361173, "ground_truth": 0}, {"key": "33197277", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964257479986, "ground_truth": 0}, {"key": "33815489", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35936413173223697, "ground_truth": 0}, {"key": "33815489", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "33815489", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5428632874243972, "ground_truth": 0}, {"key": "33815489", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269924490637, "ground_truth": 0}, {"key": "33815489", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526405663742, "ground_truth": 0}, {"key": "35862754", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6601723688541846, "ground_truth": 0}, {"key": "35862754", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6169358203854287, "ground_truth": 0}, {"key": "35862754", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6584174965991768, "ground_truth": 0}, {"key": "35862754", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324619381536, "ground_truth": 0}, {"key": "35862754", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512582171971, "ground_truth": 0}, {"key": "36080615", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18952109840451667, "ground_truth": 0}, {"key": "36080615", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3191213989813281, "ground_truth": 0}, {"key": "36080615", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21866938205066705, "ground_truth": 0}, {"key": "36080615", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.270480218707246, "ground_truth": 0}, {"key": "36080615", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2479874168963398, "ground_truth": 0}, {"key": "22822742", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6039318268861292, "ground_truth": 0}, {"key": "22822742", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.737158152285254, "ground_truth": 0}, {"key": "22822742", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7759445289755296, "ground_truth": 0}, {"key": "22822742", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666482428007, "ground_truth": 0}, {"key": "22822742", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702826447829, "ground_truth": 0}, {"key": "39747536", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.36658972464908607, "ground_truth": 0}, {"key": "39747536", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2893716951873684, "ground_truth": 0}, {"key": "39747536", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26894141963120183, "ground_truth": 0}, {"key": "39747536", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3539863278540106, "ground_truth": 0}, {"key": "39747536", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29421496704328703, "ground_truth": 0}, {"key": "34218396", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6113819877271959, "ground_truth": 0}, {"key": "34218396", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.679178699414535, "ground_truth": 0}, {"key": "34218396", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6531268960742116, "ground_truth": 0}, {"key": "34218396", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49414088922448157, "ground_truth": 0}, {"key": "34218396", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.759225427312073, "ground_truth": 0}, {"key": "39150388", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35398630283907356, "ground_truth": 0}, {"key": "39150388", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5078118355474663, "ground_truth": 0}, {"key": "39150388", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42632158481656746, "ground_truth": 0}, {"key": "39150388", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593640991156983, "ground_truth": 0}, {"key": "39150388", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011428222662, "ground_truth": 0}, {"key": "28765782", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.314050540675329, "ground_truth": 0}, {"key": "28765782", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4035668665950683, "ground_truth": 0}, {"key": "28765782", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3684056988718581, "ground_truth": 0}, {"key": "28765782", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668455810829084, "ground_truth": 0}, {"key": "28765782", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33807710962194343, "ground_truth": 0}, {"key": "35828022", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28616922691041796, "ground_truth": 0}, {"key": "35828022", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6636689627888296, "ground_truth": 0}, {"key": "35828022", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7416739913745548, "ground_truth": 0}, {"key": "35828022", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.54092386276841, "ground_truth": 0}, {"key": "35828022", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526476052574, "ground_truth": 0}, {"key": "27717735", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5136684785683839, "ground_truth": 0}, {"key": "27717735", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43206339571830277, "ground_truth": 0}, {"key": "27717735", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40733342741942513, "ground_truth": 0}, {"key": "27717735", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011453782167, "ground_truth": 0}, {"key": "27717735", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684942450663, "ground_truth": 0}, {"key": "37977826", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5370413453019385, "ground_truth": 0}, {"key": "37977826", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32252600853012475, "ground_truth": 0}, {"key": "37977826", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6774740199676372, "ground_truth": 0}, {"key": "37977826", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43782351704728034, "ground_truth": 0}, {"key": "37977826", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926665837512499, "ground_truth": 0}, {"key": "31768588", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7401743805385164, "ground_truth": 0}, {"key": "31768588", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7676898511648358, "ground_truth": 0}, {"key": "31768588", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8210441234360786, "ground_truth": 0}, {"key": "31768588", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238621956567, "ground_truth": 0}, {"key": "31768588", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789037138144, "ground_truth": 0}, {"key": "37183351", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3702253794263179, "ground_truth": 0}, {"key": "37183351", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31573598745547415, "ground_truth": 0}, {"key": "37183351", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34864514084302295, "ground_truth": 0}, {"key": "37183351", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.38491214032868887, "ground_truth": 0}, {"key": "37183351", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922083519113933, "ground_truth": 0}, {"key": "39622090", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5292633933137632, "ground_truth": 0}, {"key": "39622090", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.36477757524554716, "ground_truth": 0}, {"key": "39622090", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5525397125890218, "ground_truth": 0}, {"key": "39622090", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.394200984797465, "ground_truth": 0}, {"key": "39622090", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34334174783264404, "ground_truth": 0}, {"key": "39272756", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6334102566324122, "ground_truth": 0}, {"key": "39272756", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4205995792136617, "ground_truth": 0}, {"key": "39272756", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5583269803329836, "ground_truth": 0}, {"key": "39272756", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4941409016886072, "ground_truth": 0}, {"key": "39272756", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984343646418, "ground_truth": 0}, {"key": "32138822", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49218816132396886, "ground_truth": 0}, {"key": "32138822", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6388352921773696, "ground_truth": 0}, {"key": "32138822", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7248702787844123, "ground_truth": 0}, {"key": "32138822", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026701035219, "ground_truth": 0}, {"key": "32138822", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673215424235, "ground_truth": 0}, {"key": "31070114", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.0803574704785474, "ground_truth": 0}, {"key": "31070114", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16026603845173068, "ground_truth": 0}, {"key": "31070114", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.05834583808788193, "ground_truth": 0}, {"key": "31070114", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.06853749192678402, "ground_truth": 0}, {"key": "31070114", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17106119714204793, "ground_truth": 0}, {"key": "39652762", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.535098416417928, "ground_truth": 0}, {"key": "39652762", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7606506568492408, "ground_truth": 0}, {"key": "39652762", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7577943602090091, "ground_truth": 0}, {"key": "39652762", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093644438225, "ground_truth": 0}, {"key": "39652762", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819604799952, "ground_truth": 0}, {"key": "33258866", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28298811804585766, "ground_truth": 0}, {"key": "33258866", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3451052790398889, "ground_truth": 0}, {"key": "33258866", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.255343678253437, "ground_truth": 0}, {"key": "33258866", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25982563129949593, "ground_truth": 0}, {"key": "33258866", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.37022539060048293, "ground_truth": 0}, {"key": "36962388", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2323101475694698, "ground_truth": 0}, {"key": "36962388", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13028542448323413, "ground_truth": 0}, {"key": "36962388", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.36296919205261874, "ground_truth": 0}, {"key": "36962388", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13753245873257977, "ground_truth": 0}, {"key": "36962388", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30074558564860304, "ground_truth": 0}, {"key": "32282272", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33807712162887227, "ground_truth": 0}, {"key": "32282272", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17553808567246149, "ground_truth": 0}, {"key": "32282272", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20561504933919172, "ground_truth": 0}, {"key": "32282272", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.18010666733067537, "ground_truth": 0}, {"key": "32282272", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2674081655930332, "ground_truth": 0}, {"key": "36093072", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.819893311998664, "ground_truth": 0}, {"key": "36093072", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3486451462975124, "ground_truth": 0}, {"key": "36093072", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6636689451590865, "ground_truth": 0}, {"key": "36093072", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.700894791974097, "ground_truth": 0}, {"key": "36093072", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185406060185, "ground_truth": 0}, {"key": "38879972", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6279512277655895, "ground_truth": 0}, {"key": "38879972", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5486734937472838, "ground_truth": 0}, {"key": "38879972", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6442250989966362, "ground_truth": 0}, {"key": "38879972", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074047082253442, "ground_truth": 0}, {"key": "38879972", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4980468729212023, "ground_truth": 0}, {"key": "32106473", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8175744732510303, "ground_truth": 0}, {"key": "32106473", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6187804330383548, "ground_truth": 0}, {"key": "32106473", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8529354852015236, "ground_truth": 0}, {"key": "32106473", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424516069719, "ground_truth": 0}, {"key": "32106473", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441183521603, "ground_truth": 0}, {"key": "40415815", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28457601024606805, "ground_truth": 0}, {"key": "40415815", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20561503344530407, "ground_truth": 0}, {"key": "40415815", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4225046416893376, "ground_truth": 0}, {"key": "40415815", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.38306417309654334, "ground_truth": 0}, {"key": "40415815", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34334171352255904, "ground_truth": 0}, {"key": "34581918", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21866937504870906, "ground_truth": 0}, {"key": "34581918", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2782567953686786, "ground_truth": 0}, {"key": "34581918", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3702254038991092, "ground_truth": 0}, {"key": "34581918", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.44360042715272485, "ground_truth": 0}, {"key": "34581918", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35756752548782667, "ground_truth": 0}, {"key": "33004157", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7233094602561775, "ground_truth": 0}, {"key": "33004157", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7476159582926587, "ground_truth": 0}, {"key": "33004157", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8289388025897747, "ground_truth": 0}, {"key": "33004157", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159592134448, "ground_truth": 0}, {"key": "33004157", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085957868937, "ground_truth": 0}, {"key": "30334943", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7401743702020982, "ground_truth": 0}, {"key": "30334943", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7248702854155122, "ground_truth": 0}, {"key": "30334943", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.661922901340144, "ground_truth": 0}, {"key": "30334943", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020615842986348, "ground_truth": 0}, {"key": "30334943", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074047090540878, "ground_truth": 0}, {"key": "33280503", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1623800299778733, "ground_truth": 0}, {"key": "33280503", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11596071273406323, "ground_truth": 0}, {"key": "33280503", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.061875986881449435, "ground_truth": 0}, {"key": "33280503", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16344544430315622, "ground_truth": 0}, {"key": "33280503", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22678364543191212, "ground_truth": 0}, {"key": "25726782", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5888891282498804, "ground_truth": 0}, {"key": "25726782", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5602526318886324, "ground_truth": 0}, {"key": "25726782", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.74908718386709, "ground_truth": 0}, {"key": "25726782", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352689791535, "ground_truth": 0}, {"key": "25726782", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876300016805509, "ground_truth": 0}, {"key": "35479854", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4843800887258009, "ground_truth": 0}, {"key": "35479854", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38676345645692833, "ground_truth": 0}, {"key": "35479854", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5370413630735632, "ground_truth": 0}, {"key": "35479854", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633866806129, "ground_truth": 0}, {"key": "35479854", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004179344629, "ground_truth": 0}, {"key": "32716226", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6076631634538383, "ground_truth": 0}, {"key": "32716226", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6671476755208944, "ground_truth": 0}, {"key": "32716226", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24220562078850386, "ground_truth": 0}, {"key": "32716226", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631838221125, "ground_truth": 0}, {"key": "32716226", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004138884074, "ground_truth": 0}, {"key": "37047554", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2523840392888007, "ground_truth": 0}, {"key": "37047554", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.228156498040596, "ground_truth": 0}, {"key": "37047554", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2107662880347095, "ground_truth": 0}, {"key": "37047554", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2240554589414661, "ground_truth": 0}, {"key": "37047554", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22541661204967703, "ground_truth": 0}, {"key": "36565290", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9099070061525117, "ground_truth": 0}, {"key": "36565290", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8386797517647244, "ground_truth": 0}, {"key": "36565290", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8558511454150846, "ground_truth": 0}, {"key": "36565290", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9012274149283583, "ground_truth": 0}, {"key": "36565290", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.805632197785244, "ground_truth": 0}, {"key": "27758640", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6636689261506276, "ground_truth": 0}, {"key": "27758640", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5409238584991053, "ground_truth": 0}, {"key": "27758640", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7154239816126922, "ground_truth": 0}, {"key": "27758640", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303200053974, "ground_truth": 0}, {"key": "27758640", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762759503745, "ground_truth": 0}, {"key": "28897118", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4359015273125485, "ground_truth": 0}, {"key": "28897118", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22678362720499637, "ground_truth": 0}, {"key": "28897118", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5117166278639563, "ground_truth": 0}, {"key": "28897118", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33633105805692903, "ground_truth": 0}, {"key": "28897118", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4225046372275247, "ground_truth": 0}, {"key": "38452661", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8749346170196074, "ground_truth": 0}, {"key": "38452661", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8449215269540689, "ground_truth": 0}, {"key": "38452661", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.720171493479765, "ground_truth": 0}, {"key": "38452661", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254010347464, "ground_truth": 0}, {"key": "38452661", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106282987147979, "ground_truth": 0}, {"key": "38033492", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4726834847011023, "ground_truth": 0}, {"key": "38033492", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3451052862428962, "ground_truth": 0}, {"key": "38033492", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2845760177868068, "ground_truth": 0}, {"key": "38033492", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4493926399765087, "ground_truth": 0}, {"key": "38033492", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711703100131, "ground_truth": 0}, {"key": "35949555", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7341195098163342, "ground_truth": 0}, {"key": "35949555", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6757646262284189, "ground_truth": 0}, {"key": "35949555", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.740174352310832, "ground_truth": 0}, {"key": "35949555", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916037435005, "ground_truth": 0}, {"key": "35949555", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.753466650428933, "ground_truth": 0}, {"key": "15263826", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16667539160243905, "ground_truth": 0}, {"key": "15263826", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2227001501791507, "ground_truth": 0}, {"key": "15263826", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20181321956436463, "ground_truth": 0}, {"key": "15263826", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13568954780542264, "ground_truth": 0}, {"key": "15263826", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.324235390595095, "ground_truth": 0}, {"key": "37313866", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8080672223536248, "ground_truth": 0}, {"key": "37313866", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6039318181210911, "ground_truth": 0}, {"key": "37313866", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5525397061682681, "ground_truth": 0}, {"key": "37313866", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3738758258768987, "ground_truth": 0}, {"key": "37313866", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.63883530394162, "ground_truth": 0}, {"key": "13911157", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7892337006962092, "ground_truth": 0}, {"key": "13911157", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.658417519831853, "ground_truth": 0}, {"key": "13911157", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8799743704948169, "ground_truth": 0}, {"key": "13911157", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354752422749, "ground_truth": 0}, {"key": "13911157", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281493704615, "ground_truth": 0}, {"key": "39594894", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5774953932912837, "ground_truth": 0}, {"key": "39594894", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5175708698757603, "ground_truth": 0}, {"key": "39594894", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.45713671086725494, "ground_truth": 0}, {"key": "39594894", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331473848922, "ground_truth": 0}, {"key": "39594894", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878266783175, "ground_truth": 0}, {"key": "34096170", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3106943956093233, "ground_truth": 0}, {"key": "34096170", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4941409044055035, "ground_truth": 0}, {"key": "34096170", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3738758028793613, "ground_truth": 0}, {"key": "34096170", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33111972738177664, "ground_truth": 0}, {"key": "34096170", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32082130208786824, "ground_truth": 0}, {"key": "37891952", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9299510381728123, "ground_truth": 0}, {"key": "37891952", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8848377689762301, "ground_truth": 0}, {"key": "37891952", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9039745128133068, "ground_truth": 0}, {"key": "37891952", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9394706126898346, "ground_truth": 0}, {"key": "37891952", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218417129944, "ground_truth": 0}, {"key": "40186158", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.34158251865037054, "ground_truth": 0}, {"key": "40186158", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20181322350727302, "ground_truth": 0}, {"key": "40186158", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20307461422993034, "ground_truth": 0}, {"key": "40186158", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21469142373512945, "ground_truth": 0}, {"key": "40186158", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17781087363598524, "ground_truth": 0}, {"key": "37049719", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6242935198943788, "ground_truth": 0}, {"key": "37049719", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5964331419910572, "ground_truth": 0}, {"key": "37049719", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6095241656135231, "ground_truth": 0}, {"key": "37049719", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448013850544915, "ground_truth": 0}, {"key": "37049719", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802412660226, "ground_truth": 0}, {"key": "34610504", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27048022484340384, "ground_truth": 0}, {"key": "34610504", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24653335229435291, "ground_truth": 0}, {"key": "34610504", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24508503930014655, "ground_truth": 0}, {"key": "34610504", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3040416867193868, "ground_truth": 0}, {"key": "34610504", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3363310567827719, "ground_truth": 0}, {"key": "37595429", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5964331266774368, "ground_truth": 0}, {"key": "37595429", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6531269287558715, "ground_truth": 0}, {"key": "37595429", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4339814543185646, "ground_truth": 0}, {"key": "37595429", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.41869690207950017, "ground_truth": 0}, {"key": "37595429", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882833985546866, "ground_truth": 0}, {"key": "29772670", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35042141876769684, "ground_truth": 0}, {"key": "29772670", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.44167301102992046, "ground_truth": 0}, {"key": "29772670", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.594551254854211, "ground_truth": 0}, {"key": "29772670", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557748966465152, "ground_truth": 0}, {"key": "29772670", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3960681761549928, "ground_truth": 0}, {"key": "36369872", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.767689850900475, "ground_truth": 0}, {"key": "36369872", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4843800951583925, "ground_truth": 0}, {"key": "36369872", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5869964449016122, "ground_truth": 0}, {"key": "36369872", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.763483777177807, "ground_truth": 0}, {"key": "36369872", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300675701005, "ground_truth": 0}, {"key": "34527433", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18010666049729532, "ground_truth": 0}, {"key": "34527433", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13846179232901534, "ground_truth": 0}, {"key": "34527433", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1581743642039187, "ground_truth": 0}, {"key": "34527433", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24077459938921178, "ground_truth": 0}, {"key": "34527433", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.08694165853722546, "ground_truth": 0}, {"key": "31111734", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8164063684460531, "ground_truth": 0}, {"key": "31111734", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5389832349592922, "ground_truth": 0}, {"key": "31111734", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7461390081821542, "ground_truth": 0}, {"key": "31111734", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136955480769, "ground_truth": 0}, {"key": "31111734", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789200142597, "ground_truth": 0}, {"key": "40303872", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3904758267581698, "ground_truth": 0}, {"key": "40303872", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49218814744298045, "ground_truth": 0}, {"key": "40303872", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30902373406247435, "ground_truth": 0}, {"key": "40303872", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850226825716, "ground_truth": 0}, {"key": "40303872", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737455067993, "ground_truth": 0}, {"key": "33653553", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17441029115401802, "ground_truth": 0}, {"key": "33653553", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42632160266150987, "ground_truth": 0}, {"key": "33653553", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21733751704634727, "ground_truth": 0}, {"key": "33653553", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23231012140842608, "ground_truth": 0}, {"key": "33653553", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19072402756569845, "ground_truth": 0}, {"key": "34404510", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5467381600557115, "ground_truth": 0}, {"key": "34404510", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37022538206349914, "ground_truth": 0}, {"key": "34404510", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5214711538703223, "ground_truth": 0}, {"key": "34404510", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.525368849440467, "ground_truth": 0}, {"key": "34404510", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122322009596418, "ground_truth": 0}, {"key": "35568692", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.13386748260159104, "ground_truth": 0}, {"key": "35568692", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10970577926820815, "ground_truth": 0}, {"key": "35568692", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12506538848223345, "ground_truth": 0}, {"key": "35568692", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.07921032782499036, "ground_truth": 0}, {"key": "35568692", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.09670578653833467, "ground_truth": 0}, {"key": "39151664", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11357959130257046, "ground_truth": 0}, {"key": "39151664", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.368405695110393, "ground_truth": 0}, {"key": "39151664", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.27048023292319834, "ground_truth": 0}, {"key": "39151664", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3311197424652365, "ground_truth": 0}, {"key": "39151664", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34687307939985573, "ground_truth": 0}, {"key": "37493670", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9019206839060283, "ground_truth": 0}, {"key": "37493670", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9702399059489109, "ground_truth": 0}, {"key": "37493670", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9073122312295026, "ground_truth": 0}, {"key": "37493670", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070032802892, "ground_truth": 0}, {"key": "37493670", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.948154535948668, "ground_truth": 0}, {"key": "21935983", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19314739395169309, "ground_truth": 0}, {"key": "21935983", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24220561001481294, "ground_truth": 0}, {"key": "21935983", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.27048023599973603, "ground_truth": 0}, {"key": "21935983", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25534366114324936, "ground_truth": 0}, {"key": "21935983", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1744102878268029, "ground_truth": 0}, {"key": "38174214", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49804688163165917, "ground_truth": 0}, {"key": "38174214", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6584175002158371, "ground_truth": 0}, {"key": "38174214", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5506073600457964, "ground_truth": 0}, {"key": "38174214", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832225800939, "ground_truth": 0}, {"key": "38174214", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4263215827517884, "ground_truth": 0}, {"key": "40319923", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5563995617937767, "ground_truth": 0}, {"key": "40319923", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7577943825347367, "ground_truth": 0}, {"key": "40319923", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7106282852662935, "ground_truth": 0}, {"key": "40319923", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786082669956, "ground_truth": 0}, {"key": "40319923", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804621369469, "ground_truth": 0}, {"key": "36478264", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48438007957857626, "ground_truth": 0}, {"key": "36478264", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5544704654579904, "ground_truth": 0}, {"key": "36478264", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7592254107309517, "ground_truth": 0}, {"key": "36478264", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5525397047512194, "ground_truth": 0}, {"key": "36478264", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420095586436205, "ground_truth": 0}, {"key": "11935769", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5583269965227573, "ground_truth": 0}, {"key": "11935769", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "11935769", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.494140893228839, "ground_truth": 0}, {"key": "11935769", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "11935769", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824291088135251, "ground_truth": 0}, {"key": "33373410", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1120159446351803, "ground_truth": 0}, {"key": "33373410", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.12852514742105112, "ground_truth": 0}, {"key": "33373410", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18476750447867973, "ground_truth": 0}, {"key": "33373410", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.10894503651213144, "ground_truth": 0}, {"key": "33373410", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.10818895757216737, "ground_truth": 0}, {"key": "11130680", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.492188154763413, "ground_truth": 0}, {"key": "11130680", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38306418581748947, "ground_truth": 0}, {"key": "11130680", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.09807933140325445, "ground_truth": 0}, {"key": "11130680", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16344544722371665, "ground_truth": 0}, {"key": "11130680", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974732320209564, "ground_truth": 0}, {"key": "34868650", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27202455386696306, "ground_truth": 0}, {"key": "34868650", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40733341206646523, "ground_truth": 0}, {"key": "34868650", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4186969144605033, "ground_truth": 0}, {"key": "34868650", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33633105317806494, "ground_truth": 0}, {"key": "34868650", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.531209396555767, "ground_truth": 0}, {"key": "33960561", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5983121770127054, "ground_truth": 0}, {"key": "33960561", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5660185436416906, "ground_truth": 0}, {"key": "33960561", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.689305622198997, "ground_truth": 0}, {"key": "33960561", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804220909924, "ground_truth": 0}, {"key": "33960561", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092207920668603, "ground_truth": 0}, {"key": "22504858", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4339814630344097, "ground_truth": 0}, {"key": "22504858", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6688802828242283, "ground_truth": 0}, {"key": "22504858", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5136684562104984, "ground_truth": 0}, {"key": "22504858", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708643177086, "ground_truth": 0}, {"key": "22504858", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4130035676694375, "ground_truth": 0}, {"key": "32283530", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6791786891537172, "ground_truth": 0}, {"key": "32283530", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4921881333488405, "ground_truth": 0}, {"key": "32283530", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6297745833542586, "ground_truth": 0}, {"key": "32283530", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784083780864, "ground_truth": 0}, {"key": "32283530", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014067287225, "ground_truth": 0}, {"key": "38377099", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.697608938871637, "ground_truth": 0}, {"key": "38377099", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3433417438084416, "ground_truth": 0}, {"key": "38377099", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5331544124689722, "ground_truth": 0}, {"key": "38377099", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056079451972, "ground_truth": 0}, {"key": "38377099", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794003926711301, "ground_truth": 0}, {"key": "36105123", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7201715000269227, "ground_truth": 0}, {"key": "36105123", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8164063821442928, "ground_truth": 0}, {"key": "36105123", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8418256459551521, "ground_truth": 0}, {"key": "36105123", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441206873776, "ground_truth": 0}, {"key": "36105123", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802491653046, "ground_truth": 0}, {"key": "33527826", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6261241656183969, "ground_truth": 0}, {"key": "33527826", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31912140309518816, "ground_truth": 0}, {"key": "33527826", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5736784225166576, "ground_truth": 0}, {"key": "33527826", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684527829235, "ground_truth": 0}, {"key": "33527826", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199209176302, "ground_truth": 0}, {"key": "32349891", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5428632882344431, "ground_truth": 0}, {"key": "32349891", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7592253722769947, "ground_truth": 0}, {"key": "32349891", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7248702853236629, "ground_truth": 0}, {"key": "32349891", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723885433246, "ground_truth": 0}, {"key": "32349891", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102615970078, "ground_truth": 0}, {"key": "34281974", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4571367171191478, "ground_truth": 0}, {"key": "34281974", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5832033691740945, "ground_truth": 0}, {"key": "34281974", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.638835257092457, "ground_truth": 0}, {"key": "34281974", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093665844203, "ground_truth": 0}, {"key": "34281974", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.45907611800029474, "ground_truth": 0}, {"key": "29387866", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11436853765994073, "ground_truth": 0}, {"key": "29387866", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20689404388530425, "ground_truth": 0}, {"key": "29387866", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18359363686866959, "ground_truth": 0}, {"key": "29387866", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13386747826697046, "ground_truth": 0}, {"key": "29387866", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15713684922250906, "ground_truth": 0}, {"key": "35731925", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9507778874429188, "ground_truth": 0}, {"key": "35731925", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9671630417869984, "ground_truth": 0}, {"key": "35731925", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9678992935907984, "ground_truth": 0}, {"key": "35731925", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9500414733153809, "ground_truth": 0}, {"key": "35731925", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9621075712818408, "ground_truth": 0}, {"key": "38829733", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6057990486391396, "ground_truth": 0}, {"key": "38829733", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5350984304513453, "ground_truth": 0}, {"key": "38829733", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.47657965730354296, "ground_truth": 0}, {"key": "38829733", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165215825849, "ground_truth": 0}, {"key": "38829733", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793784012608011, "ground_truth": 0}, {"key": "24624736", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.785308575332702, "ground_truth": 0}, {"key": "24624736", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7279754596421105, "ground_truth": 0}, {"key": "24624736", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.45519859433985843, "ground_truth": 0}, {"key": "24624736", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.540923832184093, "ground_truth": 0}, {"key": "24624736", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953965615546, "ground_truth": 0}, {"key": "36928562", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5621765030426947, "ground_truth": 0}, {"key": "36928562", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7122321814261737, "ground_truth": 0}, {"key": "36928562", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.779992878678256, "ground_truth": 0}, {"key": "36928562", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619288947771, "ground_truth": 0}, {"key": "36928562", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370308035679804, "ground_truth": 0}, {"key": "34941119", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5983121740699162, "ground_truth": 0}, {"key": "34941119", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16667540903319228, "ground_truth": 0}, {"key": "34941119", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5312093403638749, "ground_truth": 0}, {"key": "34941119", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.38491212782307405, "ground_truth": 0}, {"key": "34941119", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3398276361489076, "ground_truth": 0}, {"key": "30206231", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2043418992564155, "ground_truth": 0}, {"key": "30206231", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3867634561913414, "ground_truth": 0}, {"key": "30206231", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.049958520957547776, "ground_truth": 0}, {"key": "30206231", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36296919927319554, "ground_truth": 0}, {"key": "30206231", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2200070958951881, "ground_truth": 0}, {"key": "35584972", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3486451470626162, "ground_truth": 0}, {"key": "35584972", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4882833818796607, "ground_truth": 0}, {"key": "35584972", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4111108881714108, "ground_truth": 0}, {"key": "35584972", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.329391701734363, "ground_truth": 0}, {"key": "35584972", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.42441200046011984, "ground_truth": 0}, {"key": "39277709", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7839884777310875, "ground_truth": 0}, {"key": "39277709", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5525397110275989, "ground_truth": 0}, {"key": "39277709", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5869964228088188, "ground_truth": 0}, {"key": "39277709", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526483403854, "ground_truth": 0}, {"key": "39277709", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947429592498, "ground_truth": 0}, {"key": "36123657", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8104789245753209, "ground_truth": 0}, {"key": "36123657", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8459424489770841, "ground_truth": 0}, {"key": "36123657", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6548947335180224, "ground_truth": 0}, {"key": "36123657", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210596713446, "ground_truth": 0}, {"key": "36123657", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759702116136, "ground_truth": 0}, {"key": "33363938", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.507811864314561, "ground_truth": 0}, {"key": "33363938", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.0821066242098929, "ground_truth": 0}, {"key": "33363938", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5525397055869358, "ground_truth": 0}, {"key": "33363938", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354871071417, "ground_truth": 0}, {"key": "33363938", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4746311746510154, "ground_truth": 0}, {"key": "37349129", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5331544277465233, "ground_truth": 0}, {"key": "37349129", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38121953826193467, "ground_truth": 0}, {"key": "37349129", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6206216010822407, "ground_truth": 0}, {"key": "37349129", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984766518907, "ground_truth": 0}, {"key": "37349129", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531478515278, "ground_truth": 0}, {"key": "37160199", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12336560826658055, "ground_truth": 0}, {"key": "37160199", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20307462111599162, "ground_truth": 0}, {"key": "37160199", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11047114592143362, "ground_truth": 0}, {"key": "37160199", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09203284678572123, "ground_truth": 0}, {"key": "37160199", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.08035747227258566, "ground_truth": 0}, {"key": "35891053", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.416796636873208, "ground_truth": 0}, {"key": "35891053", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7416740033743208, "ground_truth": 0}, {"key": "35891053", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6169358389869968, "ground_truth": 0}, {"key": "35891053", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819670817693, "ground_truth": 0}, {"key": "35891053", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6315943041337498, "ground_truth": 0}, {"key": "40694542", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5832033894735302, "ground_truth": 0}, {"key": "40694542", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4824290940230022, "ground_truth": 0}, {"key": "40694542", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5563995870196184, "ground_truth": 0}, {"key": "40694542", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878872332867, "ground_truth": 0}, {"key": "40694542", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4282333776996294, "ground_truth": 0}, {"key": "24645770", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19806416347153727, "ground_truth": 0}, {"key": "24645770", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2798284882223639, "ground_truth": 0}, {"key": "24645770", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3276683093075325, "ground_truth": 0}, {"key": "24645770", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4571367217526567, "ground_truth": 0}, {"key": "24645770", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33807712204652196, "ground_truth": 0}, {"key": "37974587", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7826624782440308, "ground_truth": 0}, {"key": "37974587", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8840392792221241, "ground_truth": 0}, {"key": "37974587", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8289388022317367, "ground_truth": 0}, {"key": "37974587", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737854208033, "ground_truth": 0}, {"key": "37974587", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210684943271, "ground_truth": 0}, {"key": "40354149", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.831143044922968, "ground_truth": 0}, {"key": "40354149", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48828337895274815, "ground_truth": 0}, {"key": "40354149", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7310585888090158, "ground_truth": 0}, {"key": "40354149", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365722224353, "ground_truth": 0}, {"key": "40354149", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321749444281, "ground_truth": 0}, {"key": "35519470", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20307463775414866, "ground_truth": 0}, {"key": "35519470", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5583269931555541, "ground_truth": 0}, {"key": "35519470", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2200070963585996, "ground_truth": 0}, {"key": "35519470", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16559311311602215, "ground_truth": 0}, {"key": "35519470", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.42632159721130086, "ground_truth": 0}, {"key": "36185624", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6187804276855065, "ground_truth": 0}, {"key": "36185624", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6909762909678168, "ground_truth": 0}, {"key": "36185624", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7248702538689954, "ground_truth": 0}, {"key": "36185624", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983122185618723, "ground_truth": 0}, {"key": "36185624", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884586884217, "ground_truth": 0}, {"key": "39306113", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23651624991067532, "ground_truth": 0}, {"key": "39306113", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4359015219637301, "ground_truth": 0}, {"key": "39306113", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44167298567126373, "ground_truth": 0}, {"key": "39306113", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3611647396470792, "ground_truth": 0}, {"key": "39306113", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982759910890326, "ground_truth": 0}, {"key": "19347718", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6959583162125131, "ground_truth": 0}, {"key": "19347718", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40544873290529476, "ground_truth": 0}, {"key": "19347718", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3090237333868077, "ground_truth": 0}, {"key": "19347718", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42823340343172533, "ground_truth": 0}, {"key": "19347718", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4282333998920444, "ground_truth": 0}, {"key": "21870064", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2643583545459421, "ground_truth": 0}, {"key": "21870064", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22000710541016213, "ground_truth": 0}, {"key": "21870064", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2643583581663624, "ground_truth": 0}, {"key": "21870064", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2267836451624704, "ground_truth": 0}, {"key": "21870064", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27825679678554194, "ground_truth": 0}, {"key": "37675776", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.42059959013556036, "ground_truth": 0}, {"key": "37675776", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.637030774320742, "ground_truth": 0}, {"key": "37675776", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7505527669397359, "ground_truth": 0}, {"key": "37675776", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548752660896, "ground_truth": 0}, {"key": "37675776", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159496515838, "ground_truth": 0}, {"key": "38107017", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.37022541223606265, "ground_truth": 0}, {"key": "38107017", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5370413962307157, "ground_truth": 0}, {"key": "38107017", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44939264030873366, "ground_truth": 0}, {"key": "38107017", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22270015919300223, "ground_truth": 0}, {"key": "38107017", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3942009596963058, "ground_truth": 0}, {"key": "40046472", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.482429120256865, "ground_truth": 0}, {"key": "40046472", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7732163650498878, "ground_truth": 0}, {"key": "40046472", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5234203834627118, "ground_truth": 0}, {"key": "40046472", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.816406393746954, "ground_truth": 0}, {"key": "40046472", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.422504639872854, "ground_truth": 0}, {"key": "32157820", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17217186138464005, "ground_truth": 0}, {"key": "32157820", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3793783581892038, "ground_truth": 0}, {"key": "32157820", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4263215805931127, "ground_truth": 0}, {"key": "32157820", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33111974692553375, "ground_truth": 0}, {"key": "32157820", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29421497769463273, "ground_truth": 0}, {"key": "41004037", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21866937580878992, "ground_truth": 0}, {"key": "41004037", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38306417070225446, "ground_truth": 0}, {"key": "41004037", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19193276716905613, "ground_truth": 0}, {"key": "41004037", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2018132332089231, "ground_truth": 0}, {"key": "41004037", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.41300356685147166, "ground_truth": 0}, {"key": "21387993", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23792989204773754, "ground_truth": 0}, {"key": "21387993", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7853085708354659, "ground_truth": 0}, {"key": "21387993", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39981164436084815, "ground_truth": 0}, {"key": "21387993", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.521471160812984, "ground_truth": 0}, {"key": "21387993", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746355732585, "ground_truth": 0}, {"key": "34665539", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21601152778500746, "ground_truth": 0}, {"key": "34665539", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1441488757511185, "ground_truth": 0}, {"key": "34665539", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "34665539", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570645802882113, "ground_truth": 0}, {"key": "34665539", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3629692293740575, "ground_truth": 0}, {"key": "37872111", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11124119955476906, "ground_truth": 0}, {"key": "37872111", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16238002918558278, "ground_truth": 0}, {"key": "37872111", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23231012708267063, "ground_truth": 0}, {"key": "37872111", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.0736962760527343, "ground_truth": 0}, {"key": "37872111", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.10594827890796496, "ground_truth": 0}, {"key": "36629542", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4980468872834244, "ground_truth": 0}, {"key": "36629542", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.41679665969263324, "ground_truth": 0}, {"key": "36629542", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.49804687780273393, "ground_truth": 0}, {"key": "36629542", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061776381305, "ground_truth": 0}, {"key": "36629542", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4649015930060426, "ground_truth": 0}, {"key": "36487527", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6169358312593649, "ground_truth": 0}, {"key": "36487527", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6619228853883901, "ground_truth": 0}, {"key": "36487527", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6842640367696915, "ground_truth": 0}, {"key": "36487527", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300752780436, "ground_truth": 0}, {"key": "36487527", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445475655442, "ground_truth": 0}, {"key": "37344756", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5755879998336073, "ground_truth": 0}, {"key": "37344756", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8210441008788392, "ground_truth": 0}, {"key": "37344756", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8344068911525143, "ground_truth": 0}, {"key": "37344756", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832103443642, "ground_truth": 0}, {"key": "37344756", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619264529054, "ground_truth": 0}, {"key": "38707722", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.199307991541826, "ground_truth": 0}, {"key": "38707722", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27357439817107443, "ground_truth": 0}, {"key": "38707722", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12506538532000935, "ground_truth": 0}, {"key": "38707722", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.38306416246563746, "ground_truth": 0}, {"key": "38707722", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26435832991315156, "ground_truth": 0}, {"key": "37093419", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.258325980783395, "ground_truth": 0}, {"key": "37093419", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1460872480691406, "ground_truth": 0}, {"key": "37093419", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.09670579448809134, "ground_truth": 0}, {"key": "37093419", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653333279867085, "ground_truth": 0}, {"key": "37093419", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594719206537275, "ground_truth": 0}, {"key": "35547391", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4941408863557501, "ground_truth": 0}, {"key": "35547391", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5039061693026662, "ground_truth": 0}, {"key": "35547391", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.32594951222200585, "ground_truth": 0}, {"key": "35547391", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.329391711718941, "ground_truth": 0}, {"key": "35547391", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.38676346237579096, "ground_truth": 0}, {"key": "37173168", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44746027610899153, "ground_truth": 0}, {"key": "37173168", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4205995814703253, "ground_truth": 0}, {"key": "37173168", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5983121757076059, "ground_truth": 0}, {"key": "37173168", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352914193735, "ground_truth": 0}, {"key": "37173168", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941409093013902, "ground_truth": 0}, {"key": "30725298", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5292633850811375, "ground_truth": 0}, {"key": "30725298", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4902356266906749, "ground_truth": 0}, {"key": "30725298", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6352224717207008, "ground_truth": 0}, {"key": "30725298", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666603459926, "ground_truth": 0}, {"key": "30725298", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992543956939276, "ground_truth": 0}, {"key": "33830573", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7690802409708679, "ground_truth": 0}, {"key": "33830573", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6388352693010828, "ground_truth": 0}, {"key": "33830573", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6926420012079954, "ground_truth": 0}, {"key": "33830573", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804392933001, "ground_truth": 0}, {"key": "33830573", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563375367301, "ground_truth": 0}, {"key": "33415474", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.08449276142903477, "ground_truth": 0}, {"key": "33415474", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10158944124086133, "ground_truth": 0}, {"key": "33415474", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12336562142099455, "ground_truth": 0}, {"key": "33415474", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1135795993230755, "ground_truth": 0}, {"key": "33415474", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.10017222319431647, "ground_truth": 0}, {"key": "37383994", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6992544072193365, "ground_truth": 0}, {"key": "37383994", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6959583273612149, "ground_truth": 0}, {"key": "37383994", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7606506669349208, "ground_truth": 0}, {"key": "37383994", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680180920475, "ground_truth": 0}, {"key": "37383994", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228393661537, "ground_truth": 0}, {"key": "38576819", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3363310599264807, "ground_truth": 0}, {"key": "38576819", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3942009716492214, "ground_truth": 0}, {"key": "38576819", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.27825680131614267, "ground_truth": 0}, {"key": "38576819", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4397473492990185, "ground_truth": 0}, {"key": "38576819", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1980641653900256, "ground_truth": 0}, {"key": "34500226", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5292634000219292, "ground_truth": 0}, {"key": "34500226", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5660185330314367, "ground_truth": 0}, {"key": "34500226", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5312093908827865, "ground_truth": 0}, {"key": "34500226", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.63159430615443, "ground_truth": 0}, {"key": "34500226", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764990390135, "ground_truth": 0}, {"key": "39856394", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7534666417113581, "ground_truth": 0}, {"key": "39856394", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49609380089899713, "ground_truth": 0}, {"key": "39856394", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7813306173266845, "ground_truth": 0}, {"key": "39856394", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690844325126, "ground_truth": 0}, {"key": "39856394", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056027361537, "ground_truth": 0}, {"key": "35499522", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.067546691874639, "ground_truth": 0}, {"key": "35499522", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13939637022213125, "ground_truth": 0}, {"key": "35499522", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12002563274955658, "ground_truth": 0}, {"key": "35499522", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.05877655986756067, "ground_truth": 0}, {"key": "35499522", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.04672496825750731, "ground_truth": 0}, {"key": "30157766", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7662936474380501, "ground_truth": 0}, {"key": "30157766", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7138307434134987, "ground_truth": 0}, {"key": "30157766", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8354835351371618, "ground_truth": 0}, {"key": "30157766", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.705785025759124, "ground_truth": 0}, {"key": "30157766", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163485602186, "ground_truth": 0}, {"key": "40472346", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31912138477383367, "ground_truth": 0}, {"key": "40472346", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49804688179521006, "ground_truth": 0}, {"key": "40472346", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7041601221183453, "ground_truth": 0}, {"key": "40472346", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.607663183496742, "ground_truth": 0}, {"key": "40472346", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365595016555, "ground_truth": 0}, {"key": "35305635", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6150878409392884, "ground_truth": 0}, {"key": "35305635", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7620701113480731, "ground_truth": 0}, {"key": "35305635", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8568123025760064, "ground_truth": 0}, {"key": "35305635", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791787003795215, "ground_truth": 0}, {"key": "35305635", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767874145257, "ground_truth": 0}, {"key": "32495926", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6039318162341718, "ground_truth": 0}, {"key": "32495926", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43206337325501964, "ground_truth": 0}, {"key": "32495926", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7041601359581321, "ground_truth": 0}, {"key": "32495926", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078119037235089, "ground_truth": 0}, {"key": "32495926", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118785915911, "ground_truth": 0}, {"key": "37353801", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5117166220940648, "ground_truth": 0}, {"key": "37353801", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29910518080245235, "ground_truth": 0}, {"key": "37353801", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3433417262383406, "ground_truth": 0}, {"key": "37353801", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3738758299025897, "ground_truth": 0}, {"key": "37353801", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28457600256884147, "ground_truth": 0}, {"key": "30159904", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6020616089954146, "ground_truth": 0}, {"key": "30159904", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3702253902149796, "ground_truth": 0}, {"key": "30159904", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5640984676693473, "ground_truth": 0}, {"key": "30159904", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321925711532, "ground_truth": 0}, {"key": "30159904", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.627951208676671, "ground_truth": 0}, {"key": "33698679", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3363310570835154, "ground_truth": 0}, {"key": "33698679", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5832033558556572, "ground_truth": 0}, {"key": "33698679", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1623800467119786, "ground_truth": 0}, {"key": "33698679", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.41489885529630743, "ground_truth": 0}, {"key": "33698679", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736784177658235, "ground_truth": 0}, {"key": "40530172", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6584174851575353, "ground_truth": 0}, {"key": "40530172", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.521471161448125, "ground_truth": 0}, {"key": "40530172", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7520125632309348, "ground_truth": 0}, {"key": "40530172", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.654894727934045, "ground_truth": 0}, {"key": "40530172", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297745986582902, "ground_truth": 0}, {"key": "40652941", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8019358130219706, "ground_truth": 0}, {"key": "40652941", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6187804000077025, "ground_truth": 0}, {"key": "40652941", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7634837833384734, "ground_truth": 0}, {"key": "40652941", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690605562335, "ground_truth": 0}, {"key": "40652941", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526117874788, "ground_truth": 0}, {"key": "40122246", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2465333423709832, "ground_truth": 0}, {"key": "40122246", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.15921741819556062, "ground_truth": 0}, {"key": "40122246", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19314737794763864, "ground_truth": 0}, {"key": "40122246", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11920293342545199, "ground_truth": 0}, {"key": "40122246", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22405544632646096, "ground_truth": 0}, {"key": "40032656", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8278281458033917, "ground_truth": 0}, {"key": "40032656", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6132365518280984, "ground_truth": 0}, {"key": "40032656", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6566582742790371, "ground_truth": 0}, {"key": "40032656", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936529562666, "ground_truth": 0}, {"key": "40032656", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849399356098, "ground_truth": 0}, {"key": "38913680", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.41679661224468134, "ground_truth": 0}, {"key": "38913680", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23792989397724273, "ground_truth": 0}, {"key": "38913680", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4054487128360947, "ground_truth": 0}, {"key": "38913680", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.47268347863975363, "ground_truth": 0}, {"key": "38913680", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4130035579715264, "ground_truth": 0}, {"key": "17608039", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19072401295750713, "ground_truth": 0}, {"key": "17608039", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10594828742834526, "ground_truth": 0}, {"key": "17608039", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1470645220679614, "ground_truth": 0}, {"key": "17608039", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21206878991691339, "ground_truth": 0}, {"key": "17608039", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19314737448165434, "ground_truth": 0}, {"key": "40434901", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7563575506196208, "ground_truth": 0}, {"key": "40434901", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7563575770267659, "ground_truth": 0}, {"key": "40434901", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6406358414006218, "ground_truth": 0}, {"key": "40434901", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441107784582, "ground_truth": 0}, {"key": "40434901", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094757276921, "ground_truth": 0}, {"key": "37680058", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2798285005034601, "ground_truth": 0}, {"key": "37680058", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16885695966233255, "ground_truth": 0}, {"key": "37680058", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3415824870568398, "ground_truth": 0}, {"key": "37680058", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20181320499320582, "ground_truth": 0}, {"key": "37680058", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18952109084496802, "ground_truth": 0}, {"key": "37291821", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5563995752110427, "ground_truth": 0}, {"key": "37291821", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3007455839375115, "ground_truth": 0}, {"key": "37291821", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26588048551763466, "ground_truth": 0}, {"key": "37291821", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023560159033136, "ground_truth": 0}, {"key": "37291821", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643761754499, "ground_truth": 0}, {"key": "41002743", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.29421496254708096, "ground_truth": 0}, {"key": "41002743", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4960938434814182, "ground_truth": 0}, {"key": "41002743", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3575675294722542, "ground_truth": 0}, {"key": "41002743", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3380771309045746, "ground_truth": 0}, {"key": "41002743", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.42059958637428, "ground_truth": 0}, {"key": "36322869", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6531268976100572, "ground_truth": 0}, {"key": "36322869", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6442251108642343, "ground_truth": 0}, {"key": "36322869", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6859494734264797, "ground_truth": 0}, {"key": "36322869", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684550795338, "ground_truth": 0}, {"key": "36322869", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.505859142674947, "ground_truth": 0}, {"key": "39459717", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5563995595838528, "ground_truth": 0}, {"key": "39459717", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5583269845454548, "ground_truth": 0}, {"key": "39459717", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6057990420170615, "ground_truth": 0}, {"key": "39459717", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723796319876, "ground_truth": 0}, {"key": "39459717", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512047421868, "ground_truth": 0}, {"key": "36503727", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31405054495205614, "ground_truth": 0}, {"key": "36503727", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.46879060877264633, "ground_truth": 0}, {"key": "36503727", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2720245642495057, "ground_truth": 0}, {"key": "36503727", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4941409023979941, "ground_truth": 0}, {"key": "36503727", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757645990658049, "ground_truth": 0}, {"key": "35682367", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5292633947325326, "ground_truth": 0}, {"key": "35682367", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5755880164873377, "ground_truth": 0}, {"key": "35682367", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38121957679415663, "ground_truth": 0}, {"key": "35682367", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591084657911, "ground_truth": 0}, {"key": "35682367", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984280250893, "ground_truth": 0}, {"key": "36472353", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25238402616341077, "ground_truth": 0}, {"key": "36472353", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23934933321346533, "ground_truth": 0}, {"key": "36472353", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24508500424057228, "ground_truth": 0}, {"key": "36472353", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20181322553291575, "ground_truth": 0}, {"key": "36472353", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35398630055411257, "ground_truth": 0}, {"key": "37651907", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.552539727238868, "ground_truth": 0}, {"key": "37651907", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29259531202701655, "ground_truth": 0}, {"key": "37651907", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25386099500588105, "ground_truth": 0}, {"key": "37651907", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39233679599186067, "ground_truth": 0}, {"key": "37651907", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004180844406, "ground_truth": 0}, {"key": "36255476", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.37754066928636265, "ground_truth": 0}, {"key": "36255476", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49023559845901676, "ground_truth": 0}, {"key": "36255476", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5097644001474446, "ground_truth": 0}, {"key": "36255476", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702868478359, "ground_truth": 0}, {"key": "36255476", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381555392569, "ground_truth": 0}, {"key": "37283518", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6113819886753769, "ground_truth": 0}, {"key": "37283518", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7233094990156624, "ground_truth": 0}, {"key": "37283518", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6808786117150348, "ground_truth": 0}, {"key": "37283518", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020615518786516, "ground_truth": 0}, {"key": "37283518", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512673509343, "ground_truth": 0}, {"key": "34906785", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3904758424220413, "ground_truth": 0}, {"key": "34906785", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2583259947032914, "ground_truth": 0}, {"key": "34906785", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3557748826095253, "ground_truth": 0}, {"key": "34906785", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3647775637140545, "ground_truth": 0}, {"key": "34906785", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21206881998909696, "ground_truth": 0}, {"key": "34965328", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6619228873031775, "ground_truth": 0}, {"key": "34965328", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "34965328", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48242910963414354, "ground_truth": 0}, {"key": "34965328", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506407981299, "ground_truth": 0}, {"key": "34965328", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849479861793, "ground_truth": 0}, {"key": "38788440", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14608724684048335, "ground_truth": 0}, {"key": "38788440", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.120025639658712, "ground_truth": 0}, {"key": "38788440", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1490352987166555, "ground_truth": 0}, {"key": "38788440", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.158174350648526, "ground_truth": 0}, {"key": "38788440", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.09739039766430281, "ground_truth": 0}, {"key": "35046866", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7106282912068733, "ground_truth": 0}, {"key": "35046866", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49804690497345816, "ground_truth": 0}, {"key": "35046866", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6584174893634785, "ground_truth": 0}, {"key": "35046866", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191429601428, "ground_truth": 0}, {"key": "35046866", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358296285961, "ground_truth": 0}, {"key": "37629558", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44552952860119444, "ground_truth": 0}, {"key": "37629558", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.36116471681632895, "ground_truth": 0}, {"key": "37629558", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42059958993329444, "ground_truth": 0}, {"key": "37629558", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2379298756424627, "ground_truth": 0}, {"key": "37629558", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30074558247110456, "ground_truth": 0}, {"key": "33859914", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6224593464052557, "ground_truth": 0}, {"key": "33859914", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5583269793824375, "ground_truth": 0}, {"key": "33859914", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6424325001460318, "ground_truth": 0}, {"key": "33859914", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238677990674, "ground_truth": 0}, {"key": "33859914", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593415541925, "ground_truth": 0}, {"key": "39790523", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7185944061648343, "ground_truth": 0}, {"key": "39790523", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4687906118909055, "ground_truth": 0}, {"key": "39790523", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4687906150073685, "ground_truth": 0}, {"key": "39790523", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620700960918518, "ground_truth": 0}, {"key": "39790523", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.37204877712337997, "ground_truth": 0}, {"key": "33509656", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18594718527813356, "ground_truth": 0}, {"key": "33509656", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2005576814121306, "ground_truth": 0}, {"key": "33509656", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2845759968191118, "ground_truth": 0}, {"key": "33509656", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26588049902084704, "ground_truth": 0}, {"key": "33509656", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2436424454013678, "ground_truth": 0}, {"key": "17380923", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.426321600349765, "ground_truth": 0}, {"key": "17380923", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5794004272954326, "ground_truth": 0}, {"key": "17380923", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5964331467403479, "ground_truth": 0}, {"key": "17380923", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324791296382, "ground_truth": 0}, {"key": "17380923", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43590150301082853, "ground_truth": 0}, {"key": "36202526", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35577489849951427, "ground_truth": 0}, {"key": "36202526", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.46879061280218953, "ground_truth": 0}, {"key": "36202526", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.315735971437645, "ground_truth": 0}, {"key": "36202526", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746183338356, "ground_truth": 0}, {"key": "36202526", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4455295360543132, "ground_truth": 0}, {"key": "26419232", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4629586041071333, "ground_truth": 0}, {"key": "26419232", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4455295227522545, "ground_truth": 0}, {"key": "26419232", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4824291242374404, "ground_truth": 0}, {"key": "26419232", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.46490156684042194, "ground_truth": 0}, {"key": "26419232", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982763329021176, "ground_truth": 0}, {"key": "34232398", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6039318346732044, "ground_truth": 0}, {"key": "34232398", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5907791878620036, "ground_truth": 0}, {"key": "34232398", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6774740225716582, "ground_truth": 0}, {"key": "34232398", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486734703644041, "ground_truth": 0}, {"key": "34232398", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718434893145221, "ground_truth": 0}, {"key": "33586045", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5698526492848608, "ground_truth": 0}, {"key": "33586045", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5039061652321145, "ground_truth": 0}, {"key": "33586045", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5774953656478988, "ground_truth": 0}, {"key": "33586045", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40733340318028627, "ground_truth": 0}, {"key": "33586045", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704561954358, "ground_truth": 0}, {"key": "32281151", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3242354233202013, "ground_truth": 0}, {"key": "32281151", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21601154472745648, "ground_truth": 0}, {"key": "32281151", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4186969144487583, "ground_truth": 0}, {"key": "32281151", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.18010664584865888, "ground_truth": 0}, {"key": "32281151", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.41869691350677035, "ground_truth": 0}, {"key": "37308159", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5214711373620898, "ground_truth": 0}, {"key": "37308159", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.411110852876465, "ground_truth": 0}, {"key": "37308159", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5525397196615603, "ground_truth": 0}, {"key": "37308159", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486735181620918, "ground_truth": 0}, {"key": "37308159", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.656658294370695, "ground_truth": 0}, {"key": "35694408", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3942009760334496, "ground_truth": 0}, {"key": "35694408", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8255897310975693, "ground_truth": 0}, {"key": "35694408", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33111975076421546, "ground_truth": 0}, {"key": "35694408", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740391670494, "ground_truth": 0}, {"key": "35694408", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165311883328, "ground_truth": 0}, {"key": "39781995", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3007455996365333, "ground_truth": 0}, {"key": "39781995", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2845759850298131, "ground_truth": 0}, {"key": "39781995", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3812195690486253, "ground_truth": 0}, {"key": "39781995", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2479874180922765, "ground_truth": 0}, {"key": "39781995", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2942149657936145, "ground_truth": 0}, {"key": "22799372", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.744656331336923, "ground_truth": 0}, {"key": "22799372", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8300437692880479, "ground_truth": 0}, {"key": "22799372", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8757869819739328, "ground_truth": 0}, {"key": "22799372", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8925625195272359, "ground_truth": 0}, {"key": "22799372", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744792139042, "ground_truth": 0}, {"key": "37428240", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26894145547660203, "ground_truth": 0}, {"key": "37428240", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.501953123655432, "ground_truth": 0}, {"key": "37428240", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.46101680006266593, "ground_truth": 0}, {"key": "37428240", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668455802647774, "ground_truth": 0}, {"key": "37428240", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.45519858955827835, "ground_truth": 0}, {"key": "40612657", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7648916015098952, "ground_truth": 0}, {"key": "40612657", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8449215267556183, "ground_truth": 0}, {"key": "40612657", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6548947169660025, "ground_truth": 0}, {"key": "40612657", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.737158148938801, "ground_truth": 0}, {"key": "40612657", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096122447175, "ground_truth": 0}, {"key": "34404662", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6297745875786018, "ground_truth": 0}, {"key": "34404662", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4073334022021043, "ground_truth": 0}, {"key": "34404662", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7310585760336594, "ground_truth": 0}, {"key": "34404662", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460137077946636, "ground_truth": 0}, {"key": "34404662", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121755198407, "ground_truth": 0}, {"key": "32619704", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.29583986127560535, "ground_truth": 0}, {"key": "32619704", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.226783613458517, "ground_truth": 0}, {"key": "32619704", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.381219573367567, "ground_truth": 0}, {"key": "32619704", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3023910970863363, "ground_truth": 0}, {"key": "32619704", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090237110067707, "ground_truth": 0}, {"key": "39014883", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4436004172523959, "ground_truth": 0}, {"key": "39014883", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4785288310449473, "ground_truth": 0}, {"key": "39014883", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.31573596579016433, "ground_truth": 0}, {"key": "39014883", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4551986094173916, "ground_truth": 0}, {"key": "39014883", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.41111085239522155, "ground_truth": 0}, {"key": "37982812", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1895210890533398, "ground_truth": 0}, {"key": "37982812", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.15405755485414066, "ground_truth": 0}, {"key": "37982812", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2925953102342683, "ground_truth": 0}, {"key": "37982812", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1561048932984091, "ground_truth": 0}, {"key": "37982812", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15304215538419635, "ground_truth": 0}, {"key": "28123476", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18952109457649258, "ground_truth": 0}, {"key": "28123476", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4073333853643181, "ground_truth": 0}, {"key": "28123476", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5078118397999687, "ground_truth": 0}, {"key": "28123476", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4320634106525212, "ground_truth": 0}, {"key": "28123476", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30735799100215105, "ground_truth": 0}, {"key": "39078849", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38676344175350263, "ground_truth": 0}, {"key": "39078849", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3629691998627967, "ground_truth": 0}, {"key": "39078849", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4092207951586954, "ground_truth": 0}, {"key": "39078849", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4073334081337786, "ground_truth": 0}, {"key": "39078849", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881265961863, "ground_truth": 0}, {"key": "39414137", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5214711317393121, "ground_truth": 0}, {"key": "39414137", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5964331516279662, "ground_truth": 0}, {"key": "39414137", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5467381799546219, "ground_truth": 0}, {"key": "39414137", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688074058324, "ground_truth": 0}, {"key": "39414137", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525396974656899, "ground_truth": 0}, {"key": "37371354", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39793841639125843, "ground_truth": 0}, {"key": "37371354", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6001883738132665, "ground_truth": 0}, {"key": "37371354", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.31742625296133276, "ground_truth": 0}, {"key": "37371354", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4035668520527861, "ground_truth": 0}, {"key": "37371354", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.37937839062280393, "ground_truth": 0}, {"key": "29497179", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5698526395376783, "ground_truth": 0}, {"key": "29497179", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4513265134605838, "ground_truth": 0}, {"key": "29497179", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5525396902344535, "ground_truth": 0}, {"key": "29497179", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292634187147128, "ground_truth": 0}, {"key": "29497179", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174925264848, "ground_truth": 0}, {"key": "35908694", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6825737631931803, "ground_truth": 0}, {"key": "35908694", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7106282980638865, "ground_truth": 0}, {"key": "35908694", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8376199604947775, "ground_truth": 0}, {"key": "35908694", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898694762646, "ground_truth": 0}, {"key": "35908694", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592253836675817, "ground_truth": 0}, {"key": "37619358", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4513265329346268, "ground_truth": 0}, {"key": "37619358", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6723316804581033, "ground_truth": 0}, {"key": "37619358", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6706082673845339, "ground_truth": 0}, {"key": "37619358", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.46101677311858696, "ground_truth": 0}, {"key": "37619358", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525396963299432, "ground_truth": 0}, {"key": "37293103", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6150878484633987, "ground_truth": 0}, {"key": "37293103", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5660185462376478, "ground_truth": 0}, {"key": "37293103", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.527316522117523, "ground_truth": 0}, {"key": "37293103", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315943158859167, "ground_truth": 0}, {"key": "37293103", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995995083819, "ground_truth": 0}, {"key": "36883729", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28616925326347414, "ground_truth": 0}, {"key": "36883729", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1789558887365543, "ground_truth": 0}, {"key": "36883729", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24364239256929296, "ground_truth": 0}, {"key": "36883729", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2005576867828664, "ground_truth": 0}, {"key": "36883729", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076630459755225, "ground_truth": 0}, {"key": "39209521", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.46879064099856943, "ground_truth": 0}, {"key": "39209521", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5350984188449425, "ground_truth": 0}, {"key": "39209521", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4941408495834771, "ground_truth": 0}, {"key": "39209521", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256018753436, "ground_truth": 0}, {"key": "39209521", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331473963159, "ground_truth": 0}, {"key": "27792571", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5832033575498328, "ground_truth": 0}, {"key": "27792571", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7041601556920912, "ground_truth": 0}, {"key": "27792571", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38491212870065, "ground_truth": 0}, {"key": "27792571", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224214693789, "ground_truth": 0}, {"key": "27792571", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891266254195, "ground_truth": 0}, {"key": "39755647", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6757645871959777, "ground_truth": 0}, {"key": "39755647", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7025300552062891, "ground_truth": 0}, {"key": "39755647", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5370413893430332, "ground_truth": 0}, {"key": "39755647", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030810036734, "ground_truth": 0}, {"key": "39755647", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121772605272, "ground_truth": 0}, {"key": "40800537", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.273574400273715, "ground_truth": 0}, {"key": "40800537", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32766830371938993, "ground_truth": 0}, {"key": "40800537", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.32594952152383866, "ground_truth": 0}, {"key": "40800537", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2509127791955338, "ground_truth": 0}, {"key": "40800537", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941408918617272, "ground_truth": 0}, {"key": "14171461", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31236998887265766, "ground_truth": 0}, {"key": "14171461", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5253688144084301, "ground_truth": 0}, {"key": "14171461", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4016877998509867, "ground_truth": 0}, {"key": "14171461", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668455960005144, "ground_truth": 0}, {"key": "14171461", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.430147340545247, "ground_truth": 0}, {"key": "36892440", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32252597657758697, "ground_truth": 0}, {"key": "36892440", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2523840472197008, "ground_truth": 0}, {"key": "36892440", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35398631512409084, "ground_truth": 0}, {"key": "36892440", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1634454611410258, "ground_truth": 0}, {"key": "36892440", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2553436734346206, "ground_truth": 0}, {"key": "33733410", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32252597789097603, "ground_truth": 0}, {"key": "33733410", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.350421397371011, "ground_truth": 0}, {"key": "33733410", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3522017864283599, "ground_truth": 0}, {"key": "33733410", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33458942552548665, "ground_truth": 0}, {"key": "33733410", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2365162403250335, "ground_truth": 0}, {"key": "38587765", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.07864237860735923, "ground_truth": 0}, {"key": "38587765", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.09467769451696194, "ground_truth": 0}, {"key": "38587765", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.06804042076815707, "ground_truth": 0}, {"key": "38587765", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.07211220567947761, "ground_truth": 0}, {"key": "38587765", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.09203286282565656, "ground_truth": 0}, {"key": "41065582", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2845759975315909, "ground_truth": 0}, {"key": "41065582", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.577495353345594, "ground_truth": 0}, {"key": "41065582", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3593641575294815, "ground_truth": 0}, {"key": "41065582", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4397473259476077, "ground_truth": 0}, {"key": "41065582", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629586258853321, "ground_truth": 0}, {"key": "34713891", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23231011838793542, "ground_truth": 0}, {"key": "34713891", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.0881900371727051, "ground_truth": 0}, {"key": "34713891", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1393963911273216, "ground_truth": 0}, {"key": "34713891", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.10669059519252339, "ground_truth": 0}, {"key": "34713891", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15507848530496224, "ground_truth": 0}, {"key": "18913023", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.571766587160599, "ground_truth": 0}, {"key": "18913023", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7025300536748482, "ground_truth": 0}, {"key": "18913023", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6757646042640614, "ground_truth": 0}, {"key": "18913023", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023559498840846, "ground_truth": 0}, {"key": "18913023", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.468790622221462, "ground_truth": 0}, {"key": "36884100", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26740816910265214, "ground_truth": 0}, {"key": "36884100", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3293917095191058, "ground_truth": 0}, {"key": "36884100", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43014738104655875, "ground_truth": 0}, {"key": "36884100", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3451052889270432, "ground_truth": 0}, {"key": "36884100", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2766905274412968, "ground_truth": 0}, {"key": "39899913", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32252597561008384, "ground_truth": 0}, {"key": "39899913", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25238404794118063, "ground_truth": 0}, {"key": "39899913", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4359015376816668, "ground_truth": 0}, {"key": "39899913", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20307461052516343, "ground_truth": 0}, {"key": "39899913", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36116472282554385, "ground_truth": 0}, {"key": "30725366", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.06142403993885182, "ground_truth": 0}, {"key": "30725366", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18126321191803646, "ground_truth": 0}, {"key": "30725366", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.05834585118911213, "ground_truth": 0}, {"key": "30725366", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.08632347851398635, "ground_truth": 0}, {"key": "30725366", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.03846619159188545, "ground_truth": 0}, {"key": "26133523", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31405057048855295, "ground_truth": 0}, {"key": "26133523", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3345894612478089, "ground_truth": 0}, {"key": "26133523", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48242911848163184, "ground_truth": 0}, {"key": "26133523", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.44552951935481067, "ground_truth": 0}, {"key": "26133523", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.45519861036721704, "ground_truth": 0}, {"key": "29332665", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7185943798750904, "ground_truth": 0}, {"key": "29332665", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7201715089206322, "ground_truth": 0}, {"key": "29332665", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6279512133986688, "ground_truth": 0}, {"key": "29332665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292634099694702, "ground_truth": 0}, {"key": "29332665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.602061578587489, "ground_truth": 0}, {"key": "37400481", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5640985077917748, "ground_truth": 0}, {"key": "37400481", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7918210716431205, "ground_truth": 0}, {"key": "37400481", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.840782603109975, "ground_truth": 0}, {"key": "37400481", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867812897568, "ground_truth": 0}, {"key": "37400481", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354837305331, "ground_truth": 0}, {"key": "38787241", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2877678250933924, "ground_truth": 0}, {"key": "38787241", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6859494272382535, "ground_truth": 0}, {"key": "38787241", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48828340158029515, "ground_truth": 0}, {"key": "38787241", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42823338066891825, "ground_truth": 0}, {"key": "38787241", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366064408549, "ground_truth": 0}, {"key": "38225963", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.41111090548522694, "ground_truth": 0}, {"key": "38225963", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7371581651568234, "ground_truth": 0}, {"key": "38225963", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6601723605570267, "ground_truth": 0}, {"key": "38225963", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956581079578307, "ground_truth": 0}, {"key": "38225963", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238605210737, "ground_truth": 0}, {"key": "26072034", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10894505096590354, "ground_truth": 0}, {"key": "26072034", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1422318891189471, "ground_truth": 0}, {"key": "26072034", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.08151974864645942, "ground_truth": 0}, {"key": "26072034", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.06560483938654388, "ground_truth": 0}, {"key": "26072034", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.10017221497049372, "ground_truth": 0}, {"key": "35690810", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43206341388326913, "ground_truth": 0}, {"key": "35690810", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4590761321683615, "ground_truth": 0}, {"key": "35690810", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6442250956288433, "ground_truth": 0}, {"key": "35690810", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.48828339281450267, "ground_truth": 0}, {"key": "35690810", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4186969252580961, "ground_truth": 0}, {"key": "36855665", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.920217992007082, "ground_truth": 0}, {"key": "36855665", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.903974510041543, "ground_truth": 0}, {"key": "36855665", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8732148227019783, "ground_truth": 0}, {"key": "36855665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.872347371180161, "ground_truth": 0}, {"key": "36855665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673021350864, "ground_truth": 0}, {"key": "29757662", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3812195757230795, "ground_truth": 0}, {"key": "29757662", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5253688143940212, "ground_truth": 0}, {"key": "29757662", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40356687304435296, "ground_truth": 0}, {"key": "29757662", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33807710824749027, "ground_truth": 0}, {"key": "29757662", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922082558975004, "ground_truth": 0}, {"key": "19134339", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4863315162125821, "ground_truth": 0}, {"key": "19134339", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5448013862169335, "ground_truth": 0}, {"key": "19134339", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.312369997774279, "ground_truth": 0}, {"key": "19134339", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39233681511151414, "ground_truth": 0}, {"key": "19134339", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4339814719949355, "ground_truth": 0}, {"key": "35360732", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6039318206490613, "ground_truth": 0}, {"key": "35360732", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5774953560843678, "ground_truth": 0}, {"key": "35360732", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7356416541238648, "ground_truth": 0}, {"key": "35360732", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264255817775219, "ground_truth": 0}, {"key": "35360732", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.661922865478991, "ground_truth": 0}, {"key": "37713629", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39047585961373577, "ground_truth": 0}, {"key": "37713629", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6076631421596366, "ground_truth": 0}, {"key": "37713629", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.432063382241969, "ground_truth": 0}, {"key": "37713629", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.32082131320149376, "ground_truth": 0}, {"key": "37713629", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591033932588, "ground_truth": 0}, {"key": "33393394", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5832033544081809, "ground_truth": 0}, {"key": "33393394", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2146914432566468, "ground_truth": 0}, {"key": "33393394", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1623800351111472, "ground_truth": 0}, {"key": "33393394", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2365162395855993, "ground_truth": 0}, {"key": "33393394", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2450850226869755, "ground_truth": 0}, {"key": "32275837", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6774740243494008, "ground_truth": 0}, {"key": "32275837", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7295197732055579, "ground_truth": 0}, {"key": "32275837", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8816149115645651, "ground_truth": 0}, {"key": "32275837", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011685994567, "ground_truth": 0}, {"key": "32275837", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527439177894, "ground_truth": 0}, {"key": "21458094", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.583203347536607, "ground_truth": 0}, {"key": "21458094", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5019531032328075, "ground_truth": 0}, {"key": "21458094", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6039318358736732, "ground_truth": 0}, {"key": "21458094", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216138965456, "ground_truth": 0}, {"key": "21458094", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174962158607, "ground_truth": 0}, {"key": "40975362", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.34687310955665007, "ground_truth": 0}, {"key": "40975362", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4960938462692382, "ground_truth": 0}, {"key": "40975362", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4186968805410508, "ground_truth": 0}, {"key": "40975362", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31237000574946283, "ground_truth": 0}, {"key": "40975362", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367504807191, "ground_truth": 0}, {"key": "35234201", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.37387583166516114, "ground_truth": 0}, {"key": "35234201", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.45907611793443226, "ground_truth": 0}, {"key": "35234201", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.27982852079924614, "ground_truth": 0}, {"key": "35234201", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4148988608653051, "ground_truth": 0}, {"key": "35234201", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35756754358194104, "ground_truth": 0}, {"key": "36037573", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8031737931533051, "ground_truth": 0}, {"key": "36037573", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7759445356347436, "ground_truth": 0}, {"key": "36037573", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.786622831319344, "ground_truth": 0}, {"key": "36037573", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127464259737, "ground_truth": 0}, {"key": "36037573", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240827579362, "ground_truth": 0}, {"key": "30861915", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5253687977932663, "ground_truth": 0}, {"key": "30861915", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6636689492742762, "ground_truth": 0}, {"key": "30861915", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6757645955389632, "ground_truth": 0}, {"key": "30861915", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832016793086, "ground_truth": 0}, {"key": "30861915", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804439837544, "ground_truth": 0}, {"key": "40173012", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.0960255021817026, "ground_truth": 0}, {"key": "40173012", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26740816676752444, "ground_truth": 0}, {"key": "40173012", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.158174350008845, "ground_truth": 0}, {"key": "40173012", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2043419126231368, "ground_truth": 0}, {"key": "40173012", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.13206616260325676, "ground_truth": 0}, {"key": "35100330", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4610167960044538, "ground_truth": 0}, {"key": "35100330", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26588047714640506, "ground_truth": 0}, {"key": "35100330", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1766716168187278, "ground_truth": 0}, {"key": "35100330", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27048021606576783, "ground_truth": 0}, {"key": "35100330", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220562262848822, "ground_truth": 0}, {"key": "37220221", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7943849614197039, "ground_truth": 0}, {"key": "37220221", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7786493091566642, "ground_truth": 0}, {"key": "37220221", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7772998446831229, "ground_truth": 0}, {"key": "37220221", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754679815866, "ground_truth": 0}, {"key": "37220221", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014022229688, "ground_truth": 0}, {"key": "38815218", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8080672048053139, "ground_truth": 0}, {"key": "38815218", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8164063716578437, "ground_truth": 0}, {"key": "38815218", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7956581099864034, "ground_truth": 0}, {"key": "38815218", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419822063035, "ground_truth": 0}, {"key": "38815218", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438951133087548, "ground_truth": 0}, {"key": "39379109", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.34510527186604617, "ground_truth": 0}, {"key": "39379109", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19193277438764333, "ground_truth": 0}, {"key": "39379109", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.27825681560063614, "ground_truth": 0}, {"key": "39379109", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3611647290568057, "ground_truth": 0}, {"key": "39379109", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3904758347659944, "ground_truth": 0}, {"key": "14576125", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.07263670724305749, "ground_truth": 0}, {"key": "14576125", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26133093159251064, "ground_truth": 0}, {"key": "14576125", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23651624443261718, "ground_truth": 0}, {"key": "14576125", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.134775913550588, "ground_truth": 0}, {"key": "14576125", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.10521053223778495, "ground_truth": 0}, {"key": "40814250", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5698526276896698, "ground_truth": 0}, {"key": "40814250", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.869714576605658, "ground_truth": 0}, {"key": "40814250", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48047868471005356, "ground_truth": 0}, {"key": "40814250", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27512974892145176, "ground_truth": 0}, {"key": "40814250", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4980468837771696, "ground_truth": 0}, {"key": "36334488", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21601153884479063, "ground_truth": 0}, {"key": "36334488", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18713266467730338, "ground_truth": 0}, {"key": "36334488", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15610489779870654, "ground_truth": 0}, {"key": "36334488", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09947022327954202, "ground_truth": 0}, {"key": "36334488", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1338674899422361, "ground_truth": 0}, {"key": "36888322", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.40733340992890277, "ground_truth": 0}, {"key": "36888322", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5350984279798908, "ground_truth": 0}, {"key": "36888322", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3611647321828905, "ground_truth": 0}, {"key": "36888322", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947215158336, "ground_truth": 0}, {"key": "36888322", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629586228775669, "ground_truth": 0}, {"key": "37318916", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9314625155144822, "ground_truth": 0}, {"key": "37318916", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5945512573913976, "ground_truth": 0}, {"key": "37318916", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9429286040416743, "ground_truth": 0}, {"key": "37318916", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9623913622011556, "ground_truth": 0}, {"key": "37318916", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9429286038013311, "ground_truth": 0}, {"key": "39308700", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17553808222120096, "ground_truth": 0}, {"key": "39308700", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.39047582655681023, "ground_truth": 0}, {"key": "39308700", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23934934610877012, "ground_truth": 0}, {"key": "39308700", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22000709991377257, "ground_truth": 0}, {"key": "39308700", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21601152828987208, "ground_truth": 0}, {"key": "31061543", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5078118655944459, "ground_truth": 0}, {"key": "31061543", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7154239911368943, "ground_truth": 0}, {"key": "31061543", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5926666097620071, "ground_truth": 0}, {"key": "31061543", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281589082243, "ground_truth": 0}, {"key": "31061543", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582789255337, "ground_truth": 0}, {"key": "37380894", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7648915942175111, "ground_truth": 0}, {"key": "37380894", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43014733333889893, "ground_truth": 0}, {"key": "37380894", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5907791902743098, "ground_truth": 0}, {"key": "37380894", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448013880653968, "ground_truth": 0}, {"key": "37380894", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494552276275, "ground_truth": 0}, {"key": "38410139", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4455295256272277, "ground_truth": 0}, {"key": "38410139", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4244119768897418, "ground_truth": 0}, {"key": "38410139", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.569852634968695, "ground_truth": 0}, {"key": "38410139", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792095074438, "ground_truth": 0}, {"key": "38410139", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.48047867847614195, "ground_truth": 0}, {"key": "35953842", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.50195308578592, "ground_truth": 0}, {"key": "35953842", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5813031003622594, "ground_truth": 0}, {"key": "35953842", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6261241636623233, "ground_truth": 0}, {"key": "35953842", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020615921342608, "ground_truth": 0}, {"key": "35953842", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916058741299, "ground_truth": 0}, {"key": "39815663", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2379298848482755, "ground_truth": 0}, {"key": "39815663", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19072400495803335, "ground_truth": 0}, {"key": "39815663", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18952108026313955, "ground_truth": 0}, {"key": "39815663", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24077459453494668, "ground_truth": 0}, {"key": "39815663", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16132024777179882, "ground_truth": 0}, {"key": "35121432", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8333245860291192, "ground_truth": 0}, {"key": "35121432", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7057850205044643, "ground_truth": 0}, {"key": "35121432", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8056321628706211, "ground_truth": 0}, {"key": "35121432", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672095968536, "ground_truth": 0}, {"key": "35121432", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754229570023, "ground_truth": 0}, {"key": "21712310", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2583259687633589, "ground_truth": 0}, {"key": "21712310", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35756751345645527, "ground_truth": 0}, {"key": "21712310", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17895589518702, "ground_truth": 0}, {"key": "21712310", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33807713945914963, "ground_truth": 0}, {"key": "21712310", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16238003479010613, "ground_truth": 0}, {"key": "37952914", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6020615694255051, "ground_truth": 0}, {"key": "37952914", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.844921512069703, "ground_truth": 0}, {"key": "37952914", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7853085909847397, "ground_truth": 0}, {"key": "37952914", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512581103223, "ground_truth": 0}, {"key": "37952914", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331443213338, "ground_truth": 0}, {"key": "38956779", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20055769185070005, "ground_truth": 0}, {"key": "38956779", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1835936269707846, "ground_truth": 0}, {"key": "38956779", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2814056039892096, "ground_truth": 0}, {"key": "38956779", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24944725865282474, "ground_truth": 0}, {"key": "38956779", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2213506641205248, "ground_truth": 0}, {"key": "36101833", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7279754507774868, "ground_truth": 0}, {"key": "36101833", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38676342637675676, "ground_truth": 0}, {"key": "36101833", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7490872033944835, "ground_truth": 0}, {"key": "36101833", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008947940782858, "ground_truth": 0}, {"key": "36101833", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094733741571, "ground_truth": 0}, {"key": "35544662", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4244120065298791, "ground_truth": 0}, {"key": "35544662", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4843800964021259, "ground_truth": 0}, {"key": "35544662", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7008947893839813, "ground_truth": 0}, {"key": "35544662", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389970318998, "ground_truth": 0}, {"key": "35544662", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4320634023432524, "ground_truth": 0}, {"key": "39759044", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.0987725861785493, "ground_truth": 0}, {"key": "39759044", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2465333579273673, "ground_truth": 0}, {"key": "39759044", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18713267650937057, "ground_truth": 0}, {"key": "39759044", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594719111328487, "ground_truth": 0}, {"key": "39759044", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.12336561210315616, "ground_truth": 0}, {"key": "39433018", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7745833926579178, "ground_truth": 0}, {"key": "39433018", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7122321987197224, "ground_truth": 0}, {"key": "39433018", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7217432142749933, "ground_truth": 0}, {"key": "39433018", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228341306847, "ground_truth": 0}, {"key": "39433018", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105496900234, "ground_truth": 0}, {"key": "22111959", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3311197323365723, "ground_truth": 0}, {"key": "22111959", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24508499638519107, "ground_truth": 0}, {"key": "22111959", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22953519424729962, "ground_truth": 0}, {"key": "22111959", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3023910751504754, "ground_truth": 0}, {"key": "22111959", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2254166118700611, "ground_truth": 0}, {"key": "38210094", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18832396918121386, "ground_truth": 0}, {"key": "38210094", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19682621464464356, "ground_truth": 0}, {"key": "38210094", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5660185515708989, "ground_truth": 0}, {"key": "38210094", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245326559792, "ground_truth": 0}, {"key": "38210094", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2766905276408234, "ground_truth": 0}, {"key": "37675935", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4111108955743406, "ground_truth": 0}, {"key": "37675935", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40356683421531836, "ground_truth": 0}, {"key": "37675935", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5273165338751453, "ground_truth": 0}, {"key": "37675935", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49609381284840715, "ground_truth": 0}, {"key": "37675935", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.631594291088123, "ground_truth": 0}, {"key": "35732604", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15304215139113087, "ground_truth": 0}, {"key": "35732604", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11357959463815556, "ground_truth": 0}, {"key": "35732604", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23231015087880136, "ground_truth": 0}, {"key": "35732604", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.08694165994594447, "ground_truth": 0}, {"key": "35732604", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.06903791856535009, "ground_truth": 0}, {"key": "27453212", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4339814890298819, "ground_truth": 0}, {"key": "27453212", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4455295265130765, "ground_truth": 0}, {"key": "27453212", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3575675303231319, "ground_truth": 0}, {"key": "27453212", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881439819176, "ground_truth": 0}, {"key": "27453212", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3812195602001083, "ground_truth": 0}, {"key": "39910047", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3073580130609543, "ground_truth": 0}, {"key": "39910047", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5273165347274043, "ground_truth": 0}, {"key": "39910047", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2186693565851349, "ground_truth": 0}, {"key": "39910047", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2877678140577195, "ground_truth": 0}, {"key": "39910047", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24508499901662079, "ground_truth": 0}, {"key": "40054265", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14033626214348835, "ground_truth": 0}, {"key": "40054265", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22405542154092112, "ground_truth": 0}, {"key": "40054265", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.261330919510577, "ground_truth": 0}, {"key": "40054265", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22000710260018938, "ground_truth": 0}, {"key": "40054265", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21337717016136465, "ground_truth": 0}, {"key": "19984615", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25982563313721735, "ground_truth": 0}, {"key": "19984615", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.39981164866215224, "ground_truth": 0}, {"key": "19984615", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3702253936792095, "ground_truth": 0}, {"key": "19984615", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557748898254327, "ground_truth": 0}, {"key": "19984615", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18713269018456663, "ground_truth": 0}, {"key": "16490806", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30074556927116286, "ground_truth": 0}, {"key": "16490806", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3960681673976149, "ground_truth": 0}, {"key": "16490806", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3433417018190633, "ground_truth": 0}, {"key": "16490806", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3023910771030145, "ground_truth": 0}, {"key": "16490806", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4225046382751335, "ground_truth": 0}, {"key": "36396237", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.905989824798781, "ground_truth": 0}, {"key": "36396237", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8723473825891112, "ground_truth": 0}, {"key": "36396237", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8697145697875068, "ground_truth": 0}, {"key": "36396237", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8791467629410606, "ground_truth": 0}, {"key": "36396237", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549505384378, "ground_truth": 0}, {"key": "40726444", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7786493112629839, "ground_truth": 0}, {"key": "40726444", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6619228791313743, "ground_truth": 0}, {"key": "40726444", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3007455671327312, "ground_truth": 0}, {"key": "40726444", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.44746026024623214, "ground_truth": 0}, {"key": "40726444", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953520720203122, "ground_truth": 0}, {"key": "37314826", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22135067794218413, "ground_truth": 0}, {"key": "37314826", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.195594086719618, "ground_truth": 0}, {"key": "37314826", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2751297070091415, "ground_truth": 0}, {"key": "37314826", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19806417730766876, "ground_truth": 0}, {"key": "37314826", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4186969149171946, "ground_truth": 0}, {"key": "38506971", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6076631731602489, "ground_truth": 0}, {"key": "38506971", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4649015535856114, "ground_truth": 0}, {"key": "38506971", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4301473282341198, "ground_truth": 0}, {"key": "38506971", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531544618819, "ground_truth": 0}, {"key": "38506971", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2598256299226908, "ground_truth": 0}, {"key": "40699312", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6706082674761574, "ground_truth": 0}, {"key": "40699312", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7704647882135872, "ground_truth": 0}, {"key": "40699312", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.70901916117662, "ground_truth": 0}, {"key": "40699312", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936363300628, "ground_truth": 0}, {"key": "40699312", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336989591825, "ground_truth": 0}, {"key": "34695474", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5370413794120215, "ground_truth": 0}, {"key": "34695474", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5273164919409976, "ground_truth": 0}, {"key": "34695474", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.37754065477896503, "ground_truth": 0}, {"key": "34695474", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3849121606529199, "ground_truth": 0}, {"key": "34695474", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793783706970644, "ground_truth": 0}, {"key": "36281498", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4148988539707688, "ground_truth": 0}, {"key": "36281498", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4571366971518798, "ground_truth": 0}, {"key": "36281498", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21076630603119278, "ground_truth": 0}, {"key": "36281498", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035514376995, "ground_truth": 0}, {"key": "36281498", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218815337292704, "ground_truth": 0}, {"key": "39558652", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3023910933789799, "ground_truth": 0}, {"key": "39558652", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5117166020267694, "ground_truth": 0}, {"key": "39558652", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5467381653429608, "ground_truth": 0}, {"key": "39558652", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935328692545, "ground_truth": 0}, {"key": "39558652", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.638835284178847, "ground_truth": 0}, {"key": "37330579", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12506537883137345, "ground_truth": 0}, {"key": "37330579", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14223188580186674, "ground_truth": 0}, {"key": "37330579", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11596071126446007, "ground_truth": 0}, {"key": "37330579", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12592275255017404, "ground_truth": 0}, {"key": "37330579", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.13939637367891314, "ground_truth": 0}, {"key": "40547658", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19314738515925914, "ground_truth": 0}, {"key": "40547658", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5964331507515135, "ground_truth": 0}, {"key": "40547658", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2974699526445427, "ground_truth": 0}, {"key": "40547658", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834905568989, "ground_truth": 0}, {"key": "40547658", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3960681659231718, "ground_truth": 0}, {"key": "37119340", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3575675278657476, "ground_truth": 0}, {"key": "37119340", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2613309382295664, "ground_truth": 0}, {"key": "37119340", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17217184258877957, "ground_truth": 0}, {"key": "37119340", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2323101335259598, "ground_truth": 0}, {"key": "37119340", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2120688131763155, "ground_truth": 0}, {"key": "35301627", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4843801048809354, "ground_truth": 0}, {"key": "35301627", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6842639918722184, "ground_truth": 0}, {"key": "35301627", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5525397178364139, "ground_truth": 0}, {"key": "35301627", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136783852215, "ground_truth": 0}, {"key": "35301627", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898641222161, "ground_truth": 0}, {"key": "34037168", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16559311469361523, "ground_truth": 0}, {"key": "34037168", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3293917241421637, "ground_truth": 0}, {"key": "34037168", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15713686901999757, "ground_truth": 0}, {"key": "34037168", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15921741458074412, "ground_truth": 0}, {"key": "34037168", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1710611931113416, "ground_truth": 0}, {"key": "39703862", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7772998637834249, "ground_truth": 0}, {"key": "39703862", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6943026758997567, "ground_truth": 0}, {"key": "39703862", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5945512831090313, "ground_truth": 0}, {"key": "39703862", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584175054591556, "ground_truth": 0}, {"key": "39703862", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723316979487813, "ground_truth": 0}, {"key": "16554814", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.13028541227187082, "ground_truth": 0}, {"key": "16554814", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2958398496568923, "ground_truth": 0}, {"key": "16554814", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.46684559732284564, "ground_truth": 0}, {"key": "16554814", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1356895440060151, "ground_truth": 0}, {"key": "16554814", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16559311950158218, "ground_truth": 0}, {"key": "32983099", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4532618479212222, "ground_truth": 0}, {"key": "32983099", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35756752464978414, "ground_truth": 0}, {"key": "32983099", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4301473498743879, "ground_truth": 0}, {"key": "32983099", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43014737944819076, "ground_truth": 0}, {"key": "32983099", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2538610111415986, "ground_truth": 0}, {"key": "41072994", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.36296918559237457, "ground_truth": 0}, {"key": "41072994", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1645164700023198, "ground_truth": 0}, {"key": "41072994", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5621765097699065, "ground_truth": 0}, {"key": "41072994", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3812195614142291, "ground_truth": 0}, {"key": "41072994", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469140950296417, "ground_truth": 0}, {"key": "38396247", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7041601346755354, "ground_truth": 0}, {"key": "38396247", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6113819436648502, "ground_truth": 0}, {"key": "38396247", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5544704318748884, "ground_truth": 0}, {"key": "38396247", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248703083980342, "ground_truth": 0}, {"key": "38396247", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416499211463, "ground_truth": 0}, {"key": "37507998", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24220559912077955, "ground_truth": 0}, {"key": "37507998", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2494472477681772, "ground_truth": 0}, {"key": "37507998", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35756750116202796, "ground_truth": 0}, {"key": "37507998", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.28457602602521126, "ground_truth": 0}, {"key": "37507998", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641490584482, "ground_truth": 0}, {"key": "32593929", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2120688056060818, "ground_truth": 0}, {"key": "32593929", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5058591119049651, "ground_truth": 0}, {"key": "32593929", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1919327799661316, "ground_truth": 0}, {"key": "32593929", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2173375292263695, "ground_truth": 0}, {"key": "32593929", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3575675106911504, "ground_truth": 0}, {"key": "36056449", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.51952130182298, "ground_truth": 0}, {"key": "36056449", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.44939263901249965, "ground_truth": 0}, {"key": "36056449", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5602526579898376, "ground_truth": 0}, {"key": "36056449", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992543992837061, "ground_truth": 0}, {"key": "36056449", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629585952592606, "ground_truth": 0}, {"key": "21986185", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.04958902251316358, "ground_truth": 0}, {"key": "21986185", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.06512755252555007, "ground_truth": 0}, {"key": "21986185", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.06656919055406875, "ground_truth": 0}, {"key": "21986185", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.07477004215674563, "ground_truth": 0}, {"key": "21986185", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.060086652618809785, "ground_truth": 0}, {"key": "40757465", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2538610072767292, "ground_truth": 0}, {"key": "40757465", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4610167955409631, "ground_truth": 0}, {"key": "40757465", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2553436515575266, "ground_truth": 0}, {"key": "40757465", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31405054120284237, "ground_truth": 0}, {"key": "40757465", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28298812084292857, "ground_truth": 0}, {"key": "35198313", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3174262534374696, "ground_truth": 0}, {"key": "35198313", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3867634210913263, "ground_truth": 0}, {"key": "35198313", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3345894585473072, "ground_truth": 0}, {"key": "35198313", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36658971494173964, "ground_truth": 0}, {"key": "35198313", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3174262528437514, "ground_truth": 0}, {"key": "30604618", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.540923874527502, "ground_truth": 0}, {"key": "30604618", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5563995671969696, "ground_truth": 0}, {"key": "30604618", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.457136725455452, "ground_truth": 0}, {"key": "30604618", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633920527053, "ground_truth": 0}, {"key": "30604618", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819914978693, "ground_truth": 0}, {"key": "35779006", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6740504845026816, "ground_truth": 0}, {"key": "35779006", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43782349995286884, "ground_truth": 0}, {"key": "35779006", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3276682975413302, "ground_truth": 0}, {"key": "35779006", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935200136436, "ground_truth": 0}, {"key": "35779006", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419981342179, "ground_truth": 0}, {"key": "33858956", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5448013647042613, "ground_truth": 0}, {"key": "33858956", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5698526368601271, "ground_truth": 0}, {"key": "33858956", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5755880255984391, "ground_truth": 0}, {"key": "33858956", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531120090337, "ground_truth": 0}, {"key": "33858956", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4225046159196804, "ground_truth": 0}, {"key": "38633880", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2958398679072022, "ground_truth": 0}, {"key": "38633880", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3023910542593989, "ground_truth": 0}, {"key": "38633880", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3451052483345035, "ground_truth": 0}, {"key": "38633880", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.10374862231517148, "ground_truth": 0}, {"key": "38633880", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22000709463078194, "ground_truth": 0}, {"key": "36654905", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9362850069092288, "ground_truth": 0}, {"key": "36654905", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9458012700356068, "ground_truth": 0}, {"key": "36654905", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8955226763736698, "ground_truth": 0}, {"key": "36654905", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240790444597, "ground_truth": 0}, {"key": "36654905", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274034086684, "ground_truth": 0}, {"key": "26547482", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24798741322885756, "ground_truth": 0}, {"key": "26547482", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16451646869373518, "ground_truth": 0}, {"key": "26547482", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1993080246824684, "ground_truth": 0}, {"key": "26547482", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3023910926544744, "ground_truth": 0}, {"key": "26547482", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1766715984627285, "ground_truth": 0}, {"key": "36439068", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5389832242059287, "ground_truth": 0}, {"key": "36439068", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6039318294531449, "ground_truth": 0}, {"key": "36439068", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3720488032270478, "ground_truth": 0}, {"key": "36439068", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964291478775, "ground_truth": 0}, {"key": "36439068", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793783947920582, "ground_truth": 0}, {"key": "30501258", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4571367281224984, "ground_truth": 0}, {"key": "30501258", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3942009626256177, "ground_truth": 0}, {"key": "30501258", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5486734979772946, "ground_truth": 0}, {"key": "30501258", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684615701994, "ground_truth": 0}, {"key": "30501258", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4167966372267248, "ground_truth": 0}, {"key": "37560941", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6315942967092908, "ground_truth": 0}, {"key": "37560941", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4571367541811326, "ground_truth": 0}, {"key": "37560941", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5755880240541756, "ground_truth": 0}, {"key": "37560941", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201714913590423, "ground_truth": 0}, {"key": "37560941", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4205995897885595, "ground_truth": 0}, {"key": "36801665", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5679366192315297, "ground_truth": 0}, {"key": "36801665", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5195212942133648, "ground_truth": 0}, {"key": "36801665", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6926420001938516, "ground_truth": 0}, {"key": "36801665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504876949833, "ground_truth": 0}, {"key": "36801665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947447261662, "ground_truth": 0}, {"key": "34954610", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19559408936769612, "ground_truth": 0}, {"key": "34954610", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20689405486137555, "ground_truth": 0}, {"key": "34954610", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16132023686988917, "ground_truth": 0}, {"key": "34954610", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3023910734788866, "ground_truth": 0}, {"key": "34954610", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561504181579648, "ground_truth": 0}, {"key": "37020510", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7866228143162722, "ground_truth": 0}, {"key": "37020510", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8187368056912909, "ground_truth": 0}, {"key": "37020510", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8449215186436955, "ground_truth": 0}, {"key": "37020510", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.817574470440377, "ground_truth": 0}, {"key": "37020510", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601724078138463, "ground_truth": 0}, {"key": "38064637", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21601153796686753, "ground_truth": 0}, {"key": "38064637", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3174262809351743, "ground_truth": 0}, {"key": "38064637", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1968262097070687, "ground_truth": 0}, {"key": "38064637", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.47463119082480926, "ground_truth": 0}, {"key": "38064637", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4130035661814105, "ground_truth": 0}, {"key": "40886108", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9130583429257373, "ground_truth": 0}, {"key": "40886108", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8848377687967596, "ground_truth": 0}, {"key": "40886108", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9458012726333866, "ground_truth": 0}, {"key": "40886108", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9289263259214933, "ground_truth": 0}, {"key": "40886108", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086178979154763, "ground_truth": 0}, {"key": "38554603", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3040416999703165, "ground_truth": 0}, {"key": "38554603", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.44939262407196723, "ground_truth": 0}, {"key": "38554603", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4225046412769372, "ground_truth": 0}, {"key": "38554603", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.47463118465569476, "ground_truth": 0}, {"key": "38554603", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3867634600053445, "ground_truth": 0}, {"key": "39115586", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.41489884319179654, "ground_truth": 0}, {"key": "39115586", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4785288267825569, "ground_truth": 0}, {"key": "39115586", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.373875795985502, "ground_truth": 0}, {"key": "39115586", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.41489886536962756, "ground_truth": 0}, {"key": "39115586", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004064218865, "ground_truth": 0}, {"key": "38786314", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35220176215990523, "ground_truth": 0}, {"key": "38786314", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.44360044257020687, "ground_truth": 0}, {"key": "38786314", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3757064639424656, "ground_truth": 0}, {"key": "38786314", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.46101679810953156, "ground_truth": 0}, {"key": "38786314", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897180207497, "ground_truth": 0}, {"key": "38721078", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48438006633881414, "ground_truth": 0}, {"key": "38721078", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6566582534637633, "ground_truth": 0}, {"key": "38721078", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7813306320920411, "ground_truth": 0}, {"key": "38721078", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797802696089, "ground_truth": 0}, {"key": "38721078", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711538790271, "ground_truth": 0}, {"key": "39475467", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5869964584580909, "ground_truth": 0}, {"key": "39475467", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6671476655843362, "ground_truth": 0}, {"key": "39475467", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5525397386452426, "ground_truth": 0}, {"key": "39475467", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251021500986, "ground_truth": 0}, {"key": "39475467", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.529263380124783, "ground_truth": 0}, {"key": "35691234", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33111974106208947, "ground_truth": 0}, {"key": "35691234", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3611646939018143, "ground_truth": 0}, {"key": "35691234", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24364245088960354, "ground_truth": 0}, {"key": "35691234", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3433417618331513, "ground_truth": 0}, {"key": "35691234", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4668456117094047, "ground_truth": 0}, {"key": "36871390", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23370637081298307, "ground_truth": 0}, {"key": "36871390", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3979384236446755, "ground_truth": 0}, {"key": "36871390", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5409238733799318, "ground_truth": 0}, {"key": "36871390", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36116472135459476, "ground_truth": 0}, {"key": "36871390", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15102781913179605, "ground_truth": 0}, {"key": "31730844", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.29583985597834983, "ground_truth": 0}, {"key": "31730844", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23934933839868008, "ground_truth": 0}, {"key": "31730844", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23370634214697855, "ground_truth": 0}, {"key": "31730844", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3433417267372801, "ground_truth": 0}, {"key": "31730844", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2005576816217314, "ground_truth": 0}, {"key": "30810940", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28937170363555276, "ground_truth": 0}, {"key": "30810940", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21076632577215137, "ground_truth": 0}, {"key": "30810940", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33982760869648565, "ground_truth": 0}, {"key": "30810940", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3259495183815225, "ground_truth": 0}, {"key": "30810940", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824291260668786, "ground_truth": 0}, {"key": "39352003", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8766343606292144, "ground_truth": 0}, {"key": "39352003", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8164063766059406, "ground_truth": 0}, {"key": "39352003", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8267117906896672, "ground_truth": 0}, {"key": "39352003", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549529472417, "ground_truth": 0}, {"key": "39352003", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833722658627, "ground_truth": 0}, {"key": "40118123", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39420099502553685, "ground_truth": 0}, {"key": "40118123", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.407333411599672, "ground_truth": 0}, {"key": "40118123", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34687310955970113, "ground_truth": 0}, {"key": "40118123", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708562873214, "ground_truth": 0}, {"key": "40118123", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442251043728267, "ground_truth": 0}, {"key": "37114191", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3702253818429931, "ground_truth": 0}, {"key": "37114191", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16776334213223873, "ground_truth": 0}, {"key": "37114191", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.37022538797453697, "ground_truth": 0}, {"key": "37114191", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.28937168867022733, "ground_truth": 0}, {"key": "37114191", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2393493554763718, "ground_truth": 0}, {"key": "39268203", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.550607335775494, "ground_truth": 0}, {"key": "39268203", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5331544058612198, "ground_truth": 0}, {"key": "39268203", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8104789101596519, "ground_truth": 0}, {"key": "39268203", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506563381108, "ground_truth": 0}, {"key": "39268203", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528049250614, "ground_truth": 0}, {"key": "37950968", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2720245450742457, "ground_truth": 0}, {"key": "37950968", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3468730959202458, "ground_truth": 0}, {"key": "37950968", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.31236999345977523, "ground_truth": 0}, {"key": "37950968", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3398276434200005, "ground_truth": 0}, {"key": "37950968", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18476750328305044, "ground_truth": 0}, {"key": "34959807", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5097643728878112, "ground_truth": 0}, {"key": "34959807", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37937839821353553, "ground_truth": 0}, {"key": "34959807", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4902355907234193, "ground_truth": 0}, {"key": "34959807", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.47073659734871326, "ground_truth": 0}, {"key": "34959807", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531366464283, "ground_truth": 0}, {"key": "35631314", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9105453944063068, "ground_truth": 0}, {"key": "35631314", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8311430475820452, "ground_truth": 0}, {"key": "35631314", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9437636513420262, "ground_truth": 0}, {"key": "35631314", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343717690844, "ground_truth": 0}, {"key": "35631314", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218336511714, "ground_truth": 0}, {"key": "38082365", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.670608288039703, "ground_truth": 0}, {"key": "38082365", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.726425607452633, "ground_truth": 0}, {"key": "38082365", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.705785046463463, "ground_truth": 0}, {"key": "38082365", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.841825645440789, "ground_truth": 0}, {"key": "38082365", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159548121155, "ground_truth": 0}, {"key": "37242829", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5813031039615038, "ground_truth": 0}, {"key": "37242829", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3886180326083518, "ground_truth": 0}, {"key": "37242829", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5964331277572459, "ground_truth": 0}, {"key": "37242829", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019530975311272, "ground_truth": 0}, {"key": "37242829", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4054487393892877, "ground_truth": 0}, {"key": "38556068", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23934936136134677, "ground_truth": 0}, {"key": "38556068", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2553436888153386, "ground_truth": 0}, {"key": "38556068", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35220176931263686, "ground_truth": 0}, {"key": "38556068", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3575675360730839, "ground_truth": 0}, {"key": "38556068", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092208096138817, "ground_truth": 0}, {"key": "32969336", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43206336707458837, "ground_truth": 0}, {"key": "32969336", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6495785943356839, "ground_truth": 0}, {"key": "32969336", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.381219559112889, "ground_truth": 0}, {"key": "32969336", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033819016171, "ground_truth": 0}, {"key": "32969336", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3611647216973141, "ground_truth": 0}, {"key": "36825153", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1744102821550562, "ground_truth": 0}, {"key": "36825153", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1778108700319695, "ground_truth": 0}, {"key": "36825153", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23370638222879664, "ground_truth": 0}, {"key": "36825153", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19436779940652704, "ground_truth": 0}, {"key": "36825153", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808772187827, "ground_truth": 0}, {"key": "41050146", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8887587880155812, "ground_truth": 0}, {"key": "41050146", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6688802639877754, "ground_truth": 0}, {"key": "41050146", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7606506286581303, "ground_truth": 0}, {"key": "41050146", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033768260836, "ground_truth": 0}, {"key": "41050146", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743443311265, "ground_truth": 0}, {"key": "27865037", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3398276476979605, "ground_truth": 0}, {"key": "27865037", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14511536568119282, "ground_truth": 0}, {"key": "27865037", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.32423541908453274, "ground_truth": 0}, {"key": "27865037", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526499676072, "ground_truth": 0}, {"key": "27865037", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.651354858193201, "ground_truth": 0}, {"key": "39868565", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.29259532196714294, "ground_truth": 0}, {"key": "39868565", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26894142454508896, "ground_truth": 0}, {"key": "39868565", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34864513890894494, "ground_truth": 0}, {"key": "39868565", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31405052702401937, "ground_truth": 0}, {"key": "39868565", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3073580296614522, "ground_truth": 0}, {"key": "37761968", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4474603034890808, "ground_truth": 0}, {"key": "37761968", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.484380101207534, "ground_truth": 0}, {"key": "37761968", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4474602937447547, "ground_truth": 0}, {"key": "37761968", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.32766830890551546, "ground_truth": 0}, {"key": "37761968", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544282829479, "ground_truth": 0}, {"key": "16326139", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18010666104448886, "ground_truth": 0}, {"key": "16326139", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2160115279081753, "ground_truth": 0}, {"key": "16326139", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39793842679181735, "ground_truth": 0}, {"key": "16326139", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1699562288677329, "ground_truth": 0}, {"key": "16326139", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17441028274683953, "ground_truth": 0}, {"key": "36568381", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47852883732132473, "ground_truth": 0}, {"key": "36568381", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37022539575122787, "ground_truth": 0}, {"key": "36568381", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.32423541360803354, "ground_truth": 0}, {"key": "36568381", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117165943822659, "ground_truth": 0}, {"key": "36568381", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40356684448222857, "ground_truth": 0}, {"key": "39855613", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6654105636835692, "ground_truth": 0}, {"key": "39855613", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6926420023103654, "ground_truth": 0}, {"key": "39855613", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8128673114144314, "ground_truth": 0}, {"key": "39855613", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085737157448, "ground_truth": 0}, {"key": "39855613", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943784262048, "ground_truth": 0}, {"key": "29856302", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5097643808260334, "ground_truth": 0}, {"key": "29856302", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6495786214239331, "ground_truth": 0}, {"key": "29856302", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41869692957563054, "ground_truth": 0}, {"key": "29856302", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.476579670985365, "ground_truth": 0}, {"key": "29856302", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711533513856, "ground_truth": 0}, {"key": "35641106", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7490872121232439, "ground_truth": 0}, {"key": "35641106", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7505527521371516, "ground_truth": 0}, {"key": "35641106", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8289388078498781, "ground_truth": 0}, {"key": "35641106", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704647896285235, "ground_truth": 0}, {"key": "35641106", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867701133855, "ground_truth": 0}, {"key": "39474558", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24077460061047604, "ground_truth": 0}, {"key": "39474558", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3923368267087058, "ground_truth": 0}, {"key": "39474558", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25091280526871906, "ground_truth": 0}, {"key": "39474558", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.468790633766557, "ground_truth": 0}, {"key": "39474558", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3451052535405668, "ground_truth": 0}, {"key": "34338135", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7233094576981881, "ground_truth": 0}, {"key": "34338135", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7461389769803461, "ground_truth": 0}, {"key": "34338135", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8056321973383156, "ground_truth": 0}, {"key": "34338135", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511441393362, "ground_truth": 0}, {"key": "34338135", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281360469933, "ground_truth": 0}, {"key": "35870330", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6548947406228708, "ground_truth": 0}, {"key": "35870330", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5660185398524563, "ground_truth": 0}, {"key": "35870330", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8187367701507315, "ground_truth": 0}, {"key": "35870330", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5525396953037359, "ground_truth": 0}, {"key": "35870330", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185532492719, "ground_truth": 0}, {"key": "24478245", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4263215968134586, "ground_truth": 0}, {"key": "24478245", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.39606818223505785, "ground_truth": 0}, {"key": "24478245", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5039061719414866, "ground_truth": 0}, {"key": "24478245", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.560252680405133, "ground_truth": 0}, {"key": "24478245", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824291251462234, "ground_truth": 0}, {"key": "38485946", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.552539728108233, "ground_truth": 0}, {"key": "38485946", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5525396928739941, "ground_truth": 0}, {"key": "38485946", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7371581682448688, "ground_truth": 0}, {"key": "38485946", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984701025793, "ground_truth": 0}, {"key": "38485946", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.571766596154366, "ground_truth": 0}, {"key": "32509613", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3539863021778708, "ground_truth": 0}, {"key": "32509613", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7310585806731459, "ground_truth": 0}, {"key": "32509613", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5136684791809722, "ground_truth": 0}, {"key": "32509613", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784094194479, "ground_truth": 0}, {"key": "32509613", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3775406909707958, "ground_truth": 0}, {"key": "34078819", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7732163422137979, "ground_truth": 0}, {"key": "34078819", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5253688150558603, "ground_truth": 0}, {"key": "34078819", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8624675226081915, "ground_truth": 0}, {"key": "34078819", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.562176473102974, "ground_truth": 0}, {"key": "34078819", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063790161845, "ground_truth": 0}, {"key": "39523865", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18126321498560397, "ground_truth": 0}, {"key": "39523865", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4416730096711843, "ground_truth": 0}, {"key": "39523865", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26435836100179505, "ground_truth": 0}, {"key": "39523865", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3486451584026467, "ground_truth": 0}, {"key": "39523865", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2829881331845995, "ground_truth": 0}, {"key": "33146158", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2658804677770457, "ground_truth": 0}, {"key": "33146158", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.39606815399184864, "ground_truth": 0}, {"key": "33146158", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22000709735777013, "ground_truth": 0}, {"key": "33146158", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16667540911796258, "ground_truth": 0}, {"key": "33146158", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1778108704565337, "ground_truth": 0}, {"key": "32083974", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4205995954174418, "ground_truth": 0}, {"key": "32083974", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4843800748081989, "ground_truth": 0}, {"key": "32083974", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5234203494002803, "ground_truth": 0}, {"key": "32083974", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30404167168333185, "ground_truth": 0}, {"key": "32083974", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.48828343368302946, "ground_truth": 0}, {"key": "34378482", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.846957831339103, "ground_truth": 0}, {"key": "34378482", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8848377675567052, "ground_truth": 0}, {"key": "34378482", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8210441100239338, "ground_truth": 0}, {"key": "34378482", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506575953923, "ground_truth": 0}, {"key": "34378482", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118662191962, "ground_truth": 0}, {"key": "38080102", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4921881525102322, "ground_truth": 0}, {"key": "38080102", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32423541851943166, "ground_truth": 0}, {"key": "38080102", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3960681751075315, "ground_truth": 0}, {"key": "38080102", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3647775596187511, "ground_truth": 0}, {"key": "38080102", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3886180048888961, "ground_truth": 0}, {"key": "40244537", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.36658973542060097, "ground_truth": 0}, {"key": "40244537", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.550607355903609, "ground_truth": 0}, {"key": "40244537", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33982761535358513, "ground_truth": 0}, {"key": "40244537", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.47852884402303203, "ground_truth": 0}, {"key": "40244537", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991051957050315, "ground_truth": 0}, {"key": "33497789", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6460137067619591, "ground_truth": 0}, {"key": "33497789", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7592254020346626, "ground_truth": 0}, {"key": "33497789", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6406358483429756, "ground_truth": 0}, {"key": "33497789", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673087321411, "ground_truth": 0}, {"key": "33497789", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191389886924, "ground_truth": 0}, {"key": "28816889", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5175708828950095, "ground_truth": 0}, {"key": "28816889", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5370413740273241, "ground_truth": 0}, {"key": "28816889", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5774953620355637, "ground_truth": 0}, {"key": "28816889", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448014021445238, "ground_truth": 0}, {"key": "28816889", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640985042836402, "ground_truth": 0}, {"key": "38157127", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24653336143899063, "ground_truth": 0}, {"key": "38157127", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2829881257089767, "ground_truth": 0}, {"key": "38157127", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3415824742698645, "ground_truth": 0}, {"key": "38157127", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798741625162835, "ground_truth": 0}, {"key": "38157127", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1561048867315338, "ground_truth": 0}, {"key": "36183569", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2523840369947321, "ground_truth": 0}, {"key": "36183569", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2494472488169015, "ground_truth": 0}, {"key": "36183569", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22541661191811382, "ground_truth": 0}, {"key": "36183569", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12592276492098875, "ground_truth": 0}, {"key": "36183569", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16132023056702602, "ground_truth": 0}, {"key": "36012016", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6495786351841812, "ground_truth": 0}, {"key": "36012016", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.573678405402184, "ground_truth": 0}, {"key": "36012016", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40922079978153814, "ground_truth": 0}, {"key": "36012016", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.48047866015409796, "ground_truth": 0}, {"key": "36012016", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43206336930778066, "ground_truth": 0}, {"key": "34571973", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6169358179193732, "ground_truth": 0}, {"key": "34571973", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7956581065451586, "ground_truth": 0}, {"key": "34571973", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6132365570162772, "ground_truth": 0}, {"key": "34571973", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165233713529, "ground_truth": 0}, {"key": "34571973", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947252403011, "ground_truth": 0}, {"key": "38707498", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7138307565791362, "ground_truth": 0}, {"key": "38707498", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8233284041463523, "ground_truth": 0}, {"key": "38707498", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7813306298477949, "ground_truth": 0}, {"key": "38707498", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118924676386, "ground_truth": 0}, {"key": "38707498", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008948249903206, "ground_truth": 0}, {"key": "35459082", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.887204596522498, "ground_truth": 0}, {"key": "35459082", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.930962075983707, "ground_truth": 0}, {"key": "35459082", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8311430479979761, "ground_truth": 0}, {"key": "35459082", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343800954033, "ground_truth": 0}, {"key": "35459082", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.902609612703404, "ground_truth": 0}, {"key": "39464041", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7074046844400248, "ground_truth": 0}, {"key": "39464041", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6206216222443462, "ground_truth": 0}, {"key": "39464041", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6791787144427172, "ground_truth": 0}, {"key": "39464041", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241858731291, "ground_truth": 0}, {"key": "39464041", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723316982785554, "ground_truth": 0}, {"key": "23782052", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12852513816076314, "ground_truth": 0}, {"key": "23782052", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26740816373254317, "ground_truth": 0}, {"key": "23782052", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23792987182574357, "ground_truth": 0}, {"key": "23782052", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15713683992770902, "ground_truth": 0}, {"key": "23782052", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2186693690616759, "ground_truth": 0}, {"key": "36568455", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5717666240126426, "ground_truth": 0}, {"key": "36568455", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6132365590730579, "ground_truth": 0}, {"key": "36568455", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6909762599070985, "ground_truth": 0}, {"key": "36568455", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897231157396, "ground_truth": 0}, {"key": "36568455", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585587939838, "ground_truth": 0}, {"key": "38469552", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7931059678149841, "ground_truth": 0}, {"key": "38469552", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7154240045591148, "ground_truth": 0}, {"key": "38469552", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.618780444318191, "ground_truth": 0}, {"key": "38469552", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.687630002827328, "ground_truth": 0}, {"key": "38469552", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118795982534, "ground_truth": 0}, {"key": "35922277", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7866228093764088, "ground_truth": 0}, {"key": "35922277", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.816406383017221, "ground_truth": 0}, {"key": "35922277", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9230391681381115, "ground_truth": 0}, {"key": "35922277", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159491382025, "ground_truth": 0}, {"key": "35922277", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677588602931, "ground_truth": 0}, {"key": "32744293", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47657962838599677, "ground_truth": 0}, {"key": "32744293", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6150878212361307, "ground_truth": 0}, {"key": "32744293", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7170118872144013, "ground_truth": 0}, {"key": "32744293", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35936414959886803, "ground_truth": 0}, {"key": "32744293", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191478082304, "ground_truth": 0}, {"key": "30972362", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7592254000918817, "ground_truth": 0}, {"key": "30972362", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7826624708926331, "ground_truth": 0}, {"key": "30972362", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8947894596473538, "ground_truth": 0}, {"key": "30972362", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256472428252, "ground_truth": 0}, {"key": "30972362", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.866132509222538, "ground_truth": 0}, {"key": "36380943", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7106283025430118, "ground_truth": 0}, {"key": "36380943", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6825737324154401, "ground_truth": 0}, {"key": "36380943", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6584174982777472, "ground_truth": 0}, {"key": "36380943", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239949908552, "ground_truth": 0}, {"key": "36380943", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241740889065, "ground_truth": 0}, {"key": "36929355", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5621765035680472, "ground_truth": 0}, {"key": "36929355", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3684057050707977, "ground_truth": 0}, {"key": "36929355", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5794004202565913, "ground_truth": 0}, {"key": "36929355", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011351791574, "ground_truth": 0}, {"key": "36929355", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3539863130825513, "ground_truth": 0}, {"key": "39127206", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6460136933722681, "ground_truth": 0}, {"key": "39127206", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3157359867577758, "ground_truth": 0}, {"key": "39127206", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22000710437222856, "ground_truth": 0}, {"key": "39127206", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4148988283140138, "ground_truth": 0}, {"key": "39127206", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3629692193131032, "ground_truth": 0}, {"key": "36128318", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.37937838021081166, "ground_truth": 0}, {"key": "36128318", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35220177451020296, "ground_truth": 0}, {"key": "36128318", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2081789304762113, "ground_truth": 0}, {"key": "36128318", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2351083948090249, "ground_truth": 0}, {"key": "36128318", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2674081820536926, "ground_truth": 0}, {"key": "39863480", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6020615708806775, "ground_truth": 0}, {"key": "39863480", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7476159649193874, "ground_truth": 0}, {"key": "39863480", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5312093527653499, "ground_truth": 0}, {"key": "39863480", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315943181914067, "ground_truth": 0}, {"key": "39863480", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.575588020463596, "ground_truth": 0}, {"key": "38634057", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4551986207298794, "ground_truth": 0}, {"key": "38634057", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4960938250643065, "ground_truth": 0}, {"key": "38634057", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4960938417554974, "ground_truth": 0}, {"key": "38634057", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.327668306260391, "ground_truth": 0}, {"key": "38634057", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3433417145895694, "ground_truth": 0}, {"key": "33131935", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8068526071550903, "ground_truth": 0}, {"key": "33131935", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6020615772627913, "ground_truth": 0}, {"key": "33131935", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7718435039596646, "ground_truth": 0}, {"key": "33131935", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633915928331753, "ground_truth": 0}, {"key": "33131935", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891410589103, "ground_truth": 0}, {"key": "39021319", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.45713670284461777, "ground_truth": 0}, {"key": "39021319", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26894143136443566, "ground_truth": 0}, {"key": "39021319", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34864513120169227, "ground_truth": 0}, {"key": "39021319", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.41679664176363546, "ground_truth": 0}, {"key": "39021319", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.461016760625711, "ground_truth": 0}, {"key": "40644571", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5525397431559677, "ground_truth": 0}, {"key": "40644571", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3056973361889789, "ground_truth": 0}, {"key": "40644571", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3040416745020056, "ground_truth": 0}, {"key": "40644571", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3007455779075276, "ground_truth": 0}, {"key": "40644571", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869963928791542, "ground_truth": 0}, {"key": "14681877", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5486735110306042, "ground_truth": 0}, {"key": "14681877", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5078118551620231, "ground_truth": 0}, {"key": "14681877", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6406358554332459, "ground_truth": 0}, {"key": "14681877", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591302216571, "ground_truth": 0}, {"key": "14681877", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3923368272817154, "ground_truth": 0}, {"key": "36570890", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7217432032874306, "ground_truth": 0}, {"key": "36570890", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4130036044490349, "ground_truth": 0}, {"key": "36570890", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.60952413801272, "ground_truth": 0}, {"key": "36570890", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4610167741929715, "ground_truth": 0}, {"key": "36570890", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880122867082, "ground_truth": 0}, {"key": "30452755", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6601723785935075, "ground_truth": 0}, {"key": "30452755", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5409238508660531, "ground_truth": 0}, {"key": "30452755", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4980469007300396, "ground_truth": 0}, {"key": "30452755", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794003836288766, "ground_truth": 0}, {"key": "30452755", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947292619454, "ground_truth": 0}, {"key": "37347053", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30074555012207227, "ground_truth": 0}, {"key": "37347053", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26435837116846833, "ground_truth": 0}, {"key": "37347053", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4493926408725543, "ground_truth": 0}, {"key": "37347053", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631929323861, "ground_truth": 0}, {"key": "37347053", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36477756971760766, "ground_truth": 0}, {"key": "38890979", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5640984999705181, "ground_truth": 0}, {"key": "38890979", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37022539249017944, "ground_truth": 0}, {"key": "38890979", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42632161265147994, "ground_truth": 0}, {"key": "38890979", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4282334064183956, "ground_truth": 0}, {"key": "38890979", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3738758267879533, "ground_truth": 0}, {"key": "32974694", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47463118339163546, "ground_truth": 0}, {"key": "32974694", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5467381947548524, "ground_truth": 0}, {"key": "32974694", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.46490155411018913, "ground_truth": 0}, {"key": "32974694", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118707862253, "ground_truth": 0}, {"key": "32974694", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4359014953711605, "ground_truth": 0}, {"key": "38519940", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30239109622568255, "ground_truth": 0}, {"key": "38519940", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.45907614364900545, "ground_truth": 0}, {"key": "38519940", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6495786373632765, "ground_truth": 0}, {"key": "38519940", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984712944446, "ground_truth": 0}, {"key": "38519940", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786387344008, "ground_truth": 0}, {"key": "38870104", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6334102663103385, "ground_truth": 0}, {"key": "38870104", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7325918372707886, "ground_truth": 0}, {"key": "38870104", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7745833870780229, "ground_truth": 0}, {"key": "38870104", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.699254437905062, "ground_truth": 0}, {"key": "38870104", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527336265126, "ground_truth": 0}, {"key": "34283161", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.34687306400862195, "ground_truth": 0}, {"key": "34283161", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20181321123632548, "ground_truth": 0}, {"key": "34283161", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3812195368924212, "ground_truth": 0}, {"key": "34283161", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3867634663066021, "ground_truth": 0}, {"key": "34283161", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185321338809, "ground_truth": 0}, {"key": "31650463", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5428632986688946, "ground_truth": 0}, {"key": "31650463", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7431680114029863, "ground_truth": 0}, {"key": "31650463", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6959583054676163, "ground_truth": 0}, {"key": "31650463", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307838303751, "ground_truth": 0}, {"key": "31650463", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918208744687, "ground_truth": 0}, {"key": "35589432", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6757645917984065, "ground_truth": 0}, {"key": "35589432", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5195213166948064, "ground_truth": 0}, {"key": "35589432", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6876300153206218, "ground_truth": 0}, {"key": "35589432", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743621807808, "ground_truth": 0}, {"key": "35589432", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.603931810209913, "ground_truth": 0}, {"key": "14412752", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.41489884384949266, "ground_truth": 0}, {"key": "14412752", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6825737233478723, "ground_truth": 0}, {"key": "14412752", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4707366202286435, "ground_truth": 0}, {"key": "14412752", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089295914183, "ground_truth": 0}, {"key": "14412752", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883556734023, "ground_truth": 0}, {"key": "37271183", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8311430369186282, "ground_truth": 0}, {"key": "37271183", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.798186782048828, "ground_truth": 0}, {"key": "37271183", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8407826038618221, "ground_truth": 0}, {"key": "37271183", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918306133264, "ground_truth": 0}, {"key": "37271183", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377777607558, "ground_truth": 0}, {"key": "35588153", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8766343814720293, "ground_truth": 0}, {"key": "35588153", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7356416227702338, "ground_truth": 0}, {"key": "35588153", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8128673039858313, "ground_truth": 0}, {"key": "35588153", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117803687561, "ground_truth": 0}, {"key": "35588153", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578416725494, "ground_truth": 0}, {"key": "39876692", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6791787117619537, "ground_truth": 0}, {"key": "39876692", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6619228627890258, "ground_truth": 0}, {"key": "39876692", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5156199241046107, "ground_truth": 0}, {"key": "39876692", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640340080803, "ground_truth": 0}, {"key": "39876692", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947224243985, "ground_truth": 0}, {"key": "38992323", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7122321507762512, "ground_truth": 0}, {"key": "38992323", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3522017697507353, "ground_truth": 0}, {"key": "38992323", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5525397117754974, "ground_truth": 0}, {"key": "38992323", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743598431818, "ground_truth": 0}, {"key": "38992323", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601724181541172, "ground_truth": 0}, {"key": "37556002", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49609383789418515, "ground_truth": 0}, {"key": "37556002", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3942009723349039, "ground_truth": 0}, {"key": "37556002", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.46490156459329185, "ground_truth": 0}, {"key": "37556002", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4244119952246223, "ground_truth": 0}, {"key": "37556002", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.37387581350893334, "ground_truth": 0}, {"key": "39875801", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.825589717948539, "ground_truth": 0}, {"key": "39875801", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8140528068450104, "ground_truth": 0}, {"key": "39875801", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8116760338832293, "ground_truth": 0}, {"key": "39875801", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740078608916, "ground_truth": 0}, {"key": "39875801", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835317067891, "ground_truth": 0}, {"key": "39272285", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3504213805702163, "ground_truth": 0}, {"key": "39272285", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19436780992856467, "ground_truth": 0}, {"key": "39272285", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2436424502506139, "ground_truth": 0}, {"key": "39272285", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2553436715721944, "ground_truth": 0}, {"key": "39272285", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594951950098416, "ground_truth": 0}, {"key": "39629714", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7786493234583097, "ground_truth": 0}, {"key": "39629714", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5832033594396179, "ground_truth": 0}, {"key": "39629714", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4882833894978265, "ground_truth": 0}, {"key": "39629714", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.794384969890916, "ground_truth": 0}, {"key": "39629714", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922080862899907, "ground_truth": 0}, {"key": "34043257", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5117165863956977, "ground_truth": 0}, {"key": "34043257", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6442251157049007, "ground_truth": 0}, {"key": "34043257", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6706082581706836, "ground_truth": 0}, {"key": "34043257", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.734119512917638, "ground_truth": 0}, {"key": "34043257", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.46684558950353633, "ground_truth": 0}, {"key": "33995240", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31405057651979235, "ground_truth": 0}, {"key": "33995240", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5273165281740647, "ground_truth": 0}, {"key": "33995240", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3259494990564168, "ground_truth": 0}, {"key": "33995240", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.28140562172536393, "ground_truth": 0}, {"key": "33995240", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36477757458753207, "ground_truth": 0}, {"key": "39399948", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7704647889018814, "ground_truth": 0}, {"key": "39399948", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7577943465040138, "ground_truth": 0}, {"key": "39399948", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6039318359507939, "ground_truth": 0}, {"key": "39399948", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253751525486, "ground_truth": 0}, {"key": "39399948", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953523248555, "ground_truth": 0}, {"key": "33185890", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7416740003368991, "ground_truth": 0}, {"key": "33185890", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6020615960177379, "ground_truth": 0}, {"key": "33185890", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.511716606628503, "ground_truth": 0}, {"key": "33185890", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238706135681, "ground_truth": 0}, {"key": "33185890", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.49414089324403226, "ground_truth": 0}, {"key": "35280425", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7295197787003274, "ground_truth": 0}, {"key": "35280425", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6315942967061913, "ground_truth": 0}, {"key": "35280425", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6132365209952114, "ground_truth": 0}, {"key": "35280425", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584175022255957, "ground_truth": 0}, {"key": "35280425", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307628031818, "ground_truth": 0}, {"key": "16365170", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.64243246640116, "ground_truth": 0}, {"key": "16365170", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6584174980215222, "ground_truth": 0}, {"key": "16365170", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5350984237022097, "ground_truth": 0}, {"key": "16365170", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688064202108, "ground_truth": 0}, {"key": "16365170", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149664153069, "ground_truth": 0}, {"key": "24388238", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27048022789138676, "ground_truth": 0}, {"key": "24388238", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4590761226585686, "ground_truth": 0}, {"key": "24388238", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24653334360846038, "ground_truth": 0}, {"key": "24388238", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3174262637628128, "ground_truth": 0}, {"key": "24388238", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794003920533388, "ground_truth": 0}, {"key": "35024827", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7201714957172677, "ground_truth": 0}, {"key": "35024827", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4092207954487116, "ground_truth": 0}, {"key": "35024827", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4551986075808891, "ground_truth": 0}, {"key": "35024827", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4513265172971051, "ground_truth": 0}, {"key": "35024827", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.319121418385476, "ground_truth": 0}, {"key": "38624944", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6315943040849609, "ground_truth": 0}, {"key": "38624944", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7918210582330737, "ground_truth": 0}, {"key": "38624944", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6039318164556869, "ground_truth": 0}, {"key": "38624944", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059137418841, "ground_truth": 0}, {"key": "38624944", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723317215694089, "ground_truth": 0}, {"key": "34719830", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5755880189631942, "ground_truth": 0}, {"key": "34719830", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6442250900403409, "ground_truth": 0}, {"key": "34719830", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.757794359559425, "ground_truth": 0}, {"key": "34719830", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185180748083, "ground_truth": 0}, {"key": "34719830", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.47463118837665896, "ground_truth": 0}, {"key": "38995225", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28776783972284736, "ground_truth": 0}, {"key": "38995225", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3225259870284837, "ground_truth": 0}, {"key": "38995225", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20307464325278343, "ground_truth": 0}, {"key": "38995225", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21076630326412427, "ground_truth": 0}, {"key": "38995225", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23934933452824422, "ground_truth": 0}, {"key": "34242311", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5869964342724647, "ground_truth": 0}, {"key": "34242311", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.449392631273559, "ground_truth": 0}, {"key": "34242311", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39981165014122094, "ground_truth": 0}, {"key": "34242311", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3684056913092252, "ground_truth": 0}, {"key": "34242311", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352741245912, "ground_truth": 0}, {"key": "39253748", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6057990504966317, "ground_truth": 0}, {"key": "39253748", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6279512096662173, "ground_truth": 0}, {"key": "39253748", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6187804619392696, "ground_truth": 0}, {"key": "39253748", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185344966072, "ground_truth": 0}, {"key": "39253748", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582566270588, "ground_truth": 0}, {"key": "37131104", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.984215437466498, "ground_truth": 0}, {"key": "37131104", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9967649440994808, "ground_truth": 0}, {"key": "37131104", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9802808711831512, "ground_truth": 0}, {"key": "37131104", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9942697539391869, "ground_truth": 0}, {"key": "37131104", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9837225378323776, "ground_truth": 0}, {"key": "38490554", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6601723879037272, "ground_truth": 0}, {"key": "38490554", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.620621618859806, "ground_truth": 0}, {"key": "38490554", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.677474013060002, "ground_truth": 0}, {"key": "38490554", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936427482536, "ground_truth": 0}, {"key": "38490554", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578315861004, "ground_truth": 0}, {"key": "29009500", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20055767929067256, "ground_truth": 0}, {"key": "29009500", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2379298921762048, "ground_truth": 0}, {"key": "29009500", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5253688488673607, "ground_truth": 0}, {"key": "29009500", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2133771548934221, "ground_truth": 0}, {"key": "29009500", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.31405054479641886, "ground_truth": 0}, {"key": "36703057", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.34687308171881237, "ground_truth": 0}, {"key": "36703057", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5964331468303831, "ground_truth": 0}, {"key": "36703057", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5851011632667901, "ground_truth": 0}, {"key": "36703057", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.484380072328969, "ground_truth": 0}, {"key": "36703057", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3522017948760371, "ground_truth": 0}, {"key": "34876987", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5774953710080836, "ground_truth": 0}, {"key": "34876987", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6671476584966081, "ground_truth": 0}, {"key": "34876987", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7217432107309544, "ground_truth": 0}, {"key": "34876987", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306152951023, "ground_truth": 0}, {"key": "34876987", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526268073419, "ground_truth": 0}, {"key": "36209258", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.622459344243431, "ground_truth": 0}, {"key": "36209258", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7956580836475149, "ground_truth": 0}, {"key": "36209258", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6169358300939638, "ground_truth": 0}, {"key": "36209258", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136965403053, "ground_truth": 0}, {"key": "36209258", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711708263571, "ground_truth": 0}, {"key": "36854437", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4035668545468463, "ground_truth": 0}, {"key": "36854437", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3923368314940746, "ground_truth": 0}, {"key": "36854437", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2043418926935332, "ground_truth": 0}, {"key": "36854437", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31237000691519257, "ground_truth": 0}, {"key": "36854437", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27357439821433394, "ground_truth": 0}, {"key": "38047723", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6352224433468596, "ground_truth": 0}, {"key": "38047723", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1824255217326751, "ground_truth": 0}, {"key": "38047723", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26740815429010306, "ground_truth": 0}, {"key": "38047723", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2974699253864264, "ground_truth": 0}, {"key": "38047723", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4016878157227142, "ground_truth": 0}, {"key": "34287816", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.40356686296997357, "ground_truth": 0}, {"key": "34287816", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5350984623525039, "ground_truth": 0}, {"key": "34287816", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5888891420601352, "ground_truth": 0}, {"key": "34287816", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4493926312910317, "ground_truth": 0}, {"key": "34287816", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953606323854, "ground_truth": 0}, {"key": "33235855", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8333246040761942, "ground_truth": 0}, {"key": "33235855", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8278281643221129, "ground_truth": 0}, {"key": "33235855", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9412234373975158, "ground_truth": 0}, {"key": "33235855", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9118099555716747, "ground_truth": 0}, {"key": "33235855", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274015226208, "ground_truth": 0}, {"key": "34381016", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27357438720954325, "ground_truth": 0}, {"key": "34381016", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19682619120041173, "ground_truth": 0}, {"key": "34381016", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5869964288956557, "ground_truth": 0}, {"key": "34381016", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755879880187453, "ground_truth": 0}, {"key": "34381016", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27825682144068886, "ground_truth": 0}, {"key": "28064995", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30074558172114546, "ground_truth": 0}, {"key": "28064995", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4941409036923565, "ground_truth": 0}, {"key": "28064995", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38676344609388236, "ground_truth": 0}, {"key": "28064995", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20946968434679766, "ground_truth": 0}, {"key": "28064995", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4668456072177288, "ground_truth": 0}, {"key": "37576197", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19314739144665416, "ground_truth": 0}, {"key": "37576197", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30569733541536326, "ground_truth": 0}, {"key": "37576197", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.0973903921166573, "ground_truth": 0}, {"key": "37576197", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15304215808711766, "ground_truth": 0}, {"key": "37576197", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15610488801728933, "ground_truth": 0}, {"key": "34454741", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23651622197084132, "ground_truth": 0}, {"key": "34454741", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3757064671633629, "ground_truth": 0}, {"key": "34454741", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34864514427939414, "ground_truth": 0}, {"key": "34454741", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2538610115247163, "ground_truth": 0}, {"key": "34454741", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3140505369506092, "ground_truth": 0}, {"key": "34766970", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24508502950595973, "ground_truth": 0}, {"key": "34766970", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28616924382241216, "ground_truth": 0}, {"key": "34766970", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.10669060558546341, "ground_truth": 0}, {"key": "34766970", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.14706452065721667, "ground_truth": 0}, {"key": "34766970", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1943678216134004, "ground_truth": 0}, {"key": "35574186", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6388352773393919, "ground_truth": 0}, {"key": "35574186", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.411110836314425, "ground_truth": 0}, {"key": "35574186", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6352224375988207, "ground_truth": 0}, {"key": "35574186", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49218812191987904, "ground_truth": 0}, {"key": "35574186", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755879940351218, "ground_truth": 0}, {"key": "35486470", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5467381514467542, "ground_truth": 0}, {"key": "35486470", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28937170553182096, "ground_truth": 0}, {"key": "35486470", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4668455904395075, "ground_truth": 0}, {"key": "35486470", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4474602858102219, "ground_truth": 0}, {"key": "35486470", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.42059959521379703, "ground_truth": 0}, {"key": "40977702", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.36658971043040145, "ground_truth": 0}, {"key": "40977702", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.33458944676334257, "ground_truth": 0}, {"key": "40977702", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21601153243628085, "ground_truth": 0}, {"key": "40977702", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1732882106233638, "ground_truth": 0}, {"key": "40977702", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18242551224595108, "ground_truth": 0}, {"key": "35336618", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5409238379424156, "ground_truth": 0}, {"key": "35336618", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.45326185300241284, "ground_truth": 0}, {"key": "35336618", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6150878713664247, "ground_truth": 0}, {"key": "35336618", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832348896133, "ground_truth": 0}, {"key": "35336618", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512776430532, "ground_truth": 0}, {"key": "33024679", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.36658970162233373, "ground_truth": 0}, {"key": "33024679", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5389832065847703, "ground_truth": 0}, {"key": "33024679", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6619228678498768, "ground_truth": 0}, {"key": "33024679", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39981163835531625, "ground_truth": 0}, {"key": "33024679", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307448259636, "ground_truth": 0}, {"key": "37451334", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6315943242360793, "ground_truth": 0}, {"key": "37451334", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3684057129118346, "ground_truth": 0}, {"key": "37451334", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.577495356402357, "ground_truth": 0}, {"key": "37451334", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891225340217, "ground_truth": 0}, {"key": "37451334", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880227936919, "ground_truth": 0}, {"key": "33354824", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23091977363438843, "ground_truth": 0}, {"key": "33354824", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.36477754727592193, "ground_truth": 0}, {"key": "33354824", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19193278806178812, "ground_truth": 0}, {"key": "33354824", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3575675281977593, "ground_truth": 0}, {"key": "33354824", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2613309181989286, "ground_truth": 0}, {"key": "34688538", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2674081628828566, "ground_truth": 0}, {"key": "34688538", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4073333840943891, "ground_truth": 0}, {"key": "34688538", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26740816408043677, "ground_truth": 0}, {"key": "34688538", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2538609965478857, "ground_truth": 0}, {"key": "34688538", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3174262760558096, "ground_truth": 0}, {"key": "33646276", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2043419069839901, "ground_truth": 0}, {"key": "33646276", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5312093572927343, "ground_truth": 0}, {"key": "33646276", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4785288401629823, "ground_truth": 0}, {"key": "33646276", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3073579891369194, "ground_truth": 0}, {"key": "33646276", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.42632158386321334, "ground_truth": 0}, {"key": "40322608", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6757645977190913, "ground_truth": 0}, {"key": "40322608", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.622459299326014, "ground_truth": 0}, {"key": "40322608", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7918210653915434, "ground_truth": 0}, {"key": "40322608", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504644164823, "ground_truth": 0}, {"key": "40322608", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.694302651087093, "ground_truth": 0}, {"key": "39565762", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7866228348673974, "ground_truth": 0}, {"key": "39565762", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8539127432370989, "ground_truth": 0}, {"key": "39565762", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7233094723478002, "ground_truth": 0}, {"key": "39565762", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140527922201859, "ground_truth": 0}, {"key": "39565762", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702863838167, "ground_truth": 0}, {"key": "30534259", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.707404716789949, "ground_truth": 0}, {"key": "30534259", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5506073733544927, "ground_truth": 0}, {"key": "30534259", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6224593364556656, "ground_truth": 0}, {"key": "30534259", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306026737037, "ground_truth": 0}, {"key": "30534259", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774739947768302, "ground_truth": 0}, {"key": "39644242", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7718434904188779, "ground_truth": 0}, {"key": "39644242", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7745833899097703, "ground_truth": 0}, {"key": "39644242", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7718434979994623, "ground_truth": 0}, {"key": "39644242", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102607998565, "ground_truth": 0}, {"key": "39644242", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125692756648, "ground_truth": 0}, {"key": "19853740", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25091276349246405, "ground_truth": 0}, {"key": "19853740", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5292633881371158, "ground_truth": 0}, {"key": "19853740", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6548947208668641, "ground_truth": 0}, {"key": "19853740", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850281511779, "ground_truth": 0}, {"key": "19853740", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.48828341030055356, "ground_truth": 0}, {"key": "33023078", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.42823343095976324, "ground_truth": 0}, {"key": "33023078", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5312093785526365, "ground_truth": 0}, {"key": "33023078", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.49218814620337725, "ground_truth": 0}, {"key": "33023078", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512573698243, "ground_truth": 0}, {"key": "33023078", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689307862668, "ground_truth": 0}, {"key": "38329806", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20946969007474678, "ground_truth": 0}, {"key": "38329806", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2081789316419165, "ground_truth": 0}, {"key": "38329806", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2814056126357624, "ground_truth": 0}, {"key": "38329806", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20817891167372596, "ground_truth": 0}, {"key": "38329806", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28298811909846117, "ground_truth": 0}, {"key": "38761942", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3629692396317642, "ground_truth": 0}, {"key": "38761942", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21337719065906682, "ground_truth": 0}, {"key": "38761942", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2422056320301231, "ground_truth": 0}, {"key": "38761942", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49609385432660125, "ground_truth": 0}, {"key": "38761942", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2523840364308627, "ground_truth": 0}, {"key": "33773576", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6893056097366433, "ground_truth": 0}, {"key": "33773576", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8080672049863218, "ground_truth": 0}, {"key": "33773576", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.47463116984591897, "ground_truth": 0}, {"key": "33773576", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203392149298, "ground_truth": 0}, {"key": "33773576", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4301473375212414, "ground_truth": 0}, {"key": "37642631", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2782567743886307, "ground_truth": 0}, {"key": "37642631", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.399811660233846, "ground_truth": 0}, {"key": "37642631", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4474602819819132, "ground_truth": 0}, {"key": "37642631", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990882003108, "ground_truth": 0}, {"key": "37642631", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995670332744, "ground_truth": 0}, {"key": "36609836", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.509764378018491, "ground_truth": 0}, {"key": "36609836", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4765796534682991, "ground_truth": 0}, {"key": "36609836", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6242935364322505, "ground_truth": 0}, {"key": "36609836", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982040728197, "ground_truth": 0}, {"key": "36609836", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990725949165, "ground_truth": 0}, {"key": "41035610", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5312093765862476, "ground_truth": 0}, {"key": "41035610", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4707366151968293, "ground_truth": 0}, {"key": "41035610", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4054486999973953, "ground_truth": 0}, {"key": "41035610", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39047580119708647, "ground_truth": 0}, {"key": "41035610", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30404168560864686, "ground_truth": 0}, {"key": "37592684", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2146914052579149, "ground_truth": 0}, {"key": "37592684", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5698526661912967, "ground_truth": 0}, {"key": "37592684", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40922082775051144, "ground_truth": 0}, {"key": "37592684", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291136487992, "ground_truth": 0}, {"key": "37592684", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.552539722934551, "ground_truth": 0}, {"key": "38951040", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5717666355937141, "ground_truth": 0}, {"key": "38951040", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3702254040916652, "ground_truth": 0}, {"key": "38951040", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34864514052836104, "ground_truth": 0}, {"key": "38951040", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064737725254, "ground_truth": 0}, {"key": "38951040", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40733340368799864, "ground_truth": 0}, {"key": "40774469", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1451153632225089, "ground_truth": 0}, {"key": "40774469", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1338674727102864, "ground_truth": 0}, {"key": "40774469", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16776335395609382, "ground_truth": 0}, {"key": "40774469", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27048021388467186, "ground_truth": 0}, {"key": "40774469", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.13846179818150903, "ground_truth": 0}, {"key": "40876288", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5851011589904367, "ground_truth": 0}, {"key": "40876288", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6424324660418543, "ground_truth": 0}, {"key": "40876288", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4843800861895658, "ground_truth": 0}, {"key": "40876288", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.29746993835082824, "ground_truth": 0}, {"key": "40876288", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3738758329764257, "ground_truth": 0}, {"key": "40340131", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3380771281558772, "ground_truth": 0}, {"key": "40340131", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7295197613456271, "ground_truth": 0}, {"key": "40340131", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6976089153807401, "ground_truth": 0}, {"key": "40340131", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736783807136981, "ground_truth": 0}, {"key": "40340131", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.535098430526089, "ground_truth": 0}, {"key": "30121591", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4359015018702904, "ground_truth": 0}, {"key": "30121591", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.44167302574664397, "ground_truth": 0}, {"key": "30121591", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39606816576028553, "ground_truth": 0}, {"key": "30121591", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "30121591", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30239109667183306, "ground_truth": 0}, {"key": "35623366", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5945512531463745, "ground_truth": 0}, {"key": "35623366", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3106943635693577, "ground_truth": 0}, {"key": "35623366", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4532618496021634, "ground_truth": 0}, {"key": "35623366", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39981163600865377, "ground_truth": 0}, {"key": "35623366", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.605799051359937, "ground_truth": 0}, {"key": "41014093", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5794004095327889, "ground_truth": 0}, {"key": "41014093", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5506073835716253, "ground_truth": 0}, {"key": "41014093", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4824291176661156, "ground_truth": 0}, {"key": "41014093", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494723758957, "ground_truth": 0}, {"key": "41014093", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3007455911400482, "ground_truth": 0}, {"key": "11387984", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23231015670613334, "ground_truth": 0}, {"key": "11387984", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4054487505967816, "ground_truth": 0}, {"key": "11387984", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3225259591025827, "ground_truth": 0}, {"key": "11387984", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2909808859625026, "ground_truth": 0}, {"key": "11387984", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27982850084977, "ground_truth": 0}, {"key": "39508312", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.46490158859151565, "ground_truth": 0}, {"key": "39508312", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6723316637916499, "ground_truth": 0}, {"key": "39508312", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4707366075350898, "ground_truth": 0}, {"key": "39508312", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370308033255411, "ground_truth": 0}, {"key": "39508312", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.649578599974562, "ground_truth": 0}, {"key": "35815369", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2798285045613879, "ground_truth": 0}, {"key": "35815369", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2925952949897058, "ground_truth": 0}, {"key": "35815369", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4863314890950736, "ground_truth": 0}, {"key": "35815369", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3684057121724594, "ground_truth": 0}, {"key": "35815369", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2465333581963113, "ground_truth": 0}, {"key": "35802823", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5409238720487035, "ground_truth": 0}, {"key": "35802823", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4843800910498627, "ground_truth": 0}, {"key": "35802823", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5926666107314602, "ground_truth": 0}, {"key": "35802823", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.726425607303577, "ground_truth": 0}, {"key": "35802823", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.647798233526865, "ground_truth": 0}, {"key": "38499968", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6893055998534829, "ground_truth": 0}, {"key": "38499968", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6442250885884554, "ground_truth": 0}, {"key": "38499968", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.49609384061180034, "ground_truth": 0}, {"key": "38499968", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5428632722691076, "ground_truth": 0}, {"key": "38499968", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204075192396, "ground_truth": 0}, {"key": "36926726", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4610167662916938, "ground_truth": 0}, {"key": "36926726", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48242911277217393, "ground_truth": 0}, {"key": "36926726", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7931059444525983, "ground_truth": 0}, {"key": "36926726", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216146188817, "ground_truth": 0}, {"key": "36926726", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061997504786, "ground_truth": 0}, {"key": "40903712", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3468730858244008, "ground_truth": 0}, {"key": "40903712", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6636689367049201, "ground_truth": 0}, {"key": "40903712", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5058591081129278, "ground_truth": 0}, {"key": "40903712", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717666003888292, "ground_truth": 0}, {"key": "40903712", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397065265676, "ground_truth": 0}, {"key": "19614862", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.37022540610810695, "ground_truth": 0}, {"key": "19614862", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3040417041457964, "ground_truth": 0}, {"key": "19614862", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5774953399035616, "ground_truth": 0}, {"key": "19614862", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4225046413448712, "ground_truth": 0}, {"key": "19614862", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4493926648967721, "ground_truth": 0}, {"key": "38861704", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4167966516957862, "ground_truth": 0}, {"key": "38861704", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30239109921391655, "ground_truth": 0}, {"key": "38861704", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3998116602590163, "ground_truth": 0}, {"key": "38861704", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.399811645113656, "ground_truth": 0}, {"key": "38861704", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27825680658788665, "ground_truth": 0}, {"key": "34349607", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32423539834297554, "ground_truth": 0}, {"key": "34349607", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5214711959715855, "ground_truth": 0}, {"key": "34349607", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34687308482428536, "ground_truth": 0}, {"key": "34349607", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.47463118265321913, "ground_truth": 0}, {"key": "34349607", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4746311828171901, "ground_truth": 0}, {"key": "20773800", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16132023445318175, "ground_truth": 0}, {"key": "20773800", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.34158248652579326, "ground_truth": 0}, {"key": "20773800", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16026604922115148, "ground_truth": 0}, {"key": "20773800", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2081789254662128, "ground_truth": 0}, {"key": "20773800", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1602660431076452, "ground_truth": 0}, {"key": "35545608", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5350984399159636, "ground_truth": 0}, {"key": "35545608", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4263216127223677, "ground_truth": 0}, {"key": "35545608", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.45907611167271345, "ground_truth": 0}, {"key": "35545608", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389727053326, "ground_truth": 0}, {"key": "35545608", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331543874860892, "ground_truth": 0}, {"key": "37258984", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25832599982726384, "ground_truth": 0}, {"key": "37258984", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31742624781022255, "ground_truth": 0}, {"key": "37258984", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33633106677605196, "ground_truth": 0}, {"key": "37258984", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.29098085872794677, "ground_truth": 0}, {"key": "37258984", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944722602676728, "ground_truth": 0}, {"key": "37274562", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5544704930625863, "ground_truth": 0}, {"key": "37274562", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7154240049873202, "ground_truth": 0}, {"key": "37274562", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7074047131804777, "ground_truth": 0}, {"key": "37274562", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365339954292, "ground_truth": 0}, {"key": "37274562", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056282680659, "ground_truth": 0}, {"key": "40828068", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7879311825145966, "ground_truth": 0}, {"key": "40828068", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.45326183832595224, "ground_truth": 0}, {"key": "40828068", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6740504904123743, "ground_truth": 0}, {"key": "40828068", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.615087869501268, "ground_truth": 0}, {"key": "40828068", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321999860381, "ground_truth": 0}, {"key": "37807180", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3157359615811679, "ground_truth": 0}, {"key": "37807180", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22678361904943517, "ground_truth": 0}, {"key": "37807180", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.32594951656154514, "ground_truth": 0}, {"key": "37807180", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31069437793341026, "ground_truth": 0}, {"key": "37807180", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4320633843587078, "ground_truth": 0}, {"key": "40748607", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8221891366315021, "ground_truth": 0}, {"key": "40748607", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9511422221976951, "ground_truth": 0}, {"key": "40748607", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8365545491776467, "ground_truth": 0}, {"key": "40748607", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867853149373, "ground_truth": 0}, {"key": "40748607", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.800692001045141, "ground_truth": 0}, {"key": "40123819", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9420819168482474, "ground_truth": 0}, {"key": "40123819", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4629586290984504, "ground_truth": 0}, {"key": "40123819", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.805632200020564, "ground_truth": 0}, {"key": "40123819", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9324533111337168, "ground_truth": 0}, {"key": "40123819", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872087654191, "ground_truth": 0}, {"key": "38453867", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18010665712320253, "ground_truth": 0}, {"key": "38453867", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2766905486502641, "ground_truth": 0}, {"key": "38453867", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.29583986710305593, "ground_truth": 0}, {"key": "38453867", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093951895014, "ground_truth": 0}, {"key": "38453867", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473481721174, "ground_truth": 0}, {"key": "38944856", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5195213275183491, "ground_truth": 0}, {"key": "38944856", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7217432062189555, "ground_truth": 0}, {"key": "38944856", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5621764985834127, "ground_truth": 0}, {"key": "38944856", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416320587986, "ground_truth": 0}, {"key": "38944856", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737092392474, "ground_truth": 0}, {"key": "35778898", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8832359759598043, "ground_truth": 0}, {"key": "35778898", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8006920050239013, "ground_truth": 0}, {"key": "35778898", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7969253608709131, "ground_truth": 0}, {"key": "35778898", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952921666747, "ground_truth": 0}, {"key": "35778898", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772329627324, "ground_truth": 0}, {"key": "32530125", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2925952834769741, "ground_truth": 0}, {"key": "32530125", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.590779206353889, "ground_truth": 0}, {"key": "32530125", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19559409069172282, "ground_truth": 0}, {"key": "32530125", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36658972834035936, "ground_truth": 0}, {"key": "32530125", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21601153702217687, "ground_truth": 0}, {"key": "35010363", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4397473590050286, "ground_truth": 0}, {"key": "35010363", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3140505541788698, "ground_truth": 0}, {"key": "35010363", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35936411203965474, "ground_truth": 0}, {"key": "35010363", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487417323206, "ground_truth": 0}, {"key": "35010363", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26588047756563943, "ground_truth": 0}, {"key": "27514800", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.78133063569311, "ground_truth": 0}, {"key": "27514800", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8080672079019239, "ground_truth": 0}, {"key": "27514800", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.72797543552756, "ground_truth": 0}, {"key": "27514800", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238656604815, "ground_truth": 0}, {"key": "27514800", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527374974225, "ground_truth": 0}, {"key": "25725840", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19314738810175772, "ground_truth": 0}, {"key": "25725840", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.09739039579972297, "ground_truth": 0}, {"key": "25725840", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22953520914764305, "ground_truth": 0}, {"key": "25725840", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757213072501362, "ground_truth": 0}, {"key": "25725840", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21337718203686631, "ground_truth": 0}, {"key": "38327225", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25683200664281697, "ground_truth": 0}, {"key": "38327225", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31742629412026796, "ground_truth": 0}, {"key": "38327225", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.174410278422419, "ground_truth": 0}, {"key": "38327225", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2494472367312498, "ground_truth": 0}, {"key": "38327225", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2720245376168407, "ground_truth": 0}, {"key": "11991724", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5078118588346611, "ground_truth": 0}, {"key": "11991724", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5583269664938845, "ground_truth": 0}, {"key": "11991724", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.455198620845334, "ground_truth": 0}, {"key": "11991724", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297745781657949, "ground_truth": 0}, {"key": "11991724", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4225046383938959, "ground_truth": 0}, {"key": "32217545", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.682573731932558, "ground_truth": 0}, {"key": "32217545", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49609381554086474, "ground_truth": 0}, {"key": "32217545", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7090191476114721, "ground_truth": 0}, {"key": "32217545", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891008378976, "ground_truth": 0}, {"key": "32217545", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358491992307, "ground_truth": 0}, {"key": "12731847", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3757064791332108, "ground_truth": 0}, {"key": "12731847", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7577943605605718, "ground_truth": 0}, {"key": "12731847", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43974736308109624, "ground_truth": 0}, {"key": "12731847", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39606816146919577, "ground_truth": 0}, {"key": "12731847", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4186969118868542, "ground_truth": 0}, {"key": "36827234", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31405055818432354, "ground_truth": 0}, {"key": "36827234", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6943026772207563, "ground_truth": 0}, {"key": "36827234", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8489721884001291, "ground_truth": 0}, {"key": "36827234", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762784566124, "ground_truth": 0}, {"key": "36827234", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585806899845, "ground_truth": 0}, {"key": "29111539", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5755879812026153, "ground_truth": 0}, {"key": "29111539", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6671476696263228, "ground_truth": 0}, {"key": "29111539", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5214711717158558, "ground_truth": 0}, {"key": "29111539", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907613247578716, "ground_truth": 0}, {"key": "29111539", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073611969793, "ground_truth": 0}, {"key": "37763052", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3522018133074819, "ground_truth": 0}, {"key": "37763052", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43398149116372436, "ground_truth": 0}, {"key": "37763052", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.36477756864809113, "ground_truth": 0}, {"key": "37763052", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591299298224, "ground_truth": 0}, {"key": "37763052", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3451052593447276, "ground_truth": 0}, {"key": "30682335", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.29421500143067253, "ground_truth": 0}, {"key": "30682335", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17553805578443066, "ground_truth": 0}, {"key": "30682335", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18594720051288538, "ground_truth": 0}, {"key": "30682335", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4571367174816713, "ground_truth": 0}, {"key": "30682335", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26740815958418745, "ground_truth": 0}, {"key": "12261276", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.13296424300086598, "ground_truth": 0}, {"key": "12261276", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21076630415463232, "ground_truth": 0}, {"key": "12261276", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11757213553256146, "ground_truth": 0}, {"key": "12261276", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405542885275828, "ground_truth": 0}, {"key": "12261276", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22541662446333788, "ground_truth": 0}, {"key": "36912979", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.36116471526446414, "ground_truth": 0}, {"key": "36912979", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.36477753400861307, "ground_truth": 0}, {"key": "36912979", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5117165863175958, "ground_truth": 0}, {"key": "36912979", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4167966326809025, "ground_truth": 0}, {"key": "36912979", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569734309674734, "ground_truth": 0}, {"key": "30205259", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6601723788884517, "ground_truth": 0}, {"key": "30205259", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6297745905423837, "ground_truth": 0}, {"key": "30205259", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5448013600878889, "ground_truth": 0}, {"key": "30205259", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704731208157, "ground_truth": 0}, {"key": "30205259", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.581303080138598, "ground_truth": 0}, {"key": "39458032", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9066531318525871, "ground_truth": 0}, {"key": "39458032", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8469578277978972, "ground_truth": 0}, {"key": "39458032", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7981867808912334, "ground_truth": 0}, {"key": "39458032", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583190583526, "ground_truth": 0}, {"key": "39458032", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647787088694, "ground_truth": 0}, {"key": "35116452", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12336563117511143, "ground_truth": 0}, {"key": "35116452", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.12336561574425829, "ground_truth": 0}, {"key": "35116452", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.10087861621037547, "ground_truth": 0}, {"key": "35116452", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1356895386363571, "ground_truth": 0}, {"key": "35116452", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16238002986589592, "ground_truth": 0}, {"key": "40107476", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4035668363315127, "ground_truth": 0}, {"key": "40107476", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7154240134097318, "ground_truth": 0}, {"key": "40107476", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39420095986990733, "ground_truth": 0}, {"key": "40107476", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156198897751293, "ground_truth": 0}, {"key": "40107476", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218814227782326, "ground_truth": 0}, {"key": "39501049", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8019358430474153, "ground_truth": 0}, {"key": "39501049", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8740772250773599, "ground_truth": 0}, {"key": "39501049", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9184802541807623, "ground_truth": 0}, {"key": "39501049", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9012274154677392, "ground_truth": 0}, {"key": "39501049", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110434222132, "ground_truth": 0}, {"key": "39642178", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30902371951222746, "ground_truth": 0}, {"key": "39642178", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3504214016894309, "ground_truth": 0}, {"key": "39642178", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3611647403642669, "ground_truth": 0}, {"key": "39642178", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.352201789600751, "ground_truth": 0}, {"key": "39642178", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3225260052170333, "ground_truth": 0}, {"key": "38024796", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12252321571194567, "ground_truth": 0}, {"key": "38024796", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3345894544073967, "ground_truth": 0}, {"key": "38024796", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14414887277658722, "ground_truth": 0}, {"key": "38024796", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11047115926380639, "ground_truth": 0}, {"key": "38024796", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1688569530167029, "ground_truth": 0}, {"key": "36652079", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7905303025799317, "ground_truth": 0}, {"key": "36652079", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7813306329241837, "ground_truth": 0}, {"key": "36652079", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7490872151753977, "ground_truth": 0}, {"key": "36652079", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942251388337, "ground_truth": 0}, {"key": "36652079", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125535956781, "ground_truth": 0}, {"key": "32193402", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5544704877158844, "ground_truth": 0}, {"key": "32193402", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18010666182283988, "ground_truth": 0}, {"key": "32193402", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5019531269447877, "ground_truth": 0}, {"key": "32193402", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640248998998, "ground_truth": 0}, {"key": "32193402", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4668455948923119, "ground_truth": 0}, {"key": "32589706", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5234203708973706, "ground_truth": 0}, {"key": "32589706", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6959583266240243, "ground_truth": 0}, {"key": "32589706", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48047868925052584, "ground_truth": 0}, {"key": "32589706", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3923368392237977, "ground_truth": 0}, {"key": "32589706", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486735124120082, "ground_truth": 0}, {"key": "38590589", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4130035533215498, "ground_truth": 0}, {"key": "38590589", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1688569614385489, "ground_truth": 0}, {"key": "38590589", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3398276340215771, "ground_truth": 0}, {"key": "38590589", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4843800887938465, "ground_truth": 0}, {"key": "38590589", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3979384227682831, "ground_truth": 0}, {"key": "37045414", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9928231184799847, "ground_truth": 0}, {"key": "37045414", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9778834101081806, "ground_truth": 0}, {"key": "37045414", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9600626867421574, "ground_truth": 0}, {"key": "37045414", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.962673112230283, "ground_truth": 0}, {"key": "37045414", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9910492885844954, "ground_truth": 0}, {"key": "33310095", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7074046879943527, "ground_truth": 0}, {"key": "33310095", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16026604014674503, "ground_truth": 0}, {"key": "33310095", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19436783129390459, "ground_truth": 0}, {"key": "33310095", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9184802426746936, "ground_truth": 0}, {"key": "33310095", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4746311746510154, "ground_truth": 0}, {"key": "37934604", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8376199624057544, "ground_truth": 0}, {"key": "37934604", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7431680122979258, "ground_truth": 0}, {"key": "37934604", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7325918397217827, "ground_truth": 0}, {"key": "37934604", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.766293654152754, "ground_truth": 0}, {"key": "37934604", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314840562881, "ground_truth": 0}, {"key": "39012181", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9814534343264936, "ground_truth": 0}, {"key": "39012181", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9801292822897969, "ground_truth": 0}, {"key": "39012181", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9728307667796775, "ground_truth": 0}, {"key": "39012181", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.956634201915149, "ground_truth": 0}, {"key": "39012181", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9704646632538897, "ground_truth": 0}, {"key": "40221674", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9381240136673159, "ground_truth": 0}, {"key": "40221674", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8539127526763934, "ground_truth": 0}, {"key": "40221674", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9390248186322718, "ground_truth": 0}, {"key": "40221674", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9190632866021706, "ground_truth": 0}, {"key": "40221674", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9496693649346649, "ground_truth": 0}, {"key": "36884862", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5563995827567731, "ground_truth": 0}, {"key": "36884862", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5832033432026241, "ground_truth": 0}, {"key": "36884862", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5175708763029946, "ground_truth": 0}, {"key": "36884862", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203355686103, "ground_truth": 0}, {"key": "36884862", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819621950732, "ground_truth": 0}, {"key": "39054429", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2107662777717385, "ground_truth": 0}, {"key": "39054429", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2422056079572807, "ground_truth": 0}, {"key": "39054429", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2005576581492681, "ground_truth": 0}, {"key": "39054429", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.286169242948037, "ground_truth": 0}, {"key": "39054429", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20434189510984357, "ground_truth": 0}, {"key": "36753964", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18010666017768356, "ground_truth": 0}, {"key": "36753964", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2568319987676612, "ground_truth": 0}, {"key": "36753964", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34510525289269506, "ground_truth": 0}, {"key": "36753964", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15507847693053298, "ground_truth": 0}, {"key": "36753964", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2877678099420971, "ground_truth": 0}, {"key": "37612459", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20434190023719434, "ground_truth": 0}, {"key": "37612459", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17217184921796386, "ground_truth": 0}, {"key": "37612459", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18242553173090356, "ground_truth": 0}, {"key": "37612459", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24077460895657155, "ground_truth": 0}, {"key": "37612459", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19314737270620727, "ground_truth": 0}, {"key": "36805789", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5926666068776186, "ground_truth": 0}, {"key": "36805789", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7718434878591609, "ground_truth": 0}, {"key": "36805789", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6688802761206968, "ground_truth": 0}, {"key": "36805789", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983121918863205, "ground_truth": 0}, {"key": "36805789", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754409760597, "ground_truth": 0}, {"key": "12757394", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18126319884985742, "ground_truth": 0}, {"key": "12757394", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27982849876125276, "ground_truth": 0}, {"key": "12757394", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2509127949814777, "ground_truth": 0}, {"key": "12757394", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2365162361610737, "ground_truth": 0}, {"key": "12757394", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.162380036593795, "ground_truth": 0}, {"key": "32192542", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39047581684135285, "ground_truth": 0}, {"key": "32192542", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7956580898021397, "ground_truth": 0}, {"key": "32192542", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.531209398266034, "ground_truth": 0}, {"key": "32192542", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27825676512124164, "ground_truth": 0}, {"key": "32192542", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046877671795, "ground_truth": 0}, {"key": "34856060", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16238003793415412, "ground_truth": 0}, {"key": "34856060", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2613309360772165, "ground_truth": 0}, {"key": "34856060", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4186969064894426, "ground_truth": 0}, {"key": "34856060", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245579935514, "ground_truth": 0}, {"key": "34856060", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.31573597471629294, "ground_truth": 0}, {"key": "36083416", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.84286314989351, "ground_truth": 0}, {"key": "36083416", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7416740087356836, "ground_truth": 0}, {"key": "36083416", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7310585711841463, "ground_truth": 0}, {"key": "36083416", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191028676225, "ground_truth": 0}, {"key": "36083416", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578334489196, "ground_truth": 0}, {"key": "33839050", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.42632161351936676, "ground_truth": 0}, {"key": "33839050", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23091976589123592, "ground_truth": 0}, {"key": "33839050", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4416729922498263, "ground_truth": 0}, {"key": "33839050", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4244120001740367, "ground_truth": 0}, {"key": "33839050", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43398144604989436, "ground_truth": 0}, {"key": "18464690", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3979384125294374, "ground_truth": 0}, {"key": "18464690", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43014736393017233, "ground_truth": 0}, {"key": "18464690", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30074558337215307, "ground_truth": 0}, {"key": "18464690", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3433417489708249, "ground_truth": 0}, {"key": "18464690", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17441027136840392, "ground_truth": 0}, {"key": "39212665", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.29421496363061506, "ground_truth": 0}, {"key": "39212665", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37754065806801673, "ground_truth": 0}, {"key": "39212665", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20055766419975468, "ground_truth": 0}, {"key": "39212665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.28616923317577014, "ground_truth": 0}, {"key": "39212665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2281564883860385, "ground_truth": 0}, {"key": "40094011", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6132365477798521, "ground_truth": 0}, {"key": "40094011", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3539862863004114, "ground_truth": 0}, {"key": "40094011", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42632157824837863, "ground_truth": 0}, {"key": "40094011", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256151144106, "ground_truth": 0}, {"key": "40094011", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631524578208, "ground_truth": 0}, {"key": "36036272", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4785288531177667, "ground_truth": 0}, {"key": "36036272", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28140562365405514, "ground_truth": 0}, {"key": "36036272", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3611647403203423, "ground_truth": 0}, {"key": "36036272", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.602061575337192, "ground_truth": 0}, {"key": "36036272", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3960681486979345, "ground_truth": 0}, {"key": "30681904", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23792990789631333, "ground_truth": 0}, {"key": "30681904", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2018131986123345, "ground_truth": 0}, {"key": "30681904", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.32766831088206283, "ground_truth": 0}, {"key": "30681904", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2829881234180056, "ground_truth": 0}, {"key": "30681904", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2613309151443252, "ground_truth": 0}, {"key": "27834240", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21601152708447144, "ground_truth": 0}, {"key": "27834240", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.0940101775531613, "ground_truth": 0}, {"key": "27834240", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13477591718320572, "ground_truth": 0}, {"key": "27834240", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12765262656808118, "ground_truth": 0}, {"key": "27834240", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17106117970746224, "ground_truth": 0}, {"key": "35025075", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18242553110719628, "ground_truth": 0}, {"key": "35025075", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.633410249614261, "ground_truth": 0}, {"key": "35025075", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21337718440005538, "ground_truth": 0}, {"key": "35025075", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487162655874, "ground_truth": 0}, {"key": "35025075", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26435836555693737, "ground_truth": 0}, {"key": "33316985", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5409238863604504, "ground_truth": 0}, {"key": "33316985", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.379378386861747, "ground_truth": 0}, {"key": "33316985", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3208213091155275, "ground_truth": 0}, {"key": "33316985", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3157359693920727, "ground_truth": 0}, {"key": "33316985", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.38306417397596426, "ground_truth": 0}, {"key": "17037056", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.40544874714841656, "ground_truth": 0}, {"key": "17037056", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4610167978084854, "ground_truth": 0}, {"key": "17037056", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5136684674344284, "ground_truth": 0}, {"key": "17037056", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2523840347440863, "ground_truth": 0}, {"key": "17037056", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3433417254647814, "ground_truth": 0}, {"key": "34050457", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6442251008346925, "ground_truth": 0}, {"key": "34050457", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5175708900912445, "ground_truth": 0}, {"key": "34050457", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7592253992077537, "ground_truth": 0}, {"key": "34050457", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118928630694, "ground_truth": 0}, {"key": "34050457", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943729541402, "ground_truth": 0}, {"key": "34713745", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15921740276134516, "ground_truth": 0}, {"key": "34713745", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20946968170944397, "ground_truth": 0}, {"key": "34713745", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17895589148919175, "ground_truth": 0}, {"key": "34713745", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09807932099611487, "ground_truth": 0}, {"key": "34713745", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1789558874519346, "ground_truth": 0}, {"key": "40856210", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.06008665745036525, "ground_truth": 0}, {"key": "40856210", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.0803574737059013, "ground_truth": 0}, {"key": "40856210", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.07211220156752803, "ground_truth": 0}, {"key": "40856210", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1001722232067589, "ground_truth": 0}, {"key": "40856210", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.08389038498876765, "ground_truth": 0}, {"key": "40848302", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8289388058402162, "ground_truth": 0}, {"key": "40848302", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6095241516900307, "ground_truth": 0}, {"key": "40848302", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7371581599152176, "ground_truth": 0}, {"key": "40848302", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416461795876, "ground_truth": 0}, {"key": "40848302", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754576462752, "ground_truth": 0}, {"key": "40636168", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4035668722962599, "ground_truth": 0}, {"key": "40636168", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3998116338759638, "ground_truth": 0}, {"key": "40636168", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24944724534312554, "ground_truth": 0}, {"key": "40636168", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39606817458096444, "ground_truth": 0}, {"key": "40636168", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469143398221513, "ground_truth": 0}, {"key": "34423311", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3073580070193855, "ground_truth": 0}, {"key": "34423311", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27048023478243566, "ground_truth": 0}, {"key": "34423311", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4320633968842608, "ground_truth": 0}, {"key": "34423311", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.34510524972872747, "ground_truth": 0}, {"key": "34423311", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32252600017147415, "ground_truth": 0}, {"key": "34833945", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8519527872902767, "ground_truth": 0}, {"key": "34833945", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7264256032807198, "ground_truth": 0}, {"key": "34833945", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8407825784439363, "ground_truth": 0}, {"key": "34833945", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392830550966, "ground_truth": 0}, {"key": "34833945", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344069055545438, "ground_truth": 0}, {"key": "21272328", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24798741456926818, "ground_truth": 0}, {"key": "21272328", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29259528380611305, "ground_truth": 0}, {"key": "21272328", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28298810077797193, "ground_truth": 0}, {"key": "21272328", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22953520394783242, "ground_truth": 0}, {"key": "21272328", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20689405070920924, "ground_truth": 0}, {"key": "38648957", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12336561555657459, "ground_truth": 0}, {"key": "38648957", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16559311591317685, "ground_truth": 0}, {"key": "38648957", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1993079929776736, "ground_truth": 0}, {"key": "38648957", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1412814194143865, "ground_truth": 0}, {"key": "38648957", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11596071843379424, "ground_truth": 0}, {"key": "24942981", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.13206614969656985, "ground_truth": 0}, {"key": "24942981", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14608724213206845, "ground_truth": 0}, {"key": "24942981", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11920293103323289, "ground_truth": 0}, {"key": "24942981", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12852513884679873, "ground_truth": 0}, {"key": "24942981", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11279540398978456, "ground_truth": 0}, {"key": "35882366", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09807931189024467, "ground_truth": 0}, {"key": "35882366", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16559311773493948, "ground_truth": 0}, {"key": "35882366", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.09203286394200105, "ground_truth": 0}, {"key": "35882366", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.158174347152242, "ground_truth": 0}, {"key": "35882366", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11357958685812956, "ground_truth": 0}, {"key": "40559523", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49414089151864415, "ground_truth": 0}, {"key": "40559523", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5755880211756685, "ground_truth": 0}, {"key": "40559523", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6352224437033488, "ground_truth": 0}, {"key": "40559523", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891028257154, "ground_truth": 0}, {"key": "40559523", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292634102521607, "ground_truth": 0}, {"key": "24632722", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2909808678848788, "ground_truth": 0}, {"key": "24632722", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43206338669183375, "ground_truth": 0}, {"key": "24632722", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2393493558399992, "ground_truth": 0}, {"key": "24632722", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.41111086842302963, "ground_truth": 0}, {"key": "24632722", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3328523289911875, "ground_truth": 0}, {"key": "36002759", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5097644018362821, "ground_truth": 0}, {"key": "36002759", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.45326185164413213, "ground_truth": 0}, {"key": "36002759", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6057990640631586, "ground_truth": 0}, {"key": "36002759", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3575675235059979, "ground_truth": 0}, {"key": "36002759", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4843800630352555, "ground_truth": 0}, {"key": "29508534", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6187804483469369, "ground_truth": 0}, {"key": "29508534", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4378235071329378, "ground_truth": 0}, {"key": "29508534", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5117166003886962, "ground_truth": 0}, {"key": "29508534", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786950316799, "ground_truth": 0}, {"key": "29508534", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3611647197303643, "ground_truth": 0}, {"key": "15631612", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6057990482858154, "ground_truth": 0}, {"key": "15631612", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5019531272126375, "ground_truth": 0}, {"key": "15631612", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7620701210868336, "ground_truth": 0}, {"key": "15631612", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544349224787, "ground_truth": 0}, {"key": "15631612", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740303553215, "ground_truth": 0}, {"key": "40731892", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27048022465815796, "ground_truth": 0}, {"key": "40731892", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23651623150826528, "ground_truth": 0}, {"key": "40731892", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.320821288607735, "ground_truth": 0}, {"key": "40731892", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2107663180885356, "ground_truth": 0}, {"key": "40731892", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364245214010724, "ground_truth": 0}, {"key": "35971910", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6132365414462687, "ground_truth": 0}, {"key": "35971910", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.79438493500442, "ground_truth": 0}, {"key": "35971910", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6688802382020713, "ground_truth": 0}, {"key": "35971910", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306244971298, "ground_truth": 0}, {"key": "35971910", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.638835268685553, "ground_truth": 0}, {"key": "34428424", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7154240229635237, "ground_truth": 0}, {"key": "34428424", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.859663754263971, "ground_truth": 0}, {"key": "34428424", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9376689612820656, "ground_truth": 0}, {"key": "34428424", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036253073285, "ground_truth": 0}, {"key": "34428424", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509646981899508, "ground_truth": 0}, {"key": "36971005", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5964331546388684, "ground_truth": 0}, {"key": "36971005", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8407825841901754, "ground_truth": 0}, {"key": "36971005", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7356416376640499, "ground_truth": 0}, {"key": "36971005", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389910394137, "ground_truth": 0}, {"key": "36971005", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585642870753, "ground_truth": 0}, {"key": "34649067", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09268777277728939, "ground_truth": 0}, {"key": "34649067", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1384617805940479, "ground_truth": 0}, {"key": "34649067", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1233656175676689, "ground_truth": 0}, {"key": "34649067", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.061424043779229144, "ground_truth": 0}, {"key": "34649067", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.08151974843775728, "ground_truth": 0}, {"key": "37355154", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2538610230000179, "ground_truth": 0}, {"key": "37355154", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6706082597689867, "ground_truth": 0}, {"key": "37355154", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1200256261928809, "ground_truth": 0}, {"key": "37355154", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.069541741629163, "ground_truth": 0}, {"key": "37355154", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20055766625425206, "ground_truth": 0}, {"key": "38674697", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30902370876794044, "ground_truth": 0}, {"key": "38674697", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2479874362782097, "ground_truth": 0}, {"key": "38674697", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3684057041795904, "ground_truth": 0}, {"key": "38674697", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19806418329935138, "ground_truth": 0}, {"key": "38674697", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.265880459513029, "ground_truth": 0}, {"key": "40525767", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9522199373093058, "ground_truth": 0}, {"key": "40525767", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7416740063532351, "ground_truth": 0}, {"key": "40525767", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9697854108317773, "ground_truth": 0}, {"key": "40525767", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358175949657, "ground_truth": 0}, {"key": "40525767", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437869034468, "ground_truth": 0}, {"key": "27165110", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.07978200803624158, "ground_truth": 0}, {"key": "27165110", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20946967080782478, "ground_truth": 0}, {"key": "27165110", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.07640768100208245, "ground_truth": 0}, {"key": "27165110", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23231014279242856, "ground_truth": 0}, {"key": "27165110", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14706451859701464, "ground_truth": 0}, {"key": "35497491", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3793783689884612, "ground_truth": 0}, {"key": "35497491", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2568319962129595, "ground_truth": 0}, {"key": "35497491", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.47657965979537187, "ground_truth": 0}, {"key": "35497491", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4416730089476435, "ground_truth": 0}, {"key": "35497491", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352630931339, "ground_truth": 0}, {"key": "40690716", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6825737338310098, "ground_truth": 0}, {"key": "40690716", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6654105739828005, "ground_truth": 0}, {"key": "40690716", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7138307496685119, "ground_truth": 0}, {"key": "40690716", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118922853633, "ground_truth": 0}, {"key": "40690716", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872164728954, "ground_truth": 0}, {"key": "34835193", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8519528051469708, "ground_truth": 0}, {"key": "34835193", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8577681072931884, "ground_truth": 0}, {"key": "34835193", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8278281631362687, "ground_truth": 0}, {"key": "34835193", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39606815931433736, "ground_truth": 0}, {"key": "34835193", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056080892853, "ground_truth": 0}, {"key": "39471712", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3276683073130005, "ground_truth": 0}, {"key": "39471712", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2422056445289878, "ground_truth": 0}, {"key": "39471712", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16559310647501935, "ground_truth": 0}, {"key": "39471712", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3007455954612652, "ground_truth": 0}, {"key": "39471712", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.42823339994340304, "ground_truth": 0}, {"key": "39115192", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8568123074350237, "ground_truth": 0}, {"key": "39115192", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5774953662147492, "ground_truth": 0}, {"key": "39115192", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8056321967350561, "ground_truth": 0}, {"key": "39115192", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964285676693, "ground_truth": 0}, {"key": "39115192", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563363615989, "ground_truth": 0}, {"key": "23520673", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.230919762662089, "ground_truth": 0}, {"key": "23520673", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3539862901107468, "ground_truth": 0}, {"key": "23520673", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5774953415763647, "ground_truth": 0}, {"key": "23520673", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093572531661, "ground_truth": 0}, {"key": "23520673", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32082130019407823, "ground_truth": 0}, {"key": "35764233", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38676343943899033, "ground_truth": 0}, {"key": "35764233", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2814056141059974, "ground_truth": 0}, {"key": "35764233", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26284183237750947, "ground_truth": 0}, {"key": "35764233", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2942149866469122, "ground_truth": 0}, {"key": "35764233", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.204341908590325, "ground_truth": 0}, {"key": "35228910", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.273574377676167, "ground_truth": 0}, {"key": "35228910", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5945512719505273, "ground_truth": 0}, {"key": "35228910", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3090236917591614, "ground_truth": 0}, {"key": "35228910", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2538610209174241, "ground_truth": 0}, {"key": "35228910", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16344544597504343, "ground_truth": 0}, {"key": "36795599", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7853085631635245, "ground_truth": 0}, {"key": "36795599", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7606506628044495, "ground_truth": 0}, {"key": "36795599", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8577681122000266, "ground_truth": 0}, {"key": "36795599", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.790530307704514, "ground_truth": 0}, {"key": "36795599", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690914057501, "ground_truth": 0}, {"key": "38641949", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7170118774813359, "ground_truth": 0}, {"key": "38641949", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8344068755959865, "ground_truth": 0}, {"key": "38641949", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7879312139787558, "ground_truth": 0}, {"key": "38641949", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.749087216632097, "ground_truth": 0}, {"key": "38641949", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772315138695, "ground_truth": 0}, {"key": "29968443", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6513548668331948, "ground_truth": 0}, {"key": "29968443", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6442251083653961, "ground_truth": 0}, {"key": "29968443", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6976089263604316, "ground_truth": 0}, {"key": "29968443", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.685949449599056, "ground_truth": 0}, {"key": "29968443", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964166971391, "ground_truth": 0}, {"key": "21268042", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4148988464799192, "ground_truth": 0}, {"key": "21268042", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.613236545202428, "ground_truth": 0}, {"key": "21268042", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41869693008977366, "ground_truth": 0}, {"key": "21268042", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746190884682, "ground_truth": 0}, {"key": "21268042", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880136990361, "ground_truth": 0}, {"key": "26808572", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6113819859649813, "ground_truth": 0}, {"key": "26808572", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23651624072881952, "ground_truth": 0}, {"key": "26808572", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6388352803193288, "ground_truth": 0}, {"key": "26808572", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073583845233, "ground_truth": 0}, {"key": "26808572", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191222678245, "ground_truth": 0}, {"key": "37829390", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5136684698822322, "ground_truth": 0}, {"key": "37829390", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5774953655884194, "ground_truth": 0}, {"key": "37829390", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7341195228394661, "ground_truth": 0}, {"key": "37829390", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.47463118068051213, "ground_truth": 0}, {"key": "37829390", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.47463119705783574, "ground_truth": 0}, {"key": "35716045", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6132365509870268, "ground_truth": 0}, {"key": "35716045", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.533154395583034, "ground_truth": 0}, {"key": "35716045", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5370413901895155, "ground_truth": 0}, {"key": "35716045", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.538983233023214, "ground_truth": 0}, {"key": "35716045", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.778649316904943, "ground_truth": 0}, {"key": "34367070", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4863315117443419, "ground_truth": 0}, {"key": "34367070", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6688802401125256, "ground_truth": 0}, {"key": "34367070", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6943026779244632, "ground_truth": 0}, {"key": "34367070", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.713830780138152, "ground_truth": 0}, {"key": "34367070", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321648657909, "ground_truth": 0}, {"key": "35239748", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2845759953133452, "ground_truth": 0}, {"key": "35239748", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.373875845156247, "ground_truth": 0}, {"key": "35239748", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2925952827646443, "ground_truth": 0}, {"key": "35239748", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526560191929, "ground_truth": 0}, {"key": "35239748", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882834120157879, "ground_truth": 0}, {"key": "40421370", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.46490155035379926, "ground_truth": 0}, {"key": "40421370", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14414885369191469, "ground_truth": 0}, {"key": "40421370", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.27048022380940573, "ground_truth": 0}, {"key": "40421370", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3259495175195085, "ground_truth": 0}, {"key": "40421370", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510835837934543, "ground_truth": 0}, {"key": "37288396", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6315943187354444, "ground_truth": 0}, {"key": "37288396", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29583986824282565, "ground_truth": 0}, {"key": "37288396", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.631594308527088, "ground_truth": 0}, {"key": "37288396", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.573678393574147, "ground_truth": 0}, {"key": "37288396", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061726264796, "ground_truth": 0}, {"key": "38903688", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7008948147976697, "ground_truth": 0}, {"key": "38903688", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.562176518200119, "ground_truth": 0}, {"key": "38903688", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7217432082891756, "ground_truth": 0}, {"key": "38903688", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217431933007827, "ground_truth": 0}, {"key": "38903688", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318300248971, "ground_truth": 0}, {"key": "28071228", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6548947133794139, "ground_truth": 0}, {"key": "28071228", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7461389908253213, "ground_truth": 0}, {"key": "28071228", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7620701039052005, "ground_truth": 0}, {"key": "28071228", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702848506842, "ground_truth": 0}, {"key": "28071228", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068786732106, "ground_truth": 0}, {"key": "36855834", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22953519608451117, "ground_truth": 0}, {"key": "36855834", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42059960875860064, "ground_truth": 0}, {"key": "36855834", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23510838267725606, "ground_truth": 0}, {"key": "36855834", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3073580054060403, "ground_truth": 0}, {"key": "36855834", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2583259977335757, "ground_truth": 0}, {"key": "40548717", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19072402862947221, "ground_truth": 0}, {"key": "40548717", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24798741118889295, "ground_truth": 0}, {"key": "40548717", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1623800185620701, "ground_truth": 0}, {"key": "40548717", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1645164528134759, "ground_truth": 0}, {"key": "40548717", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20689405687018672, "ground_truth": 0}, {"key": "37051175", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6774740218942539, "ground_truth": 0}, {"key": "37051175", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.567936596530818, "ground_truth": 0}, {"key": "37051175", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3007455745474428, "ground_truth": 0}, {"key": "37051175", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117166217016788, "ground_truth": 0}, {"key": "37051175", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046849554128, "ground_truth": 0}, {"key": "38882119", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6548947255208203, "ground_truth": 0}, {"key": "38882119", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6095241525266168, "ground_truth": 0}, {"key": "38882119", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7839884768983318, "ground_truth": 0}, {"key": "38882119", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744890270176, "ground_truth": 0}, {"key": "38882119", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238728746076, "ground_truth": 0}, {"key": "19485402", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.46684561168054806, "ground_truth": 0}, {"key": "19485402", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3398276489149583, "ground_truth": 0}, {"key": "19485402", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4746312030662147, "ground_truth": 0}, {"key": "19485402", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3979384009553061, "ground_truth": 0}, {"key": "19485402", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4111108770625468, "ground_truth": 0}, {"key": "36060907", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.13477592738881064, "ground_truth": 0}, {"key": "36060907", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21076629353710966, "ground_truth": 0}, {"key": "36060907", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14903529943093552, "ground_truth": 0}, {"key": "36060907", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20055767441027114, "ground_truth": 0}, {"key": "36060907", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1302854146407685, "ground_truth": 0}, {"key": "24037309", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35042138208373375, "ground_truth": 0}, {"key": "24037309", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38306418112442664, "ground_truth": 0}, {"key": "24037309", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.47268347682134815, "ground_truth": 0}, {"key": "24037309", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2798284990988655, "ground_truth": 0}, {"key": "24037309", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.39793838467425735, "ground_truth": 0}, {"key": "35605805", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3242353963308558, "ground_truth": 0}, {"key": "35605805", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43590151076061856, "ground_truth": 0}, {"key": "35605805", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5679366140498129, "ground_truth": 0}, {"key": "35605805", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35756755787465655, "ground_truth": 0}, {"key": "35605805", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203108183162, "ground_truth": 0}, {"key": "17706248", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22270014223471607, "ground_truth": 0}, {"key": "17706248", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18126319122166298, "ground_truth": 0}, {"key": "17706248", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24798742466747986, "ground_truth": 0}, {"key": "17706248", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2146914240243559, "ground_truth": 0}, {"key": "17706248", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420097216668476, "ground_truth": 0}, {"key": "36883559", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6723316746174526, "ground_truth": 0}, {"key": "36883559", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5544704715600428, "ground_truth": 0}, {"key": "36883559", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.32423541094348934, "ground_truth": 0}, {"key": "36883559", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740309977097, "ground_truth": 0}, {"key": "36883559", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352759203737, "ground_truth": 0}, {"key": "32799471", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47657966048097256, "ground_truth": 0}, {"key": "32799471", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4941409046771716, "ground_truth": 0}, {"key": "32799471", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3684057095568117, "ground_truth": 0}, {"key": "32799471", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3468730898138807, "ground_truth": 0}, {"key": "32799471", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531239608802, "ground_truth": 0}, {"key": "34797243", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25091281504524876, "ground_truth": 0}, {"key": "34797243", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5467381476341442, "ground_truth": 0}, {"key": "34797243", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4882833973293643, "ground_truth": 0}, {"key": "34797243", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.312369997426415, "ground_truth": 0}, {"key": "34797243", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.31573597136407733, "ground_truth": 0}, {"key": "32154876", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33285231477175087, "ground_truth": 0}, {"key": "32154876", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.352201803951195, "ground_truth": 0}, {"key": "32154876", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28937169255016404, "ground_truth": 0}, {"key": "32154876", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13660839288680443, "ground_truth": 0}, {"key": "32154876", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22815650462617124, "ground_truth": 0}, {"key": "37962274", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2583259803300443, "ground_truth": 0}, {"key": "37962274", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6150878333702811, "ground_truth": 0}, {"key": "37962274", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3522017625178691, "ground_truth": 0}, {"key": "37962274", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3023910921733616, "ground_truth": 0}, {"key": "37962274", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641875148276, "ground_truth": 0}, {"key": "35574030", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.585101158226629, "ground_truth": 0}, {"key": "35574030", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5448013800417562, "ground_truth": 0}, {"key": "35574030", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6566582628333696, "ground_truth": 0}, {"key": "35574030", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4610167528506093, "ground_truth": 0}, {"key": "35574030", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746024950042, "ground_truth": 0}, {"key": "39105949", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18594719222722228, "ground_truth": 0}, {"key": "39105949", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3056973174477394, "ground_truth": 0}, {"key": "39105949", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24077458274196833, "ground_truth": 0}, {"key": "39105949", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30074556363800764, "ground_truth": 0}, {"key": "39105949", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17106119278277365, "ground_truth": 0}, {"key": "41064322", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8469578515728127, "ground_truth": 0}, {"key": "41064322", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.770464800785343, "ground_truth": 0}, {"key": "41064322", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8679338421574182, "ground_truth": 0}, {"key": "41064322", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711766256728, "ground_truth": 0}, {"key": "41064322", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585894896421, "ground_truth": 0}, {"key": "28105101", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6943026672592243, "ground_truth": 0}, {"key": "28105101", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7090191279266723, "ground_truth": 0}, {"key": "28105101", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41111083717484875, "ground_truth": 0}, {"key": "28105101", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786073269443, "ground_truth": 0}, {"key": "28105101", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318370018248, "ground_truth": 0}, {"key": "36036068", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6513548430329084, "ground_truth": 0}, {"key": "36036068", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5117166134839558, "ground_truth": 0}, {"key": "36036068", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6688802620700993, "ground_truth": 0}, {"key": "36036068", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185362715646, "ground_truth": 0}, {"key": "36036068", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.624293535211074, "ground_truth": 0}, {"key": "37991460", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6261241709882678, "ground_truth": 0}, {"key": "37991460", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5964331585990139, "ground_truth": 0}, {"key": "37991460", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6757645967781348, "ground_truth": 0}, {"key": "37991460", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832192159999, "ground_truth": 0}, {"key": "37991460", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.560252661223637, "ground_truth": 0}, {"key": "38437830", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.552539713917535, "ground_truth": 0}, {"key": "38437830", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3960681979810195, "ground_truth": 0}, {"key": "38437830", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7138307423588122, "ground_truth": 0}, {"key": "38437830", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878338966455, "ground_truth": 0}, {"key": "38437830", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723316932031289, "ground_truth": 0}, {"key": "36507138", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3849121570395144, "ground_truth": 0}, {"key": "36507138", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24220563459556232, "ground_truth": 0}, {"key": "36507138", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20307462526242415, "ground_truth": 0}, {"key": "36507138", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25982563499890166, "ground_truth": 0}, {"key": "36507138", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360039892750436, "ground_truth": 0}, {"key": "37824866", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5234203502514608, "ground_truth": 0}, {"key": "37824866", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6187804220109778, "ground_truth": 0}, {"key": "37824866", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.451326531876204, "ground_truth": 0}, {"key": "37824866", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544298842791, "ground_truth": 0}, {"key": "37824866", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531218508162, "ground_truth": 0}, {"key": "25088134", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14033626120230144, "ground_truth": 0}, {"key": "25088134", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.397938398516613, "ground_truth": 0}, {"key": "25088134", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.31912138072460977, "ground_truth": 0}, {"key": "25088134", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39606819303214214, "ground_truth": 0}, {"key": "25088134", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561503585108917, "ground_truth": 0}, {"key": "40172531", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.577495365914894, "ground_truth": 0}, {"key": "40172531", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5175708593225418, "ground_truth": 0}, {"key": "40172531", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.69760892083312, "ground_truth": 0}, {"key": "40172531", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592253877395647, "ground_truth": 0}, {"key": "40172531", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300431145565, "ground_truth": 0}, {"key": "37035874", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28140561650153545, "ground_truth": 0}, {"key": "37035874", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3023910849165958, "ground_truth": 0}, {"key": "37035874", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24508502770064503, "ground_truth": 0}, {"key": "37035874", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27202454036638823, "ground_truth": 0}, {"key": "37035874", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2465333511586931, "ground_truth": 0}, {"key": "36404465", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7662936348501199, "ground_truth": 0}, {"key": "36404465", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8998277822645298, "ground_truth": 0}, {"key": "36404465", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7745833859331823, "ground_truth": 0}, {"key": "36404465", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036020554901, "ground_truth": 0}, {"key": "36404465", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585719557706, "ground_truth": 0}, {"key": "39602052", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.734119521645403, "ground_truth": 0}, {"key": "39602052", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7217432152749377, "ground_truth": 0}, {"key": "39602052", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7648916041668503, "ground_truth": 0}, {"key": "39602052", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216119942392, "ground_truth": 0}, {"key": "39602052", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228757086729, "ground_truth": 0}, {"key": "33792789", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4244119797661528, "ground_truth": 0}, {"key": "33792789", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31573599282575143, "ground_truth": 0}, {"key": "33792789", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28298812029319953, "ground_truth": 0}, {"key": "33792789", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.34510528510950067, "ground_truth": 0}, {"key": "33792789", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26133091356081367, "ground_truth": 0}, {"key": "32776626", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26588045046480613, "ground_truth": 0}, {"key": "32776626", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43782352363154337, "ground_truth": 0}, {"key": "32776626", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2295352053949162, "ground_truth": 0}, {"key": "32776626", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27669052362584834, "ground_truth": 0}, {"key": "32776626", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4244120133034446, "ground_truth": 0}, {"key": "37195090", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3684057024911389, "ground_truth": 0}, {"key": "37195090", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38491214611059316, "ground_truth": 0}, {"key": "37195090", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4320633981970933, "ground_truth": 0}, {"key": "37195090", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40544873118354235, "ground_truth": 0}, {"key": "37195090", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897505944561, "ground_truth": 0}, {"key": "33981824", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.242205622836417, "ground_truth": 0}, {"key": "33981824", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2436424354219665, "ground_truth": 0}, {"key": "33981824", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18594721056942123, "ground_truth": 0}, {"key": "33981824", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16132023332577305, "ground_truth": 0}, {"key": "33981824", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29746993210697453, "ground_truth": 0}, {"key": "39569142", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2877678244756455, "ground_truth": 0}, {"key": "39569142", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48242912581203173, "ground_truth": 0}, {"key": "39569142", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4073333923902632, "ground_truth": 0}, {"key": "39569142", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3684056832625083, "ground_truth": 0}, {"key": "39569142", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.31742625393837415, "ground_truth": 0}, {"key": "40268210", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6206215989773739, "ground_truth": 0}, {"key": "40268210", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3886180350120824, "ground_truth": 0}, {"key": "40268210", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4863315207637091, "ground_truth": 0}, {"key": "40268210", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.717011882353179, "ground_truth": 0}, {"key": "40268210", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413669077392, "ground_truth": 0}, {"key": "34925159", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.785308582014961, "ground_truth": 0}, {"key": "34925159", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5097643784766922, "ground_truth": 0}, {"key": "34925159", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7676898437975977, "ground_truth": 0}, {"key": "34925159", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346091544272, "ground_truth": 0}, {"key": "34925159", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281583489984, "ground_truth": 0}, {"key": "36181903", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6774740204267791, "ground_truth": 0}, {"key": "36181903", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6495786304075527, "ground_truth": 0}, {"key": "36181903", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7074046917930207, "ground_truth": 0}, {"key": "36181903", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476762746716, "ground_truth": 0}, {"key": "36181903", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624789813764, "ground_truth": 0}, {"key": "38620559", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7772998500906297, "ground_truth": 0}, {"key": "38620559", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7759445577530648, "ground_truth": 0}, {"key": "38620559", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7592254409915654, "ground_truth": 0}, {"key": "38620559", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743619664516, "ground_truth": 0}, {"key": "38620559", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314698184397, "ground_truth": 0}, {"key": "32719657", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2568320043019003, "ground_truth": 0}, {"key": "32719657", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.33633105657082224, "ground_truth": 0}, {"key": "32719657", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20817894500069628, "ground_truth": 0}, {"key": "32719657", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26588047766068923, "ground_truth": 0}, {"key": "32719657", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18476751530284982, "ground_truth": 0}, {"key": "37530914", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3923368316315719, "ground_truth": 0}, {"key": "37530914", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.44939263353084624, "ground_truth": 0}, {"key": "37530914", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5195212936350122, "ground_truth": 0}, {"key": "37530914", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3191213629857781, "ground_truth": 0}, {"key": "37530914", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.42441199810536123, "ground_truth": 0}, {"key": "33306933", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.40356685943857834, "ground_truth": 0}, {"key": "33306933", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5660185326762166, "ground_truth": 0}, {"key": "33306933", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5058590700702866, "ground_truth": 0}, {"key": "33306933", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4474602701353087, "ground_truth": 0}, {"key": "33306933", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206216328936563, "ground_truth": 0}, {"key": "33837212", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32082129277325994, "ground_truth": 0}, {"key": "33837212", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22815651285289107, "ground_truth": 0}, {"key": "33837212", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3380771151845728, "ground_truth": 0}, {"key": "33837212", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.44552954422770963, "ground_truth": 0}, {"key": "33837212", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.31405054821454825, "ground_truth": 0}, {"key": "40945179", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.45326183887721555, "ground_truth": 0}, {"key": "40945179", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.46295858677551266, "ground_truth": 0}, {"key": "40945179", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4668456065709904, "ground_truth": 0}, {"key": "40945179", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4590761523246308, "ground_truth": 0}, {"key": "40945179", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743510814588, "ground_truth": 0}, {"key": "34152358", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3380771372238381, "ground_truth": 0}, {"key": "34152358", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24508500458283894, "ground_truth": 0}, {"key": "34152358", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3923368310524029, "ground_truth": 0}, {"key": "34152358", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3415824983485702, "ground_truth": 0}, {"key": "34152358", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.37387583935217156, "ground_truth": 0}, {"key": "34136541", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5234203633610275, "ground_truth": 0}, {"key": "34136541", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43782349330669246, "ground_truth": 0}, {"key": "34136541", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38861801583207856, "ground_truth": 0}, {"key": "34136541", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4785288288737997, "ground_truth": 0}, {"key": "34136541", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746174999563, "ground_truth": 0}, {"key": "37469603", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5640984627677175, "ground_truth": 0}, {"key": "37469603", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5660185176308608, "ground_truth": 0}, {"key": "37469603", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.724870272535439, "ground_truth": 0}, {"key": "37469603", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216032627655, "ground_truth": 0}, {"key": "37469603", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791787177317518, "ground_truth": 0}, {"key": "37353611", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.579400362669273, "ground_truth": 0}, {"key": "37353611", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7745833771421538, "ground_truth": 0}, {"key": "37353611", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7745833760780346, "ground_truth": 0}, {"key": "37353611", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689429732759, "ground_truth": 0}, {"key": "37353611", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743534175249, "ground_truth": 0}, {"key": "37211649", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4282334046946584, "ground_truth": 0}, {"key": "37211649", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5964331476699023, "ground_truth": 0}, {"key": "37211649", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5794003818529511, "ground_truth": 0}, {"key": "37211649", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4649015945329908, "ground_truth": 0}, {"key": "37211649", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4148988391301795, "ground_truth": 0}, {"key": "37320976", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20055768868695176, "ground_truth": 0}, {"key": "37320976", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1993080111953775, "ground_truth": 0}, {"key": "37320976", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4746311681241776, "ground_truth": 0}, {"key": "37320976", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168779367785423, "ground_truth": 0}, {"key": "37320976", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730862304681, "ground_truth": 0}, {"key": "34492412", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7233094787084258, "ground_truth": 0}, {"key": "34492412", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5486734859318794, "ground_truth": 0}, {"key": "34492412", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6370307820371043, "ground_truth": 0}, {"key": "34492412", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49804686490756284, "ground_truth": 0}, {"key": "34492412", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321882103638, "ground_truth": 0}, {"key": "36655016", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8459424252375536, "ground_truth": 0}, {"key": "36655016", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8044059156580072, "ground_truth": 0}, {"key": "36655016", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7905303135119326, "ground_truth": 0}, {"key": "36655016", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321845894482, "ground_truth": 0}, {"key": "36655016", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919918954805, "ground_truth": 0}, {"key": "35220773", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43590148869276946, "ground_truth": 0}, {"key": "35220773", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4804786835043312, "ground_truth": 0}, {"key": "35220773", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3904758261149207, "ground_truth": 0}, {"key": "35220773", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093747632741, "ground_truth": 0}, {"key": "35220773", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688256949555, "ground_truth": 0}, {"key": "31569808", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2735743988902527, "ground_truth": 0}, {"key": "31569808", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17441029355961385, "ground_truth": 0}, {"key": "31569808", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.188323985127761, "ground_truth": 0}, {"key": "31569808", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2056150396076585, "ground_truth": 0}, {"key": "31569808", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4863315402824095, "ground_truth": 0}, {"key": "37696256", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26740816044423604, "ground_truth": 0}, {"key": "37696256", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20689407749237196, "ground_truth": 0}, {"key": "37696256", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20561505010881947, "ground_truth": 0}, {"key": "37696256", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19930798967168517, "ground_truth": 0}, {"key": "37696256", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510839774853856, "ground_truth": 0}, {"key": "36874328", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.353986311108806, "ground_truth": 0}, {"key": "36874328", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6095241721541449, "ground_truth": 0}, {"key": "36874328", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7461389784026519, "ground_truth": 0}, {"key": "36874328", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740425820157, "ground_truth": 0}, {"key": "36874328", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689670844235, "ground_truth": 0}, {"key": "24532377", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17106119031392492, "ground_truth": 0}, {"key": "24532377", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11516222621883158, "ground_truth": 0}, {"key": "24532377", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18010667050392598, "ground_truth": 0}, {"key": "24532377", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2877678141536166, "ground_truth": 0}, {"key": "24532377", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23934931401480225, "ground_truth": 0}, {"key": "39560618", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48242912341269795, "ground_truth": 0}, {"key": "39560618", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7074047121655636, "ground_truth": 0}, {"key": "39560618", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5389832154030169, "ground_truth": 0}, {"key": "39560618", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43590153689842254, "ground_truth": 0}, {"key": "39560618", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526410233446, "ground_truth": 0}, {"key": "34922693", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2735743894774478, "ground_truth": 0}, {"key": "34922693", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26133092303142735, "ground_truth": 0}, {"key": "34922693", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2538610016597276, "ground_truth": 0}, {"key": "34922693", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3363310720151566, "ground_truth": 0}, {"key": "34922693", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.31237000436838275, "ground_truth": 0}, {"key": "33629577", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12002562842072667, "ground_truth": 0}, {"key": "33629577", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20307462201299215, "ground_truth": 0}, {"key": "33629577", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.08570927993872439, "ground_truth": 0}, {"key": "33629577", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.14804719546949616, "ground_truth": 0}, {"key": "33629577", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1366083940947868, "ground_truth": 0}, {"key": "32284359", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27512971702373407, "ground_truth": 0}, {"key": "32284359", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3757064539421956, "ground_truth": 0}, {"key": "32284359", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4571367304362201, "ground_truth": 0}, {"key": "32284359", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064778089183, "ground_truth": 0}, {"key": "32284359", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.42059956214808814, "ground_truth": 0}, {"key": "28082962", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11516222827673366, "ground_truth": 0}, {"key": "28082962", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10017220690862152, "ground_truth": 0}, {"key": "28082962", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1200256239292283, "ground_truth": 0}, {"key": "28082962", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.08210662601050847, "ground_truth": 0}, {"key": "28082962", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.08882029477895888, "ground_truth": 0}, {"key": "24796803", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8670357512479191, "ground_truth": 0}, {"key": "24796803", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7008947900106233, "ground_truth": 0}, {"key": "24796803", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19436780915812119, "ground_truth": 0}, {"key": "24796803", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.658417503944704, "ground_truth": 0}, {"key": "24796803", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228665854652, "ground_truth": 0}, {"key": "35466150", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4436004378590589, "ground_truth": 0}, {"key": "35466150", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.45519860142376756, "ground_truth": 0}, {"key": "35466150", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.620621642679765, "ground_truth": 0}, {"key": "35466150", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102878330182, "ground_truth": 0}, {"key": "35466150", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3311197437385806, "ground_truth": 0}, {"key": "35754289", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8418256522490101, "ground_truth": 0}, {"key": "35754289", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7325918057872126, "ground_truth": 0}, {"key": "35754289", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7279754592092472, "ground_truth": 0}, {"key": "35754289", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.812867317409259, "ground_truth": 0}, {"key": "35754289", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256070371323, "ground_truth": 0}, {"key": "36678662", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8469578475418065, "ground_truth": 0}, {"key": "36678662", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8824278736802036, "ground_truth": 0}, {"key": "36678662", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.778649299106921, "ground_truth": 0}, {"key": "36678662", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9032942076360692, "ground_truth": 0}, {"key": "36678662", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240804566209, "ground_truth": 0}, {"key": "35399671", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7217431751501598, "ground_truth": 0}, {"key": "35399671", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7057850184534109, "ground_truth": 0}, {"key": "35399671", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7310585683704438, "ground_truth": 0}, {"key": "35399671", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461390035438444, "ground_truth": 0}, {"key": "35399671", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388353032035055, "ground_truth": 0}, {"key": "36888180", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6619228551695756, "ground_truth": 0}, {"key": "36888180", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4455295510028864, "ground_truth": 0}, {"key": "36888180", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.542863276409743, "ground_truth": 0}, {"key": "36888180", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.624293542586548, "ground_truth": 0}, {"key": "36888180", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.48242909086506713, "ground_truth": 0}, {"key": "28061069", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5058590842058973, "ground_truth": 0}, {"key": "28061069", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23231014923867577, "ground_truth": 0}, {"key": "28061069", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3557748931730051, "ground_truth": 0}, {"key": "28061069", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632158901670175, "ground_truth": 0}, {"key": "28061069", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416730262895583, "ground_truth": 0}, {"key": "22259982", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17553806501128488, "ground_truth": 0}, {"key": "22259982", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32082129095078704, "ground_truth": 0}, {"key": "22259982", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21469141659561142, "ground_truth": 0}, {"key": "22259982", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776332933343804, "ground_truth": 0}, {"key": "22259982", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1955940932772492, "ground_truth": 0}, {"key": "34026805", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7892336826327201, "ground_truth": 0}, {"key": "34026805", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6893056173754876, "ground_truth": 0}, {"key": "34026805", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7170118794730082, "ground_truth": 0}, {"key": "34026805", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318054914249, "ground_truth": 0}, {"key": "34026805", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764947931251, "ground_truth": 0}, {"key": "36713809", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4746311777401656, "ground_truth": 0}, {"key": "36713809", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38121955435568927, "ground_truth": 0}, {"key": "36713809", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41869689116368286, "ground_truth": 0}, {"key": "36713809", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.46295861600854327, "ground_truth": 0}, {"key": "36713809", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460137180381671, "ground_truth": 0}, {"key": "39726411", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2704802267566516, "ground_truth": 0}, {"key": "39726411", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23231014116486054, "ground_truth": 0}, {"key": "39726411", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23091977771201908, "ground_truth": 0}, {"key": "39726411", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15002882103154944, "ground_truth": 0}, {"key": "39726411", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1470645189886734, "ground_truth": 0}, {"key": "37069841", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7918210752411571, "ground_truth": 0}, {"key": "37069841", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6791786985584913, "ground_truth": 0}, {"key": "37069841", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6943026722095295, "ground_truth": 0}, {"key": "37069841", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424446813696, "ground_truth": 0}, {"key": "37069841", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615381988909739, "ground_truth": 0}, {"key": "38894693", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5370413881762605, "ground_truth": 0}, {"key": "38894693", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5195213471886385, "ground_truth": 0}, {"key": "38894693", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7431679918539965, "ground_truth": 0}, {"key": "38894693", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575495578334, "ground_truth": 0}, {"key": "38894693", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228934384235, "ground_truth": 0}, {"key": "33946032", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7662936469233635, "ground_truth": 0}, {"key": "33946032", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7577943850670021, "ground_truth": 0}, {"key": "33946032", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8670357662898327, "ground_truth": 0}, {"key": "33946032", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367884458797, "ground_truth": 0}, {"key": "33946032", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748642337595, "ground_truth": 0}, {"key": "39035311", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5312093446091972, "ground_truth": 0}, {"key": "39035311", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2861692439592556, "ground_truth": 0}, {"key": "39035311", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4339814667815894, "ground_truth": 0}, {"key": "39035311", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42823341414357097, "ground_truth": 0}, {"key": "39035311", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594951483309803, "ground_truth": 0}, {"key": "27680038", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2909808782872854, "ground_truth": 0}, {"key": "27680038", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.0803574687895287, "ground_truth": 0}, {"key": "27680038", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15713684870251404, "ground_truth": 0}, {"key": "27680038", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17328819237059667, "ground_truth": 0}, {"key": "27680038", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11757213785086319, "ground_truth": 0}, {"key": "36901907", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.50781185749443, "ground_truth": 0}, {"key": "36901907", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5774953673004991, "ground_truth": 0}, {"key": "36901907", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4863315566564802, "ground_truth": 0}, {"key": "36901907", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582711431691, "ground_truth": 0}, {"key": "36901907", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473616824076, "ground_truth": 0}, {"key": "21530542", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.262841847372626, "ground_truth": 0}, {"key": "21530542", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5097644110185426, "ground_truth": 0}, {"key": "21530542", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.27825680676840725, "ground_truth": 0}, {"key": "21530542", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.45713670788295185, "ground_truth": 0}, {"key": "21530542", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2538610138742271, "ground_truth": 0}, {"key": "38192532", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5926666109828623, "ground_truth": 0}, {"key": "38192532", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5312093445605262, "ground_truth": 0}, {"key": "38192532", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4902356308158964, "ground_truth": 0}, {"key": "38192532", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42823339896137136, "ground_truth": 0}, {"key": "38192532", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366423804857, "ground_truth": 0}, {"key": "34102400", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16776335881914298, "ground_truth": 0}, {"key": "34102400", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10818895241402274, "ground_truth": 0}, {"key": "34102400", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11757213237141548, "ground_truth": 0}, {"key": "34102400", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223190115666914, "ground_truth": 0}, {"key": "34102400", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1366083851745593, "ground_truth": 0}, {"key": "36133399", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4378234834380859, "ground_truth": 0}, {"key": "36133399", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6706082527205323, "ground_truth": 0}, {"key": "36133399", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39233684903619787, "ground_truth": 0}, {"key": "36133399", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984868554307, "ground_truth": 0}, {"key": "36133399", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32423538715199374, "ground_truth": 0}, {"key": "34314544", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6242935379412422, "ground_truth": 0}, {"key": "34314544", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5253688197953199, "ground_truth": 0}, {"key": "34314544", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4244119985097907, "ground_truth": 0}, {"key": "34314544", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813031208914549, "ground_truth": 0}, {"key": "34314544", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953568363201, "ground_truth": 0}, {"key": "33460074", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5698526325887022, "ground_truth": 0}, {"key": "33460074", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5755880297099092, "ground_truth": 0}, {"key": "33460074", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40544874134772074, "ground_truth": 0}, {"key": "33460074", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2909808865829693, "ground_truth": 0}, {"key": "33460074", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953467082689, "ground_truth": 0}, {"key": "36191495", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4378235010124322, "ground_truth": 0}, {"key": "36191495", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2323101460598998, "ground_truth": 0}, {"key": "36191495", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16885695364623238, "ground_truth": 0}, {"key": "36191495", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21076631111502456, "ground_truth": 0}, {"key": "36191495", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35577488634243043, "ground_truth": 0}, {"key": "39532668", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6992543960004822, "ground_truth": 0}, {"key": "39532668", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7759445651198804, "ground_truth": 0}, {"key": "39532668", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7371581492820207, "ground_truth": 0}, {"key": "39532668", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476636085398, "ground_truth": 0}, {"key": "39532668", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195095651665, "ground_truth": 0}, {"key": "20328247", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4687906094943615, "ground_truth": 0}, {"key": "20328247", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19559409838571226, "ground_truth": 0}, {"key": "20328247", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5907792212539943, "ground_truth": 0}, {"key": "20328247", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366085461475, "ground_truth": 0}, {"key": "20328247", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416729769347504, "ground_truth": 0}, {"key": "39112675", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.40922076653452, "ground_truth": 0}, {"key": "39112675", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3486451311893087, "ground_truth": 0}, {"key": "39112675", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42632159628555627, "ground_truth": 0}, {"key": "39112675", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42250465400346043, "ground_truth": 0}, {"key": "39112675", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544872031666296, "ground_truth": 0}, {"key": "31620300", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3073580282734415, "ground_truth": 0}, {"key": "31620300", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3328523254276527, "ground_truth": 0}, {"key": "31620300", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.32766830100879696, "ground_truth": 0}, {"key": "31620300", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3793784031056337, "ground_truth": 0}, {"key": "31620300", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420095817642536, "ground_truth": 0}, {"key": "37518509", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1081889498998871, "ground_truth": 0}, {"key": "37518509", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28776781727169637, "ground_truth": 0}, {"key": "37518509", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16344543434159586, "ground_truth": 0}, {"key": "37518509", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11436851803295155, "ground_truth": 0}, {"key": "37518509", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364245118083003, "ground_truth": 0}, {"key": "35454095", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5370413641920119, "ground_truth": 0}, {"key": "35454095", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8187367899075402, "ground_truth": 0}, {"key": "35454095", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7476159386865047, "ground_truth": 0}, {"key": "35454095", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358800237704, "ground_truth": 0}, {"key": "35454095", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884632614622, "ground_truth": 0}, {"key": "38542788", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5640984861301542, "ground_truth": 0}, {"key": "38542788", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5583269696819781, "ground_truth": 0}, {"key": "38542788", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8244619225886389, "ground_truth": 0}, {"key": "38542788", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509646975189508, "ground_truth": 0}, {"key": "38542788", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321831352264, "ground_truth": 0}, {"key": "23944937", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7138307842015277, "ground_truth": 0}, {"key": "23944937", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2240554638953111, "ground_truth": 0}, {"key": "23944937", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5964331362779871, "ground_truth": 0}, {"key": "23944937", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4111108711349121, "ground_truth": 0}, {"key": "23944937", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32423540596104605, "ground_truth": 0}, {"key": "31753944", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22678363333312196, "ground_truth": 0}, {"key": "31753944", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14223190224252763, "ground_truth": 0}, {"key": "31753944", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23510841059034018, "ground_truth": 0}, {"key": "31753944", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21866938986505902, "ground_truth": 0}, {"key": "31753944", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.25091277828050446, "ground_truth": 0}, {"key": "35527214", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3276682999157282, "ground_truth": 0}, {"key": "35527214", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.41111086047000733, "ground_truth": 0}, {"key": "35527214", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2893716958622153, "ground_truth": 0}, {"key": "35527214", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23934935051542625, "ground_truth": 0}, {"key": "35527214", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944725878519539, "ground_truth": 0}, {"key": "40400404", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8596637499839803, "ground_truth": 0}, {"key": "40400404", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.746139002514509, "ground_truth": 0}, {"key": "40400404", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7704647767878745, "ground_truth": 0}, {"key": "40400404", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897219683492, "ground_truth": 0}, {"key": "40400404", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760310696828, "ground_truth": 0}, {"key": "21713119", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22270014876873337, "ground_truth": 0}, {"key": "21713119", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16026603789446925, "ground_truth": 0}, {"key": "21713119", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1907240289412481, "ground_truth": 0}, {"key": "21713119", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757213315870492, "ground_truth": 0}, {"key": "21713119", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.12940272721064333, "ground_truth": 0}, {"key": "28730678", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6566582629586132, "ground_truth": 0}, {"key": "28730678", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7401743361855861, "ground_truth": 0}, {"key": "28730678", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8164063894308735, "ground_truth": 0}, {"key": "28730678", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512023033978, "ground_truth": 0}, {"key": "28730678", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601376031618, "ground_truth": 0}, {"key": "36823733", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5175708944769685, "ground_truth": 0}, {"key": "36823733", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4513264980491531, "ground_truth": 0}, {"key": "36823733", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.29259528444317157, "ground_truth": 0}, {"key": "36823733", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.542863305393179, "ground_truth": 0}, {"key": "36823733", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2893716993767609, "ground_truth": 0}, {"key": "35988862", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25683202078331985, "ground_truth": 0}, {"key": "35988862", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31742626562073134, "ground_truth": 0}, {"key": "35988862", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.31236999611045274, "ground_truth": 0}, {"key": "35988862", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16238002867798668, "ground_truth": 0}, {"key": "35988862", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.12336562344864546, "ground_truth": 0}, {"key": "40499665", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6740504964526189, "ground_truth": 0}, {"key": "40499665", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6057990162595058, "ground_truth": 0}, {"key": "40499665", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6808785954718053, "ground_truth": 0}, {"key": "40499665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006919871884182, "ground_truth": 0}, {"key": "40499665", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723316903106461, "ground_truth": 0}, {"key": "32829820", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6315942956297118, "ground_truth": 0}, {"key": "32829820", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.515619934021027, "ground_truth": 0}, {"key": "32829820", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48242910119416377, "ground_truth": 0}, {"key": "32829820", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942800843206, "ground_truth": 0}, {"key": "32829820", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842639999327346, "ground_truth": 0}, {"key": "20583553", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12592276258255022, "ground_truth": 0}, {"key": "20583553", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16238003926034253, "ground_truth": 0}, {"key": "20583553", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.0809367048804901, "ground_truth": 0}, {"key": "20583553", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20561504680040887, "ground_truth": 0}, {"key": "20583553", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11047115905855169, "ground_truth": 0}, {"key": "30501550", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6279512046078913, "ground_truth": 0}, {"key": "30501550", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7648916006790554, "ground_truth": 0}, {"key": "30501550", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7170118804012315, "ground_truth": 0}, {"key": "30501550", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743649326699, "ground_truth": 0}, {"key": "30501550", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.633410275467293, "ground_truth": 0}, {"key": "38755897", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3208212884907463, "ground_truth": 0}, {"key": "38755897", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31573596422084843, "ground_truth": 0}, {"key": "38755897", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6584175062140875, "ground_truth": 0}, {"key": "38755897", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4035668450615257, "ground_truth": 0}, {"key": "38755897", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594948967807086, "ground_truth": 0}, {"key": "35507201", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5945512653260039, "ground_truth": 0}, {"key": "35507201", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5888891347339937, "ground_truth": 0}, {"key": "35507201", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7416740043095007, "ground_truth": 0}, {"key": "35507201", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786297751919, "ground_truth": 0}, {"key": "35507201", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324542392559, "ground_truth": 0}, {"key": "36453511", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6842640428341447, "ground_truth": 0}, {"key": "36453511", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7248702774307948, "ground_truth": 0}, {"key": "36453511", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5964331558079059, "ground_truth": 0}, {"key": "36453511", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213622391248, "ground_truth": 0}, {"key": "36453511", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058590991755612, "ground_truth": 0}, {"key": "38066835", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.40922078004045775, "ground_truth": 0}, {"key": "38066835", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6095241588811069, "ground_truth": 0}, {"key": "38066835", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4054487714125012, "ground_truth": 0}, {"key": "38066835", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4532618512471742, "ground_truth": 0}, {"key": "38066835", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974734900852985, "ground_truth": 0}, {"key": "39697181", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3738758024165338, "ground_truth": 0}, {"key": "39697181", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40356684214569005, "ground_truth": 0}, {"key": "39697181", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3757064753432327, "ground_truth": 0}, {"key": "39697181", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31237002559646454, "ground_truth": 0}, {"key": "39697181", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213471351375, "ground_truth": 0}, {"key": "21820893", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6095241869943921, "ground_truth": 0}, {"key": "21820893", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6076631753817284, "ground_truth": 0}, {"key": "21820893", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4765796353197557, "ground_truth": 0}, {"key": "21820893", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42441199846078403, "ground_truth": 0}, {"key": "21820893", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359824687122, "ground_truth": 0}, {"key": "40519933", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5832033785743442, "ground_truth": 0}, {"key": "40519933", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3007455595027592, "ground_truth": 0}, {"key": "40519933", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.46684562814795516, "ground_truth": 0}, {"key": "40519933", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4610167774221756, "ground_truth": 0}, {"key": "40519933", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4339814524635625, "ground_truth": 0}, {"key": "30446033", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5869964400871933, "ground_truth": 0}, {"key": "30446033", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3849121460564198, "ground_truth": 0}, {"key": "30446033", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.46879064155998035, "ground_truth": 0}, {"key": "30446033", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4073334253697181, "ground_truth": 0}, {"key": "30446033", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.42059959379213757, "ground_truth": 0}, {"key": "40216291", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7892336801423284, "ground_truth": 0}, {"key": "40216291", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7534666520693929, "ground_truth": 0}, {"key": "40216291", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8152324789142811, "ground_truth": 0}, {"key": "40216291", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767876078858, "ground_truth": 0}, {"key": "40216291", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.869714579823336, "ground_truth": 0}, {"key": "33479118", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.36840569817721963, "ground_truth": 0}, {"key": "33479118", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2877678239867295, "ground_truth": 0}, {"key": "33479118", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3942009385112455, "ground_truth": 0}, {"key": "33479118", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4359014998598861, "ground_truth": 0}, {"key": "33479118", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3775406483547305, "ground_truth": 0}, {"key": "22297373", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.08269734072283651, "ground_truth": 0}, {"key": "22297373", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.07159120082505391, "ground_truth": 0}, {"key": "22297373", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.10374862617781591, "ground_truth": 0}, {"key": "22297373", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.05582314165546699, "ground_truth": 0}, {"key": "22297373", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.04603390528752139, "ground_truth": 0}, {"key": "36463668", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09268777652149134, "ground_truth": 0}, {"key": "36463668", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22000708772409366, "ground_truth": 0}, {"key": "36463668", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.07585817676237634, "ground_truth": 0}, {"key": "36463668", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.02387083821418743, "ground_truth": 0}, {"key": "36463668", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15713685452347348, "ground_truth": 0}, {"key": "35264615", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43974732039993336, "ground_truth": 0}, {"key": "35264615", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5234203421581709, "ground_truth": 0}, {"key": "35264615", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39793842735165924, "ground_truth": 0}, {"key": "35264615", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.384912175535947, "ground_truth": 0}, {"key": "35264615", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.38491213157559906, "ground_truth": 0}, {"key": "39898482", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6859494676298004, "ground_truth": 0}, {"key": "39898482", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8019358239490633, "ground_truth": 0}, {"key": "39898482", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7732163709318421, "ground_truth": 0}, {"key": "39898482", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936169133943, "ground_truth": 0}, {"key": "39898482", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489721915093414, "ground_truth": 0}, {"key": "37228721", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5774953631087378, "ground_truth": 0}, {"key": "37228721", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6261241855219648, "ground_truth": 0}, {"key": "37228721", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6315943080444117, "ground_truth": 0}, {"key": "37228721", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593331004019, "ground_truth": 0}, {"key": "37228721", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677608314967, "ground_truth": 0}, {"key": "24535799", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9546474214048662, "ground_truth": 0}, {"key": "24535799", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9462003510328509, "ground_truth": 0}, {"key": "24535799", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9294403923617117, "ground_truth": 0}, {"key": "24535799", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9884918510732013, "ground_truth": 0}, {"key": "24535799", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9289263321938295, "ground_truth": 0}, {"key": "35177759", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6688802749420781, "ground_truth": 0}, {"key": "35177759", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6150878262617806, "ground_truth": 0}, {"key": "35177759", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6261241612026514, "ground_truth": 0}, {"key": "35177759", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581759090077, "ground_truth": 0}, {"key": "35177759", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577681147912294, "ground_truth": 0}, {"key": "34364829", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4824291190355958, "ground_truth": 0}, {"key": "34364829", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3979384340221589, "ground_truth": 0}, {"key": "34364829", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5506073715042337, "ground_truth": 0}, {"key": "34364829", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4073333945558775, "ground_truth": 0}, {"key": "34364829", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43398146062656945, "ground_truth": 0}, {"key": "38090732", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6584174978059861, "ground_truth": 0}, {"key": "38090732", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6388352802077809, "ground_truth": 0}, {"key": "38090732", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4416729982808753, "ground_truth": 0}, {"key": "38090732", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468923168898, "ground_truth": 0}, {"key": "38090732", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.47073661263426986, "ground_truth": 0}, {"key": "30651479", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6169358327649322, "ground_truth": 0}, {"key": "30651479", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.724870272374182, "ground_truth": 0}, {"key": "30651479", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7074046971178508, "ground_truth": 0}, {"key": "30651479", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185262022323, "ground_truth": 0}, {"key": "30651479", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737186841607, "ground_truth": 0}, {"key": "39380921", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.37754063689382583, "ground_truth": 0}, {"key": "39380921", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4474603005058233, "ground_truth": 0}, {"key": "39380921", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1666753993762546, "ground_truth": 0}, {"key": "39380921", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2674081742227695, "ground_truth": 0}, {"key": "39380921", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2436424544169541, "ground_truth": 0}, {"key": "39037490", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20055768753077302, "ground_truth": 0}, {"key": "39037490", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1127954045489685, "ground_truth": 0}, {"key": "39037490", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1721718516453964, "ground_truth": 0}, {"key": "39037490", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17217184769542176, "ground_truth": 0}, {"key": "39037490", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22270014506676816, "ground_truth": 0}, {"key": "35917499", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5019530977137039, "ground_truth": 0}, {"key": "35917499", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7185943725505156, "ground_truth": 0}, {"key": "35917499", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4378234901297087, "ground_truth": 0}, {"key": "35917499", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5428632965422348, "ground_truth": 0}, {"key": "35917499", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273164892443503, "ground_truth": 0}, {"key": "34908073", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.674050484662653, "ground_truth": 0}, {"key": "34908073", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6370307840187559, "ground_truth": 0}, {"key": "34908073", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6187804387881499, "ground_truth": 0}, {"key": "34908073", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704580757991, "ground_truth": 0}, {"key": "34908073", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269925868116, "ground_truth": 0}, {"key": "36344759", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3276682853951954, "ground_truth": 0}, {"key": "36344759", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25832599593531896, "ground_truth": 0}, {"key": "36344759", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3157359642544479, "ground_truth": 0}, {"key": "36344759", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091977305424974, "ground_truth": 0}, {"key": "36344759", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.25534365321567604, "ground_truth": 0}, {"key": "39984637", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.372048776276045, "ground_truth": 0}, {"key": "39984637", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2974699434349993, "ground_truth": 0}, {"key": "39984637", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18952109621784272, "ground_truth": 0}, {"key": "39984637", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15102780311474276, "ground_truth": 0}, {"key": "39984637", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16667541567142047, "ground_truth": 0}, {"key": "17917326", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.145115355419672, "ground_truth": 0}, {"key": "17917326", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30239109079380605, "ground_truth": 0}, {"key": "17917326", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40922078389787325, "ground_truth": 0}, {"key": "17917326", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3007455751735568, "ground_truth": 0}, {"key": "17917326", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.13846179908934086, "ground_truth": 0}, {"key": "32193638", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4960938132340288, "ground_truth": 0}, {"key": "32193638", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49414093536537496, "ground_truth": 0}, {"key": "32193638", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6477982466374342, "ground_truth": 0}, {"key": "32193638", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165484153595, "ground_truth": 0}, {"key": "32193638", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118794111538, "ground_truth": 0}, {"key": "34564692", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2861692310329429, "ground_truth": 0}, {"key": "34564692", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7606506373164613, "ground_truth": 0}, {"key": "34564692", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5312093690545678, "ground_truth": 0}, {"key": "34564692", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786211772472, "ground_truth": 0}, {"key": "34564692", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704725994819, "ground_truth": 0}, {"key": "39329284", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8714748663679217, "ground_truth": 0}, {"key": "39329284", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9766692308675358, "ground_truth": 0}, {"key": "39329284", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9911526446449881, "ground_truth": 0}, {"key": "39329284", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.944994712696137, "ground_truth": 0}, {"key": "39329284", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9875683490177155, "ground_truth": 0}, {"key": "37438541", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3486451442645342, "ground_truth": 0}, {"key": "37438541", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4054487254169826, "ground_truth": 0}, {"key": "37438541", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2583259781595742, "ground_truth": 0}, {"key": "37438541", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17106119140673282, "ground_truth": 0}, {"key": "37438541", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17667158952957823, "ground_truth": 0}, {"key": "34652757", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6477982194444053, "ground_truth": 0}, {"key": "34652757", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4960938251248429, "ground_truth": 0}, {"key": "34652757", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5755880220140409, "ground_truth": 0}, {"key": "34652757", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883266762364, "ground_truth": 0}, {"key": "34652757", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786246325254, "ground_truth": 0}, {"key": "31361004", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44167300479302507, "ground_truth": 0}, {"key": "31361004", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.47852883674441604, "ground_truth": 0}, {"key": "31361004", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6424324868105427, "ground_truth": 0}, {"key": "31361004", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833742013322, "ground_truth": 0}, {"key": "31361004", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702534320368, "ground_truth": 0}, {"key": "26150727", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18713267345627563, "ground_truth": 0}, {"key": "26150727", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1895210830205837, "ground_truth": 0}, {"key": "26150727", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15405757048767896, "ground_truth": 0}, {"key": "26150727", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.32423539586354194, "ground_truth": 0}, {"key": "26150727", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23651622349086765, "ground_truth": 0}, {"key": "36997402", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.640635846482728, "ground_truth": 0}, {"key": "36997402", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6095241671159571, "ground_truth": 0}, {"key": "36997402", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6706082604318823, "ground_truth": 0}, {"key": "36997402", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689398243049, "ground_truth": 0}, {"key": "36997402", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389726827062, "ground_truth": 0}, {"key": "37430643", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4843801152795406, "ground_truth": 0}, {"key": "37430643", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5755880348751949, "ground_truth": 0}, {"key": "37430643", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7233094496021286, "ground_truth": 0}, {"key": "37430643", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621765016016573, "ground_truth": 0}, {"key": "37430643", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744735772953, "ground_truth": 0}, {"key": "36964631", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6584175213315939, "ground_truth": 0}, {"key": "36964631", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7122322136506211, "ground_truth": 0}, {"key": "36964631", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5983121963214275, "ground_truth": 0}, {"key": "36964631", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867862496854, "ground_truth": 0}, {"key": "36964631", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416407135122, "ground_truth": 0}, {"key": "35502013", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4629586124173056, "ground_truth": 0}, {"key": "35502013", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4513265031253738, "ground_truth": 0}, {"key": "35502013", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2925952807188273, "ground_truth": 0}, {"key": "35502013", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3191213926604412, "ground_truth": 0}, {"key": "35502013", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711613332067, "ground_truth": 0}, {"key": "33987664", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5602526640955372, "ground_truth": 0}, {"key": "33987664", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7074046913319901, "ground_truth": 0}, {"key": "33987664", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6584175161614445, "ground_truth": 0}, {"key": "33987664", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061582637351, "ground_truth": 0}, {"key": "33987664", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935292394707, "ground_truth": 0}, {"key": "35203721", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.42823338743029776, "ground_truth": 0}, {"key": "35203721", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.517570882130143, "ground_truth": 0}, {"key": "35203721", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30404169156390737, "ground_truth": 0}, {"key": "35203721", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4416729953732482, "ground_truth": 0}, {"key": "35203721", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34687307853943233, "ground_truth": 0}, {"key": "39028348", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6261241627692142, "ground_truth": 0}, {"key": "39028348", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7310585582192022, "ground_truth": 0}, {"key": "39028348", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7490871882038275, "ground_truth": 0}, {"key": "39028348", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4513264785930815, "ground_truth": 0}, {"key": "39028348", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935292807907, "ground_truth": 0}, {"key": "37459383", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.616935820810667, "ground_truth": 0}, {"key": "37459383", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7401743645661576, "ground_truth": 0}, {"key": "37459383", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6513548565353293, "ground_truth": 0}, {"key": "37459383", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701101119957, "ground_truth": 0}, {"key": "37459383", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791787442934099, "ground_truth": 0}, {"key": "34020070", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39047584956134834, "ground_truth": 0}, {"key": "34020070", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29259530339315115, "ground_truth": 0}, {"key": "34020070", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3345894314887427, "ground_truth": 0}, {"key": "34020070", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40922081090506196, "ground_truth": 0}, {"key": "34020070", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.46490155081038187, "ground_truth": 0}, {"key": "35176615", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7279754649312749, "ground_truth": 0}, {"key": "35176615", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7356416356417862, "ground_truth": 0}, {"key": "35176615", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4649015606931008, "ground_truth": 0}, {"key": "35176615", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.622459341017425, "ground_truth": 0}, {"key": "35176615", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416500541076, "ground_truth": 0}, {"key": "33296389", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48047867757274926, "ground_truth": 0}, {"key": "33296389", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6279512089379714, "ground_truth": 0}, {"key": "33296389", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7461389694587706, "ground_truth": 0}, {"key": "33296389", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990142750086, "ground_truth": 0}, {"key": "33296389", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389998248452, "ground_truth": 0}, {"key": "35399504", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4726834783198206, "ground_truth": 0}, {"key": "35399504", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7310586069191483, "ground_truth": 0}, {"key": "35399504", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8661325144923689, "ground_truth": 0}, {"key": "35399504", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321854650196, "ground_truth": 0}, {"key": "35399504", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619141302175, "ground_truth": 0}, {"key": "34807886", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26133091475450054, "ground_truth": 0}, {"key": "34807886", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3575675524256989, "ground_truth": 0}, {"key": "34807886", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3007455719782825, "ground_truth": 0}, {"key": "34807886", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27357437829034326, "ground_truth": 0}, {"key": "34807886", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3504214079058184, "ground_truth": 0}, {"key": "37629813", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3720487723898403, "ground_truth": 0}, {"key": "37629813", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.34510526294774196, "ground_truth": 0}, {"key": "37629813", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3923367999046138, "ground_truth": 0}, {"key": "37629813", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4111108738725888, "ground_truth": 0}, {"key": "37629813", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32423542102918423, "ground_truth": 0}, {"key": "28084389", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2509127671165832, "ground_truth": 0}, {"key": "28084389", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5506073507517221, "ground_truth": 0}, {"key": "28084389", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4629586253114976, "ground_truth": 0}, {"key": "28084389", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307653335715, "ground_truth": 0}, {"key": "28084389", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.48242912054426207, "ground_truth": 0}, {"key": "35391734", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11357959294823936, "ground_truth": 0}, {"key": "35391734", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.46879062968445945, "ground_truth": 0}, {"key": "35391734", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.47657964849089884, "ground_truth": 0}, {"key": "35391734", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679365999517374, "ground_truth": 0}, {"key": "35391734", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4590761114774581, "ground_truth": 0}, {"key": "40214591", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48438009811054755, "ground_truth": 0}, {"key": "40214591", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25683197462863033, "ground_truth": 0}, {"key": "40214591", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.31573597025681926, "ground_truth": 0}, {"key": "40214591", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937838723720635, "ground_truth": 0}, {"key": "40214591", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19314737307280347, "ground_truth": 0}, {"key": "26283171", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6113819575530621, "ground_truth": 0}, {"key": "26283171", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5409238744896979, "ground_truth": 0}, {"key": "26283171", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33982761292139624, "ground_truth": 0}, {"key": "26283171", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723729743578, "ground_truth": 0}, {"key": "26283171", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.724870291279141, "ground_truth": 0}, {"key": "37084030", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20181320522890012, "ground_truth": 0}, {"key": "37084030", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2523840405105019, "ground_truth": 0}, {"key": "37084030", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2958398653625838, "ground_truth": 0}, {"key": "37084030", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24077460247895324, "ground_truth": 0}, {"key": "37084030", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19930801041175797, "ground_truth": 0}, {"key": "39027295", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10970577704302317, "ground_truth": 0}, {"key": "39027295", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2309197686963594, "ground_truth": 0}, {"key": "39027295", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24220560884478387, "ground_truth": 0}, {"key": "39027295", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4244119912378966, "ground_truth": 0}, {"key": "39027295", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40733339217250447, "ground_truth": 0}, {"key": "14018647", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2751297310383534, "ground_truth": 0}, {"key": "14018647", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1460872365364184, "ground_truth": 0}, {"key": "14018647", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18952110062543487, "ground_truth": 0}, {"key": "14018647", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20946967977517822, "ground_truth": 0}, {"key": "14018647", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2186693803341305, "ground_truth": 0}, {"key": "37424289", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.74908723292774, "ground_truth": 0}, {"key": "37424289", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7648916110805843, "ground_truth": 0}, {"key": "37424289", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8311430346133946, "ground_truth": 0}, {"key": "37424289", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894602833613, "ground_truth": 0}, {"key": "37424289", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321968540127, "ground_truth": 0}, {"key": "37498031", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.0920328506921794, "ground_truth": 0}, {"key": "37498031", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11279540501623074, "ground_truth": 0}, {"key": "37498031", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1530421561552975, "ground_truth": 0}, {"key": "37498031", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17895587522775136, "ground_truth": 0}, {"key": "37498031", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16132024100527464, "ground_truth": 0}, {"key": "30104095", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7520125876138704, "ground_truth": 0}, {"key": "30104095", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8255897162987059, "ground_truth": 0}, {"key": "30104095", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5195213323374612, "ground_truth": 0}, {"key": "30104095", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073834903791, "ground_truth": 0}, {"key": "30104095", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995567050729, "ground_truth": 0}, {"key": "37911407", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.824461914539713, "ground_truth": 0}, {"key": "37911407", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7041601238220716, "ground_truth": 0}, {"key": "37911407", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7799929105826983, "ground_truth": 0}, {"key": "37911407", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122865454109, "ground_truth": 0}, {"key": "37911407", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8661325196322713, "ground_truth": 0}, {"key": "39177472", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.631594301329246, "ground_truth": 0}, {"key": "39177472", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6636689551193196, "ground_truth": 0}, {"key": "39177472", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5136684819679406, "ground_truth": 0}, {"key": "39177472", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358559527979, "ground_truth": 0}, {"key": "39177472", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206216114004316, "ground_truth": 0}, {"key": "32325454", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8006919950288884, "ground_truth": 0}, {"key": "32325454", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40356684187826564, "ground_truth": 0}, {"key": "32325454", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.546738194804445, "ground_truth": 0}, {"key": "32325454", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39233683006626874, "ground_truth": 0}, {"key": "32325454", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.39793841162589666, "ground_truth": 0}, {"key": "38395319", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48047869117931163, "ground_truth": 0}, {"key": "38395319", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35756750556548317, "ground_truth": 0}, {"key": "38395319", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3720487768554799, "ground_truth": 0}, {"key": "38395319", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4863315503839435, "ground_truth": 0}, {"key": "38395319", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.594551245209881, "ground_truth": 0}, {"key": "38235895", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20181323835205012, "ground_truth": 0}, {"key": "38235895", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1329642373073931, "ground_truth": 0}, {"key": "38235895", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2814056146053416, "ground_truth": 0}, {"key": "38235895", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26133092225116733, "ground_truth": 0}, {"key": "38235895", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2674081388596171, "ground_truth": 0}, {"key": "26543267", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16132022882025662, "ground_truth": 0}, {"key": "26543267", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26284185250882947, "ground_truth": 0}, {"key": "26543267", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19930798818376816, "ground_truth": 0}, {"key": "26543267", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19682620398176656, "ground_truth": 0}, {"key": "26543267", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1699562246705429, "ground_truth": 0}, {"key": "39054728", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9826909044826856, "ground_truth": 0}, {"key": "39054728", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9804313242361623, "ground_truth": 0}, {"key": "39054728", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9224823413264436, "ground_truth": 0}, {"key": "39054728", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9559813523079626, "ground_truth": 0}, {"key": "39054728", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9764905488796337, "ground_truth": 0}, {"key": "39158443", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7341195118443006, "ground_truth": 0}, {"key": "39158443", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48633153728641526, "ground_truth": 0}, {"key": "39158443", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6909762683042756, "ground_truth": 0}, {"key": "39158443", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210766495534, "ground_truth": 0}, {"key": "39158443", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324636973997, "ground_truth": 0}, {"key": "36254201", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4455295398661148, "ground_truth": 0}, {"key": "36254201", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3468730965541212, "ground_truth": 0}, {"key": "36254201", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.581303093449843, "ground_truth": 0}, {"key": "36254201", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.46684559090737004, "ground_truth": 0}, {"key": "36254201", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4493926191849534, "ground_truth": 0}, {"key": "23434347", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43974732874321387, "ground_truth": 0}, {"key": "23434347", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1931473824044123, "ground_truth": 0}, {"key": "23434347", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6150878417079864, "ground_truth": 0}, {"key": "23434347", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4687906462927728, "ground_truth": 0}, {"key": "23434347", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331543989406645, "ground_truth": 0}, {"key": "34397620", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.29098084043718137, "ground_truth": 0}, {"key": "34397620", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.15610490595198875, "ground_truth": 0}, {"key": "34397620", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3276682949765886, "ground_truth": 0}, {"key": "34397620", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782568135660094, "ground_truth": 0}, {"key": "34397620", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730883781571, "ground_truth": 0}, {"key": "34340916", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39793839494234184, "ground_truth": 0}, {"key": "34340916", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1907240294170039, "ground_truth": 0}, {"key": "34340916", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24798742236266558, "ground_truth": 0}, {"key": "34340916", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3812195966085224, "ground_truth": 0}, {"key": "34340916", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3960681409861306, "ground_truth": 0}, {"key": "30375089", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5350984185877605, "ground_truth": 0}, {"key": "30375089", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3328523154095701, "ground_truth": 0}, {"key": "30375089", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3415824848165336, "ground_truth": 0}, {"key": "30375089", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3293917171652965, "ground_truth": 0}, {"key": "30375089", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117165600443073, "ground_truth": 0}, {"key": "35807797", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5506073234066303, "ground_truth": 0}, {"key": "35807797", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5058591050584824, "ground_truth": 0}, {"key": "35807797", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8333245935206821, "ground_truth": 0}, {"key": "35807797", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545507432512, "ground_truth": 0}, {"key": "35807797", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673137898984, "ground_truth": 0}, {"key": "34188172", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5195212994945797, "ground_truth": 0}, {"key": "34188172", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3363310705080811, "ground_truth": 0}, {"key": "34188172", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40922077540885293, "ground_truth": 0}, {"key": "34188172", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.48047868177023767, "ground_truth": 0}, {"key": "34188172", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15921739326547485, "ground_truth": 0}, {"key": "37075567", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8354835451143393, "ground_truth": 0}, {"key": "37075567", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8267117904509252, "ground_truth": 0}, {"key": "37075567", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8652240822934855, "ground_truth": 0}, {"key": "37075567", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9032942090484845, "ground_truth": 0}, {"key": "37075567", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9263037365288207, "ground_truth": 0}, {"key": "35559735", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5312093686962036, "ground_truth": 0}, {"key": "35559735", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6671476839887954, "ground_truth": 0}, {"key": "35559735", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6406358444157019, "ground_truth": 0}, {"key": "35559735", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981868103254433, "ground_truth": 0}, {"key": "35559735", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601320481005, "ground_truth": 0}, {"key": "33005019", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4765796575844681, "ground_truth": 0}, {"key": "33005019", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4263215850924159, "ground_truth": 0}, {"key": "33005019", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8333245886335847, "ground_truth": 0}, {"key": "33005019", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585891017753, "ground_truth": 0}, {"key": "33005019", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880012729362, "ground_truth": 0}, {"key": "30808252", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3174262454554883, "ground_truth": 0}, {"key": "30808252", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.34687309891042434, "ground_truth": 0}, {"key": "30808252", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35042139808540224, "ground_truth": 0}, {"key": "30808252", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.466845607140811, "ground_truth": 0}, {"key": "30808252", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35042139243423376, "ground_truth": 0}, {"key": "15159017", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5698526700615683, "ground_truth": 0}, {"key": "15159017", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5331543691936795, "ground_truth": 0}, {"key": "15159017", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5058591031122601, "ground_truth": 0}, {"key": "15159017", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907791777451209, "ground_truth": 0}, {"key": "15159017", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082902796657, "ground_truth": 0}, {"key": "24493400", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2974699441366037, "ground_truth": 0}, {"key": "24493400", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2568319731785578, "ground_truth": 0}, {"key": "24493400", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38121955397085283, "ground_truth": 0}, {"key": "24493400", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27825678711135043, "ground_truth": 0}, {"key": "24493400", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4205996099082356, "ground_truth": 0}, {"key": "37791071", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6723317163071985, "ground_truth": 0}, {"key": "37791071", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6169358409794969, "ground_truth": 0}, {"key": "37791071", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7490872045912886, "ground_truth": 0}, {"key": "37791071", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.783988473635665, "ground_truth": 0}, {"key": "37791071", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5813030907625804, "ground_truth": 0}, {"key": "33528627", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5389832239922502, "ground_truth": 0}, {"key": "33528627", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6095241481952223, "ground_truth": 0}, {"key": "33528627", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6654105616461381, "ground_truth": 0}, {"key": "33528627", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366058884517, "ground_truth": 0}, {"key": "33528627", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585897357729, "ground_truth": 0}, {"key": "39925662", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7905303122338391, "ground_truth": 0}, {"key": "39925662", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8807970766572799, "ground_truth": 0}, {"key": "39925662", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7592254099233339, "ground_truth": 0}, {"key": "39925662", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267118084693825, "ground_truth": 0}, {"key": "39925662", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637514433365, "ground_truth": 0}, {"key": "29213416", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.08035746706200352, "ground_truth": 0}, {"key": "29213416", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28776779833658, "ground_truth": 0}, {"key": "29213416", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33982759507998844, "ground_truth": 0}, {"key": "29213416", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22953522855699213, "ground_truth": 0}, {"key": "29213416", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27982849104361496, "ground_truth": 0}, {"key": "34492745", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23231014196814984, "ground_truth": 0}, {"key": "34492745", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.12765261891726956, "ground_truth": 0}, {"key": "34492745", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38306419369083367, "ground_truth": 0}, {"key": "34492745", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850362277874, "ground_truth": 0}, {"key": "34492745", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881427894279, "ground_truth": 0}, {"key": "34191937", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32594952512917635, "ground_truth": 0}, {"key": "34191937", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10374862602895983, "ground_truth": 0}, {"key": "34191937", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41869690867053405, "ground_truth": 0}, {"key": "34191937", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3398276061113392, "ground_truth": 0}, {"key": "34191937", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.31912138771837895, "ground_truth": 0}, {"key": "34933372", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5660185485635177, "ground_truth": 0}, {"key": "34933372", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5195213228815987, "ground_truth": 0}, {"key": "34933372", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44552952499565757, "ground_truth": 0}, {"key": "34933372", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746126330601, "ground_truth": 0}, {"key": "34933372", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891086688303, "ground_truth": 0}, {"key": "38714379", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8322366507442412, "ground_truth": 0}, {"key": "38714379", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7620701112461572, "ground_truth": 0}, {"key": "38714379", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8723473778230441, "ground_truth": 0}, {"key": "38714379", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445520057011, "ground_truth": 0}, {"key": "38714379", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737954451312, "ground_truth": 0}, {"key": "39220660", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7490872022168054, "ground_truth": 0}, {"key": "39220660", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7813306288697789, "ground_truth": 0}, {"key": "39220660", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7505527694787469, "ground_truth": 0}, {"key": "39220660", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519527970310888, "ground_truth": 0}, {"key": "39220660", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195142830378, "ground_truth": 0}, {"key": "41028780", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6224593212261368, "ground_truth": 0}, {"key": "41028780", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7008948209369494, "ground_truth": 0}, {"key": "41028780", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7090191333548143, "ground_truth": 0}, {"key": "41028780", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094761833185, "ground_truth": 0}, {"key": "41028780", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118908225375, "ground_truth": 0}, {"key": "39457108", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5019531189308041, "ground_truth": 0}, {"key": "39457108", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4493926427943439, "ground_truth": 0}, {"key": "39457108", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5195212997761447, "ground_truth": 0}, {"key": "39457108", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.816406373614518, "ground_truth": 0}, {"key": "39457108", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.519521321429688, "ground_truth": 0}, {"key": "38288018", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21206882181834089, "ground_truth": 0}, {"key": "38288018", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.056236347031632127, "ground_truth": 0}, {"key": "38288018", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.10447731568604736, "ground_truth": 0}, {"key": "38288018", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1721718435571313, "ground_truth": 0}, {"key": "38288018", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.12168575739914733, "ground_truth": 0}, {"key": "40106293", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2766905217466145, "ground_truth": 0}, {"key": "40106293", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.47073662814716605, "ground_truth": 0}, {"key": "40106293", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3242354119343485, "ground_truth": 0}, {"key": "40106293", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33633103674541653, "ground_truth": 0}, {"key": "40106293", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991051940332528, "ground_truth": 0}, {"key": "39948797", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7476159450395218, "ground_truth": 0}, {"key": "39948797", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8300437629175521, "ground_truth": 0}, {"key": "39948797", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6688802686288843, "ground_truth": 0}, {"key": "39948797", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759865876081, "ground_truth": 0}, {"key": "39948797", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445497295056, "ground_truth": 0}, {"key": "31853399", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9407897474387213, "ground_truth": 0}, {"key": "31853399", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7981867903594466, "ground_truth": 0}, {"key": "31853399", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8955226783017203, "ground_truth": 0}, {"key": "31853399", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8879840454267346, "ground_truth": 0}, {"key": "31853399", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907177446604, "ground_truth": 0}, {"key": "35273252", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.06142404495903616, "ground_truth": 0}, {"key": "35273252", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.08210663350153519, "ground_truth": 0}, {"key": "35273252", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.0940101775698911, "ground_truth": 0}, {"key": "35273252", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.08329192597421924, "ground_truth": 0}, {"key": "35273252", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.06512754147498663, "ground_truth": 0}, {"key": "37130459", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5621764974440631, "ground_truth": 0}, {"key": "37130459", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6566582743360649, "ground_truth": 0}, {"key": "37130459", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5563995707454695, "ground_truth": 0}, {"key": "37130459", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.38121956151511016, "ground_truth": 0}, {"key": "37130459", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786116182913, "ground_truth": 0}, {"key": "21734003", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3611647243998756, "ground_truth": 0}, {"key": "21734003", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6774739790947295, "ground_truth": 0}, {"key": "21734003", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6477982180058377, "ground_truth": 0}, {"key": "21734003", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.535098425966061, "ground_truth": 0}, {"key": "21734003", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881466007849, "ground_truth": 0}, {"key": "33990737", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.287767788559732, "ground_truth": 0}, {"key": "33990737", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.47268346724347526, "ground_truth": 0}, {"key": "33990737", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39606817577064485, "ground_truth": 0}, {"key": "33990737", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4532618508060392, "ground_truth": 0}, {"key": "33990737", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.507811875612108, "ground_truth": 0}, {"key": "34559912", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8006919926392053, "ground_truth": 0}, {"key": "34559912", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7201714893832779, "ground_truth": 0}, {"key": "34559912", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8872045925440316, "ground_truth": 0}, {"key": "34559912", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631485412511, "ground_truth": 0}, {"key": "34559912", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416656192881, "ground_truth": 0}, {"key": "39820439", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.13386749883764565, "ground_truth": 0}, {"key": "39820439", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2643583307326838, "ground_truth": 0}, {"key": "39820439", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3867634460007818, "ground_truth": 0}, {"key": "39820439", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20307463280211455, "ground_truth": 0}, {"key": "39820439", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469140819482976, "ground_truth": 0}, {"key": "34759328", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7577943580361384, "ground_truth": 0}, {"key": "34759328", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8187367880913284, "ground_truth": 0}, {"key": "34759328", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6424325017842688, "ground_truth": 0}, {"key": "34759328", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673201349297, "ground_truth": 0}, {"key": "34759328", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849752181528, "ground_truth": 0}, {"key": "36939137", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24653333577652098, "ground_truth": 0}, {"key": "36939137", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5851011364653368, "ground_truth": 0}, {"key": "36939137", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4186969191578906, "ground_truth": 0}, {"key": "36939137", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3867634418807708, "ground_truth": 0}, {"key": "36939137", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218815806073196, "ground_truth": 0}, {"key": "35851522", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7732163796658134, "ground_truth": 0}, {"key": "35851522", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5717665867421566, "ground_truth": 0}, {"key": "35851522", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4921881242559767, "ground_truth": 0}, {"key": "35851522", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487612345899, "ground_truth": 0}, {"key": "35851522", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527554289861, "ground_truth": 0}, {"key": "22412782", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.573678427344031, "ground_truth": 0}, {"key": "22412782", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40356684212111893, "ground_truth": 0}, {"key": "22412782", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3225259794374314, "ground_truth": 0}, {"key": "22412782", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093594304559, "ground_truth": 0}, {"key": "22412782", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583270060730714, "ground_truth": 0}, {"key": "38579227", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47463117497029345, "ground_truth": 0}, {"key": "38579227", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5755880074865697, "ground_truth": 0}, {"key": "38579227", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30074558667321427, "ground_truth": 0}, {"key": "38579227", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004196911744, "ground_truth": 0}, {"key": "38579227", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118447412004, "ground_truth": 0}, {"key": "37206995", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.46684556208161154, "ground_truth": 0}, {"key": "37206995", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5078118436298743, "ground_truth": 0}, {"key": "37206995", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4902356041482164, "ground_truth": 0}, {"key": "37206995", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5428632940729086, "ground_truth": 0}, {"key": "37206995", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413875117976, "ground_truth": 0}, {"key": "38700847", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6636689590929035, "ground_truth": 0}, {"key": "38700847", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8376199824995665, "ground_truth": 0}, {"key": "38700847", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8278281406865308, "ground_truth": 0}, {"key": "38700847", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.762070106905053, "ground_truth": 0}, {"key": "38700847", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984148381993, "ground_truth": 0}, {"key": "20246590", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.958537727763743, "ground_truth": 0}, {"key": "20246590", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9850429143050855, "ground_truth": 0}, {"key": "20246590", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9902161237038564, "ground_truth": 0}, {"key": "20246590", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9726235099833406, "ground_truth": 0}, {"key": "20246590", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9778834109260022, "ground_truth": 0}, {"key": "39141360", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6959583360255939, "ground_truth": 0}, {"key": "39141360", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6774740291985302, "ground_truth": 0}, {"key": "39141360", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7786493284043594, "ground_truth": 0}, {"key": "39141360", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070058768508, "ground_truth": 0}, {"key": "39141360", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583286643474, "ground_truth": 0}, {"key": "37906226", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19193279092597967, "ground_truth": 0}, {"key": "37906226", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23370636090270216, "ground_truth": 0}, {"key": "37906226", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13117322627647965, "ground_truth": 0}, {"key": "37906226", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.06804041692108992, "ground_truth": 0}, {"key": "37906226", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.08389039189461965, "ground_truth": 0}, {"key": "16201033", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2160115311610536, "ground_truth": 0}, {"key": "16201033", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3191213773128205, "ground_truth": 0}, {"key": "16201033", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3923368329687432, "ground_truth": 0}, {"key": "16201033", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3960681882923411, "ground_truth": 0}, {"key": "16201033", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40733340386008016, "ground_truth": 0}, {"key": "36469022", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6619228833736236, "ground_truth": 0}, {"key": "36469022", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4980468833536435, "ground_truth": 0}, {"key": "36469022", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.583203338091487, "ground_truth": 0}, {"key": "36469022", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982095663827, "ground_truth": 0}, {"key": "36469022", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324500271871, "ground_truth": 0}, {"key": "31295270", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11279541461257427, "ground_truth": 0}, {"key": "31295270", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35398630698404265, "ground_truth": 0}, {"key": "31295270", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.08389037683739281, "ground_truth": 0}, {"key": "31295270", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09073549545835717, "ground_truth": 0}, {"key": "31295270", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.06512754631258812, "ground_truth": 0}, {"key": "35360689", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30902370256451767, "ground_truth": 0}, {"key": "35360689", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.15713685797425092, "ground_truth": 0}, {"key": "35360689", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1259227635648397, "ground_truth": 0}, {"key": "35360689", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21733754011322115, "ground_truth": 0}, {"key": "35360689", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23792992653792322, "ground_truth": 0}, {"key": "29202793", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3398276157240406, "ground_truth": 0}, {"key": "29202793", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13846179166145053, "ground_truth": 0}, {"key": "29202793", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2568319940402842, "ground_truth": 0}, {"key": "29202793", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24077459708235371, "ground_truth": 0}, {"key": "29202793", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2407745976067892, "ground_truth": 0}, {"key": "35999008", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6039318414676467, "ground_truth": 0}, {"key": "35999008", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35756752343135634, "ground_truth": 0}, {"key": "35999008", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7620700946846978, "ground_truth": 0}, {"key": "35999008", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850120128595, "ground_truth": 0}, {"key": "35999008", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548831117592, "ground_truth": 0}, {"key": "31797119", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7620701018789997, "ground_truth": 0}, {"key": "31797119", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4016878066162757, "ground_truth": 0}, {"key": "31797119", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6926419886603998, "ground_truth": 0}, {"key": "31797119", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723869948887, "ground_truth": 0}, {"key": "31797119", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.538983228320767, "ground_truth": 0}, {"key": "26711893", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2583259791432011, "ground_truth": 0}, {"key": "26711893", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49609384624623065, "ground_truth": 0}, {"key": "26711893", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.37204879170135624, "ground_truth": 0}, {"key": "26711893", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.377540655225768, "ground_truth": 0}, {"key": "26711893", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19806416603847102, "ground_truth": 0}, {"key": "35348288", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3259495155966391, "ground_truth": 0}, {"key": "35348288", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4804786927107644, "ground_truth": 0}, {"key": "35348288", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4244119801278424, "ground_truth": 0}, {"key": "35348288", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3522017613971394, "ground_truth": 0}, {"key": "35348288", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44939261722827806, "ground_truth": 0}, {"key": "38124131", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.0881900402954718, "ground_truth": 0}, {"key": "38124131", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.07263669876337503, "ground_truth": 0}, {"key": "38124131", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.082106624221845, "ground_truth": 0}, {"key": "38124131", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15405756411711496, "ground_truth": 0}, {"key": "38124131", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.12421299841335945, "ground_truth": 0}, {"key": "20285901", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4921881221935903, "ground_truth": 0}, {"key": "20285901", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3073580110202409, "ground_truth": 0}, {"key": "20285901", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3123699977764373, "ground_truth": 0}, {"key": "20285901", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3225260029252173, "ground_truth": 0}, {"key": "20285901", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569734953078675, "ground_truth": 0}, {"key": "35633632", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5117166267136585, "ground_truth": 0}, {"key": "35633632", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5370413986927894, "ground_truth": 0}, {"key": "35633632", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48047867950074685, "ground_truth": 0}, {"key": "35633632", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.403566865692371, "ground_truth": 0}, {"key": "35633632", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4590761436377277, "ground_truth": 0}, {"key": "10741274", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4092207958172939, "ground_truth": 0}, {"key": "10741274", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26588049628756605, "ground_truth": 0}, {"key": "10741274", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30735800171329763, "ground_truth": 0}, {"key": "10741274", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011782346875, "ground_truth": 0}, {"key": "10741274", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43206339158501533, "ground_truth": 0}, {"key": "30605795", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5117165800710145, "ground_truth": 0}, {"key": "30605795", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5156199052576658, "ground_truth": 0}, {"key": "30605795", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6132365271162092, "ground_truth": 0}, {"key": "30605795", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907791935081457, "ground_truth": 0}, {"key": "30605795", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631590138942, "ground_truth": 0}, {"key": "30539722", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "30539722", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5832033455787307, "ground_truth": 0}, {"key": "30539722", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4474602945392827, "ground_truth": 0}, {"key": "30539722", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.418696882522783, "ground_truth": 0}, {"key": "30539722", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621765206467066, "ground_truth": 0}, {"key": "18639299", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23370634272351076, "ground_truth": 0}, {"key": "18639299", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3539863127441539, "ground_truth": 0}, {"key": "18639299", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18594721282025353, "ground_truth": 0}, {"key": "18639299", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245364250183, "ground_truth": 0}, {"key": "18639299", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364243469062694, "ground_truth": 0}, {"key": "39773552", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5058591187655412, "ground_truth": 0}, {"key": "39773552", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48438007163416386, "ground_truth": 0}, {"key": "39773552", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3812195773835612, "ground_truth": 0}, {"key": "39773552", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3904758165532013, "ground_truth": 0}, {"key": "39773552", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117165899992291, "ground_truth": 0}, {"key": "34086410", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26284185558078377, "ground_truth": 0}, {"key": "34086410", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.09334687832312387, "ground_truth": 0}, {"key": "34086410", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34334173913349064, "ground_truth": 0}, {"key": "34086410", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16885695509286636, "ground_truth": 0}, {"key": "34086410", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.37754069669414975, "ground_truth": 0}, {"key": "35454652", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4416730123608033, "ground_truth": 0}, {"key": "35454652", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7563575579131451, "ground_truth": 0}, {"key": "35454652", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5331544227861714, "ground_truth": 0}, {"key": "35454652", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49218814555207546, "ground_truth": 0}, {"key": "35454652", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413951159697, "ground_truth": 0}, {"key": "36158310", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49218813292859964, "ground_truth": 0}, {"key": "36158310", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37937838402289215, "ground_truth": 0}, {"key": "36158310", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3979384179777053, "ground_truth": 0}, {"key": "36158310", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35042137563718806, "ground_truth": 0}, {"key": "36158310", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27512973186005324, "ground_truth": 0}, {"key": "35688387", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.032100706776657016, "ground_truth": 0}, {"key": "35688387", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5039061602876838, "ground_truth": 0}, {"key": "35688387", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.046724958436877136, "ground_truth": 0}, {"key": "35688387", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.04742587067984774, "ground_truth": 0}, {"key": "35688387", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.038756194485828274, "ground_truth": 0}, {"key": "34209292", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8407825996476154, "ground_truth": 0}, {"key": "34209292", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21866939548676373, "ground_truth": 0}, {"key": "34209292", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7025300650071198, "ground_truth": 0}, {"key": "34209292", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199549412296, "ground_truth": 0}, {"key": "34209292", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762936832652, "ground_truth": 0}, {"key": "25037859", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4320633689272633, "ground_truth": 0}, {"key": "25037859", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.46295860448298815, "ground_truth": 0}, {"key": "25037859", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4054487204436436, "ground_truth": 0}, {"key": "25037859", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37022538497791585, "ground_truth": 0}, {"key": "25037859", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24508500403124997, "ground_truth": 0}, {"key": "36412121", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7476159478749558, "ground_truth": 0}, {"key": "36412121", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6442251162406893, "ground_truth": 0}, {"key": "36412121", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7620700990117913, "ground_truth": 0}, {"key": "36412121", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089090555756, "ground_truth": 0}, {"key": "36412121", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688316255591, "ground_truth": 0}, {"key": "34909172", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5869964388735351, "ground_truth": 0}, {"key": "34909172", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4359015419693738, "ground_truth": 0}, {"key": "34909172", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4436004153988167, "ground_truth": 0}, {"key": "34909172", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4941408797625663, "ground_truth": 0}, {"key": "34909172", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014734628880924, "ground_truth": 0}, {"key": "39011806", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2553436607275658, "ground_truth": 0}, {"key": "39011806", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42823340168979934, "ground_truth": 0}, {"key": "39011806", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4054487359215385, "ground_truth": 0}, {"key": "39011806", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.18713269308943442, "ground_truth": 0}, {"key": "39011806", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14033624680647544, "ground_truth": 0}, {"key": "33096163", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4571367355375298, "ground_truth": 0}, {"key": "33096163", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6279512383355292, "ground_truth": 0}, {"key": "33096163", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.552539700865981, "ground_truth": 0}, {"key": "33096163", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3123699781986756, "ground_truth": 0}, {"key": "33096163", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531365853274, "ground_truth": 0}, {"key": "38762205", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7170118644370423, "ground_truth": 0}, {"key": "38762205", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7325918294847228, "ground_truth": 0}, {"key": "38762205", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6842640255730653, "ground_truth": 0}, {"key": "38762205", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201714981114997, "ground_truth": 0}, {"key": "38762205", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.741673999919705, "ground_truth": 0}, {"key": "35519177", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4359015202158414, "ground_truth": 0}, {"key": "35519177", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1732882170075862, "ground_truth": 0}, {"key": "35519177", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6132365524987526, "ground_truth": 0}, {"key": "35519177", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43782350561444694, "ground_truth": 0}, {"key": "35519177", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5832033623664806, "ground_truth": 0}, {"key": "36192531", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39793841605435143, "ground_truth": 0}, {"key": "36192531", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4590761542365221, "ground_truth": 0}, {"key": "36192531", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4397473588614245, "ground_truth": 0}, {"key": "36192531", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238771236691, "ground_truth": 0}, {"key": "36192531", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.484380080968595, "ground_truth": 0}, {"key": "33160852", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19193280916159464, "ground_truth": 0}, {"key": "33160852", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7264255909215723, "ground_truth": 0}, {"key": "33160852", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5136684761590969, "ground_truth": 0}, {"key": "33160852", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3539862812564256, "ground_truth": 0}, {"key": "33160852", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43782350696984346, "ground_truth": 0}, {"key": "36312304", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2735743668801248, "ground_truth": 0}, {"key": "36312304", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3345894564964899, "ground_truth": 0}, {"key": "36312304", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5869964536950834, "ground_truth": 0}, {"key": "36312304", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.47073662142120065, "ground_truth": 0}, {"key": "36312304", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3886180366830267, "ground_truth": 0}, {"key": "33773343", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3647775716385815, "ground_truth": 0}, {"key": "33773343", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30902370666764484, "ground_truth": 0}, {"key": "33773343", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22953519929856414, "ground_truth": 0}, {"key": "33773343", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798744337288015, "ground_truth": 0}, {"key": "33773343", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14223188496578396, "ground_truth": 0}, {"key": "34913320", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6876299819874654, "ground_truth": 0}, {"key": "34913320", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5370413910684787, "ground_truth": 0}, {"key": "34913320", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43206339648341663, "ground_truth": 0}, {"key": "34913320", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082571234432, "ground_truth": 0}, {"key": "34913320", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306139248621, "ground_truth": 0}, {"key": "33784155", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.544801384288695, "ground_truth": 0}, {"key": "33784155", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.740174355407908, "ground_truth": 0}, {"key": "33784155", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6619228807569263, "ground_truth": 0}, {"key": "33784155", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358463377676, "ground_truth": 0}, {"key": "33784155", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512344292879, "ground_truth": 0}, {"key": "24085062", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9637799428989817, "ground_truth": 0}, {"key": "24085062", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9855521489002551, "ground_truth": 0}, {"key": "24085062", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9671630444134811, "ground_truth": 0}, {"key": "24085062", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9645892688464559, "ground_truth": 0}, {"key": "24085062", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.934872456624119, "ground_truth": 0}, {"key": "33893487", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14223190834804242, "ground_truth": 0}, {"key": "33893487", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10017221337848736, "ground_truth": 0}, {"key": "33893487", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1602660298080258, "ground_truth": 0}, {"key": "33893487", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12168575599105623, "ground_truth": 0}, {"key": "33893487", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17781088370464201, "ground_truth": 0}, {"key": "40913011", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8397339498317713, "ground_truth": 0}, {"key": "40913011", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8031737820914575, "ground_truth": 0}, {"key": "40913011", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7217432255638654, "ground_truth": 0}, {"key": "40913011", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366502832389, "ground_truth": 0}, {"key": "40913011", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.685949465909386, "ground_truth": 0}, {"key": "29642545", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25386100127509675, "ground_truth": 0}, {"key": "29642545", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2379299024131259, "ground_truth": 0}, {"key": "29642545", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2845760034982519, "ground_truth": 0}, {"key": "29642545", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3276682695479573, "ground_truth": 0}, {"key": "29642545", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35756750728941555, "ground_truth": 0}, {"key": "35969159", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4493926196040516, "ground_truth": 0}, {"key": "35969159", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43974735387780794, "ground_truth": 0}, {"key": "35969159", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4130035599244096, "ground_truth": 0}, {"key": "35969159", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3849121348187765, "ground_truth": 0}, {"key": "35969159", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571366980334706, "ground_truth": 0}, {"key": "37081669", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18242550420260412, "ground_truth": 0}, {"key": "37081669", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6909763051994405, "ground_truth": 0}, {"key": "37081669", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3593641496214937, "ground_truth": 0}, {"key": "37081669", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3904758386034665, "ground_truth": 0}, {"key": "37081669", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3293917210883621, "ground_truth": 0}, {"key": "40048022", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6495786297344208, "ground_truth": 0}, {"key": "40048022", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5640984896570725, "ground_truth": 0}, {"key": "40048022", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6636689288010176, "ground_truth": 0}, {"key": "40048022", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.60018836305455, "ground_truth": 0}, {"key": "40048022", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241740131722, "ground_truth": 0}, {"key": "32884004", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.46295859247009336, "ground_truth": 0}, {"key": "32884004", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6315942821599247, "ground_truth": 0}, {"key": "32884004", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6513548567520955, "ground_truth": 0}, {"key": "32884004", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460137293065156, "ground_truth": 0}, {"key": "32884004", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633154044187266, "ground_truth": 0}, {"key": "39022490", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6531269053592178, "ground_truth": 0}, {"key": "39022490", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6601723616543017, "ground_truth": 0}, {"key": "39022490", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4941408987457198, "ground_truth": 0}, {"key": "39022490", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.594551261298249, "ground_truth": 0}, {"key": "39022490", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.426321580432563, "ground_truth": 0}, {"key": "35159385", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5679366145664045, "ground_truth": 0}, {"key": "35159385", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7732163739004206, "ground_truth": 0}, {"key": "35159385", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7490872126542566, "ground_truth": 0}, {"key": "35159385", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762726384965, "ground_truth": 0}, {"key": "35159385", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.800692016017833, "ground_truth": 0}, {"key": "34363669", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6740504807651949, "ground_truth": 0}, {"key": "34363669", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49609383095871495, "ground_truth": 0}, {"key": "34363669", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5660185285781673, "ground_truth": 0}, {"key": "34363669", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185397640545, "ground_truth": 0}, {"key": "34363669", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4649015616604877, "ground_truth": 0}, {"key": "36119687", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7866228265508114, "ground_truth": 0}, {"key": "36119687", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6477982040919962, "ground_truth": 0}, {"key": "36119687", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9273632844863965, "ground_truth": 0}, {"key": "36119687", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933093963928814, "ground_truth": 0}, {"key": "36119687", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9066531128488133, "ground_truth": 0}, {"key": "35217446", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7866228145664257, "ground_truth": 0}, {"key": "35217446", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7217431848344562, "ground_truth": 0}, {"key": "35217446", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8766343601515727, "ground_truth": 0}, {"key": "35217446", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833653110838, "ground_truth": 0}, {"key": "35217446", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.884039275607037, "ground_truth": 0}, {"key": "39049331", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2829881306064399, "ground_truth": 0}, {"key": "39049331", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49804686663492914, "ground_truth": 0}, {"key": "39049331", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3593641460953092, "ground_truth": 0}, {"key": "39049331", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30902371125987144, "ground_truth": 0}, {"key": "39049331", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.47268348588515413, "ground_truth": 0}, {"key": "36472242", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5563995738620319, "ground_truth": 0}, {"key": "36472242", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6825737418967627, "ground_truth": 0}, {"key": "36472242", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7759445653860076, "ground_truth": 0}, {"key": "36472242", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8333245859426744, "ground_truth": 0}, {"key": "36472242", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430459189533, "ground_truth": 0}, {"key": "31854721", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6909762699093114, "ground_truth": 0}, {"key": "31854721", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42632159166652894, "ground_truth": 0}, {"key": "31854721", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7813306097082204, "ground_truth": 0}, {"key": "31854721", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548445514372, "ground_truth": 0}, {"key": "31854721", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723793331481, "ground_truth": 0}, {"key": "18725849", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21469141244599022, "ground_truth": 0}, {"key": "18725849", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2751297163438558, "ground_truth": 0}, {"key": "18725849", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25534366522754326, "ground_truth": 0}, {"key": "18725849", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25683198527932216, "ground_truth": 0}, {"key": "18725849", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1666753927669047, "ground_truth": 0}, {"key": "36883179", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2674081545525012, "ground_truth": 0}, {"key": "36883179", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.670608261064651, "ground_truth": 0}, {"key": "36883179", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5506073743583261, "ground_truth": 0}, {"key": "36883179", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33982760962700115, "ground_truth": 0}, {"key": "36883179", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28457602597651144, "ground_truth": 0}, {"key": "34266359", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4765796382128637, "ground_truth": 0}, {"key": "34266359", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5717665959473298, "ground_truth": 0}, {"key": "34266359", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5175708939359934, "ground_truth": 0}, {"key": "34266359", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43782348827831913, "ground_truth": 0}, {"key": "34266359", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4980468881456714, "ground_truth": 0}, {"key": "31920289", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1500288185721955, "ground_truth": 0}, {"key": "31920289", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25238402235483587, "ground_truth": 0}, {"key": "31920289", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4054487021050567, "ground_truth": 0}, {"key": "31920289", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.216011521134613, "ground_truth": 0}, {"key": "31920289", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2337063433789949, "ground_truth": 0}, {"key": "36292997", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5019531221370727, "ground_truth": 0}, {"key": "36292997", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5851011568709655, "ground_truth": 0}, {"key": "36292997", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7025300687650157, "ground_truth": 0}, {"key": "36292997", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432072211581, "ground_truth": 0}, {"key": "36292997", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228875591745, "ground_truth": 0}, {"key": "30412533", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6584175029429554, "ground_truth": 0}, {"key": "30412533", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5888891270305812, "ground_truth": 0}, {"key": "30412533", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7233094754471538, "ground_truth": 0}, {"key": "30412533", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804007667862, "ground_truth": 0}, {"key": "30412533", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762667014029, "ground_truth": 0}, {"key": "40433191", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7879311898354, "ground_truth": 0}, {"key": "40433191", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6460137386449788, "ground_truth": 0}, {"key": "40433191", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6150878521998883, "ground_truth": 0}, {"key": "40433191", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9529258193607097, "ground_truth": 0}, {"key": "40433191", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637484875164, "ground_truth": 0}, {"key": "34565591", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3056973037719861, "ground_truth": 0}, {"key": "34565591", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23231013262116704, "ground_truth": 0}, {"key": "34565591", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.279828482620086, "ground_truth": 0}, {"key": "34565591", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25091277715725646, "ground_truth": 0}, {"key": "34565591", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.10818895033858088, "ground_truth": 0}, {"key": "36062480", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6548947282212911, "ground_truth": 0}, {"key": "36062480", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7201715146516153, "ground_truth": 0}, {"key": "36062480", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8140527975516688, "ground_truth": 0}, {"key": "36062480", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833890185253, "ground_truth": 0}, {"key": "36062480", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210780181982, "ground_truth": 0}, {"key": "37276883", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5409238458122825, "ground_truth": 0}, {"key": "37276883", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5851011484481441, "ground_truth": 0}, {"key": "37276883", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44552956287776974, "ground_truth": 0}, {"key": "37276883", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643860737444, "ground_truth": 0}, {"key": "37276883", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370414068757201, "ground_truth": 0}, {"key": "38509260", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5736784139918719, "ground_truth": 0}, {"key": "38509260", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3775406929451434, "ground_truth": 0}, {"key": "38509260", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44360041398815653, "ground_truth": 0}, {"key": "38509260", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.38861802766370623, "ground_truth": 0}, {"key": "38509260", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34687307263380557, "ground_truth": 0}, {"key": "37139607", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5350984165999774, "ground_truth": 0}, {"key": "37139607", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5832033611406292, "ground_truth": 0}, {"key": "37139607", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5195213469248938, "ground_truth": 0}, {"key": "37139607", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381538113878, "ground_truth": 0}, {"key": "37139607", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953793820935, "ground_truth": 0}, {"key": "37092824", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7185943978981246, "ground_truth": 0}, {"key": "37092824", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6261241905353352, "ground_truth": 0}, {"key": "37092824", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2704802408310856, "ground_truth": 0}, {"key": "37092824", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203229037008, "ground_truth": 0}, {"key": "37092824", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004033206726, "ground_truth": 0}, {"key": "32191802", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8210441081626503, "ground_truth": 0}, {"key": "32191802", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7892336792385642, "ground_truth": 0}, {"key": "32191802", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8848377705157635, "ground_truth": 0}, {"key": "32191802", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943810353699, "ground_truth": 0}, {"key": "32191802", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517045166484, "ground_truth": 0}, {"key": "39396038", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9353465166223125, "ground_truth": 0}, {"key": "39396038", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.833324590685819, "ground_truth": 0}, {"key": "39396038", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8418256493830685, "ground_truth": 0}, {"key": "39396038", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675389544644, "ground_truth": 0}, {"key": "39396038", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228323880003, "ground_truth": 0}, {"key": "39076884", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5117165987483431, "ground_truth": 0}, {"key": "39076884", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6095241440907297, "ground_truth": 0}, {"key": "39076884", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7634837395064743, "ground_truth": 0}, {"key": "39076884", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136954644395, "ground_truth": 0}, {"key": "39076884", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621765028540388, "ground_truth": 0}, {"key": "27763432", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2735743966424861, "ground_truth": 0}, {"key": "27763432", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4244119846799241, "ground_truth": 0}, {"key": "27763432", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3123700213215622, "ground_truth": 0}, {"key": "27763432", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881518592778, "ground_truth": 0}, {"key": "27763432", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34510527003217156, "ground_truth": 0}, {"key": "37806929", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.42250463844764563, "ground_truth": 0}, {"key": "37806929", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4980468642499521, "ground_truth": 0}, {"key": "37806929", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4436003990207919, "ground_truth": 0}, {"key": "37806929", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4804786808201113, "ground_truth": 0}, {"key": "37806929", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378235022465921, "ground_truth": 0}, {"key": "32334186", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.720171502656693, "ground_truth": 0}, {"key": "32334186", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6370307941228331, "ground_truth": 0}, {"key": "32334186", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5945512642615278, "ground_truth": 0}, {"key": "32334186", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026712995508, "ground_truth": 0}, {"key": "32334186", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640155097417, "ground_truth": 0}, {"key": "36187324", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48633152648368405, "ground_truth": 0}, {"key": "36187324", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5117165726605641, "ground_truth": 0}, {"key": "36187324", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.61693583502057, "ground_truth": 0}, {"key": "36187324", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.45132653056051847, "ground_truth": 0}, {"key": "36187324", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392849169794, "ground_truth": 0}, {"key": "35306009", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8679338392791582, "ground_truth": 0}, {"key": "35306009", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8056321904266789, "ground_truth": 0}, {"key": "35306009", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9252299537250918, "ground_truth": 0}, {"key": "35306009", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9425067183000924, "ground_truth": 0}, {"key": "35306009", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.891054941465462, "ground_truth": 0}, {"key": "39490050", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16667541257981527, "ground_truth": 0}, {"key": "39490050", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38491213830814064, "ground_truth": 0}, {"key": "39490050", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2658804520834085, "ground_truth": 0}, {"key": "39490050", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11676401818489876, "ground_truth": 0}, {"key": "39490050", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594952275744404, "ground_truth": 0}, {"key": "38072149", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5058590828762075, "ground_truth": 0}, {"key": "38072149", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40733341794117056, "ground_truth": 0}, {"key": "38072149", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26588046211836003, "ground_truth": 0}, {"key": "38072149", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40544872474044796, "ground_truth": 0}, {"key": "38072149", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4244119988728138, "ground_truth": 0}, {"key": "35899689", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26284187346735954, "ground_truth": 0}, {"key": "35899689", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.34510528500696735, "ground_truth": 0}, {"key": "35899689", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38861803177566373, "ground_truth": 0}, {"key": "35899689", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953742022814, "ground_truth": 0}, {"key": "35899689", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.41869688946820816, "ground_truth": 0}, {"key": "27994518", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38121958056758287, "ground_truth": 0}, {"key": "27994518", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.39981166577479443, "ground_truth": 0}, {"key": "27994518", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4148988571529781, "ground_truth": 0}, {"key": "27994518", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3090236902166221, "ground_truth": 0}, {"key": "27994518", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544873267710096, "ground_truth": 0}, {"key": "10615479", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12421301081034272, "ground_truth": 0}, {"key": "10615479", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11838510409636364, "ground_truth": 0}, {"key": "10615479", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.0803574774725266, "ground_truth": 0}, {"key": "10615479", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.0913821002554589, "ground_truth": 0}, {"key": "10615479", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16451646229436, "ground_truth": 0}, {"key": "40186667", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6926419731938267, "ground_truth": 0}, {"key": "40186667", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4186969006308111, "ground_truth": 0}, {"key": "40186667", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5253688206252107, "ground_truth": 0}, {"key": "40186667", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.656658238857049, "ground_truth": 0}, {"key": "40186667", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.37022537340105355, "ground_truth": 0}, {"key": "38622886", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7341195175468589, "ground_truth": 0}, {"key": "38622886", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29583986043662824, "ground_truth": 0}, {"key": "38622886", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7074046916711163, "ground_truth": 0}, {"key": "38622886", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825957837437, "ground_truth": 0}, {"key": "38622886", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159444741443, "ground_truth": 0}, {"key": "40686943", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6584174961961115, "ground_truth": 0}, {"key": "40686943", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.718594384116536, "ground_truth": 0}, {"key": "40686943", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5019531037170156, "ground_truth": 0}, {"key": "40686943", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786404130289, "ground_truth": 0}, {"key": "40686943", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.723309469795295, "ground_truth": 0}, {"key": "30604567", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7772998695127882, "ground_truth": 0}, {"key": "30604567", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7799928964048962, "ground_truth": 0}, {"key": "30604567", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6636689329775504, "ground_truth": 0}, {"key": "30604567", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.746138994260599, "ground_truth": 0}, {"key": "30604567", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723317058860251, "ground_truth": 0}, {"key": "35440903", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6842640478819223, "ground_truth": 0}, {"key": "35440903", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48047864739559276, "ground_truth": 0}, {"key": "35440903", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6723316777313102, "ground_truth": 0}, {"key": "35440903", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "35440903", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224479879813, "ground_truth": 0}, {"key": "37219533", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.388618033597546, "ground_truth": 0}, {"key": "37219533", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4416729677913096, "ground_truth": 0}, {"key": "37219533", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.462958602636887, "ground_truth": 0}, {"key": "37219533", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3486451402730235, "ground_truth": 0}, {"key": "37219533", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34864512864719, "ground_truth": 0}, {"key": "40178965", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6566582687936106, "ground_truth": 0}, {"key": "40178965", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4205995732890436, "ground_truth": 0}, {"key": "40178965", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7201715090695382, "ground_truth": 0}, {"key": "40178965", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382060103959, "ground_truth": 0}, {"key": "40178965", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438950793351494, "ground_truth": 0}, {"key": "13750468", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18010667192640212, "ground_truth": 0}, {"key": "13750468", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2658804868490114, "ground_truth": 0}, {"key": "13750468", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19072403660173046, "ground_truth": 0}, {"key": "13750468", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1561049062924932, "ground_truth": 0}, {"key": "13750468", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20689403867994235, "ground_truth": 0}, {"key": "17754949", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5117165955726427, "ground_truth": 0}, {"key": "17754949", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4921881282569155, "ground_truth": 0}, {"key": "17754949", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5078118470952445, "ground_truth": 0}, {"key": "17754949", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389896434075, "ground_truth": 0}, {"key": "17754949", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506320204516, "ground_truth": 0}, {"key": "36675623", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8962513864651799, "ground_truth": 0}, {"key": "36675623", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8740772397817662, "ground_truth": 0}, {"key": "36675623", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7931059535089287, "ground_truth": 0}, {"key": "36675623", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677566804037, "ground_truth": 0}, {"key": "36675623", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894700676322, "ground_truth": 0}, {"key": "40035440", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8925625211441736, "ground_truth": 0}, {"key": "40035440", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7732163521760339, "ground_truth": 0}, {"key": "40035440", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.646013684800502, "ground_truth": 0}, {"key": "40035440", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759624668114, "ground_truth": 0}, {"key": "40035440", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105590563121, "ground_truth": 0}, {"key": "37685909", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2583259997070171, "ground_truth": 0}, {"key": "37685909", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20817892863695384, "ground_truth": 0}, {"key": "37685909", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22678364815328705, "ground_truth": 0}, {"key": "37685909", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25238401122670656, "ground_truth": 0}, {"key": "37685909", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18476753322662473, "ground_truth": 0}, {"key": "36938787", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5698526546066695, "ground_truth": 0}, {"key": "36938787", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5755880192049891, "ground_truth": 0}, {"key": "36938787", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.418696906994834, "ground_truth": 0}, {"key": "36938787", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.562176492109106, "ground_truth": 0}, {"key": "36938787", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632973969318, "ground_truth": 0}, {"key": "39398068", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25534365320359836, "ground_truth": 0}, {"key": "39398068", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35398632156142307, "ground_truth": 0}, {"key": "39398068", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4436004215599607, "ground_truth": 0}, {"key": "39398068", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49414089777805903, "ground_truth": 0}, {"key": "39398068", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4320633788651782, "ground_truth": 0}, {"key": "39926408", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44552953321242533, "ground_truth": 0}, {"key": "39926408", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6909763016627606, "ground_truth": 0}, {"key": "39926408", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23231015601411456, "ground_truth": 0}, {"key": "39926408", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531156678132, "ground_truth": 0}, {"key": "39926408", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734983968092, "ground_truth": 0}, {"key": "40465336", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3468730595761272, "ground_truth": 0}, {"key": "40465336", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5097643595128374, "ground_truth": 0}, {"key": "40465336", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43014734056753406, "ground_truth": 0}, {"key": "40465336", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.48828339631341094, "ground_truth": 0}, {"key": "40465336", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944725287227074, "ground_truth": 0}, {"key": "34173549", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7634837663043913, "ground_truth": 0}, {"key": "34173549", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48438005886104885, "ground_truth": 0}, {"key": "34173549", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.607663163640064, "ground_truth": 0}, {"key": "34173549", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9329437201916231, "ground_truth": 0}, {"key": "34173549", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517175160198, "ground_truth": 0}, {"key": "33541535", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6584174933138186, "ground_truth": 0}, {"key": "33541535", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5660185415918306, "ground_truth": 0}, {"key": "33541535", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7122321830856286, "ground_truth": 0}, {"key": "33541535", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093574977743, "ground_truth": 0}, {"key": "33541535", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046903198069, "ground_truth": 0}, {"key": "35685195", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.670608280093699, "ground_truth": 0}, {"key": "35685195", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6926419899504882, "ground_truth": 0}, {"key": "35685195", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7648916150718975, "ground_truth": 0}, {"key": "35685195", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254008331101, "ground_truth": 0}, {"key": "35685195", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943792462835, "ground_truth": 0}, {"key": "28440730", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18952108933395903, "ground_truth": 0}, {"key": "28440730", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37570646654283607, "ground_truth": 0}, {"key": "28440730", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26435838025780295, "ground_truth": 0}, {"key": "28440730", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864512918584645, "ground_truth": 0}, {"key": "28440730", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29421499977110455, "ground_truth": 0}, {"key": "38338714", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6315942974726467, "ground_truth": 0}, {"key": "38338714", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7201715059932343, "ground_truth": 0}, {"key": "38338714", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7057850049542175, "ground_truth": 0}, {"key": "38338714", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.675764606831482, "ground_truth": 0}, {"key": "38338714", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918276489044, "ground_truth": 0}, {"key": "32191881", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28937167581433165, "ground_truth": 0}, {"key": "32191881", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.154057550904896, "ground_truth": 0}, {"key": "32191881", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12765263185525988, "ground_truth": 0}, {"key": "32191881", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.08509905213112935, "ground_truth": 0}, {"key": "32191881", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1592174056893529, "ground_truth": 0}, {"key": "37707251", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15713686432746662, "ground_truth": 0}, {"key": "37707251", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26588045598096804, "ground_truth": 0}, {"key": "37707251", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24220562410670574, "ground_truth": 0}, {"key": "37707251", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1732882126287403, "ground_truth": 0}, {"key": "37707251", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20434189492691662, "ground_truth": 0}, {"key": "40172567", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3629692090857865, "ground_truth": 0}, {"key": "40172567", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38121955976230704, "ground_truth": 0}, {"key": "40172567", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5370413832771722, "ground_truth": 0}, {"key": "40172567", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35577488465222296, "ground_truth": 0}, {"key": "40172567", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4668456101432378, "ground_truth": 0}, {"key": "33113255", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8128673042068302, "ground_truth": 0}, {"key": "33113255", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7106282969997276, "ground_truth": 0}, {"key": "33113255", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6893056156880711, "ground_truth": 0}, {"key": "33113255", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094578902273, "ground_truth": 0}, {"key": "33113255", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104788921924114, "ground_truth": 0}, {"key": "33022143", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49023561850607317, "ground_truth": 0}, {"key": "33022143", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5428632861954374, "ground_truth": 0}, {"key": "33022143", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3539863288508467, "ground_truth": 0}, {"key": "33022143", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058590925567429, "ground_truth": 0}, {"key": "33022143", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1980641806231622, "ground_truth": 0}, {"key": "32084473", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6706082795770398, "ground_truth": 0}, {"key": "32084473", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7025300565641508, "ground_truth": 0}, {"key": "32084473", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7620700975907548, "ground_truth": 0}, {"key": "32084473", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802474328571, "ground_truth": 0}, {"key": "32084473", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321905048705, "ground_truth": 0}, {"key": "40564245", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11357959349459906, "ground_truth": 0}, {"key": "40564245", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2909808686802568, "ground_truth": 0}, {"key": "40564245", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17441027218482646, "ground_truth": 0}, {"key": "40564245", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2568320160441412, "ground_truth": 0}, {"key": "40564245", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22135071113905, "ground_truth": 0}, {"key": "31717213", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48633154973326254, "ground_truth": 0}, {"key": "31717213", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3522017861881379, "ground_truth": 0}, {"key": "31717213", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3056973282001081, "ground_truth": 0}, {"key": "31717213", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4301473280679395, "ground_truth": 0}, {"key": "31717213", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3867634405551714, "ground_truth": 0}, {"key": "34861894", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.34864514262422946, "ground_truth": 0}, {"key": "34861894", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.45907612435631406, "ground_truth": 0}, {"key": "34861894", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6261241865774656, "ground_truth": 0}, {"key": "34861894", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792028097743, "ground_truth": 0}, {"key": "34861894", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891281126881, "ground_truth": 0}, {"key": "40838760", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7248702713433093, "ground_truth": 0}, {"key": "40838760", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7786493084028413, "ground_truth": 0}, {"key": "40838760", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7041601210691335, "ground_truth": 0}, {"key": "40838760", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680059114326, "ground_truth": 0}, {"key": "40838760", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548700960731, "ground_truth": 0}, {"key": "40044849", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6513548534169462, "ground_truth": 0}, {"key": "40044849", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7264256301606993, "ground_truth": 0}, {"key": "40044849", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7090191346489385, "ground_truth": 0}, {"key": "40044849", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256253397254, "ground_truth": 0}, {"key": "40044849", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883534161975, "ground_truth": 0}, {"key": "30296116", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25683198154243125, "ground_truth": 0}, {"key": "30296116", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.33982760739670564, "ground_truth": 0}, {"key": "30296116", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.509764421904635, "ground_truth": 0}, {"key": "30296116", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4765796476099942, "ground_truth": 0}, {"key": "30296116", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090236763421727, "ground_truth": 0}, {"key": "34931360", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5331543665266755, "ground_truth": 0}, {"key": "34931360", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23792990412850884, "ground_truth": 0}, {"key": "34931360", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3522017740279217, "ground_truth": 0}, {"key": "34931360", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3979384255270266, "ground_truth": 0}, {"key": "34931360", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881369983647, "ground_truth": 0}, {"key": "18862422", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3140505434020163, "ground_truth": 0}, {"key": "18862422", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4513264883065652, "ground_truth": 0}, {"key": "18862422", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26588047140315585, "ground_truth": 0}, {"key": "18862422", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2674081700412056, "ground_truth": 0}, {"key": "18862422", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360043651670356, "ground_truth": 0}, {"key": "36361140", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6959583190525142, "ground_truth": 0}, {"key": "36361140", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5019530999115172, "ground_truth": 0}, {"key": "36361140", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7386690676627593, "ground_truth": 0}, {"key": "36361140", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057849864398472, "ground_truth": 0}, {"key": "36361140", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367166714562, "ground_truth": 0}, {"key": "39703329", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18010664905800589, "ground_truth": 0}, {"key": "39703329", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21076631384415326, "ground_truth": 0}, {"key": "39703329", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.10230471602683636, "ground_truth": 0}, {"key": "39703329", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.07159119525229646, "ground_truth": 0}, {"key": "39703329", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11676401227781294, "ground_truth": 0}, {"key": "34033324", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9465966687524722, "ground_truth": 0}, {"key": "34033324", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8233284021540642, "ground_truth": 0}, {"key": "34033324", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5774953821986629, "ground_truth": 0}, {"key": "34033324", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9314625140670881, "ground_truth": 0}, {"key": "34033324", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321991832693, "ground_truth": 0}, {"key": "35658862", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5813031266782116, "ground_truth": 0}, {"key": "35658862", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32082130964766625, "ground_truth": 0}, {"key": "35658862", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6740504862269892, "ground_truth": 0}, {"key": "35658862", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49609379840387763, "ground_truth": 0}, {"key": "35658862", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711584336045, "ground_truth": 0}, {"key": "36092657", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6279512216744362, "ground_truth": 0}, {"key": "36092657", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7371581413833314, "ground_truth": 0}, {"key": "36092657", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6723316865868896, "ground_truth": 0}, {"key": "36092657", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004138444068, "ground_truth": 0}, {"key": "36092657", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.616935852414732, "ground_truth": 0}, {"key": "26333438", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18713267745678436, "ground_truth": 0}, {"key": "26333438", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4167966412228593, "ground_truth": 0}, {"key": "26333438", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3415825039443352, "ground_truth": 0}, {"key": "26333438", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2689414234235691, "ground_truth": 0}, {"key": "26333438", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36116471833920566, "ground_truth": 0}, {"key": "34184963", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3174262838906843, "ground_truth": 0}, {"key": "34184963", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6566582567993093, "ground_truth": 0}, {"key": "34184963", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.32766831038269256, "ground_truth": 0}, {"key": "34184963", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3056973225803264, "ground_truth": 0}, {"key": "34184963", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2658804904654752, "ground_truth": 0}, {"key": "35069975", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5331544060593563, "ground_truth": 0}, {"key": "35069975", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5214711602624598, "ground_truth": 0}, {"key": "35069975", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5869964231787467, "ground_truth": 0}, {"key": "35069975", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43398147701612366, "ground_truth": 0}, {"key": "35069975", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3451052754469879, "ground_truth": 0}, {"key": "36443950", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2689414415994634, "ground_truth": 0}, {"key": "36443950", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22815652818943513, "ground_truth": 0}, {"key": "36443950", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21601154512675164, "ground_truth": 0}, {"key": "36443950", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19806417435636273, "ground_truth": 0}, {"key": "36443950", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23370636051108262, "ground_truth": 0}, {"key": "29460858", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21076631391999123, "ground_truth": 0}, {"key": "29460858", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16132024771811224, "ground_truth": 0}, {"key": "29460858", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2893716896111021, "ground_truth": 0}, {"key": "29460858", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1847675226462119, "ground_truth": 0}, {"key": "29460858", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.25534367141039016, "ground_truth": 0}, {"key": "36155704", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.41489885041710145, "ground_truth": 0}, {"key": "36155704", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2861692590037174, "ground_truth": 0}, {"key": "36155704", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3522017716349547, "ground_truth": 0}, {"key": "36155704", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2436424296014824, "ground_truth": 0}, {"key": "36155704", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3040416900989962, "ground_truth": 0}, {"key": "37185211", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7122321889565073, "ground_truth": 0}, {"key": "37185211", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4668455983390547, "ground_truth": 0}, {"key": "37185211", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4921881431402208, "ground_truth": 0}, {"key": "37185211", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4707366159372879, "ground_truth": 0}, {"key": "37185211", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723317043866034, "ground_truth": 0}, {"key": "36454885", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5926666077264016, "ground_truth": 0}, {"key": "36454885", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.45907613076749687, "ground_truth": 0}, {"key": "36454885", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5117166092553809, "ground_truth": 0}, {"key": "36454885", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.45519861924502053, "ground_truth": 0}, {"key": "36454885", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708808604799, "ground_truth": 0}, {"key": "33148906", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.0888202868604171, "ground_truth": 0}, {"key": "33148906", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10302441833223722, "ground_truth": 0}, {"key": "33148906", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.08449274931949045, "ground_truth": 0}, {"key": "33148906", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12592276850183362, "ground_truth": 0}, {"key": "33148906", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2323101416307887, "ground_truth": 0}, {"key": "18086604", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.13477591226524685, "ground_truth": 0}, {"key": "18086604", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13568954230955227, "ground_truth": 0}, {"key": "18086604", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22000710061904313, "ground_truth": 0}, {"key": "18086604", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11279539926099273, "ground_truth": 0}, {"key": "18086604", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11357958589673553, "ground_truth": 0}, {"key": "33693397", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.45713671554998636, "ground_truth": 0}, {"key": "33693397", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.41869690750832234, "ground_truth": 0}, {"key": "33693397", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3793784108789999, "ground_truth": 0}, {"key": "33693397", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3522017736554763, "ground_truth": 0}, {"key": "33693397", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014197498193, "ground_truth": 0}, {"key": "39501530", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2254166281341112, "ground_truth": 0}, {"key": "39501530", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1338674748562959, "ground_truth": 0}, {"key": "39501530", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16995624258070743, "ground_truth": 0}, {"key": "39501530", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19314736345302452, "ground_truth": 0}, {"key": "39501530", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1602660249418901, "ground_truth": 0}, {"key": "30948874", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5389831994280712, "ground_truth": 0}, {"key": "30948874", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5058591169227514, "ground_truth": 0}, {"key": "30948874", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5679366219448956, "ground_truth": 0}, {"key": "30948874", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.476579660090668, "ground_truth": 0}, {"key": "30948874", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365564666477, "ground_truth": 0}, {"key": "39410675", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6825737242489042, "ground_truth": 0}, {"key": "39410675", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7025300459164121, "ground_truth": 0}, {"key": "39410675", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8354835367278244, "ground_truth": 0}, {"key": "39410675", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743766901119, "ground_truth": 0}, {"key": "39410675", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148246941037, "ground_truth": 0}, {"key": "32903337", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38306414885715584, "ground_truth": 0}, {"key": "32903337", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29421497629008886, "ground_truth": 0}, {"key": "32903337", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.338077137319901, "ground_truth": 0}, {"key": "32903337", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3090237397462623, "ground_truth": 0}, {"key": "32903337", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3451052481414735, "ground_truth": 0}, {"key": "27685132", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6548947334427773, "ground_truth": 0}, {"key": "27685132", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3486451448952597, "ground_truth": 0}, {"key": "27685132", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4863315420296241, "ground_truth": 0}, {"key": "27685132", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.45132648241682555, "ground_truth": 0}, {"key": "27685132", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064747731801, "ground_truth": 0}, {"key": "22791471", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38306413620879287, "ground_truth": 0}, {"key": "22791471", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4455295327591753, "ground_truth": 0}, {"key": "22791471", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6242935393062947, "ground_truth": 0}, {"key": "22791471", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365398629298, "ground_truth": 0}, {"key": "22791471", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.517570904037918, "ground_truth": 0}, {"key": "32292348", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2267836346895404, "ground_truth": 0}, {"key": "32292348", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.397938386920649, "ground_truth": 0}, {"key": "32292348", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3242354090727612, "ground_truth": 0}, {"key": "32292348", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.253861028692717, "ground_truth": 0}, {"key": "32292348", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.31573598224043203, "ground_truth": 0}, {"key": "20482930", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5467381357188753, "ground_truth": 0}, {"key": "20482930", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5964331724966754, "ground_truth": 0}, {"key": "20482930", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28457599759952823, "ground_truth": 0}, {"key": "20482930", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3611647488498929, "ground_truth": 0}, {"key": "20482930", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974733288726287, "ground_truth": 0}, {"key": "11635754", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4551986176579014, "ground_truth": 0}, {"key": "11635754", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2479874387595249, "ground_truth": 0}, {"key": "11635754", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5273165448676631, "ground_truth": 0}, {"key": "11635754", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907791966397345, "ground_truth": 0}, {"key": "11635754", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.707404672698377, "ground_truth": 0}, {"key": "40029096", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.41869691093951283, "ground_truth": 0}, {"key": "40029096", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4882833888996392, "ground_truth": 0}, {"key": "40029096", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5717665977512023, "ground_truth": 0}, {"key": "40029096", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3923368267108845, "ground_truth": 0}, {"key": "40029096", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819690304954, "ground_truth": 0}, {"key": "40414719", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7994422958492425, "ground_truth": 0}, {"key": "40414719", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5926666049457285, "ground_truth": 0}, {"key": "40414719", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6334102676126916, "ground_truth": 0}, {"key": "40414719", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740013555003, "ground_truth": 0}, {"key": "40414719", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117956699562, "ground_truth": 0}, {"key": "39537616", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7248702971847107, "ground_truth": 0}, {"key": "39537616", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5640984683510801, "ground_truth": 0}, {"key": "39537616", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6774740144680166, "ground_truth": 0}, {"key": "39537616", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706083023568281, "ground_truth": 0}, {"key": "39537616", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819504600051, "ground_truth": 0}, {"key": "33245830", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3056973041182065, "ground_truth": 0}, {"key": "33245830", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2173375188650611, "ground_truth": 0}, {"key": "33245830", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20946967914278236, "ground_truth": 0}, {"key": "33245830", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21601155033635902, "ground_truth": 0}, {"key": "33245830", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1895211038175583, "ground_truth": 0}, {"key": "39243601", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43206341108321755, "ground_truth": 0}, {"key": "39243601", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2568320064802744, "ground_truth": 0}, {"key": "39243601", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.49414090407923605, "ground_truth": 0}, {"key": "39243601", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3942009852511346, "ground_truth": 0}, {"key": "39243601", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36116469876736046, "ground_truth": 0}, {"key": "35815905", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2958398393798029, "ground_truth": 0}, {"key": "35815905", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3090236889661765, "ground_truth": 0}, {"key": "35815905", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2553436669925667, "ground_truth": 0}, {"key": "35815905", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1919327952194878, "ground_truth": 0}, {"key": "35815905", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23231015179991357, "ground_truth": 0}, {"key": "35260212", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5640984795681675, "ground_truth": 0}, {"key": "35260212", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32594951579867026, "ground_truth": 0}, {"key": "35260212", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6242935229586216, "ground_truth": 0}, {"key": "35260212", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593351414704, "ground_truth": 0}, {"key": "35260212", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.63703080117211, "ground_truth": 0}, {"key": "39193924", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7008948113835359, "ground_truth": 0}, {"key": "39193924", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5097644100538717, "ground_truth": 0}, {"key": "39193924", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6020615961427909, "ground_truth": 0}, {"key": "39193924", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3684057066455872, "ground_truth": 0}, {"key": "39193924", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629586095166548, "ground_truth": 0}, {"key": "40658569", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3259495104774656, "ground_truth": 0}, {"key": "40658569", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32252598603962307, "ground_truth": 0}, {"key": "40658569", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35577492222034796, "ground_truth": 0}, {"key": "40658569", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2005576650278019, "ground_truth": 0}, {"key": "40658569", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36840569399094314, "ground_truth": 0}, {"key": "33497596", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3023910730280002, "ground_truth": 0}, {"key": "33497596", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2568319848087032, "ground_truth": 0}, {"key": "33497596", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4590760975828598, "ground_truth": 0}, {"key": "33497596", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937839867605866, "ground_truth": 0}, {"key": "33497596", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2893716838118953, "ground_truth": 0}, {"key": "40339241", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7905303238630706, "ground_truth": 0}, {"key": "40339241", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6187804472517833, "ground_truth": 0}, {"key": "40339241", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6757646132126173, "ground_truth": 0}, {"key": "40339241", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063693716882, "ground_truth": 0}, {"key": "40339241", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.727975442161595, "ground_truth": 0}, {"key": "31792608", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.226783628753232, "ground_truth": 0}, {"key": "31792608", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32766830567970245, "ground_truth": 0}, {"key": "31792608", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20946970797324374, "ground_truth": 0}, {"key": "31792608", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3242353995048312, "ground_truth": 0}, {"key": "31792608", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19682618854551684, "ground_truth": 0}, {"key": "33132662", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3415824853196419, "ground_truth": 0}, {"key": "33132662", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25982562663866754, "ground_truth": 0}, {"key": "33132662", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4941408785844017, "ground_truth": 0}, {"key": "33132662", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557749014823886, "ground_truth": 0}, {"key": "33132662", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004353859136, "ground_truth": 0}, {"key": "37577457", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49414090441897046, "ground_truth": 0}, {"key": "37577457", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.44167303553357307, "ground_truth": 0}, {"key": "37577457", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.282988125917836, "ground_truth": 0}, {"key": "37577457", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4282333993624746, "ground_truth": 0}, {"key": "37577457", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.38676343922508133, "ground_truth": 0}, {"key": "38701278", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23934936185235908, "ground_truth": 0}, {"key": "38701278", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27982847505349573, "ground_truth": 0}, {"key": "38701278", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5156199191192049, "ground_truth": 0}, {"key": "38701278", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2798285017096621, "ground_truth": 0}, {"key": "38701278", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561504817125176, "ground_truth": 0}, {"key": "34570783", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.724870262770896, "ground_truth": 0}, {"key": "34570783", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5736784072570746, "ground_truth": 0}, {"key": "34570783", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7853085917336019, "ground_truth": 0}, {"key": "34570783", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563421440221, "ground_truth": 0}, {"key": "34570783", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089041084248, "ground_truth": 0}, {"key": "39064526", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4035668457445343, "ground_truth": 0}, {"key": "39064526", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3023910788957953, "ground_truth": 0}, {"key": "39064526", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21337716244505406, "ground_truth": 0}, {"key": "39064526", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.258325980985916, "ground_truth": 0}, {"key": "39064526", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4320634047806743, "ground_truth": 0}, {"key": "40741545", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43974734844576324, "ground_truth": 0}, {"key": "40741545", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6584175086003655, "ground_truth": 0}, {"key": "40741545", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6150878414057132, "ground_truth": 0}, {"key": "40741545", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093503660579, "ground_truth": 0}, {"key": "40741545", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358574522079, "ground_truth": 0}, {"key": "36929751", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5253688426757955, "ground_truth": 0}, {"key": "36929751", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5448013957604315, "ground_truth": 0}, {"key": "36929751", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6513548790825294, "ground_truth": 0}, {"key": "36929751", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358360629633, "ground_truth": 0}, {"key": "36929751", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014099088494, "ground_truth": 0}, {"key": "23984730", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.0888202913190189, "ground_truth": 0}, {"key": "23984730", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24220563419690272, "ground_truth": 0}, {"key": "23984730", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1480472125089363, "ground_truth": 0}, {"key": "23984730", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11357960350648542, "ground_truth": 0}, {"key": "23984730", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21601153797131792, "ground_truth": 0}, {"key": "36007415", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7461389851119667, "ground_truth": 0}, {"key": "36007415", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9046505256394922, "ground_truth": 0}, {"key": "36007415", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9252299550097602, "ground_truth": 0}, {"key": "36007415", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419968091779, "ground_truth": 0}, {"key": "36007415", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.956957154570458, "ground_truth": 0}, {"key": "38875041", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6169358601116646, "ground_truth": 0}, {"key": "38875041", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.548673534738502, "ground_truth": 0}, {"key": "38875041", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6926419849215849, "ground_truth": 0}, {"key": "38875041", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504782568119, "ground_truth": 0}, {"key": "38875041", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882834163954101, "ground_truth": 0}]