[{"key": "35232142", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09739039913991475, "ground_truth": 0}, {"key": "35232142", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16132024611902185, "ground_truth": 0}, {"key": "35232142", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19559408650290036, "ground_truth": 0}, {"key": "35232142", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14511536367621047, "ground_truth": 0}, {"key": "35232142", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.08882028854207102, "ground_truth": 0}, {"key": "40143035", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.45132653343779316, "ground_truth": 0}, {"key": "40143035", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2814056060548279, "ground_truth": 0}, {"key": "40143035", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4513265388896658, "ground_truth": 0}, {"key": "40143035", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2583259961125988, "ground_truth": 0}, {"key": "40143035", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.46295860150020696, "ground_truth": 0}, {"key": "35951548", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1699562336421884, "ground_truth": 0}, {"key": "35951548", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14414884548831217, "ground_truth": 0}, {"key": "35951548", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12940273345221398, "ground_truth": 0}, {"key": "35951548", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07369627635053697, "ground_truth": 0}, {"key": "35951548", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1183850921058667, "ground_truth": 0}, {"key": "36266422", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19559408174201146, "ground_truth": 0}, {"key": "36266422", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2643583489463604, "ground_truth": 0}, {"key": "36266422", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10970576936091611, "ground_truth": 0}, {"key": "36266422", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10970577056270127, "ground_truth": 0}, {"key": "36266422", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1259227656870677, "ground_truth": 0}, {"key": "38826984", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33111974517802717, "ground_truth": 0}, {"key": "38826984", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44360040623089736, "ground_truth": 0}, {"key": "38826984", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4111108569663157, "ground_truth": 0}, {"key": "38826984", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3629691883982172, "ground_truth": 0}, {"key": "38826984", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44746028025685025, "ground_truth": 0}, {"key": "34540833", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2043419083622694, "ground_truth": 0}, {"key": "34540833", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.45713670267397827, "ground_truth": 0}, {"key": "34540833", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3208213077747246, "ground_truth": 0}, {"key": "34540833", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25832597494435855, "ground_truth": 0}, {"key": "34540833", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.255343649461367, "ground_truth": 0}, {"key": "20836172", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35577486184628304, "ground_truth": 0}, {"key": "20836172", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40733340817181807, "ground_truth": 0}, {"key": "20836172", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40922079273972584, "ground_truth": 0}, {"key": "20836172", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.348645153801162, "ground_truth": 0}, {"key": "20836172", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.29910518817900866, "ground_truth": 0}, {"key": "35932467", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20307462115843045, "ground_truth": 0}, {"key": "35932467", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3702254179434023, "ground_truth": 0}, {"key": "35932467", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3040416885994462, "ground_truth": 0}, {"key": "35932467", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1919327894729671, "ground_truth": 0}, {"key": "35932467", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1320661477164125, "ground_truth": 0}, {"key": "40758845", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1835936264944796, "ground_truth": 0}, {"key": "40758845", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32423541681268453, "ground_truth": 0}, {"key": "40758845", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4474603026143953, "ground_truth": 0}, {"key": "40758845", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10447731828420856, "ground_truth": 0}, {"key": "40758845", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18952109821804108, "ground_truth": 0}, {"key": "30358490", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2120687985995859, "ground_truth": 0}, {"key": "30358490", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24508502815063546, "ground_truth": 0}, {"key": "30358490", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23651623858351742, "ground_truth": 0}, {"key": "30358490", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510839255498012, "ground_truth": 0}, {"key": "30358490", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.28616923728667654, "ground_truth": 0}, {"key": "34615665", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6688802534833233, "ground_truth": 0}, {"key": "34615665", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.567936614761065, "ground_truth": 0}, {"key": "34615665", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8187368147100035, "ground_truth": 0}, {"key": "34615665", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587921378263, "ground_truth": 0}, {"key": "34615665", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063751465885, "ground_truth": 0}, {"key": "35890902", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5486734794765268, "ground_truth": 0}, {"key": "35890902", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21866938544410125, "ground_truth": 0}, {"key": "35890902", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4035668349569231, "ground_truth": 0}, {"key": "35890902", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.624293547404287, "ground_truth": 0}, {"key": "35890902", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22135069563193474, "ground_truth": 0}, {"key": "37922330", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35220179754310216, "ground_truth": 0}, {"key": "37922330", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3942009738333173, "ground_truth": 0}, {"key": "37922330", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4610167587746556, "ground_truth": 0}, {"key": "37922330", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413977813633, "ground_truth": 0}, {"key": "37922330", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33458943595909607, "ground_truth": 0}, {"key": "30844962", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.32594953304888247, "ground_truth": 0}, {"key": "30844962", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12252320910929276, "ground_truth": 0}, {"key": "30844962", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.04434858236168769, "ground_truth": 0}, {"key": "30844962", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16995623311127178, "ground_truth": 0}, {"key": "30844962", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10447731499430414, "ground_truth": 0}, {"key": "36217333", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.06142404311172037, "ground_truth": 0}, {"key": "36217333", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07004895882873384, "ground_truth": 0}, {"key": "36217333", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14223188270065448, "ground_truth": 0}, {"key": "36217333", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.259825651586389, "ground_truth": 0}, {"key": "36217333", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11920292052615043, "ground_truth": 0}, {"key": "30816523", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2814056212826157, "ground_truth": 0}, {"key": "30816523", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22270014109493164, "ground_truth": 0}, {"key": "30816523", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2005576698039553, "ground_truth": 0}, {"key": "30816523", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.299105180100697, "ground_truth": 0}, {"key": "30816523", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16026602886027025, "ground_truth": 0}, {"key": "38900884", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.790530291730276, "ground_truth": 0}, {"key": "38900884", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4668455856376632, "ground_truth": 0}, {"key": "38900884", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7217432104948328, "ground_truth": 0}, {"key": "38900884", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020616039103602, "ground_truth": 0}, {"key": "38900884", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548534833701, "ground_truth": 0}, {"key": "13890581", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3886180367940306, "ground_truth": 0}, {"key": "13890581", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.35756751091884287, "ground_truth": 0}, {"key": "13890581", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3157359689794279, "ground_truth": 0}, {"key": "13890581", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4455295601018002, "ground_truth": 0}, {"key": "13890581", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1699562176555699, "ground_truth": 0}, {"key": "40194700", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.509764371831468, "ground_truth": 0}, {"key": "40194700", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4668456105766453, "ground_truth": 0}, {"key": "40194700", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5755880064852862, "ground_truth": 0}, {"key": "40194700", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804507558095, "ground_truth": 0}, {"key": "40194700", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014192784616, "ground_truth": 0}, {"key": "37903647", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.0660853740104279, "ground_truth": 0}, {"key": "37903647", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12002563680530015, "ground_truth": 0}, {"key": "37903647", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09073548815530834, "ground_truth": 0}, {"key": "37903647", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.0960254934820971, "ground_truth": 0}, {"key": "37903647", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12336561413876224, "ground_truth": 0}, {"key": "13291223", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3998116306860021, "ground_truth": 0}, {"key": "13291223", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27512975499931097, "ground_truth": 0}, {"key": "13291223", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19436782167658373, "ground_truth": 0}, {"key": "13291223", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2018132185467044, "ground_truth": 0}, {"key": "13291223", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40733340773843163, "ground_truth": 0}, {"key": "36052570", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13939638580500763, "ground_truth": 0}, {"key": "36052570", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16451645065206946, "ground_truth": 0}, {"key": "36052570", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2845760156279339, "ground_truth": 0}, {"key": "36052570", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16451646559271518, "ground_truth": 0}, {"key": "36052570", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14706450595108128, "ground_truth": 0}, {"key": "34944735", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.264358370933927, "ground_truth": 0}, {"key": "34944735", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5097643656867505, "ground_truth": 0}, {"key": "34944735", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5736784079029206, "ground_truth": 0}, {"key": "34944735", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512722574111, "ground_truth": 0}, {"key": "34944735", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.649578621048131, "ground_truth": 0}, {"key": "32159602", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15817436256617132, "ground_truth": 0}, {"key": "32159602", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.451326518025921, "ground_truth": 0}, {"key": "32159602", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.484380073261415, "ground_truth": 0}, {"key": "32159602", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2877678141952147, "ground_truth": 0}, {"key": "32159602", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45519861593367306, "ground_truth": 0}, {"key": "34988915", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2094697031551239, "ground_truth": 0}, {"key": "34988915", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18242553449212792, "ground_truth": 0}, {"key": "34988915", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08945459782988832, "ground_truth": 0}, {"key": "34988915", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1267851670641365, "ground_truth": 0}, {"key": "34988915", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11676400853623295, "ground_truth": 0}, {"key": "37889203", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5273165274925791, "ground_truth": 0}, {"key": "37889203", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.527316529213247, "ground_truth": 0}, {"key": "37889203", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43782349427788475, "ground_truth": 0}, {"key": "37889203", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633651759767, "ground_truth": 0}, {"key": "37889203", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40356686995043783, "ground_truth": 0}, {"key": "33609927", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3702253827701347, "ground_truth": 0}, {"key": "33609927", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43398148448469775, "ground_truth": 0}, {"key": "33609927", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2553436470460017, "ground_truth": 0}, {"key": "33609927", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.264358356008019, "ground_truth": 0}, {"key": "33609927", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2553436483534247, "ground_truth": 0}, {"key": "33578778", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2422056408964898, "ground_truth": 0}, {"key": "33578778", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2081789254984409, "ground_truth": 0}, {"key": "33578778", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27048022873367356, "ground_truth": 0}, {"key": "33578778", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1732882006005596, "ground_truth": 0}, {"key": "33578778", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10970577255265326, "ground_truth": 0}, {"key": "36888270", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39606815585872773, "ground_truth": 0}, {"key": "36888270", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3468730930479531, "ground_truth": 0}, {"key": "36888270", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5448013818352238, "ground_truth": 0}, {"key": "36888270", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.30404167344506083, "ground_truth": 0}, {"key": "36888270", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21601152740381305, "ground_truth": 0}, {"key": "36846007", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6959583345790792, "ground_truth": 0}, {"key": "36846007", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6548947124026583, "ground_truth": 0}, {"key": "36846007", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7008947808270318, "ground_truth": 0}, {"key": "36846007", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637608116162, "ground_truth": 0}, {"key": "36846007", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701032407908, "ground_truth": 0}, {"key": "31723471", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.411110853124729, "ground_truth": 0}, {"key": "31723471", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5698526423862266, "ground_truth": 0}, {"key": "31723471", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.540923848172202, "ground_truth": 0}, {"key": "31723471", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687307743077883, "ground_truth": 0}, {"key": "31723471", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397334289552, "ground_truth": 0}, {"key": "15921828", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24798745109975584, "ground_truth": 0}, {"key": "15921828", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41489886610602694, "ground_truth": 0}, {"key": "15921828", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6334102652191124, "ground_truth": 0}, {"key": "15921828", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23651622736402242, "ground_truth": 0}, {"key": "15921828", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35398629323943326, "ground_truth": 0}, {"key": "39109408", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2295352065644833, "ground_truth": 0}, {"key": "39109408", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.34158249827267656, "ground_truth": 0}, {"key": "39109408", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3738758260548005, "ground_truth": 0}, {"key": "39109408", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1919328003346172, "ground_truth": 0}, {"key": "39109408", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19193278701395988, "ground_truth": 0}, {"key": "20936833", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08632347713404377, "ground_truth": 0}, {"key": "20936833", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.08449276199124996, "ground_truth": 0}, {"key": "20936833", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07751765528493326, "ground_truth": 0}, {"key": "20936833", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.05791808712922381, "ground_truth": 0}, {"key": "20936833", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11047114252247939, "ground_truth": 0}, {"key": "36832879", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2553436569294673, "ground_truth": 0}, {"key": "36832879", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3056973163105271, "ground_truth": 0}, {"key": "36832879", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3433417013920091, "ground_truth": 0}, {"key": "36832879", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405545139802568, "ground_truth": 0}, {"key": "36832879", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2958398328545879, "ground_truth": 0}, {"key": "14958201", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2958398577376692, "ground_truth": 0}, {"key": "14958201", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21733750880943437, "ground_truth": 0}, {"key": "14958201", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17895590880602522, "ground_truth": 0}, {"key": "14958201", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256354688675, "ground_truth": 0}, {"key": "14958201", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3073580116333903, "ground_truth": 0}, {"key": "34352262", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18594721222570013, "ground_truth": 0}, {"key": "34352262", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.45713672786705856, "ground_truth": 0}, {"key": "34352262", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3259495240467938, "ground_truth": 0}, {"key": "34352262", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25386101882207773, "ground_truth": 0}, {"key": "34352262", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2643583635006885, "ground_truth": 0}, {"key": "39805395", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15304215953255565, "ground_truth": 0}, {"key": "39805395", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16238002465864768, "ground_truth": 0}, {"key": "39805395", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.36116471853004267, "ground_truth": 0}, {"key": "39805395", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776335001455772, "ground_truth": 0}, {"key": "39805395", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23651623449103357, "ground_truth": 0}, {"key": "34303109", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23510839285678914, "ground_truth": 0}, {"key": "34303109", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1470645335607896, "ground_truth": 0}, {"key": "34303109", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2720245688062062, "ground_truth": 0}, {"key": "34303109", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24077461036220985, "ground_truth": 0}, {"key": "34303109", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2043418995392781, "ground_truth": 0}, {"key": "39939090", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7577943618290114, "ground_truth": 0}, {"key": "39939090", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6893056091203263, "ground_truth": 0}, {"key": "39939090", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43782349411848526, "ground_truth": 0}, {"key": "39939090", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44746024733869866, "ground_truth": 0}, {"key": "39939090", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632895698464, "ground_truth": 0}, {"key": "29347771", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19314737716161767, "ground_truth": 0}, {"key": "29347771", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2254166110393699, "ground_truth": 0}, {"key": "29347771", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2213506729279327, "ground_truth": 0}, {"key": "29347771", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4416730029973905, "ground_truth": 0}, {"key": "29347771", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20434189932011962, "ground_truth": 0}, {"key": "36783415", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7386690833304894, "ground_truth": 0}, {"key": "36783415", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42441201371569914, "ground_truth": 0}, {"key": "36783415", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.544801401777712, "ground_truth": 0}, {"key": "36783415", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3960681577792589, "ground_truth": 0}, {"key": "36783415", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3775406784395163, "ground_truth": 0}, {"key": "37935687", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16667541470467243, "ground_truth": 0}, {"key": "37935687", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1710611946319191, "ground_truth": 0}, {"key": "37935687", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17441027468292788, "ground_truth": 0}, {"key": "37935687", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13206614728423607, "ground_truth": 0}, {"key": "37935687", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.206894061506053, "ground_truth": 0}, {"key": "40260829", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5331543734066381, "ground_truth": 0}, {"key": "40260829", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5058590719185839, "ground_truth": 0}, {"key": "40260829", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3007455880739295, "ground_truth": 0}, {"key": "40260829", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907616310457316, "ground_truth": 0}, {"key": "40260829", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.531209354546443, "ground_truth": 0}, {"key": "36478199", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3191213718247343, "ground_truth": 0}, {"key": "36478199", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4167966324664342, "ground_truth": 0}, {"key": "36478199", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2081789321262516, "ground_truth": 0}, {"key": "36478199", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31236999458173287, "ground_truth": 0}, {"key": "36478199", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23792987479768454, "ground_truth": 0}, {"key": "34541803", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3757064598250455, "ground_truth": 0}, {"key": "34541803", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12940272363005095, "ground_truth": 0}, {"key": "34541803", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.29583988568164504, "ground_truth": 0}, {"key": "34541803", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757213300762315, "ground_truth": 0}, {"key": "34541803", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19682620982277377, "ground_truth": 0}, {"key": "35360841", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37754067074291797, "ground_truth": 0}, {"key": "35360841", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5389832516527977, "ground_truth": 0}, {"key": "35360841", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1347759200244433, "ground_truth": 0}, {"key": "35360841", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32939171849422894, "ground_truth": 0}, {"key": "35360841", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132649675560643, "ground_truth": 0}, {"key": "35550407", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15921741910486037, "ground_truth": 0}, {"key": "35550407", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14804719425921836, "ground_truth": 0}, {"key": "35550407", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.28776782220066455, "ground_truth": 0}, {"key": "35550407", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10521053741302978, "ground_truth": 0}, {"key": "35550407", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13028542200064616, "ground_truth": 0}, {"key": "37561590", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1907240215945426, "ground_truth": 0}, {"key": "37561590", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.525368803550176, "ground_truth": 0}, {"key": "37561590", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5253688394471414, "ground_truth": 0}, {"key": "37561590", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45519862780783554, "ground_truth": 0}, {"key": "37561590", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3293917021727362, "ground_truth": 0}, {"key": "39328843", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3830641675257258, "ground_truth": 0}, {"key": "39328843", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5679365847460612, "ground_truth": 0}, {"key": "39328843", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6261242178339792, "ground_truth": 0}, {"key": "39328843", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4649015688942225, "ground_truth": 0}, {"key": "39328843", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.47852882930693974, "ground_truth": 0}, {"key": "35389665", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7704647761318106, "ground_truth": 0}, {"key": "35389665", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7371581714982821, "ground_truth": 0}, {"key": "35389665", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8679338439104308, "ground_truth": 0}, {"key": "35389665", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526275210904, "ground_truth": 0}, {"key": "35389665", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736784143196828, "ground_truth": 0}, {"key": "33080187", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25832598738149437, "ground_truth": 0}, {"key": "33080187", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17106117772941784, "ground_truth": 0}, {"key": "33080187", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21337717421536334, "ground_truth": 0}, {"key": "33080187", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38306417708017826, "ground_truth": 0}, {"key": "33080187", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27982850374467466, "ground_truth": 0}, {"key": "38636995", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.240774591994917, "ground_truth": 0}, {"key": "38636995", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.212068800511518, "ground_truth": 0}, {"key": "38636995", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14033624875767495, "ground_truth": 0}, {"key": "38636995", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.130285426703943, "ground_truth": 0}, {"key": "38636995", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09073548708537688, "ground_truth": 0}, {"key": "18536236", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29098086077008833, "ground_truth": 0}, {"key": "18536236", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.34158248666460234, "ground_truth": 0}, {"key": "18536236", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24077459141662205, "ground_truth": 0}, {"key": "18536236", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1755380681089309, "ground_truth": 0}, {"key": "18536236", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16559311404634777, "ground_truth": 0}, {"key": "36289151", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16026603154789695, "ground_truth": 0}, {"key": "36289151", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20434190443656147, "ground_truth": 0}, {"key": "36289151", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1789558899323135, "ground_truth": 0}, {"key": "36289151", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13206615048147932, "ground_truth": 0}, {"key": "36289151", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1980641741249544, "ground_truth": 0}, {"key": "23017045", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33807713231788356, "ground_truth": 0}, {"key": "23017045", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5156198978374846, "ground_truth": 0}, {"key": "23017045", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5832033532463377, "ground_truth": 0}, {"key": "23017045", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935497835209, "ground_truth": 0}, {"key": "23017045", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941408655362767, "ground_truth": 0}, {"key": "36418082", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2450849998645161, "ground_truth": 0}, {"key": "36418082", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14414884992295257, "ground_truth": 0}, {"key": "36418082", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3259495244855009, "ground_truth": 0}, {"key": "36418082", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11047115355086749, "ground_truth": 0}, {"key": "36418082", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1044773209106948, "ground_truth": 0}, {"key": "34396551", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16026603873563666, "ground_truth": 0}, {"key": "34396551", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26740816495571035, "ground_truth": 0}, {"key": "34396551", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2133771694182138, "ground_truth": 0}, {"key": "34396551", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.0670562836641826, "ground_truth": 0}, {"key": "34396551", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11757214395103333, "ground_truth": 0}, {"key": "39720944", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6132365550748609, "ground_truth": 0}, {"key": "39720944", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4882833737579502, "ground_truth": 0}, {"key": "39720944", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5717666016766035, "ground_truth": 0}, {"key": "39720944", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3539862947713545, "ground_truth": 0}, {"key": "39720944", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.31742627205834073, "ground_truth": 0}, {"key": "35884842", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13939638185246853, "ground_truth": 0}, {"key": "35884842", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11124122310089167, "ground_truth": 0}, {"key": "35884842", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07807816174381157, "ground_truth": 0}, {"key": "35884842", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13568954195413968, "ground_truth": 0}, {"key": "35884842", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12852512793546964, "ground_truth": 0}, {"key": "35403375", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.07978201609680159, "ground_truth": 0}, {"key": "35403375", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1613202334825838, "ground_truth": 0}, {"key": "35403375", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12940272945532322, "ground_truth": 0}, {"key": "35403375", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11596071004685464, "ground_truth": 0}, {"key": "35403375", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2509127974426343, "ground_truth": 0}, {"key": "26341324", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4339814327560797, "ground_truth": 0}, {"key": "26341324", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.533154430196423, "ground_truth": 0}, {"key": "26341324", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3886180287933552, "ground_truth": 0}, {"key": "26341324", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990400464895, "ground_truth": 0}, {"key": "26341324", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740360022766, "ground_truth": 0}, {"key": "19212345", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22000709976445434, "ground_truth": 0}, {"key": "19212345", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.292595287946842, "ground_truth": 0}, {"key": "19212345", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3157359920992328, "ground_truth": 0}, {"key": "19212345", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035935845827, "ground_truth": 0}, {"key": "19212345", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2598256282106206, "ground_truth": 0}, {"key": "30548367", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30239107258075054, "ground_truth": 0}, {"key": "30548367", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28776783017645396, "ground_truth": 0}, {"key": "30548367", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39047583353225584, "ground_truth": 0}, {"key": "30548367", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687310552570627, "ground_truth": 0}, {"key": "30548367", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.203074623886376, "ground_truth": 0}, {"key": "37919402", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6584174789158962, "ground_truth": 0}, {"key": "37919402", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.525368824250221, "ground_truth": 0}, {"key": "37919402", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6926419900540394, "ground_truth": 0}, {"key": "37919402", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881427554195, "ground_truth": 0}, {"key": "37919402", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526681099049, "ground_truth": 0}, {"key": "39995133", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5888891457735516, "ground_truth": 0}, {"key": "39995133", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7279754492620093, "ground_truth": 0}, {"key": "39995133", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3720487995234934, "ground_truth": 0}, {"key": "39995133", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526204465404, "ground_truth": 0}, {"key": "39995133", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27512972382098766, "ground_truth": 0}, {"key": "40249088", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.320821294484828, "ground_truth": 0}, {"key": "40249088", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38861801504440374, "ground_truth": 0}, {"key": "40249088", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2146914132572006, "ground_truth": 0}, {"key": "40249088", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25386101894045116, "ground_truth": 0}, {"key": "40249088", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27357436690141407, "ground_truth": 0}, {"key": "40254388", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2974699432286959, "ground_truth": 0}, {"key": "40254388", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2674081603094842, "ground_truth": 0}, {"key": "40254388", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22000710732768097, "ground_truth": 0}, {"key": "40254388", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23231015922196924, "ground_truth": 0}, {"key": "40254388", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2583259832111719, "ground_truth": 0}, {"key": "31995230", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19682620591524028, "ground_truth": 0}, {"key": "31995230", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19682620762916905, "ground_truth": 0}, {"key": "31995230", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19314738891203034, "ground_truth": 0}, {"key": "31995230", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3665897079814173, "ground_truth": 0}, {"key": "31995230", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118645023283, "ground_truth": 0}, {"key": "38632129", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4513265390937719, "ground_truth": 0}, {"key": "38632129", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4378234890252344, "ground_truth": 0}, {"key": "38632129", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6388352835409264, "ground_truth": 0}, {"key": "38632129", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213357297424, "ground_truth": 0}, {"key": "38632129", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824291151603621, "ground_truth": 0}, {"key": "35720795", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4980468426203611, "ground_truth": 0}, {"key": "35720795", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26284180989477857, "ground_truth": 0}, {"key": "35720795", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4571366882614033, "ground_truth": 0}, {"key": "35720795", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2942149666333034, "ground_truth": 0}, {"key": "35720795", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.26588048680100124, "ground_truth": 0}, {"key": "23906759", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09534946147395813, "ground_truth": 0}, {"key": "23906759", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12592276668424005, "ground_truth": 0}, {"key": "23906759", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14128142381961617, "ground_truth": 0}, {"key": "23906759", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594720117951768, "ground_truth": 0}, {"key": "23906759", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076630121334217, "ground_truth": 0}, {"key": "19410108", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10017222320399649, "ground_truth": 0}, {"key": "19410108", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.747615967848332, "ground_truth": 0}, {"key": "19410108", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3757064629133685, "ground_truth": 0}, {"key": "19410108", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557748462282687, "ground_truth": 0}, {"key": "19410108", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2068940588363884, "ground_truth": 0}, {"key": "30745137", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37204876037286483, "ground_truth": 0}, {"key": "30745137", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2925952657458149, "ground_truth": 0}, {"key": "30745137", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16995624605996706, "ground_truth": 0}, {"key": "30745137", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11838509790841184, "ground_truth": 0}, {"key": "30745137", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3522017724530566, "ground_truth": 0}, {"key": "26553115", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4668456190900027, "ground_truth": 0}, {"key": "26553115", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3140505560826782, "ground_truth": 0}, {"key": "26553115", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4746311813101187, "ground_truth": 0}, {"key": "26553115", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4902356105518612, "ground_truth": 0}, {"key": "26553115", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2281564871175333, "ground_truth": 0}, {"key": "37872311", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6706082717003473, "ground_truth": 0}, {"key": "37872311", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5467381630801625, "ground_truth": 0}, {"key": "37872311", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4111108810823205, "ground_truth": 0}, {"key": "37872311", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125886182796, "ground_truth": 0}, {"key": "37872311", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127606923057, "ground_truth": 0}, {"key": "35553131", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6315943192266049, "ground_truth": 0}, {"key": "35553131", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6992544336025828, "ground_truth": 0}, {"key": "35553131", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5602526340498794, "ground_truth": 0}, {"key": "35553131", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570648664379735, "ground_truth": 0}, {"key": "35553131", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318189059529, "ground_truth": 0}, {"key": "39038936", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19682620388933555, "ground_truth": 0}, {"key": "39038936", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22678362931022666, "ground_truth": 0}, {"key": "39038936", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18832398441988848, "ground_truth": 0}, {"key": "39038936", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10017222348646328, "ground_truth": 0}, {"key": "39038936", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22000710354918468, "ground_truth": 0}, {"key": "38735486", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9304582558189854, "ground_truth": 0}, {"key": "38735486", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9693241980768337, "ground_truth": 0}, {"key": "38735486", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9358173580592933, "ground_truth": 0}, {"key": "38735486", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.942081913069703, "ground_truth": 0}, {"key": "38735486", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9207896785442605, "ground_truth": 0}, {"key": "17087845", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3380771253119647, "ground_truth": 0}, {"key": "17087845", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14414885203612254, "ground_truth": 0}, {"key": "17087845", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1422318870696165, "ground_truth": 0}, {"key": "17087845", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2365162228202365, "ground_truth": 0}, {"key": "17087845", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.07316472067715733, "ground_truth": 0}, {"key": "37443011", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2766905441887886, "ground_truth": 0}, {"key": "37443011", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1907240228956286, "ground_truth": 0}, {"key": "37443011", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12940272947110537, "ground_truth": 0}, {"key": "37443011", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.36116473626138257, "ground_truth": 0}, {"key": "37443011", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3157359701675129, "ground_truth": 0}, {"key": "36855749", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17667160435387919, "ground_truth": 0}, {"key": "36855749", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2337063545700276, "ground_truth": 0}, {"key": "36855749", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2798284860459195, "ground_truth": 0}, {"key": "36855749", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29259530318837745, "ground_truth": 0}, {"key": "36855749", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939170323979045, "ground_truth": 0}, {"key": "35613141", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24220562887153246, "ground_truth": 0}, {"key": "35613141", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4571367268075765, "ground_truth": 0}, {"key": "35613141", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3328523277517786, "ground_truth": 0}, {"key": "35613141", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937837126160645, "ground_truth": 0}, {"key": "35613141", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09534945691479778, "ground_truth": 0}, {"key": "39088847", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5350984191344951, "ground_truth": 0}, {"key": "39088847", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3575675109894073, "ground_truth": 0}, {"key": "39088847", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5175709148252166, "ground_truth": 0}, {"key": "39088847", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4205995950095801, "ground_truth": 0}, {"key": "39088847", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907791897803935, "ground_truth": 0}, {"key": "33197277", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5292633818451026, "ground_truth": 0}, {"key": "33197277", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.569852648381013, "ground_truth": 0}, {"key": "33197277", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6654105561573248, "ground_truth": 0}, {"key": "33197277", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43782350696146916, "ground_truth": 0}, {"key": "33197277", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621765003145679, "ground_truth": 0}, {"key": "33815489", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18359362895242268, "ground_truth": 0}, {"key": "33815489", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14128141686379303, "ground_truth": 0}, {"key": "33815489", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.024237634663290635, "ground_truth": 0}, {"key": "33815489", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.04401865472370283, "ground_truth": 0}, {"key": "33815489", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.04603389869259908, "ground_truth": 0}, {"key": "35862754", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2814056304312818, "ground_truth": 0}, {"key": "35862754", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3242353891744722, "ground_truth": 0}, {"key": "35862754", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.32766829207573783, "ground_truth": 0}, {"key": "35862754", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43590149550261514, "ground_truth": 0}, {"key": "35862754", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2043418781335822, "ground_truth": 0}, {"key": "36080615", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2281565136959298, "ground_truth": 0}, {"key": "36080615", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15304215829600118, "ground_truth": 0}, {"key": "36080615", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2186693873835058, "ground_truth": 0}, {"key": "36080615", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.314050540839862, "ground_truth": 0}, {"key": "36080615", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1943678124479533, "ground_truth": 0}, {"key": "22822742", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7401743632466145, "ground_truth": 0}, {"key": "22822742", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6601723668377205, "ground_truth": 0}, {"key": "22822742", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6388353102690841, "ground_truth": 0}, {"key": "22822742", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.48633151961607934, "ground_truth": 0}, {"key": "22822742", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688166242325, "ground_truth": 0}, {"key": "39747536", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.52147116624344, "ground_truth": 0}, {"key": "39747536", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.36116471501211594, "ground_truth": 0}, {"key": "39747536", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3363310356071519, "ground_truth": 0}, {"key": "39747536", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881432981937, "ground_truth": 0}, {"key": "39747536", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39606817461628113, "ground_truth": 0}, {"key": "34218396", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10302443509442637, "ground_truth": 0}, {"key": "34218396", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2689414473276533, "ground_truth": 0}, {"key": "34218396", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2942149630100806, "ground_truth": 0}, {"key": "34218396", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3468730684630908, "ground_truth": 0}, {"key": "34218396", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21601153991504815, "ground_truth": 0}, {"key": "39150388", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18952109534747463, "ground_truth": 0}, {"key": "39150388", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.09807932250553626, "ground_truth": 0}, {"key": "39150388", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16667540377274076, "ground_truth": 0}, {"key": "39150388", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653334898707263, "ground_truth": 0}, {"key": "39150388", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19930801295301012, "ground_truth": 0}, {"key": "28765782", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3242353740748275, "ground_truth": 0}, {"key": "28765782", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40168780170304247, "ground_truth": 0}, {"key": "28765782", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1581743521345285, "ground_truth": 0}, {"key": "28765782", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4902356045124186, "ground_truth": 0}, {"key": "28765782", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38861801994691786, "ground_truth": 0}, {"key": "35828022", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.0973903969339297, "ground_truth": 0}, {"key": "35828022", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.35756754735561364, "ground_truth": 0}, {"key": "35828022", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5175708782675803, "ground_truth": 0}, {"key": "35828022", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2240554660816199, "ground_truth": 0}, {"key": "35828022", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "27717735", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1081889557041774, "ground_truth": 0}, {"key": "27717735", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30735801524777745, "ground_truth": 0}, {"key": "27717735", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10521054151839965, "ground_truth": 0}, {"key": "27717735", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15713685297890503, "ground_truth": 0}, {"key": "27717735", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16238003020975164, "ground_truth": 0}, {"key": "37977826", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.299105193020409, "ground_truth": 0}, {"key": "37977826", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38491215522883204, "ground_truth": 0}, {"key": "37977826", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24798742998377157, "ground_truth": 0}, {"key": "37977826", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2643583454733456, "ground_truth": 0}, {"key": "37977826", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1677633597263936, "ground_truth": 0}, {"key": "31768588", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8311430595139997, "ground_truth": 0}, {"key": "31768588", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7310585879455728, "ground_truth": 0}, {"key": "31768588", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4765796375060498, "ground_truth": 0}, {"key": "31768588", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030966281725, "ground_truth": 0}, {"key": "31768588", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.720171517492238, "ground_truth": 0}, {"key": "37183351", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1530421598597695, "ground_truth": 0}, {"key": "37183351", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23370636300266867, "ground_truth": 0}, {"key": "37183351", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.053403330997504474, "ground_truth": 0}, {"key": "37183351", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11357958787852462, "ground_truth": 0}, {"key": "37183351", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1242130047573806, "ground_truth": 0}, {"key": "39622090", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22541660982158623, "ground_truth": 0}, {"key": "39622090", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16451647910905934, "ground_truth": 0}, {"key": "39622090", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17441028664561467, "ground_truth": 0}, {"key": "39622090", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17553807974146116, "ground_truth": 0}, {"key": "39622090", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11357959378364968, "ground_truth": 0}, {"key": "39272756", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3363310379673188, "ground_truth": 0}, {"key": "39272756", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41679665347795813, "ground_truth": 0}, {"key": "39272756", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3328523173189939, "ground_truth": 0}, {"key": "39272756", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3451052532305674, "ground_truth": 0}, {"key": "39272756", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4225046276914603, "ground_truth": 0}, {"key": "32138822", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2583259729881354, "ground_truth": 0}, {"key": "32138822", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37570647246427635, "ground_truth": 0}, {"key": "32138822", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27048021789124094, "ground_truth": 0}, {"key": "32138822", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4960938309736023, "ground_truth": 0}, {"key": "32138822", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3276682813311431, "ground_truth": 0}, {"key": "31070114", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2925953155607703, "ground_truth": 0}, {"key": "31070114", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18832398789171859, "ground_truth": 0}, {"key": "31070114", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2553436374589788, "ground_truth": 0}, {"key": "31070114", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15610490332253935, "ground_truth": 0}, {"key": "31070114", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22270013582713039, "ground_truth": 0}, {"key": "39652762", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5448013911351323, "ground_truth": 0}, {"key": "39652762", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5195213282735889, "ground_truth": 0}, {"key": "39652762", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7106283311111108, "ground_truth": 0}, {"key": "39652762", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.46101679073835433, "ground_truth": 0}, {"key": "39652762", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526373077833, "ground_truth": 0}, {"key": "33258866", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1375324723253263, "ground_truth": 0}, {"key": "33258866", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32082129688520755, "ground_truth": 0}, {"key": "33258866", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13753245812731268, "ground_truth": 0}, {"key": "33258866", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2583259786004904, "ground_truth": 0}, {"key": "33258866", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17328819557043332, "ground_truth": 0}, {"key": "36962388", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17441028090402397, "ground_truth": 0}, {"key": "36962388", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17217185642826524, "ground_truth": 0}, {"key": "36962388", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3363310349178419, "ground_truth": 0}, {"key": "36962388", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13386748691301975, "ground_truth": 0}, {"key": "36962388", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22000709274372435, "ground_truth": 0}, {"key": "32282272", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09203286027661835, "ground_truth": 0}, {"key": "32282272", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.06008665108901299, "ground_truth": 0}, {"key": "32282272", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1847675126479812, "ground_truth": 0}, {"key": "32282272", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.06371499394748716, "ground_truth": 0}, {"key": "32282272", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14608723837995274, "ground_truth": 0}, {"key": "36093072", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7356416352385465, "ground_truth": 0}, {"key": "36093072", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5755880063809939, "ground_truth": 0}, {"key": "36093072", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6001883456463778, "ground_truth": 0}, {"key": "36093072", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640087195039, "ground_truth": 0}, {"key": "36093072", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819703908234, "ground_truth": 0}, {"key": "38879972", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4416730094897662, "ground_truth": 0}, {"key": "38879972", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3486451400907329, "ground_truth": 0}, {"key": "38879972", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42059957336628084, "ground_truth": 0}, {"key": "38879972", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4225046126264121, "ground_truth": 0}, {"key": "38879972", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982761824127106, "ground_truth": 0}, {"key": "32106473", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11357958571009863, "ground_truth": 0}, {"key": "32106473", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19193279565125929, "ground_truth": 0}, {"key": "32106473", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12940273687387302, "ground_truth": 0}, {"key": "32106473", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.30074556331005897, "ground_truth": 0}, {"key": "32106473", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11838510473090998, "ground_truth": 0}, {"key": "40415815", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09739039760330369, "ground_truth": 0}, {"key": "40415815", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13386749367466552, "ground_truth": 0}, {"key": "40415815", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10594827610899542, "ground_truth": 0}, {"key": "40415815", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23934932017522417, "ground_truth": 0}, {"key": "40415815", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10374863178021043, "ground_truth": 0}, {"key": "34581918", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08269734573276767, "ground_truth": 0}, {"key": "34581918", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12085322702367786, "ground_truth": 0}, {"key": "34581918", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15203224731685738, "ground_truth": 0}, {"key": "34581918", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.049222113658127405, "ground_truth": 0}, {"key": "34581918", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19072402156081264, "ground_truth": 0}, {"key": "33004157", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4186969243379915, "ground_truth": 0}, {"key": "33004157", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5832033800943561, "ground_truth": 0}, {"key": "33004157", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6388352536713336, "ground_truth": 0}, {"key": "33004157", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690871293687, "ground_truth": 0}, {"key": "33004157", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224305064224, "ground_truth": 0}, {"key": "30334943", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7264256287241629, "ground_truth": 0}, {"key": "30334943", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7233094853740193, "ground_truth": 0}, {"key": "30334943", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35936414635740765, "ground_truth": 0}, {"key": "30334943", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32423539563709325, "ground_truth": 0}, {"key": "30334943", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.540923892826697, "ground_truth": 0}, {"key": "33280503", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.43398146752831784, "ground_truth": 0}, {"key": "33280503", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41300357826040507, "ground_truth": 0}, {"key": "33280503", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3023910939382595, "ground_truth": 0}, {"key": "33280503", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25683200556064933, "ground_truth": 0}, {"key": "33280503", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2814056117797927, "ground_truth": 0}, {"key": "25726782", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.449392633769293, "ground_truth": 0}, {"key": "25726782", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31405055085751105, "ground_truth": 0}, {"key": "25726782", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5019530914827602, "ground_truth": 0}, {"key": "25726782", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45519859796800893, "ground_truth": 0}, {"key": "25726782", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36477755489456076, "ground_truth": 0}, {"key": "35479854", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22541660984097345, "ground_truth": 0}, {"key": "35479854", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47657965807072317, "ground_truth": 0}, {"key": "35479854", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4687906300014284, "ground_truth": 0}, {"key": "35479854", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.48242911014115536, "ground_truth": 0}, {"key": "35479854", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922079617930524, "ground_truth": 0}, {"key": "32716226", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35936416188412706, "ground_truth": 0}, {"key": "32716226", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25832598166397225, "ground_truth": 0}, {"key": "32716226", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1677633400012255, "ground_truth": 0}, {"key": "32716226", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25832598735820406, "ground_truth": 0}, {"key": "32716226", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2213506791205277, "ground_truth": 0}, {"key": "37047554", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3106943936841978, "ground_truth": 0}, {"key": "37047554", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.49804688606231723, "ground_truth": 0}, {"key": "37047554", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26894142838896684, "ground_truth": 0}, {"key": "37047554", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1320661535924646, "ground_truth": 0}, {"key": "37047554", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12168575750995791, "ground_truth": 0}, {"key": "36565290", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15203224413318053, "ground_truth": 0}, {"key": "36565290", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1366083934185915, "ground_truth": 0}, {"key": "36565290", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3451052512460832, "ground_truth": 0}, {"key": "36565290", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.531209369083145, "ground_truth": 0}, {"key": "36565290", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2877678291992479, "ground_truth": 0}, {"key": "27758640", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.397938394476218, "ground_truth": 0}, {"key": "27758640", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2861692511639468, "ground_truth": 0}, {"key": "27758640", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.34334171498404475, "ground_truth": 0}, {"key": "27758640", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2845760072283618, "ground_truth": 0}, {"key": "27758640", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.46879064739315557, "ground_truth": 0}, {"key": "28897118", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5467381707717728, "ground_truth": 0}, {"key": "28897118", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4378234955251584, "ground_truth": 0}, {"key": "28897118", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7732163729283523, "ground_truth": 0}, {"key": "28897118", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.616935825379364, "ground_truth": 0}, {"key": "28897118", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2227001465421589, "ground_truth": 0}, {"key": "38452661", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4493926419143526, "ground_truth": 0}, {"key": "38452661", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5019530926164414, "ground_truth": 0}, {"key": "38452661", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.29098088482489953, "ground_truth": 0}, {"key": "38452661", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.26588046820680805, "ground_truth": 0}, {"key": "38452661", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09401018514408722, "ground_truth": 0}, {"key": "38033492", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1801066639937661, "ground_truth": 0}, {"key": "38033492", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2751297237553127, "ground_truth": 0}, {"key": "38033492", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4167966462341659, "ground_truth": 0}, {"key": "38033492", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18952109420382976, "ground_truth": 0}, {"key": "38033492", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27825680089675003, "ground_truth": 0}, {"key": "35949555", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8940517209666122, "ground_truth": 0}, {"key": "35949555", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7943849543027428, "ground_truth": 0}, {"key": "35949555", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6636689489813378, "ground_truth": 0}, {"key": "35949555", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493099260662, "ground_truth": 0}, {"key": "35949555", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.638835279925839, "ground_truth": 0}, {"key": "15263826", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24077460354015418, "ground_truth": 0}, {"key": "15263826", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26588047611490595, "ground_truth": 0}, {"key": "15263826", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2643583577285959, "ground_truth": 0}, {"key": "15263826", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21337717024531327, "ground_truth": 0}, {"key": "15263826", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3007455691061981, "ground_truth": 0}, {"key": "37313866", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.41679663869309747, "ground_truth": 0}, {"key": "37313866", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14223189274193984, "ground_truth": 0}, {"key": "37313866", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10158945445002834, "ground_truth": 0}, {"key": "37313866", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15507847669281483, "ground_truth": 0}, {"key": "37313866", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12421302610232948, "ground_truth": 0}, {"key": "13911157", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5621764791798728, "ground_truth": 0}, {"key": "13911157", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.749087230496969, "ground_truth": 0}, {"key": "13911157", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7606506504716798, "ground_truth": 0}, {"key": "13911157", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445502879011, "ground_truth": 0}, {"key": "13911157", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575751656154, "ground_truth": 0}, {"key": "39594894", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4590761285790887, "ground_truth": 0}, {"key": "39594894", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.585101142975492, "ground_truth": 0}, {"key": "39594894", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.29098084958522696, "ground_truth": 0}, {"key": "39594894", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199244918035, "ground_truth": 0}, {"key": "39594894", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4130035767093148, "ground_truth": 0}, {"key": "34096170", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20434190197343166, "ground_truth": 0}, {"key": "34096170", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21076632110878807, "ground_truth": 0}, {"key": "34096170", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3242354131033384, "ground_truth": 0}, {"key": "34096170", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22815651816725963, "ground_truth": 0}, {"key": "34096170", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12678517288850838, "ground_truth": 0}, {"key": "37891952", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7295197892960547, "ground_truth": 0}, {"key": "37891952", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7662936351354676, "ground_truth": 0}, {"key": "37891952", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8633916165993032, "ground_truth": 0}, {"key": "37891952", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672048024601, "ground_truth": 0}, {"key": "37891952", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.734119527274072, "ground_truth": 0}, {"key": "40186158", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37387579552957756, "ground_truth": 0}, {"key": "40186158", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1208532368603261, "ground_truth": 0}, {"key": "40186158", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2861692624153417, "ground_truth": 0}, {"key": "40186158", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17106118534381962, "ground_truth": 0}, {"key": "40186158", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11676400153705133, "ground_truth": 0}, {"key": "37049719", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35042137698197845, "ground_truth": 0}, {"key": "37049719", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16995622525632165, "ground_truth": 0}, {"key": "37049719", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26588047099467066, "ground_truth": 0}, {"key": "37049719", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2628418474972515, "ground_truth": 0}, {"key": "37049719", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15102779835251715, "ground_truth": 0}, {"key": "34610504", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.651354868555587, "ground_truth": 0}, {"key": "34610504", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7563575667624728, "ground_truth": 0}, {"key": "34610504", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5486735083920047, "ground_truth": 0}, {"key": "34610504", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44167301090092487, "ground_truth": 0}, {"key": "34610504", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056052627318, "ground_truth": 0}, {"key": "37595429", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6315943114968096, "ground_truth": 0}, {"key": "37595429", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "37595429", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33111973692310726, "ground_truth": 0}, {"key": "37595429", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035461497475, "ground_truth": 0}, {"key": "37595429", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3363310502430415, "ground_truth": 0}, {"key": "29772670", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4320633966774512, "ground_truth": 0}, {"key": "29772670", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6654105459217255, "ground_truth": 0}, {"key": "29772670", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7248702779604029, "ground_truth": 0}, {"key": "29772670", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4474603186442195, "ground_truth": 0}, {"key": "29772670", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413934678951, "ground_truth": 0}, {"key": "36369872", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2553436631480954, "ground_truth": 0}, {"key": "36369872", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.08449275887835941, "ground_truth": 0}, {"key": "36369872", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18359362714185526, "ground_truth": 0}, {"key": "36369872", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1581743431557138, "ground_truth": 0}, {"key": "36369872", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10970577217152526, "ground_truth": 0}, {"key": "34527433", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16559311493447593, "ground_truth": 0}, {"key": "34527433", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12421300697672752, "ground_truth": 0}, {"key": "34527433", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13568954549070678, "ground_truth": 0}, {"key": "34527433", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1441488611013147, "ground_truth": 0}, {"key": "34527433", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.07807816640948573, "ground_truth": 0}, {"key": "31111734", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5679366026613073, "ground_truth": 0}, {"key": "31111734", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23370634639540494, "ground_truth": 0}, {"key": "31111734", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4882833870876048, "ground_truth": 0}, {"key": "31111734", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4746311931011434, "ground_truth": 0}, {"key": "31111734", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197745215202, "ground_truth": 0}, {"key": "40303872", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3106943677387422, "ground_truth": 0}, {"key": "40303872", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6334102469668604, "ground_truth": 0}, {"key": "40303872", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3345894379546889, "ground_truth": 0}, {"key": "40303872", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269911328321, "ground_truth": 0}, {"key": "40303872", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.468790643416022, "ground_truth": 0}, {"key": "33653553", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26133092630490284, "ground_truth": 0}, {"key": "33653553", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3073580195415546, "ground_truth": 0}, {"key": "33653553", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22815649704777657, "ground_truth": 0}, {"key": "33653553", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14804718121339414, "ground_truth": 0}, {"key": "33653553", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1871326759722064, "ground_truth": 0}, {"key": "34404510", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21733751481675034, "ground_truth": 0}, {"key": "34404510", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23792987830487417, "ground_truth": 0}, {"key": "34404510", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24944722121416382, "ground_truth": 0}, {"key": "34404510", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2568319902268182, "ground_truth": 0}, {"key": "34404510", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941408822945711, "ground_truth": 0}, {"key": "35568692", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.04958902386634072, "ground_truth": 0}, {"key": "35568692", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21733752374304982, "ground_truth": 0}, {"key": "35568692", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.04813677061469274, "ground_truth": 0}, {"key": "35568692", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11436852286175894, "ground_truth": 0}, {"key": "35568692", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.039048292477698754, "ground_truth": 0}, {"key": "39151664", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3174262893549077, "ground_truth": 0}, {"key": "39151664", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27357439721709953, "ground_truth": 0}, {"key": "39151664", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22953520393932328, "ground_truth": 0}, {"key": "39151664", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3056973280998232, "ground_truth": 0}, {"key": "39151664", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2782567931329105, "ground_truth": 0}, {"key": "37493670", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9353465114836882, "ground_truth": 0}, {"key": "37493670", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9843363508947832, "ground_truth": 0}, {"key": "37493670", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9118099557462092, "ground_truth": 0}, {"key": "37493670", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9690910397782401, "ground_truth": 0}, {"key": "37493670", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9353465098904199, "ground_truth": 0}, {"key": "21935983", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1356895431451961, "ground_truth": 0}, {"key": "21935983", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3539862860004262, "ground_truth": 0}, {"key": "21935983", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26740815991863914, "ground_truth": 0}, {"key": "21935983", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13206616097698515, "ground_truth": 0}, {"key": "21935983", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32766829909636613, "ground_truth": 0}, {"key": "38174214", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2450849965376273, "ground_truth": 0}, {"key": "38174214", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24944723759984389, "ground_truth": 0}, {"key": "38174214", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2861692524627477, "ground_truth": 0}, {"key": "38174214", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2877678174470819, "ground_truth": 0}, {"key": "38174214", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.0960254901281135, "ground_truth": 0}, {"key": "40319923", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6893056040605778, "ground_truth": 0}, {"key": "40319923", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6723317086399724, "ground_truth": 0}, {"key": "40319923", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6169358250042049, "ground_truth": 0}, {"key": "40319923", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995854958895, "ground_truth": 0}, {"key": "40319923", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512677159314, "ground_truth": 0}, {"key": "36478264", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37937836583186874, "ground_truth": 0}, {"key": "36478264", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31405054181371655, "ground_truth": 0}, {"key": "36478264", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.44939264278294405, "ground_truth": 0}, {"key": "36478264", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.49609383242515986, "ground_truth": 0}, {"key": "36478264", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27982850706345247, "ground_truth": 0}, {"key": "11935769", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1710611800107306, "ground_truth": 0}, {"key": "11935769", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32939171037223347, "ground_truth": 0}, {"key": "11935769", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3557748710725876, "ground_truth": 0}, {"key": "11935769", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15610490687436612, "ground_truth": 0}, {"key": "11935769", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22815650007285798, "ground_truth": 0}, {"key": "33373410", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12252320365266238, "ground_truth": 0}, {"key": "33373410", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17781087007218171, "ground_truth": 0}, {"key": "33373410", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18476750567239822, "ground_truth": 0}, {"key": "33373410", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1561048990397476, "ground_truth": 0}, {"key": "33373410", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1422318878332404, "ground_truth": 0}, {"key": "11130680", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3174262790626681, "ground_truth": 0}, {"key": "11130680", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12852513089788803, "ground_truth": 0}, {"key": "11130680", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.050330631286545614, "ground_truth": 0}, {"key": "11130680", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17328820956539556, "ground_truth": 0}, {"key": "11130680", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3702253608851294, "ground_truth": 0}, {"key": "34868650", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24798744174977413, "ground_truth": 0}, {"key": "34868650", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21206879590678476, "ground_truth": 0}, {"key": "34868650", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42823341936608345, "ground_truth": 0}, {"key": "34868650", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22135069014429135, "ground_truth": 0}, {"key": "34868650", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27202455635965983, "ground_truth": 0}, {"key": "33960561", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4590761395084464, "ground_truth": 0}, {"key": "33960561", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4073333983471299, "ground_truth": 0}, {"key": "33960561", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22953521118325715, "ground_truth": 0}, {"key": "33960561", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21733751237627785, "ground_truth": 0}, {"key": "33960561", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20307463207042983, "ground_truth": 0}, {"key": "22504858", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39047584297818694, "ground_truth": 0}, {"key": "22504858", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41869692988352947, "ground_truth": 0}, {"key": "22504858", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3191213885736736, "ground_truth": 0}, {"key": "22504858", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4111108765933851, "ground_truth": 0}, {"key": "22504858", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15921740029532347, "ground_truth": 0}, {"key": "32283530", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2674081762548611, "ground_truth": 0}, {"key": "32283530", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.0869416578266453, "ground_truth": 0}, {"key": "32283530", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4320634029165263, "ground_truth": 0}, {"key": "32283530", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15921740456918124, "ground_truth": 0}, {"key": "32283530", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3433417117817171, "ground_truth": 0}, {"key": "38377099", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25982563677807174, "ground_truth": 0}, {"key": "38377099", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3867634494288735, "ground_truth": 0}, {"key": "38377099", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2861692497970383, "ground_truth": 0}, {"key": "38377099", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25534365713207985, "ground_truth": 0}, {"key": "38377099", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1561049010809345, "ground_truth": 0}, {"key": "36105123", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.507811884083631, "ground_truth": 0}, {"key": "36105123", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7025300496820556, "ground_truth": 0}, {"key": "36105123", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5698526533380058, "ground_truth": 0}, {"key": "36105123", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292634047822796, "ground_truth": 0}, {"key": "36105123", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.46101679032779413, "ground_truth": 0}, {"key": "33527826", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33633106080615865, "ground_truth": 0}, {"key": "33527826", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21469143352179562, "ground_truth": 0}, {"key": "33527826", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23231015291731286, "ground_truth": 0}, {"key": "33527826", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116181837766, "ground_truth": 0}, {"key": "33527826", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.25091276879295477, "ground_truth": 0}, {"key": "32349891", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6334102703213782, "ground_truth": 0}, {"key": "32349891", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.48828340969772804, "ground_truth": 0}, {"key": "32349891", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.41111087678696356, "ground_truth": 0}, {"key": "32349891", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4073333969981275, "ground_truth": 0}, {"key": "32349891", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804237606436, "ground_truth": 0}, {"key": "34281974", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37570646870151997, "ground_truth": 0}, {"key": "34281974", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3904758367690478, "ground_truth": 0}, {"key": "34281974", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5097643945820416, "ground_truth": 0}, {"key": "34281974", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.47268348885448336, "ground_truth": 0}, {"key": "34281974", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4474602633397035, "ground_truth": 0}, {"key": "29387866", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.54673815604561, "ground_truth": 0}, {"key": "29387866", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20817893364422466, "ground_truth": 0}, {"key": "29387866", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.586996418422808, "ground_truth": 0}, {"key": "29387866", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.39047583261615637, "ground_truth": 0}, {"key": "29387866", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796510564194, "ground_truth": 0}, {"key": "35731925", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9473810458329022, "ground_truth": 0}, {"key": "35731925", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9294404029696643, "ground_truth": 0}, {"key": "35731925", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9046505397568212, "ground_truth": 0}, {"key": "35731925", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9462003549460828, "ground_truth": 0}, {"key": "35731925", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274089965171, "ground_truth": 0}, {"key": "38829733", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5640984817032335, "ground_truth": 0}, {"key": "38829733", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3720487673177516, "ground_truth": 0}, {"key": "38829733", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5409238841021983, "ground_truth": 0}, {"key": "38829733", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4882834002643174, "ground_truth": 0}, {"key": "38829733", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544871549099853, "ground_truth": 0}, {"key": "24624736", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6513548691663079, "ground_truth": 0}, {"key": "24624736", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6206216523087719, "ground_truth": 0}, {"key": "24624736", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6261241599806195, "ground_truth": 0}, {"key": "24624736", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687307259600686, "ground_truth": 0}, {"key": "24624736", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218818054288777, "ground_truth": 0}, {"key": "36928562", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7994423204169115, "ground_truth": 0}, {"key": "36928562", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7154239871225923, "ground_truth": 0}, {"key": "36928562", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7648916048729113, "ground_truth": 0}, {"key": "36928562", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195255475802, "ground_truth": 0}, {"key": "36928562", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512095455606, "ground_truth": 0}, {"key": "34941119", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17667160561372777, "ground_truth": 0}, {"key": "34941119", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18832397609283671, "ground_truth": 0}, {"key": "34941119", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43398145173473984, "ground_truth": 0}, {"key": "34941119", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19682620110594104, "ground_truth": 0}, {"key": "34941119", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.282988089575483, "ground_truth": 0}, {"key": "30206231", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5486735122994648, "ground_truth": 0}, {"key": "30206231", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4882834046848125, "ground_truth": 0}, {"key": "30206231", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4863315273884631, "ground_truth": 0}, {"key": "30206231", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792245317068, "ground_truth": 0}, {"key": "30206231", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880151511046, "ground_truth": 0}, {"key": "35584972", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4111108631611601, "ground_truth": 0}, {"key": "35584972", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31742629065256067, "ground_truth": 0}, {"key": "35584972", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.37754067050751805, "ground_truth": 0}, {"key": "35584972", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091974462570222, "ground_truth": 0}, {"key": "35584972", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641254842696, "ground_truth": 0}, {"key": "39277709", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6671476819436035, "ground_truth": 0}, {"key": "39277709", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6531269310166231, "ground_truth": 0}, {"key": "39277709", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5621764971054855, "ground_truth": 0}, {"key": "39277709", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4263216031740431, "ground_truth": 0}, {"key": "39277709", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378234859894671, "ground_truth": 0}, {"key": "36123657", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6150878671837676, "ground_truth": 0}, {"key": "36123657", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.49804687711421214, "ground_truth": 0}, {"key": "36123657", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3007455767413869, "ground_truth": 0}, {"key": "36123657", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4016878022380628, "ground_truth": 0}, {"key": "36123657", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632636637444, "ground_truth": 0}, {"key": "33363938", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44939262231576516, "ground_truth": 0}, {"key": "33363938", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.05707140112327922, "ground_truth": 0}, {"key": "33363938", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.47463116876929995, "ground_truth": 0}, {"key": "33363938", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9485372359657568, "ground_truth": 0}, {"key": "33363938", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793783849419006, "ground_truth": 0}, {"key": "37349129", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12085323974005037, "ground_truth": 0}, {"key": "37349129", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18242552283342334, "ground_truth": 0}, {"key": "37349129", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3486451282600048, "ground_truth": 0}, {"key": "37349129", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16559312200380713, "ground_truth": 0}, {"key": "37349129", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.07640767806915248, "ground_truth": 0}, {"key": "37160199", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16344542769847686, "ground_truth": 0}, {"key": "37160199", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2766905368173812, "ground_truth": 0}, {"key": "37160199", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2068940582933063, "ground_truth": 0}, {"key": "37160199", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28140559707361423, "ground_truth": 0}, {"key": "37160199", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20434190643163808, "ground_truth": 0}, {"key": "35891053", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5888891502677311, "ground_truth": 0}, {"key": "35891053", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7813306180758506, "ground_truth": 0}, {"key": "35891053", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5813031094187411, "ground_truth": 0}, {"key": "35891053", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723316976759336, "ground_truth": 0}, {"key": "35891053", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4532618950679033, "ground_truth": 0}, {"key": "40694542", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6636689482168396, "ground_truth": 0}, {"key": "40694542", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.49414089219150836, "ground_truth": 0}, {"key": "40694542", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6224593349115263, "ground_truth": 0}, {"key": "40694542", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.583203324305985, "ground_truth": 0}, {"key": "40694542", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "24645770", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2974699457943166, "ground_truth": 0}, {"key": "24645770", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25091278443053483, "ground_truth": 0}, {"key": "24645770", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5136684653160312, "ground_truth": 0}, {"key": "24645770", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593641467000804, "ground_truth": 0}, {"key": "24645770", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076629918828943, "ground_truth": 0}, {"key": "37974587", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5234203669558807, "ground_truth": 0}, {"key": "37974587", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6261241743722475, "ground_truth": 0}, {"key": "37974587", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5195213167028743, "ground_truth": 0}, {"key": "37974587", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802622491924, "ground_truth": 0}, {"key": "37974587", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476929582513, "ground_truth": 0}, {"key": "40354149", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4186969044575723, "ground_truth": 0}, {"key": "40354149", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.39420092069270835, "ground_truth": 0}, {"key": "40354149", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6460137060782516, "ground_truth": 0}, {"key": "40354149", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755880310504558, "ground_truth": 0}, {"key": "40354149", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397027257076, "ground_truth": 0}, {"key": "35519470", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.06418263714847225, "ground_truth": 0}, {"key": "35519470", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16667540300995748, "ground_truth": 0}, {"key": "35519470", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12336561809159487, "ground_truth": 0}, {"key": "35519470", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13660840435142277, "ground_truth": 0}, {"key": "35519470", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09203285937882115, "ground_truth": 0}, {"key": "36185624", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.48047865797060785, "ground_truth": 0}, {"key": "36185624", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5544705028014587, "ground_truth": 0}, {"key": "36185624", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6688802551936873, "ground_truth": 0}, {"key": "36185624", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.492188134447561, "ground_truth": 0}, {"key": "36185624", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358293722318, "ground_truth": 0}, {"key": "39306113", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2213506811012255, "ground_truth": 0}, {"key": "39306113", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18126321003698848, "ground_truth": 0}, {"key": "39306113", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1645164558079635, "ground_truth": 0}, {"key": "39306113", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.05665242259281477, "ground_truth": 0}, {"key": "39306113", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.07585817937292823, "ground_truth": 0}, {"key": "19347718", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25386099460146366, "ground_truth": 0}, {"key": "19347718", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2523840374894608, "ground_truth": 0}, {"key": "19347718", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18832398379177037, "ground_truth": 0}, {"key": "19347718", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31236998557339535, "ground_truth": 0}, {"key": "19347718", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.262841829688492, "ground_truth": 0}, {"key": "21870064", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16451645819692715, "ground_truth": 0}, {"key": "21870064", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10374862865715721, "ground_truth": 0}, {"key": "21870064", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07263670486678214, "ground_truth": 0}, {"key": "21870064", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09203285997654329, "ground_truth": 0}, {"key": "21870064", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.0474258715999006, "ground_truth": 0}, {"key": "37675776", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6842640174535863, "ground_truth": 0}, {"key": "37675776", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5428632679916336, "ground_truth": 0}, {"key": "37675776", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7201715100443103, "ground_truth": 0}, {"key": "37675776", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936480495395, "ground_truth": 0}, {"key": "37675776", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907791984791578, "ground_truth": 0}, {"key": "38107017", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20307462823685718, "ground_truth": 0}, {"key": "38107017", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.276690525546367, "ground_truth": 0}, {"key": "38107017", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18952109031013967, "ground_truth": 0}, {"key": "38107017", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21337717136710954, "ground_truth": 0}, {"key": "38107017", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2379298854904154, "ground_truth": 0}, {"key": "40046472", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5350984561810269, "ground_truth": 0}, {"key": "40046472", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7170118762361228, "ground_truth": 0}, {"key": "40046472", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2942149745470466, "ground_truth": 0}, {"key": "40046472", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548558792674, "ground_truth": 0}, {"key": "40046472", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984159323433, "ground_truth": 0}, {"key": "32157820", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4532618448419079, "ground_truth": 0}, {"key": "32157820", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5945512539397592, "ground_truth": 0}, {"key": "32157820", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.47852881558245924, "ground_truth": 0}, {"key": "32157820", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704811851761, "ground_truth": 0}, {"key": "32157820", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878367265946, "ground_truth": 0}, {"key": "41004037", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22541661172318547, "ground_truth": 0}, {"key": "41004037", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2133771610005665, "ground_truth": 0}, {"key": "41004037", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2509127907742806, "ground_truth": 0}, {"key": "41004037", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1460872545078859, "ground_truth": 0}, {"key": "41004037", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15304215758582587, "ground_truth": 0}, {"key": "21387993", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3451052806146676, "ground_truth": 0}, {"key": "21387993", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44360040310029586, "ground_truth": 0}, {"key": "21387993", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3259495165452839, "ground_truth": 0}, {"key": "21387993", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3090237199000929, "ground_truth": 0}, {"key": "21387993", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199379103287, "ground_truth": 0}, {"key": "34665539", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3904758356410865, "ground_truth": 0}, {"key": "34665539", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.29910519156224796, "ground_truth": 0}, {"key": "34665539", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38491214857315764, "ground_truth": 0}, {"key": "34665539", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030614083872, "ground_truth": 0}, {"key": "34665539", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3575675123943979, "ground_truth": 0}, {"key": "37872111", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3539862914614632, "ground_truth": 0}, {"key": "37872111", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42632158321204106, "ground_truth": 0}, {"key": "37872111", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5253688235284468, "ground_truth": 0}, {"key": "37872111", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14033625606142702, "ground_truth": 0}, {"key": "37872111", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366062081321, "ground_truth": 0}, {"key": "36629542", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3259494985068336, "ground_truth": 0}, {"key": "36629542", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4474602947355337, "ground_truth": 0}, {"key": "36629542", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2030746254517329, "ground_truth": 0}, {"key": "36629542", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.401687805934342, "ground_truth": 0}, {"key": "36629542", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20946968413470302, "ground_truth": 0}, {"key": "36487527", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.48438005627543373, "ground_truth": 0}, {"key": "36487527", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6261241654166712, "ground_truth": 0}, {"key": "36487527", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6909762929110752, "ground_truth": 0}, {"key": "36487527", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4186969079115065, "ground_truth": 0}, {"key": "36487527", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30902371652297056, "ground_truth": 0}, {"key": "37344756", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6370307645818216, "ground_truth": 0}, {"key": "37344756", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5813031095689107, "ground_truth": 0}, {"key": "37344756", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "37344756", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28298813083313484, "ground_truth": 0}, {"key": "37344756", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224293077802, "ground_truth": 0}, {"key": "38707722", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2877678185531476, "ground_truth": 0}, {"key": "38707722", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22541661146811778, "ground_truth": 0}, {"key": "38707722", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27048021666115973, "ground_truth": 0}, {"key": "38707722", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21866938443963577, "ground_truth": 0}, {"key": "38707722", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3056973277489496, "ground_truth": 0}, {"key": "37093419", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10158945106513752, "ground_truth": 0}, {"key": "37093419", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14128142336541202, "ground_truth": 0}, {"key": "37093419", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15817434392817195, "ground_truth": 0}, {"key": "37093419", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08570928126007368, "ground_truth": 0}, {"key": "37093419", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21206880724512464, "ground_truth": 0}, {"key": "35547391", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3738758175865319, "ground_truth": 0}, {"key": "35547391", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3451052629104072, "ground_truth": 0}, {"key": "35547391", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11516223675857962, "ground_truth": 0}, {"key": "35547391", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.30902372028839725, "ground_truth": 0}, {"key": "35547391", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3242353938848665, "ground_truth": 0}, {"key": "37173168", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.48242908629236364, "ground_truth": 0}, {"key": "37173168", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4416729837902862, "ground_truth": 0}, {"key": "37173168", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6370307714983986, "ground_truth": 0}, {"key": "37173168", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073648067046, "ground_truth": 0}, {"key": "37173168", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21866937526066937, "ground_truth": 0}, {"key": "30725298", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24364243803386715, "ground_truth": 0}, {"key": "30725298", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4726834730663998, "ground_truth": 0}, {"key": "30725298", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31069438495881385, "ground_truth": 0}, {"key": "30725298", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633932625295, "ground_truth": 0}, {"key": "30725298", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3522017742699337, "ground_truth": 0}, {"key": "33830573", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5312093558651806, "ground_truth": 0}, {"key": "33830573", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.602061566558516, "ground_truth": 0}, {"key": "33830573", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5869964300462828, "ground_truth": 0}, {"key": "33830573", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.596433159808695, "ground_truth": 0}, {"key": "33830573", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.633410284698893, "ground_truth": 0}, {"key": "33415474", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12678517544351223, "ground_truth": 0}, {"key": "33415474", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1023047012265008, "ground_truth": 0}, {"key": "33415474", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07423137282298553, "ground_truth": 0}, {"key": "33415474", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10017222929350947, "ground_truth": 0}, {"key": "33415474", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.05665242298198525, "ground_truth": 0}, {"key": "37383994", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5253688115077536, "ground_truth": 0}, {"key": "37383994", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5660185348105367, "ground_truth": 0}, {"key": "37383994", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6477982160340954, "ground_truth": 0}, {"key": "37383994", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943506468114, "ground_truth": 0}, {"key": "37383994", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907792121673303, "ground_truth": 0}, {"key": "38576819", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8670357561342572, "ground_truth": 0}, {"key": "38576819", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8807970801900159, "ground_truth": 0}, {"key": "38576819", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7122321810157073, "ground_truth": 0}, {"key": "38576819", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.915507242509579, "ground_truth": 0}, {"key": "38576819", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281485144007, "ground_truth": 0}, {"key": "34500226", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2227001128829503, "ground_truth": 0}, {"key": "34500226", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40922076668133683, "ground_truth": 0}, {"key": "34500226", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2814056086311059, "ground_truth": 0}, {"key": "34500226", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3451052854687725, "ground_truth": 0}, {"key": "34500226", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37204879742484787, "ground_truth": 0}, {"key": "39856394", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35398628072354665, "ground_truth": 0}, {"key": "39856394", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3380771340967307, "ground_truth": 0}, {"key": "39856394", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.49414089048174664, "ground_truth": 0}, {"key": "39856394", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24220562640984247, "ground_truth": 0}, {"key": "39856394", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2720245614528547, "ground_truth": 0}, {"key": "35499522", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12765262475752687, "ground_truth": 0}, {"key": "35499522", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21469141931919025, "ground_truth": 0}, {"key": "35499522", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07477005158834307, "ground_truth": 0}, {"key": "35499522", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.0651275456908171, "ground_truth": 0}, {"key": "35499522", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.0869416587465792, "ground_truth": 0}, {"key": "30157766", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5312093709269845, "ground_truth": 0}, {"key": "30157766", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4804786858717054, "ground_truth": 0}, {"key": "30157766", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4397472968015327, "ground_truth": 0}, {"key": "30157766", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583212738619, "ground_truth": 0}, {"key": "30157766", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238782760121, "ground_truth": 0}, {"key": "40472346", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.42823339395140786, "ground_truth": 0}, {"key": "40472346", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4225046549712001, "ground_truth": 0}, {"key": "40472346", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.366589741568762, "ground_truth": 0}, {"key": "40472346", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19436780769819897, "ground_truth": 0}, {"key": "40472346", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45907612212520094, "ground_truth": 0}, {"key": "35305635", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5389832104853661, "ground_truth": 0}, {"key": "35305635", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6001883368094793, "ground_truth": 0}, {"key": "35305635", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5736783973309256, "ground_truth": 0}, {"key": "35305635", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3867634645318816, "ground_truth": 0}, {"key": "35305635", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548641363145, "ground_truth": 0}, {"key": "32495926", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25238404239250317, "ground_truth": 0}, {"key": "32495926", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21206880481255755, "ground_truth": 0}, {"key": "32495926", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23231012456396796, "ground_truth": 0}, {"key": "32495926", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14414886058171208, "ground_truth": 0}, {"key": "32495926", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20055768707881969, "ground_truth": 0}, {"key": "37353801", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1847675126427606, "ground_truth": 0}, {"key": "37353801", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13117323140610404, "ground_truth": 0}, {"key": "37353801", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3208213276345869, "ground_truth": 0}, {"key": "37353801", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12765262207901765, "ground_truth": 0}, {"key": "37353801", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.08882028610394256, "ground_truth": 0}, {"key": "30159904", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6224593169669397, "ground_truth": 0}, {"key": "30159904", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.49609382127793294, "ground_truth": 0}, {"key": "30159904", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5525397228349419, "ground_truth": 0}, {"key": "30159904", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512706117025, "ground_truth": 0}, {"key": "30159904", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582588007001, "ground_truth": 0}, {"key": "33698679", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4339814443785183, "ground_truth": 0}, {"key": "33698679", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31573598704383876, "ground_truth": 0}, {"key": "33698679", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15817436143150335, "ground_truth": 0}, {"key": "33698679", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19314737967535575, "ground_truth": 0}, {"key": "33698679", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20434190228543153, "ground_truth": 0}, {"key": "40530172", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6001883400874903, "ground_truth": 0}, {"key": "40530172", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3345894502575783, "ground_truth": 0}, {"key": "40530172", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6976088925185043, "ground_truth": 0}, {"key": "40530172", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156198821366909, "ground_truth": 0}, {"key": "40530172", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.484380119593709, "ground_truth": 0}, {"key": "40652941", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6279512047500049, "ground_truth": 0}, {"key": "40652941", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.618780451938225, "ground_truth": 0}, {"key": "40652941", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7969253675552229, "ground_truth": 0}, {"key": "40652941", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819826924547, "ground_truth": 0}, {"key": "40652941", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4980468615148804, "ground_truth": 0}, {"key": "40122246", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3398276375758158, "ground_truth": 0}, {"key": "40122246", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5409238756092853, "ground_truth": 0}, {"key": "40122246", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.32423540467190654, "ground_truth": 0}, {"key": "40122246", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09334687656299834, "ground_truth": 0}, {"key": "40122246", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3775406617046849, "ground_truth": 0}, {"key": "40032656", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.43206338912011044, "ground_truth": 0}, {"key": "40032656", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6132365355298967, "ground_truth": 0}, {"key": "40032656", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6150878566729954, "ground_truth": 0}, {"key": "40032656", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629585946112257, "ground_truth": 0}, {"key": "40032656", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.49609385197608485, "ground_truth": 0}, {"key": "38913680", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09670578765090622, "ground_truth": 0}, {"key": "38913680", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17895589000958595, "ground_truth": 0}, {"key": "38913680", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18832397606294593, "ground_truth": 0}, {"key": "38913680", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798744028038408, "ground_truth": 0}, {"key": "38913680", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30239107016396993, "ground_truth": 0}, {"key": "17608039", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.07423137286846812, "ground_truth": 0}, {"key": "17608039", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6095241581727542, "ground_truth": 0}, {"key": "17608039", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14608723917662964, "ground_truth": 0}, {"key": "17608039", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14608725005791703, "ground_truth": 0}, {"key": "17608039", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11838509844205991, "ground_truth": 0}, {"key": "40434901", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.41111083786852365, "ground_truth": 0}, {"key": "40434901", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38121956453852474, "ground_truth": 0}, {"key": "40434901", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5755880196062995, "ground_truth": 0}, {"key": "40434901", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370414136370544, "ground_truth": 0}, {"key": "40434901", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35936414402063643, "ground_truth": 0}, {"key": "37680058", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10447731826033858, "ground_truth": 0}, {"key": "37680058", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.045015535330681124, "ground_truth": 0}, {"key": "37680058", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.04995851975099821, "ground_truth": 0}, {"key": "37680058", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.0411528867474818, "ground_truth": 0}, {"key": "37680058", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.07004895786037553, "ground_truth": 0}, {"key": "37291821", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5544704545128059, "ground_truth": 0}, {"key": "37291821", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5136684351985645, "ground_truth": 0}, {"key": "37291821", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.47073661574147996, "ground_truth": 0}, {"key": "37291821", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117166103364905, "ground_truth": 0}, {"key": "37291821", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3345894390608359, "ground_truth": 0}, {"key": "41002743", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3886180221753902, "ground_truth": 0}, {"key": "41002743", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6406358602795568, "ground_truth": 0}, {"key": "41002743", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3468730840808441, "ground_truth": 0}, {"key": "41002743", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4205995963422218, "ground_truth": 0}, {"key": "41002743", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413807295845, "ground_truth": 0}, {"key": "36322869", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4092207979884161, "ground_truth": 0}, {"key": "36322869", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3539862771216909, "ground_truth": 0}, {"key": "36322869", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5370413624383777, "ground_truth": 0}, {"key": "36322869", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27048022169069197, "ground_truth": 0}, {"key": "36322869", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218814077402573, "ground_truth": 0}, {"key": "39459717", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3225259888708438, "ground_truth": 0}, {"key": "39459717", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3684056860177914, "ground_truth": 0}, {"key": "39459717", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4902356598828998, "ground_truth": 0}, {"key": "39459717", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256365171278, "ground_truth": 0}, {"key": "39459717", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991051779947678, "ground_truth": 0}, {"key": "36503727", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2643583697736953, "ground_truth": 0}, {"key": "36503727", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.284576016969751, "ground_truth": 0}, {"key": "36503727", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.255343646427687, "ground_truth": 0}, {"key": "36503727", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1030244259791066, "ground_truth": 0}, {"key": "36503727", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3380771436691583, "ground_truth": 0}, {"key": "35682367", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4513265165433538, "ground_truth": 0}, {"key": "35682367", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5039061652164216, "ground_truth": 0}, {"key": "35682367", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20434188734289324, "ground_truth": 0}, {"key": "35682367", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3380771022293958, "ground_truth": 0}, {"key": "35682367", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.357567509991665, "ground_truth": 0}, {"key": "36472353", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4474603104756806, "ground_truth": 0}, {"key": "36472353", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5350984388786609, "ground_truth": 0}, {"key": "36472353", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20689403268621592, "ground_truth": 0}, {"key": "36472353", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16026603375093237, "ground_truth": 0}, {"key": "36472353", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19682620855522964, "ground_truth": 0}, {"key": "37651907", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21206881029566543, "ground_truth": 0}, {"key": "37651907", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28937169936762636, "ground_truth": 0}, {"key": "37651907", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15304215118403375, "ground_truth": 0}, {"key": "37651907", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.224055462251498, "ground_truth": 0}, {"key": "37651907", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.06465348960469759, "ground_truth": 0}, {"key": "36255476", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17895589935682515, "ground_truth": 0}, {"key": "36255476", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2751297298662333, "ground_truth": 0}, {"key": "36255476", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1550784717866452, "ground_truth": 0}, {"key": "36255476", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21469141620210777, "ground_truth": 0}, {"key": "36255476", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3106943717992146, "ground_truth": 0}, {"key": "37283518", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6566582587987373, "ground_truth": 0}, {"key": "37283518", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6548947375804962, "ground_truth": 0}, {"key": "37283518", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6976089134370166, "ground_truth": 0}, {"key": "37283518", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318492575839, "ground_truth": 0}, {"key": "37283518", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4843800633612615, "ground_truth": 0}, {"key": "34906785", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39233681292477907, "ground_truth": 0}, {"key": "34906785", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2735744027296973, "ground_truth": 0}, {"key": "34906785", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35936415722551523, "ground_truth": 0}, {"key": "34906785", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213248742508, "ground_truth": 0}, {"key": "34906785", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32766830542467873, "ground_truth": 0}, {"key": "34965328", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6039318275671202, "ground_truth": 0}, {"key": "34965328", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5467381380311221, "ground_truth": 0}, {"key": "34965328", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.32766830877165903, "ground_truth": 0}, {"key": "34965328", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269912779758, "ground_truth": 0}, {"key": "34965328", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4320634035806301, "ground_truth": 0}, {"key": "38788440", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.05541279152062894, "ground_truth": 0}, {"key": "38788440", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.06465349086957732, "ground_truth": 0}, {"key": "38788440", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1320661505135005, "ground_truth": 0}, {"key": "38788440", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08632347553689194, "ground_truth": 0}, {"key": "38788440", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.052618955885435914, "ground_truth": 0}, {"key": "35046866", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40733342403257683, "ground_truth": 0}, {"key": "35046866", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5544704476111082, "ground_truth": 0}, {"key": "35046866", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5964331542931298, "ground_truth": 0}, {"key": "35046866", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891488490083, "ground_truth": 0}, {"key": "35046866", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615854498997, "ground_truth": 0}, {"key": "37629558", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24798743094374448, "ground_truth": 0}, {"key": "37629558", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22135069177774133, "ground_truth": 0}, {"key": "37629558", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24653332668303887, "ground_truth": 0}, {"key": "37629558", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12421302671351947, "ground_truth": 0}, {"key": "37629558", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.06560483701681037, "ground_truth": 0}, {"key": "33859914", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27982846980804843, "ground_truth": 0}, {"key": "33859914", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3775406554701468, "ground_truth": 0}, {"key": "33859914", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.46295861700639845, "ground_truth": 0}, {"key": "33859914", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2991051811451008, "ground_truth": 0}, {"key": "33859914", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2942149905512824, "ground_truth": 0}, {"key": "39790523", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27202454633574585, "ground_truth": 0}, {"key": "39790523", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5019531170583635, "ground_truth": 0}, {"key": "39790523", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16885693671306445, "ground_truth": 0}, {"key": "39790523", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43398144576088, "ground_truth": 0}, {"key": "39790523", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.26435835341430364, "ground_truth": 0}, {"key": "33509656", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23370635784072594, "ground_truth": 0}, {"key": "33509656", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4073333843088584, "ground_truth": 0}, {"key": "33509656", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14128142587035245, "ground_truth": 0}, {"key": "33509656", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1183850947545611, "ground_truth": 0}, {"key": "33509656", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3923368336769663, "ground_truth": 0}, {"key": "17380923", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4571367378133361, "ground_truth": 0}, {"key": "17380923", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6020615715664287, "ground_truth": 0}, {"key": "17380923", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.45519862521882803, "ground_truth": 0}, {"key": "17380923", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.414898833376369, "ground_truth": 0}, {"key": "17380923", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061761180248, "ground_truth": 0}, {"key": "36202526", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20181322052025755, "ground_truth": 0}, {"key": "36202526", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32252596791090443, "ground_truth": 0}, {"key": "36202526", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14511535943571993, "ground_truth": 0}, {"key": "36202526", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3311197489025313, "ground_truth": 0}, {"key": "36202526", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2861692549734744, "ground_truth": 0}, {"key": "26419232", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4843801027768001, "ground_truth": 0}, {"key": "26419232", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5506073818160924, "ground_truth": 0}, {"key": "26419232", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.47463114036876414, "ground_truth": 0}, {"key": "26419232", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.472683455909796, "ground_truth": 0}, {"key": "26419232", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.28616924019816475, "ground_truth": 0}, {"key": "34232398", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36296920359573415, "ground_truth": 0}, {"key": "34232398", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.34158248465919666, "ground_truth": 0}, {"key": "34232398", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3793784147269618, "ground_truth": 0}, {"key": "34232398", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486735234358936, "ground_truth": 0}, {"key": "34232398", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.47073659755508934, "ground_truth": 0}, {"key": "33586045", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20817893237623197, "ground_truth": 0}, {"key": "33586045", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6442251298590435, "ground_truth": 0}, {"key": "33586045", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20307462575305027, "ground_truth": 0}, {"key": "33586045", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18832398938230197, "ground_truth": 0}, {"key": "33586045", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15304214806744992, "ground_truth": 0}, {"key": "32281151", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2120688324025578, "ground_truth": 0}, {"key": "32281151", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14706453205476197, "ground_truth": 0}, {"key": "32281151", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16132023409740442, "ground_truth": 0}, {"key": "32281151", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17553808134477147, "ground_truth": 0}, {"key": "32281151", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944725120095879, "ground_truth": 0}, {"key": "37308159", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.459076152318793, "ground_truth": 0}, {"key": "37308159", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.690976298922355, "ground_truth": 0}, {"key": "37308159", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39981166362994597, "ground_truth": 0}, {"key": "37308159", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32939171904881054, "ground_truth": 0}, {"key": "37308159", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882834068659988, "ground_truth": 0}, {"key": "35694408", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4092207822972318, "ground_truth": 0}, {"key": "35694408", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7813306251531821, "ground_truth": 0}, {"key": "35694408", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.41111087607942287, "ground_truth": 0}, {"key": "35694408", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4416730124585966, "ground_truth": 0}, {"key": "35694408", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.34864513179362716, "ground_truth": 0}, {"key": "39781995", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5195213293697561, "ground_truth": 0}, {"key": "39781995", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.35936413931408523, "ground_truth": 0}, {"key": "39781995", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5525397143083217, "ground_truth": 0}, {"key": "39781995", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723317029149167, "ground_truth": 0}, {"key": "39781995", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37387581011086235, "ground_truth": 0}, {"key": "22799372", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8344068908337436, "ground_truth": 0}, {"key": "22799372", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.796925364849801, "ground_truth": 0}, {"key": "22799372", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8344068824863876, "ground_truth": 0}, {"key": "22799372", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307780109194, "ground_truth": 0}, {"key": "22799372", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976088849712483, "ground_truth": 0}, {"key": "37428240", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2598256234637954, "ground_truth": 0}, {"key": "37428240", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2735743998375459, "ground_truth": 0}, {"key": "37428240", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15610490024317777, "ground_truth": 0}, {"key": "37428240", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3720487890543238, "ground_truth": 0}, {"key": "37428240", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17441028006452067, "ground_truth": 0}, {"key": "40612657", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7732163718989999, "ground_truth": 0}, {"key": "40612657", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6531269100500579, "ground_truth": 0}, {"key": "40612657", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42441198193089635, "ground_truth": 0}, {"key": "40612657", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786153419812, "ground_truth": 0}, {"key": "40612657", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358461020867, "ground_truth": 0}, {"key": "34404662", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2450850160189696, "ground_truth": 0}, {"key": "34404662", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15405755121251083, "ground_truth": 0}, {"key": "34404662", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.65489472287662, "ground_truth": 0}, {"key": "34404662", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27357436737426444, "ground_truth": 0}, {"key": "34404662", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3904758441029104, "ground_truth": 0}, {"key": "32619704", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34687309193110144, "ground_truth": 0}, {"key": "32619704", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21469141970466693, "ground_truth": 0}, {"key": "32619704", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3040416695854861, "ground_truth": 0}, {"key": "32619704", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32252598846289154, "ground_truth": 0}, {"key": "32619704", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4244120103165334, "ground_truth": 0}, {"key": "39014883", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3225259897554114, "ground_truth": 0}, {"key": "39014883", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.379378384848875, "ground_truth": 0}, {"key": "39014883", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.29421495638765055, "ground_truth": 0}, {"key": "39014883", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4474602971863884, "ground_truth": 0}, {"key": "39014883", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2720245710868454, "ground_truth": 0}, {"key": "37982812", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1571368601342807, "ground_truth": 0}, {"key": "37982812", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.372048792055172, "ground_truth": 0}, {"key": "37982812", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4551986075244629, "ground_truth": 0}, {"key": "37982812", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3611647222145325, "ground_truth": 0}, {"key": "37982812", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21601153195847297, "ground_truth": 0}, {"key": "28123476", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3849121313393509, "ground_truth": 0}, {"key": "28123476", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24798739915552076, "ground_truth": 0}, {"key": "28123476", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40733339612271025, "ground_truth": 0}, {"key": "28123476", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38676345315937377, "ground_truth": 0}, {"key": "28123476", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185402906961, "ground_truth": 0}, {"key": "39078849", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26740815769488396, "ground_truth": 0}, {"key": "39078849", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.161320235446756, "ground_truth": 0}, {"key": "39078849", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2337063656086745, "ground_truth": 0}, {"key": "39078849", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17441027417783384, "ground_truth": 0}, {"key": "39078849", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16559310931772575, "ground_truth": 0}, {"key": "39414137", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.838679765280739, "ground_truth": 0}, {"key": "39414137", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7201715076976084, "ground_truth": 0}, {"key": "39414137", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8714748693168091, "ground_truth": 0}, {"key": "39414137", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545658175813, "ground_truth": 0}, {"key": "39414137", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253758029555, "ground_truth": 0}, {"key": "37371354", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33807712587946714, "ground_truth": 0}, {"key": "37371354", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3398276307420717, "ground_truth": 0}, {"key": "37371354", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3539863100149942, "ground_truth": 0}, {"key": "37371354", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27357438354238384, "ground_truth": 0}, {"key": "37371354", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22135069426974704, "ground_truth": 0}, {"key": "29497179", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37387579642388236, "ground_truth": 0}, {"key": "29497179", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.34864514377689687, "ground_truth": 0}, {"key": "29497179", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2479874220735799, "ground_truth": 0}, {"key": "29497179", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061425214659, "ground_truth": 0}, {"key": "29497179", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360040687155033, "ground_truth": 0}, {"key": "35908694", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6774740026647389, "ground_truth": 0}, {"key": "35908694", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6584174884994191, "ground_truth": 0}, {"key": "35908694", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5907792083359775, "ground_truth": 0}, {"key": "35908694", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.41300355977773784, "ground_truth": 0}, {"key": "35908694", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4960938378009148, "ground_truth": 0}, {"key": "37619358", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13386748458745287, "ground_truth": 0}, {"key": "37619358", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3225260019221684, "ground_truth": 0}, {"key": "37619358", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24798743413128102, "ground_truth": 0}, {"key": "37619358", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17781087772095402, "ground_truth": 0}, {"key": "37619358", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.310694397793259, "ground_truth": 0}, {"key": "37293103", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5506073921671625, "ground_truth": 0}, {"key": "37293103", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5234203661791726, "ground_truth": 0}, {"key": "37293103", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7534666608012173, "ground_truth": 0}, {"key": "37293103", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786913434552, "ground_truth": 0}, {"key": "37293103", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159409135144, "ground_truth": 0}, {"key": "36883729", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1613202323691018, "ground_truth": 0}, {"key": "36883729", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10894505118995204, "ground_truth": 0}, {"key": "36883729", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21076630437185953, "ground_truth": 0}, {"key": "36883729", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14608725649125362, "ground_truth": 0}, {"key": "36883729", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14903530270330573, "ground_truth": 0}, {"key": "39209521", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4707366224223106, "ground_truth": 0}, {"key": "39209521", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3023910703664466, "ground_truth": 0}, {"key": "39209521", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42059957814168086, "ground_truth": 0}, {"key": "39209521", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199241297942, "ground_truth": 0}, {"key": "39209521", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43206340932875853, "ground_truth": 0}, {"key": "27792571", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.43974734113697983, "ground_truth": 0}, {"key": "27792571", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4687906248839432, "ground_truth": 0}, {"key": "27792571", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2974699333159606, "ground_truth": 0}, {"key": "27792571", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44746029701333573, "ground_truth": 0}, {"key": "27792571", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3486451327597224, "ground_truth": 0}, {"key": "39755647", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5832033450876802, "ground_truth": 0}, {"key": "39755647", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "39755647", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.48047866876595774, "ground_truth": 0}, {"key": "39755647", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061911324251, "ground_truth": 0}, {"key": "39755647", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.74167399763393, "ground_truth": 0}, {"key": "40800537", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.04115288352688261, "ground_truth": 0}, {"key": "40800537", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1422318865348577, "ground_truth": 0}, {"key": "40800537", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11516223234781041, "ground_truth": 0}, {"key": "40800537", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07807816200201469, "ground_truth": 0}, {"key": "40800537", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.06187598763927282, "ground_truth": 0}, {"key": "14171461", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23091975906321124, "ground_truth": 0}, {"key": "14171461", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2379299031239573, "ground_truth": 0}, {"key": "14171461", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1550784646756935, "ground_truth": 0}, {"key": "14171461", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245688881602, "ground_truth": 0}, {"key": "14171461", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14903529379486205, "ground_truth": 0}, {"key": "36892440", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2689414384997494, "ground_truth": 0}, {"key": "36892440", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5736784064312432, "ground_truth": 0}, {"key": "36892440", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1895210903347415, "ground_truth": 0}, {"key": "36892440", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878653805849, "ground_truth": 0}, {"key": "36892440", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926666161490528, "ground_truth": 0}, {"key": "33733410", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5698526458112986, "ground_truth": 0}, {"key": "33733410", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22953520587222045, "ground_truth": 0}, {"key": "33733410", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.41300359175809, "ground_truth": 0}, {"key": "33733410", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29259530459562166, "ground_truth": 0}, {"key": "33733410", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.49804688035172084, "ground_truth": 0}, {"key": "38587765", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.05921025263247533, "ground_truth": 0}, {"key": "38587765", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.06142403853220241, "ground_truth": 0}, {"key": "38587765", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12940272768978744, "ground_truth": 0}, {"key": "38587765", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07369627368081454, "ground_truth": 0}, {"key": "38587765", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.03676946402657216, "ground_truth": 0}, {"key": "41065582", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3998116681027844, "ground_truth": 0}, {"key": "41065582", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2227001504597503, "ground_truth": 0}, {"key": "41065582", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24798744245789942, "ground_truth": 0}, {"key": "41065582", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2436424396421402, "ground_truth": 0}, {"key": "41065582", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20181321996303847, "ground_truth": 0}, {"key": "34713891", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.047780068582386, "ground_truth": 0}, {"key": "34713891", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1175721384136794, "ground_truth": 0}, {"key": "34713891", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2056150367812559, "ground_truth": 0}, {"key": "34713891", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.187132684954865, "ground_truth": 0}, {"key": "34713891", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16776334857213485, "ground_truth": 0}, {"key": "18913023", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2613309066247544, "ground_truth": 0}, {"key": "18913023", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5717666069039883, "ground_truth": 0}, {"key": "18913023", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5214711652959265, "ground_truth": 0}, {"key": "18913023", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20561505025703966, "ground_truth": 0}, {"key": "18913023", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2782567799472203, "ground_truth": 0}, {"key": "36884100", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18594721192879254, "ground_truth": 0}, {"key": "36884100", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3684057052784698, "ground_truth": 0}, {"key": "36884100", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1530421563530205, "ground_truth": 0}, {"key": "36884100", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.055412794893203464, "ground_truth": 0}, {"key": "36884100", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.07159119602338013, "ground_truth": 0}, {"key": "39899913", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24220563128743905, "ground_truth": 0}, {"key": "39899913", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2942149880525074, "ground_truth": 0}, {"key": "39899913", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4378235315191785, "ground_truth": 0}, {"key": "39899913", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2254166153334893, "ground_truth": 0}, {"key": "39899913", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2689413945252368, "ground_truth": 0}, {"key": "30725366", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11279540275051084, "ground_truth": 0}, {"key": "30725366", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5945512633028128, "ground_truth": 0}, {"key": "30725366", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07531230956198191, "ground_truth": 0}, {"key": "30725366", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.06903793018379545, "ground_truth": 0}, {"key": "30725366", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11920292532785601, "ground_truth": 0}, {"key": "26133523", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24077456547840537, "ground_truth": 0}, {"key": "26133523", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19193278023691204, "ground_truth": 0}, {"key": "26133523", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22405542816479465, "ground_truth": 0}, {"key": "26133523", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18359361015461384, "ground_truth": 0}, {"key": "26133523", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2861692420204962, "ground_truth": 0}, {"key": "29332665", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37937840437212356, "ground_truth": 0}, {"key": "29332665", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6893056069820716, "ground_truth": 0}, {"key": "29332665", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3629692233888745, "ground_truth": 0}, {"key": "29332665", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2351083776132644, "ground_truth": 0}, {"key": "29332665", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473437743606, "ground_truth": 0}, {"key": "37400481", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.48047868872089744, "ground_truth": 0}, {"key": "37400481", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5983122065500414, "ground_truth": 0}, {"key": "37400481", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5039061716490553, "ground_truth": 0}, {"key": "37400481", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165214582876, "ground_truth": 0}, {"key": "37400481", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4455295424791559, "ground_truth": 0}, {"key": "38787241", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2974699543842328, "ground_truth": 0}, {"key": "38787241", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3684057029817688, "ground_truth": 0}, {"key": "38787241", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3398276146468921, "ground_truth": 0}, {"key": "38787241", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.232310147262137, "ground_truth": 0}, {"key": "38787241", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12168575394570054, "ground_truth": 0}, {"key": "38225963", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20946968521799728, "ground_truth": 0}, {"key": "38225963", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5813030863039965, "ground_truth": 0}, {"key": "38225963", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2942149676967812, "ground_truth": 0}, {"key": "38225963", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3311197238451311, "ground_truth": 0}, {"key": "38225963", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.28298813159793723, "ground_truth": 0}, {"key": "26072034", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1267851696507629, "ground_truth": 0}, {"key": "26072034", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22541661297253157, "ground_truth": 0}, {"key": "26072034", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3415824878827312, "ground_truth": 0}, {"key": "26072034", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13660840360093618, "ground_truth": 0}, {"key": "26072034", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09268777559084514, "ground_truth": 0}, {"key": "35690810", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22135069486118267, "ground_truth": 0}, {"key": "35690810", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32082130266565423, "ground_truth": 0}, {"key": "35690810", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3539863016672701, "ground_truth": 0}, {"key": "35690810", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20055767325855056, "ground_truth": 0}, {"key": "35690810", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2538610258850849, "ground_truth": 0}, {"key": "36855665", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9073122312376946, "ground_truth": 0}, {"key": "36855665", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7759445574462762, "ground_truth": 0}, {"key": "36855665", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7905303118731016, "ground_truth": 0}, {"key": "36855665", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213511843625, "ground_truth": 0}, {"key": "36855665", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688267140371, "ground_truth": 0}, {"key": "29757662", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39981163113780926, "ground_truth": 0}, {"key": "29757662", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37387581891327737, "ground_truth": 0}, {"key": "29757662", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.273574390076584, "ground_truth": 0}, {"key": "29757662", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23651623516157202, "ground_truth": 0}, {"key": "29757662", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2814056010029283, "ground_truth": 0}, {"key": "19134339", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2450849986383633, "ground_truth": 0}, {"key": "19134339", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3522017837769552, "ground_truth": 0}, {"key": "19134339", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13568954217106927, "ground_truth": 0}, {"key": "19134339", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16026603776177298, "ground_truth": 0}, {"key": "19134339", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19314739335331627, "ground_truth": 0}, {"key": "35360732", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5660185266270006, "ground_truth": 0}, {"key": "35360732", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43974735068344484, "ground_truth": 0}, {"key": "35360732", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5428632714351028, "ground_truth": 0}, {"key": "35360732", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804318891362, "ground_truth": 0}, {"key": "35360732", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.624293528831079, "ground_truth": 0}, {"key": "37713629", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8976952937799687, "ground_truth": 0}, {"key": "37713629", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6113819777379957, "ground_truth": 0}, {"key": "37713629", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7648916161194764, "ground_truth": 0}, {"key": "37713629", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585472130593, "ground_truth": 0}, {"key": "37713629", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673078816672, "ground_truth": 0}, {"key": "33393394", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16238002140061233, "ground_truth": 0}, {"key": "33393394", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11201595826073804, "ground_truth": 0}, {"key": "33393394", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1801066568411418, "ground_truth": 0}, {"key": "33393394", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11279540185309404, "ground_truth": 0}, {"key": "33393394", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10447732052259281, "ground_truth": 0}, {"key": "32275837", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6842640245394971, "ground_truth": 0}, {"key": "32275837", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6619228791065564, "ground_truth": 0}, {"key": "32275837", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7490872281811627, "ground_truth": 0}, {"key": "32275837", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601380078257, "ground_truth": 0}, {"key": "32275837", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106282906532594, "ground_truth": 0}, {"key": "21458094", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34158249879460684, "ground_truth": 0}, {"key": "21458094", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43014734633803786, "ground_truth": 0}, {"key": "21458094", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5679366317758032, "ground_truth": 0}, {"key": "21458094", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.658417490989514, "ground_truth": 0}, {"key": "21458094", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2845760124555702, "ground_truth": 0}, {"key": "40975362", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40168778696915536, "ground_truth": 0}, {"key": "40975362", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3775406791110594, "ground_truth": 0}, {"key": "40975362", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35936414589316207, "ground_truth": 0}, {"key": "40975362", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.36116470863525113, "ground_truth": 0}, {"key": "40975362", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.270480218182264, "ground_truth": 0}, {"key": "35234201", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.43398143115276694, "ground_truth": 0}, {"key": "35234201", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5525397103889965, "ground_truth": 0}, {"key": "35234201", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2643583531145269, "ground_truth": 0}, {"key": "35234201", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27202455309936996, "ground_truth": 0}, {"key": "35234201", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014735109628, "ground_truth": 0}, {"key": "36037573", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4054487582296819, "ground_truth": 0}, {"key": "36037573", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3665897109120024, "ground_truth": 0}, {"key": "36037573", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43590152749310324, "ground_truth": 0}, {"key": "36037573", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3849121382286083, "ground_truth": 0}, {"key": "36037573", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37022539547452693, "ground_truth": 0}, {"key": "30861915", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25386098573691385, "ground_truth": 0}, {"key": "30861915", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40922081935669735, "ground_truth": 0}, {"key": "30861915", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23651625554769223, "ground_truth": 0}, {"key": "30861915", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4035668641510677, "ground_truth": 0}, {"key": "30861915", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2925952801057421, "ground_truth": 0}, {"key": "40173012", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44167300551235145, "ground_truth": 0}, {"key": "40173012", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43782348519700004, "ground_truth": 0}, {"key": "40173012", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1613202457134843, "ground_truth": 0}, {"key": "40173012", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23934934285540965, "ground_truth": 0}, {"key": "40173012", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2107662860192378, "ground_truth": 0}, {"key": "35100330", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10669059680107353, "ground_truth": 0}, {"key": "35100330", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21337716089649347, "ground_truth": 0}, {"key": "35100330", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1403362568416458, "ground_truth": 0}, {"key": "35100330", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07369626968875835, "ground_truth": 0}, {"key": "35100330", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1943678214780266, "ground_truth": 0}, {"key": "37220221", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5292633998153372, "ground_truth": 0}, {"key": "37220221", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7549149690501372, "ground_truth": 0}, {"key": "37220221", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3830641619976809, "ground_truth": 0}, {"key": "37220221", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621764920014187, "ground_truth": 0}, {"key": "37220221", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707365766523064, "ground_truth": 0}, {"key": "38815218", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7310585610977506, "ground_truth": 0}, {"key": "38815218", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6774740312666495, "ground_truth": 0}, {"key": "38815218", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7718435160260766, "ground_truth": 0}, {"key": "38815218", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419943529324, "ground_truth": 0}, {"key": "38815218", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.834406880430884, "ground_truth": 0}, {"key": "39379109", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2227001395422881, "ground_truth": 0}, {"key": "39379109", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.123365619211332, "ground_truth": 0}, {"key": "39379109", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18952110134177652, "ground_truth": 0}, {"key": "39379109", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3106943837497443, "ground_truth": 0}, {"key": "39379109", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17217184598140592, "ground_truth": 0}, {"key": "14576125", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.176671605971241, "ground_truth": 0}, {"key": "14576125", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25091278916617266, "ground_truth": 0}, {"key": "14576125", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11920291949772852, "ground_truth": 0}, {"key": "14576125", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16995623679904495, "ground_truth": 0}, {"key": "14576125", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10017222252247986, "ground_truth": 0}, {"key": "40814250", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5640984656900672, "ground_truth": 0}, {"key": "40814250", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7969253671041125, "ground_truth": 0}, {"key": "40814250", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6460137099936363, "ground_truth": 0}, {"key": "40814250", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413819690512, "ground_truth": 0}, {"key": "40814250", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919991669051, "ground_truth": 0}, {"key": "36334488", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2909808682753422, "ground_truth": 0}, {"key": "36334488", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4532618628923652, "ground_truth": 0}, {"key": "36334488", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42823338719805704, "ground_truth": 0}, {"key": "36334488", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3157359802185443, "ground_truth": 0}, {"key": "36334488", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35756753163168786, "ground_truth": 0}, {"key": "36888322", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36296919316222326, "ground_truth": 0}, {"key": "36888322", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3040416804434924, "ground_truth": 0}, {"key": "36888322", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2798284944888113, "ground_truth": 0}, {"key": "36888322", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223188761163755, "ground_truth": 0}, {"key": "36888322", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10017222275826025, "ground_truth": 0}, {"key": "37318916", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7704648010320639, "ground_truth": 0}, {"key": "37318916", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7676898670248676, "ground_truth": 0}, {"key": "37318916", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9032942006866879, "ground_truth": 0}, {"key": "37318916", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760307994368, "ground_truth": 0}, {"key": "37318916", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036254947629, "ground_truth": 0}, {"key": "39308700", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3363310476790436, "ground_truth": 0}, {"key": "39308700", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.35936412553634495, "ground_truth": 0}, {"key": "39308700", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.32594952775455394, "ground_truth": 0}, {"key": "39308700", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27357440082141216, "ground_truth": 0}, {"key": "39308700", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1655931167267378, "ground_truth": 0}, {"key": "31061543", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.331119773188056, "ground_truth": 0}, {"key": "31061543", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.35936412030251, "ground_truth": 0}, {"key": "31061543", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15304216856676806, "ground_truth": 0}, {"key": "31061543", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668456015961858, "ground_truth": 0}, {"key": "31061543", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061686539668, "ground_truth": 0}, {"key": "37380894", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.166675396002077, "ground_truth": 0}, {"key": "37380894", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.548673491018715, "ground_truth": 0}, {"key": "37380894", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35220177966861194, "ground_truth": 0}, {"key": "37380894", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16667539708869528, "ground_truth": 0}, {"key": "37380894", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38306417011730026, "ground_truth": 0}, {"key": "38410139", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08093670866883262, "ground_truth": 0}, {"key": "38410139", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.0809367154857746, "ground_truth": 0}, {"key": "38410139", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.0815197557342615, "ground_truth": 0}, {"key": "38410139", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08449275895155524, "ground_truth": 0}, {"key": "38410139", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.42441197167848765, "ground_truth": 0}, {"key": "35953842", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34687309036538255, "ground_truth": 0}, {"key": "35953842", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.777299883489575, "ground_truth": 0}, {"key": "35953842", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5117165968296608, "ground_truth": 0}, {"key": "35953842", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990487352053, "ground_truth": 0}, {"key": "35953842", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381630809683, "ground_truth": 0}, {"key": "39815663", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.06465348726846262, "ground_truth": 0}, {"key": "39815663", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.048136770129427374, "ground_truth": 0}, {"key": "39815663", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.05834583779720935, "ground_truth": 0}, {"key": "39815663", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07263670904781365, "ground_truth": 0}, {"key": "39815663", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11516223340349326, "ground_truth": 0}, {"key": "35121432", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40356687401118596, "ground_truth": 0}, {"key": "35121432", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.46879061836321373, "ground_truth": 0}, {"key": "35121432", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5253688211176207, "ground_truth": 0}, {"key": "35121432", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43398142860719324, "ground_truth": 0}, {"key": "35121432", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544110144186, "ground_truth": 0}, {"key": "21712310", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08819004455713206, "ground_truth": 0}, {"key": "21712310", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13028542765862136, "ground_truth": 0}, {"key": "21712310", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07055960042256706, "ground_truth": 0}, {"key": "21712310", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10521054065478187, "ground_truth": 0}, {"key": "21712310", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1666754035381909, "ground_truth": 0}, {"key": "37952914", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4785288140269155, "ground_truth": 0}, {"key": "37952914", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2553436470242517, "ground_truth": 0}, {"key": "37952914", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3468730665854504, "ground_truth": 0}, {"key": "37952914", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14804719257368662, "ground_truth": 0}, {"key": "37952914", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38121955364125254, "ground_truth": 0}, {"key": "38956779", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.48633151020189075, "ground_truth": 0}, {"key": "38956779", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5097643785473674, "ground_truth": 0}, {"key": "38956779", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.45132649556665744, "ground_truth": 0}, {"key": "38956779", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2658804779524153, "ground_truth": 0}, {"key": "38956779", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38121956217443576, "ground_truth": 0}, {"key": "36101833", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.49218813066510847, "ground_truth": 0}, {"key": "36101833", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3415825229424805, "ground_truth": 0}, {"key": "36101833", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.30569730781620824, "ground_truth": 0}, {"key": "36101833", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629586218298646, "ground_truth": 0}, {"key": "36101833", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991051957940313, "ground_truth": 0}, {"key": "35544662", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1001722228331798, "ground_truth": 0}, {"key": "35544662", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20689405286312748, "ground_truth": 0}, {"key": "35544662", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13028542138029292, "ground_truth": 0}, {"key": "35544662", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629586201435791, "ground_truth": 0}, {"key": "35544662", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2538610244983878, "ground_truth": 0}, {"key": "39759044", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3665897495988434, "ground_truth": 0}, {"key": "39759044", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32082129282679994, "ground_truth": 0}, {"key": "39759044", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2782567989850812, "ground_truth": 0}, {"key": "39759044", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594720528882364, "ground_truth": 0}, {"key": "39759044", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20817893102784296, "ground_truth": 0}, {"key": "39433018", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7106282983961834, "ground_truth": 0}, {"key": "39433018", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7264256055058554, "ground_truth": 0}, {"key": "39433018", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7041601490751095, "ground_truth": 0}, {"key": "39433018", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.42250461245006177, "ground_truth": 0}, {"key": "39433018", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531037973296, "ground_truth": 0}, {"key": "22111959", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.744656348775238, "ground_truth": 0}, {"key": "22111959", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25091278608645357, "ground_truth": 0}, {"key": "22111959", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3242354041150446, "ground_truth": 0}, {"key": "22111959", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.49414089902516845, "ground_truth": 0}, {"key": "22111959", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.496093854393993, "ground_truth": 0}, {"key": "38210094", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22135067635254627, "ground_truth": 0}, {"key": "38210094", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.29746992413662376, "ground_truth": 0}, {"key": "38210094", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13117322665528455, "ground_truth": 0}, {"key": "38210094", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14511537652190967, "ground_truth": 0}, {"key": "38210094", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11436852423079052, "ground_truth": 0}, {"key": "37675935", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31069439116726394, "ground_truth": 0}, {"key": "37675935", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7461389807482938, "ground_truth": 0}, {"key": "37675935", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.49804686957725924, "ground_truth": 0}, {"key": "37675935", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241843791334, "ground_truth": 0}, {"key": "37675935", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416730175622412, "ground_truth": 0}, {"key": "35732604", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12002562458890191, "ground_truth": 0}, {"key": "35732604", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22541661249023545, "ground_truth": 0}, {"key": "35732604", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13296424575118018, "ground_truth": 0}, {"key": "35732604", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08210662486865376, "ground_truth": 0}, {"key": "35732604", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16776334415799735, "ground_truth": 0}, {"key": "27453212", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23934933836034214, "ground_truth": 0}, {"key": "27453212", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2735743963613461, "ground_truth": 0}, {"key": "27453212", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31069438673209043, "ground_truth": 0}, {"key": "27453212", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34510527016928694, "ground_truth": 0}, {"key": "27453212", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13660839277487896, "ground_truth": 0}, {"key": "39910047", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10087862409448439, "ground_truth": 0}, {"key": "39910047", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3106943789640089, "ground_truth": 0}, {"key": "39910047", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1320661587196736, "ground_truth": 0}, {"key": "39910047", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14033625669822722, "ground_truth": 0}, {"key": "39910047", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3208213072324844, "ground_truth": 0}, {"key": "40054265", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1431877159014285, "ground_truth": 0}, {"key": "40054265", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19806417981796673, "ground_truth": 0}, {"key": "40054265", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12168575568463011, "ground_truth": 0}, {"key": "40054265", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1550784722454107, "ground_truth": 0}, {"key": "40054265", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12765261952298498, "ground_truth": 0}, {"key": "19984615", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37204880043601796, "ground_truth": 0}, {"key": "19984615", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5331544003139467, "ground_truth": 0}, {"key": "19984615", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3960681936225558, "ground_truth": 0}, {"key": "19984615", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1801066603088566, "ground_truth": 0}, {"key": "19984615", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.28140561161140837, "ground_truth": 0}, {"key": "16490806", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21733750880824354, "ground_truth": 0}, {"key": "16490806", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18594721191330324, "ground_truth": 0}, {"key": "16490806", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19682618808373692, "ground_truth": 0}, {"key": "16490806", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19314738809676274, "ground_truth": 0}, {"key": "16490806", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15610490509987102, "ground_truth": 0}, {"key": "36396237", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8278281492401505, "ground_truth": 0}, {"key": "36396237", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6959583360598083, "ground_truth": 0}, {"key": "36396237", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7185944143296872, "ground_truth": 0}, {"key": "36396237", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165305784379, "ground_truth": 0}, {"key": "36396237", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737310046736, "ground_truth": 0}, {"key": "40726444", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4359015218149127, "ground_truth": 0}, {"key": "40726444", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8766343822120971, "ground_truth": 0}, {"key": "40726444", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7090191276231107, "ground_truth": 0}, {"key": "40726444", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256364073001, "ground_truth": 0}, {"key": "40726444", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2720245682881505, "ground_truth": 0}, {"key": "37314826", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24220563770091327, "ground_truth": 0}, {"key": "37314826", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18832398989047805, "ground_truth": 0}, {"key": "37314826", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13568954461836888, "ground_truth": 0}, {"key": "37314826", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11516223536920632, "ground_truth": 0}, {"key": "37314826", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510840032766755, "ground_truth": 0}, {"key": "38506971", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3557748915297993, "ground_truth": 0}, {"key": "38506971", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37937838207427377, "ground_truth": 0}, {"key": "38506971", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27825680067409875, "ground_truth": 0}, {"key": "38506971", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15817435612260544, "ground_truth": 0}, {"key": "38506971", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13660839263428776, "ground_truth": 0}, {"key": "40699312", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35577489538099555, "ground_truth": 0}, {"key": "40699312", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.433981462932066, "ground_truth": 0}, {"key": "40699312", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22135069978851155, "ground_truth": 0}, {"key": "40699312", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31237000990520314, "ground_truth": 0}, {"key": "40699312", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.433981482091998, "ground_truth": 0}, {"key": "34695474", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21866937993540783, "ground_truth": 0}, {"key": "34695474", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1789558870960883, "ground_truth": 0}, {"key": "34695474", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12852513806188828, "ground_truth": 0}, {"key": "34695474", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09073548174724161, "ground_truth": 0}, {"key": "34695474", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10894504671855605, "ground_truth": 0}, {"key": "36281498", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.509764378215268, "ground_truth": 0}, {"key": "36281498", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6460137035830175, "ground_truth": 0}, {"key": "36281498", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5253688318312408, "ground_truth": 0}, {"key": "36281498", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.554470461008606, "ground_truth": 0}, {"key": "36281498", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3960681892208415, "ground_truth": 0}, {"key": "39558652", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13846179676959766, "ground_truth": 0}, {"key": "39558652", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15405756177757965, "ground_truth": 0}, {"key": "39558652", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40922079835402153, "ground_truth": 0}, {"key": "39558652", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31912141066397565, "ground_truth": 0}, {"key": "39558652", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3522017792152728, "ground_truth": 0}, {"key": "37330579", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18242552700125253, "ground_truth": 0}, {"key": "37330579", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3433417424851154, "ground_truth": 0}, {"key": "37330579", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18010665948656968, "ground_truth": 0}, {"key": "37330579", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12252322211767334, "ground_truth": 0}, {"key": "37330579", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20434190359889076, "ground_truth": 0}, {"key": "40547658", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23934933703145436, "ground_truth": 0}, {"key": "40547658", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1766716017722518, "ground_truth": 0}, {"key": "40547658", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14804718191459135, "ground_truth": 0}, {"key": "40547658", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27048023144178046, "ground_truth": 0}, {"key": "40547658", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2553436426426868, "ground_truth": 0}, {"key": "37119340", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2005576755716359, "ground_truth": 0}, {"key": "37119340", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12592275813227335, "ground_truth": 0}, {"key": "37119340", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2107663111225131, "ground_truth": 0}, {"key": "37119340", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1688569535365762, "ground_truth": 0}, {"key": "37119340", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13846178862013164, "ground_truth": 0}, {"key": "35301627", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3738758240150517, "ground_truth": 0}, {"key": "35301627", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3191213867754618, "ground_truth": 0}, {"key": "35301627", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35398629937632115, "ground_truth": 0}, {"key": "35301627", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2407745940966561, "ground_truth": 0}, {"key": "35301627", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.47463119274116605, "ground_truth": 0}, {"key": "34037168", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15002883078791346, "ground_truth": 0}, {"key": "34037168", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2538610214800701, "ground_truth": 0}, {"key": "34037168", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19193277740169642, "ground_truth": 0}, {"key": "34037168", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1592174099043543, "ground_truth": 0}, {"key": "34037168", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21337717473306467, "ground_truth": 0}, {"key": "39703862", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6959583279031586, "ground_truth": 0}, {"key": "39703862", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40168779872814986, "ground_truth": 0}, {"key": "39703862", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7025300581604272, "ground_truth": 0}, {"key": "39703862", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.633410259845714, "ground_truth": 0}, {"key": "39703862", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004097600918, "ground_truth": 0}, {"key": "16554814", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4902356140655294, "ground_truth": 0}, {"key": "16554814", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9294404005971122, "ground_truth": 0}, {"key": "16554814", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5428632745652132, "ground_truth": 0}, {"key": "16554814", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984991122825, "ground_truth": 0}, {"key": "16554814", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39606815961733377, "ground_truth": 0}, {"key": "32983099", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1338674851022392, "ground_truth": 0}, {"key": "32983099", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07751765520401188, "ground_truth": 0}, {"key": "32983099", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15405755603883556, "ground_truth": 0}, {"key": "32983099", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09807932033474338, "ground_truth": 0}, {"key": "32983099", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1550784785087327, "ground_truth": 0}, {"key": "41072994", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1895210862137275, "ground_truth": 0}, {"key": "41072994", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27357440713234527, "ground_truth": 0}, {"key": "41072994", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.46101676457210944, "ground_truth": 0}, {"key": "41072994", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3942009527243732, "ground_truth": 0}, {"key": "41072994", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569735624296446, "ground_truth": 0}, {"key": "38396247", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4092207861761604, "ground_truth": 0}, {"key": "38396247", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3593641412987271, "ground_truth": 0}, {"key": "38396247", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7577943496659925, "ground_truth": 0}, {"key": "38396247", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239943365353, "ground_truth": 0}, {"key": "38396247", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014081218313, "ground_truth": 0}, {"key": "37507998", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4301473568491938, "ground_truth": 0}, {"key": "37507998", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41111087876655134, "ground_truth": 0}, {"key": "37507998", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5370413944210399, "ground_truth": 0}, {"key": "37507998", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.46490157412709787, "ground_truth": 0}, {"key": "37507998", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2720245188373175, "ground_truth": 0}, {"key": "32593929", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14511535849784155, "ground_truth": 0}, {"key": "32593929", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2782567944364264, "ground_truth": 0}, {"key": "32593929", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2509127873304801, "ground_truth": 0}, {"key": "32593929", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20561505248846532, "ground_truth": 0}, {"key": "32593929", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2120688139120492, "ground_truth": 0}, {"key": "36056449", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14223190133314528, "ground_truth": 0}, {"key": "36056449", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18126321090028108, "ground_truth": 0}, {"key": "36056449", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19193280399674514, "ground_truth": 0}, {"key": "36056449", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21733751722596403, "ground_truth": 0}, {"key": "36056449", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2407745716730638, "ground_truth": 0}, {"key": "21986185", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.256832002043367, "ground_truth": 0}, {"key": "21986185", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3647775651175255, "ground_truth": 0}, {"key": "21986185", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.29583987394107464, "ground_truth": 0}, {"key": "21986185", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1613202437922155, "ground_truth": 0}, {"key": "21986185", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2877678110404758, "ground_truth": 0}, {"key": "40757465", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23934933577309012, "ground_truth": 0}, {"key": "40757465", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10158944761405111, "ground_truth": 0}, {"key": "40757465", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.0850990449645712, "ground_truth": 0}, {"key": "40757465", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1120159548041685, "ground_truth": 0}, {"key": "40757465", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14318770731099717, "ground_truth": 0}, {"key": "35198313", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5039061716274932, "ground_truth": 0}, {"key": "35198313", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3775406498700444, "ground_truth": 0}, {"key": "35198313", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27669052854804616, "ground_truth": 0}, {"key": "35198313", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12678516670926993, "ground_truth": 0}, {"key": "35198313", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3157359972677596, "ground_truth": 0}, {"key": "30604618", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3611647050127117, "ground_truth": 0}, {"key": "30604618", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40356684978313806, "ground_truth": 0}, {"key": "30604618", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35042138476501367, "ground_truth": 0}, {"key": "30604618", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2613309138861441, "ground_truth": 0}, {"key": "30604618", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1766716117387512, "ground_truth": 0}, {"key": "35779006", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3757064768104202, "ground_truth": 0}, {"key": "35779006", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.396068175688915, "ground_truth": 0}, {"key": "35779006", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2751297318994382, "ground_truth": 0}, {"key": "35779006", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15921740755020727, "ground_truth": 0}, {"key": "35779006", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11757213586982823, "ground_truth": 0}, {"key": "33858956", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.435901508066892, "ground_truth": 0}, {"key": "33858956", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42441197286128746, "ground_truth": 0}, {"key": "33858956", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3328523181221843, "ground_truth": 0}, {"key": "33858956", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.366589764746802, "ground_truth": 0}, {"key": "33858956", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.29910518338962894, "ground_truth": 0}, {"key": "38633880", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12506538476525755, "ground_truth": 0}, {"key": "38633880", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12765262199717511, "ground_truth": 0}, {"key": "38633880", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.06656918409360349, "ground_truth": 0}, {"key": "38633880", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09467770576782598, "ground_truth": 0}, {"key": "38633880", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.06233104169466526, "ground_truth": 0}, {"key": "36654905", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8198933376714627, "ground_truth": 0}, {"key": "36654905", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9099070085900379, "ground_truth": 0}, {"key": "36654905", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8732148231173734, "ground_truth": 0}, {"key": "36654905", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074047209076111, "ground_truth": 0}, {"key": "36654905", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370307896428299, "ground_truth": 0}, {"key": "26547482", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08449275910078213, "ground_truth": 0}, {"key": "26547482", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1089450452468202, "ground_truth": 0}, {"key": "26547482", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14318771265896596, "ground_truth": 0}, {"key": "26547482", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07107366275684127, "ground_truth": 0}, {"key": "26547482", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12085323293980324, "ground_truth": 0}, {"key": "36439068", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.28457600424280494, "ground_truth": 0}, {"key": "36439068", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10594828545703666, "ground_truth": 0}, {"key": "36439068", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15921740763940745, "ground_truth": 0}, {"key": "36439068", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.04707417868403868, "ground_truth": 0}, {"key": "36439068", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.040237943476934726, "ground_truth": 0}, {"key": "30501258", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2422056203297412, "ground_truth": 0}, {"key": "30501258", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31069438728753107, "ground_truth": 0}, {"key": "30501258", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2893716992029807, "ground_truth": 0}, {"key": "30501258", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18242552827598266, "ground_truth": 0}, {"key": "30501258", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2509127871713547, "ground_truth": 0}, {"key": "37560941", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14903530102026405, "ground_truth": 0}, {"key": "37560941", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27512972158154597, "ground_truth": 0}, {"key": "37560941", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33285231643153207, "ground_truth": 0}, {"key": "37560941", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10594828004674396, "ground_truth": 0}, {"key": "37560941", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11124121607731907, "ground_truth": 0}, {"key": "36801665", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4707366153610206, "ground_truth": 0}, {"key": "36801665", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.569852649053832, "ground_truth": 0}, {"key": "36801665", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40544871875207306, "ground_truth": 0}, {"key": "36801665", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4167966392818758, "ground_truth": 0}, {"key": "36801665", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364244552373288, "ground_truth": 0}, {"key": "34954610", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21076630861634255, "ground_truth": 0}, {"key": "34954610", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47657965059539287, "ground_truth": 0}, {"key": "34954610", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.239349348761024, "ground_truth": 0}, {"key": "34954610", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.30239109339686354, "ground_truth": 0}, {"key": "34954610", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39793842968341514, "ground_truth": 0}, {"key": "37020510", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4016878090733176, "ground_truth": 0}, {"key": "37020510", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3056973228588287, "ground_truth": 0}, {"key": "37020510", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.37570646324625245, "ground_truth": 0}, {"key": "37020510", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3738758110098855, "ground_truth": 0}, {"key": "37020510", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004126090421, "ground_truth": 0}, {"key": "38064637", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.28776781840824367, "ground_truth": 0}, {"key": "38064637", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2798284875422357, "ground_truth": 0}, {"key": "38064637", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17781087121320516, "ground_truth": 0}, {"key": "38064637", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091975961325698, "ground_truth": 0}, {"key": "38064637", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15921740648005725, "ground_truth": 0}, {"key": "40886108", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5486735043778744, "ground_truth": 0}, {"key": "40886108", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7431680288655075, "ground_truth": 0}, {"key": "40886108", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7994423380818209, "ground_truth": 0}, {"key": "40886108", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704647737155708, "ground_truth": 0}, {"key": "40886108", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918392543478, "ground_truth": 0}, {"key": "38554603", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3123699925632529, "ground_truth": 0}, {"key": "38554603", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.45326182136218496, "ground_truth": 0}, {"key": "38554603", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2436424170150466, "ground_truth": 0}, {"key": "38554603", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3738758192981977, "ground_truth": 0}, {"key": "38554603", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557749053904889, "ground_truth": 0}, {"key": "39115586", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37937838250716216, "ground_truth": 0}, {"key": "39115586", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2974699568864545, "ground_truth": 0}, {"key": "39115586", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2958398663167029, "ground_truth": 0}, {"key": "39115586", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08632347661489383, "ground_truth": 0}, {"key": "39115586", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32766831406458813, "ground_truth": 0}, {"key": "38786314", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.28776781486513014, "ground_truth": 0}, {"key": "38786314", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12852514158463857, "ground_truth": 0}, {"key": "38786314", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2877678056567786, "ground_truth": 0}, {"key": "38786314", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10447731267388655, "ground_truth": 0}, {"key": "38786314", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561503915095075, "ground_truth": 0}, {"key": "38721078", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.47268346493840646, "ground_truth": 0}, {"key": "38721078", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41111086017989273, "ground_truth": 0}, {"key": "38721078", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6057990604973068, "ground_truth": 0}, {"key": "38721078", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593405910648, "ground_truth": 0}, {"key": "38721078", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102810313044, "ground_truth": 0}, {"key": "39475467", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27669053793818205, "ground_truth": 0}, {"key": "39475467", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4186969027191311, "ground_truth": 0}, {"key": "39475467", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5195213432561012, "ground_truth": 0}, {"key": "39475467", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687308517650656, "ground_truth": 0}, {"key": "39475467", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30074556683071313, "ground_truth": 0}, {"key": "35691234", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.42250463121819803, "ground_truth": 0}, {"key": "35691234", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1847675197696057, "ground_truth": 0}, {"key": "35691234", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27825679997346636, "ground_truth": 0}, {"key": "35691234", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25238404175646856, "ground_truth": 0}, {"key": "35691234", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2018132248170019, "ground_truth": 0}, {"key": "36871390", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.355774890963464, "ground_truth": 0}, {"key": "36871390", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5097643690617512, "ground_truth": 0}, {"key": "36871390", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4629586332811938, "ground_truth": 0}, {"key": "36871390", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.531209371631698, "ground_truth": 0}, {"key": "36871390", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643718963475, "ground_truth": 0}, {"key": "31730844", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5467381372137226, "ground_truth": 0}, {"key": "31730844", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2120688019906382, "ground_truth": 0}, {"key": "31730844", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4921881208278566, "ground_truth": 0}, {"key": "31730844", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45326185467800895, "ground_truth": 0}, {"key": "31730844", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.34864515135672275, "ground_truth": 0}, {"key": "30810940", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09877258576747941, "ground_truth": 0}, {"key": "30810940", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15002882164708092, "ground_truth": 0}, {"key": "30810940", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20817891631605365, "ground_truth": 0}, {"key": "30810940", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10230470084105595, "ground_truth": 0}, {"key": "30810940", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10521054233650501, "ground_truth": 0}, {"key": "39352003", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3738758145975408, "ground_truth": 0}, {"key": "39352003", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.36658972945886115, "ground_truth": 0}, {"key": "39352003", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35398631007440823, "ground_truth": 0}, {"key": "39352003", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091975271903206, "ground_truth": 0}, {"key": "39352003", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944725560550707, "ground_truth": 0}, {"key": "40118123", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3539863046018235, "ground_truth": 0}, {"key": "40118123", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16995623270126153, "ground_truth": 0}, {"key": "40118123", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26894142365926865, "ground_truth": 0}, {"key": "40118123", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16559311326391113, "ground_truth": 0}, {"key": "40118123", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1943678148575598, "ground_truth": 0}, {"key": "37114191", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15921740221626432, "ground_truth": 0}, {"key": "37114191", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12168574949348272, "ground_truth": 0}, {"key": "37114191", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2030746246615073, "ground_truth": 0}, {"key": "37114191", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1699562319155315, "ground_truth": 0}, {"key": "37114191", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.06512754621173461, "ground_truth": 0}, {"key": "39268203", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.43206340094944923, "ground_truth": 0}, {"key": "39268203", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23370636468234685, "ground_truth": 0}, {"key": "39268203", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3311197358745544, "ground_truth": 0}, {"key": "39268203", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526579272245, "ground_truth": 0}, {"key": "39268203", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39981165003315283, "ground_truth": 0}, {"key": "37950968", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4551985684162558, "ground_truth": 0}, {"key": "37950968", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3007455947486383, "ground_truth": 0}, {"key": "37950968", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.34158250647058824, "ground_truth": 0}, {"key": "37950968", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3451052646846617, "ground_truth": 0}, {"key": "37950968", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2509127980360774, "ground_truth": 0}, {"key": "34959807", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7279754246487807, "ground_truth": 0}, {"key": "34959807", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5273165207916949, "ground_truth": 0}, {"key": "34959807", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.482429144262436, "ground_truth": 0}, {"key": "34959807", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.627951218777457, "ground_truth": 0}, {"key": "34959807", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300833564075, "ground_truth": 0}, {"key": "35631314", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5964331394073841, "ground_truth": 0}, {"key": "35631314", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41679664810393124, "ground_truth": 0}, {"key": "35631314", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6959583179035687, "ground_truth": 0}, {"key": "35631314", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159683203747, "ground_truth": 0}, {"key": "35631314", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37754067201138863, "ground_truth": 0}, {"key": "38082365", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6001883556522492, "ground_truth": 0}, {"key": "38082365", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.605799034838566, "ground_truth": 0}, {"key": "38082365", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6636689284503944, "ground_truth": 0}, {"key": "38082365", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.482429098207691, "ground_truth": 0}, {"key": "38082365", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352826859116, "ground_truth": 0}, {"key": "37242829", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44939261216247767, "ground_truth": 0}, {"key": "37242829", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4687906438787799, "ground_truth": 0}, {"key": "37242829", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5136684489003788, "ground_truth": 0}, {"key": "37242829", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984781416014, "ground_truth": 0}, {"key": "37242829", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3702254024896566, "ground_truth": 0}, {"key": "38556068", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23231015383182735, "ground_truth": 0}, {"key": "38556068", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23091974934787757, "ground_truth": 0}, {"key": "38556068", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3684056886285867, "ground_truth": 0}, {"key": "38556068", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1931474003993845, "ground_truth": 0}, {"key": "38556068", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2720245400707614, "ground_truth": 0}, {"key": "32969336", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3904758599172406, "ground_truth": 0}, {"key": "32969336", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5117165939047952, "ground_truth": 0}, {"key": "32969336", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5039061760955559, "ground_truth": 0}, {"key": "32969336", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035649714303, "ground_truth": 0}, {"key": "32969336", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882834112573859, "ground_truth": 0}, {"key": "36825153", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5331543877933616, "ground_truth": 0}, {"key": "36825153", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.29746995739186777, "ground_truth": 0}, {"key": "36825153", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.217337510157029, "ground_truth": 0}, {"key": "36825153", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15203225498156567, "ground_truth": 0}, {"key": "36825153", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2877678156738872, "ground_truth": 0}, {"key": "41050146", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3904758422653048, "ground_truth": 0}, {"key": "41050146", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.29746992655217513, "ground_truth": 0}, {"key": "41050146", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3380771167405265, "ground_truth": 0}, {"key": "41050146", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3073580267460949, "ground_truth": 0}, {"key": "41050146", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4455295354597698, "ground_truth": 0}, {"key": "27865037", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3225259773518531, "ground_truth": 0}, {"key": "27865037", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2583259887423863, "ground_truth": 0}, {"key": "27865037", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21337718342364256, "ground_truth": 0}, {"key": "27865037", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20689403971073853, "ground_truth": 0}, {"key": "27865037", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.26588046828591716, "ground_truth": 0}, {"key": "39868565", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16559311541365734, "ground_truth": 0}, {"key": "39868565", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23231014910314288, "ground_truth": 0}, {"key": "39868565", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2568320049253313, "ground_truth": 0}, {"key": "39868565", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14903530721658373, "ground_truth": 0}, {"key": "39868565", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.25091279346067635, "ground_truth": 0}, {"key": "37761968", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2583259756435307, "ground_truth": 0}, {"key": "37761968", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2494472181529881, "ground_truth": 0}, {"key": "37761968", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.46684561308407724, "ground_truth": 0}, {"key": "37761968", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18952109917323956, "ground_truth": 0}, {"key": "37761968", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3140505607761009, "ground_truth": 0}, {"key": "16326139", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3123700048131604, "ground_truth": 0}, {"key": "16326139", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6076631730560104, "ground_truth": 0}, {"key": "16326139", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6825737083752184, "ground_truth": 0}, {"key": "16326139", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29421498640677474, "ground_truth": 0}, {"key": "16326139", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22405546629327341, "ground_truth": 0}, {"key": "36568381", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23231013177657636, "ground_truth": 0}, {"key": "36568381", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3486451278298711, "ground_truth": 0}, {"key": "36568381", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23651623937363578, "ground_truth": 0}, {"key": "36568381", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32082130574079554, "ground_truth": 0}, {"key": "36568381", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.247987431335746, "ground_truth": 0}, {"key": "39855613", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6132365267465995, "ground_truth": 0}, {"key": "39855613", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7057850191590102, "ground_truth": 0}, {"key": "39855613", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8766343659839836, "ground_truth": 0}, {"key": "39855613", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026617435204, "ground_truth": 0}, {"key": "39855613", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445442223031, "ground_truth": 0}, {"key": "29856302", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3923368154918464, "ground_truth": 0}, {"key": "29856302", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31405052453959337, "ground_truth": 0}, {"key": "29856302", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3106943934501694, "ground_truth": 0}, {"key": "29856302", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44939265450768523, "ground_truth": 0}, {"key": "29856302", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38491215125519335, "ground_truth": 0}, {"key": "35641106", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44360042927330384, "ground_truth": 0}, {"key": "35641106", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5389831901229425, "ground_truth": 0}, {"key": "35641106", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4493926402994425, "ground_truth": 0}, {"key": "35641106", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43014735246893004, "ground_truth": 0}, {"key": "35641106", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2568319848594201, "ground_truth": 0}, {"key": "39474558", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.046378209830661626, "ground_truth": 0}, {"key": "39474558", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.06512754942258876, "ground_truth": 0}, {"key": "39474558", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.06418264465055952, "ground_truth": 0}, {"key": "39474558", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.053799641533513125, "ground_truth": 0}, {"key": "39474558", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.0596469434780848, "ground_truth": 0}, {"key": "34338135", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.607663154988159, "ground_truth": 0}, {"key": "34338135", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7008947948020494, "ground_truth": 0}, {"key": "34338135", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7662936592117643, "ground_truth": 0}, {"key": "34338135", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254149907328, "ground_truth": 0}, {"key": "34338135", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056139008463, "ground_truth": 0}, {"key": "35870330", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35936414856420207, "ground_truth": 0}, {"key": "35870330", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.45907613697951544, "ground_truth": 0}, {"key": "35870330", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4863315287659755, "ground_truth": 0}, {"key": "35870330", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064562962555, "ground_truth": 0}, {"key": "35870330", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39233684582898515, "ground_truth": 0}, {"key": "24478245", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30239110286774007, "ground_truth": 0}, {"key": "24478245", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20817892761912052, "ground_truth": 0}, {"key": "24478245", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4282334103743526, "ground_truth": 0}, {"key": "24478245", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2146914215768702, "ground_truth": 0}, {"key": "24478245", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974733405826566, "ground_truth": 0}, {"key": "38485946", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18126320793079626, "ground_truth": 0}, {"key": "38485946", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1859471795011391, "ground_truth": 0}, {"key": "38485946", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22135067618202198, "ground_truth": 0}, {"key": "38485946", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.40922076368853666, "ground_truth": 0}, {"key": "38485946", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.34510526984162776, "ground_truth": 0}, {"key": "32509613", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5058591189176088, "ground_truth": 0}, {"key": "32509613", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7041601203043281, "ground_truth": 0}, {"key": "32509613", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42823339625389806, "ground_truth": 0}, {"key": "32509613", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1859472024129699, "ground_truth": 0}, {"key": "32509613", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.28937168565230376, "ground_truth": 0}, {"key": "34078819", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26588046455310116, "ground_truth": 0}, {"key": "34078819", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3486451120786768, "ground_truth": 0}, {"key": "34078819", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3942009557267437, "ground_truth": 0}, {"key": "34078819", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3812195695479716, "ground_truth": 0}, {"key": "34078819", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358786669443, "ground_truth": 0}, {"key": "39523865", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20181322688569334, "ground_truth": 0}, {"key": "39523865", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4359015194062576, "ground_truth": 0}, {"key": "39523865", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.48633152737758817, "ground_truth": 0}, {"key": "39523865", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3293917087892099, "ground_truth": 0}, {"key": "39523865", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6315942866799402, "ground_truth": 0}, {"key": "33146158", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40733338360481836, "ground_truth": 0}, {"key": "33146158", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2365162367044844, "ground_truth": 0}, {"key": "33146158", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09947021181301426, "ground_truth": 0}, {"key": "33146158", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08632347117013278, "ground_truth": 0}, {"key": "33146158", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1520322464492356, "ground_truth": 0}, {"key": "32083974", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3593641385190061, "ground_truth": 0}, {"key": "32083974", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21337716729496284, "ground_truth": 0}, {"key": "32083974", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5389832233532971, "ground_truth": 0}, {"key": "32083974", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2861692498729601, "ground_truth": 0}, {"key": "32083974", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.48828339025783823, "ground_truth": 0}, {"key": "34378482", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4843800874208727, "ground_truth": 0}, {"key": "34378482", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47657963697664, "ground_truth": 0}, {"key": "34378482", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5350984130973655, "ground_truth": 0}, {"key": "34378482", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704386146521, "ground_truth": 0}, {"key": "34378482", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3611647405513845, "ground_truth": 0}, {"key": "38080102", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3191213819921208, "ground_truth": 0}, {"key": "38080102", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27202456168626127, "ground_truth": 0}, {"key": "38080102", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3539862937985573, "ground_truth": 0}, {"key": "38080102", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37387580110497237, "ground_truth": 0}, {"key": "38080102", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730907172577, "ground_truth": 0}, {"key": "40244537", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2281565090781724, "ground_truth": 0}, {"key": "40244537", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28457599265751454, "ground_truth": 0}, {"key": "40244537", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21076631339463653, "ground_truth": 0}, {"key": "40244537", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2422056374088074, "ground_truth": 0}, {"key": "40244537", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15713683685857857, "ground_truth": 0}, {"key": "33497789", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5640984823638598, "ground_truth": 0}, {"key": "33497789", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5983122077069631, "ground_truth": 0}, {"key": "33497789", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.247987434146706, "ground_truth": 0}, {"key": "33497789", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.33807711978091043, "ground_truth": 0}, {"key": "33497789", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.46684560882724957, "ground_truth": 0}, {"key": "28816889", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5331543882071924, "ground_truth": 0}, {"key": "28816889", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3451052794007366, "ground_truth": 0}, {"key": "28816889", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5907792081641312, "ground_truth": 0}, {"key": "28816889", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31573598008564085, "ground_truth": 0}, {"key": "28816889", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24508500675057263, "ground_truth": 0}, {"key": "38157127", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17781087279564387, "ground_truth": 0}, {"key": "38157127", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24364244307771268, "ground_truth": 0}, {"key": "38157127", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19072401719036594, "ground_truth": 0}, {"key": "38157127", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20817892969808685, "ground_truth": 0}, {"key": "38157127", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.286169270027517, "ground_truth": 0}, {"key": "36183569", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19072402020786544, "ground_truth": 0}, {"key": "36183569", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1812632172985294, "ground_truth": 0}, {"key": "36183569", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2782567818721296, "ground_truth": 0}, {"key": "36183569", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.300745593721708, "ground_truth": 0}, {"key": "36183569", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2942149690303573, "ground_truth": 0}, {"key": "36012016", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2643583473447695, "ground_truth": 0}, {"key": "36012016", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2751297196864935, "ground_truth": 0}, {"key": "36012016", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2782568041636069, "ground_truth": 0}, {"key": "36012016", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31912139401498135, "ground_truth": 0}, {"key": "36012016", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33458942704618755, "ground_truth": 0}, {"key": "34571973", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23651623606408703, "ground_truth": 0}, {"key": "34571973", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2509127822363072, "ground_truth": 0}, {"key": "34571973", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21733750688105943, "ground_truth": 0}, {"key": "34571973", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10158945110091118, "ground_truth": 0}, {"key": "34571973", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13846178730909808, "ground_truth": 0}, {"key": "38707498", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7325918448148004, "ground_truth": 0}, {"key": "38707498", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5019531003364376, "ground_truth": 0}, {"key": "38707498", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6187804385415083, "ground_truth": 0}, {"key": "38707498", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011640266588, "ground_truth": 0}, {"key": "38707498", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40168781414965854, "ground_truth": 0}, {"key": "35459082", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8489721923698625, "ground_truth": 0}, {"key": "35459082", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.749087226828717, "ground_truth": 0}, {"key": "35459082", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7563575511972179, "ground_truth": 0}, {"key": "35459082", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.863391617172093, "ground_truth": 0}, {"key": "35459082", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892337088052946, "ground_truth": 0}, {"key": "39464041", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8300437770459955, "ground_truth": 0}, {"key": "39464041", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.717011894455554, "ground_truth": 0}, {"key": "39464041", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9178933698831121, "ground_truth": 0}, {"key": "39464041", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445344374354, "ground_truth": 0}, {"key": "39464041", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190632899831566, "ground_truth": 0}, {"key": "23782052", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44746030132026343, "ground_truth": 0}, {"key": "23782052", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25386101764992763, "ground_truth": 0}, {"key": "23782052", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5660185329858618, "ground_truth": 0}, {"key": "23782052", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269965431259, "ground_truth": 0}, {"key": "23782052", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802560643308, "ground_truth": 0}, {"key": "36568455", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4073333942361249, "ground_truth": 0}, {"key": "36568455", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.48633154171784176, "ground_truth": 0}, {"key": "36568455", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4167966274076176, "ground_truth": 0}, {"key": "36568455", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4532618545113865, "ground_truth": 0}, {"key": "36568455", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2674081514562998, "ground_truth": 0}, {"key": "38469552", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6959583333203221, "ground_truth": 0}, {"key": "38469552", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5292633865738665, "ground_truth": 0}, {"key": "38469552", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.45519861387147925, "ground_truth": 0}, {"key": "38469552", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792218167728, "ground_truth": 0}, {"key": "38469552", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526211902208, "ground_truth": 0}, {"key": "35922277", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5813030888086097, "ground_truth": 0}, {"key": "35922277", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6442251104768449, "ground_truth": 0}, {"key": "35922277", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4941409048690774, "ground_truth": 0}, {"key": "35922277", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.54867351720321, "ground_truth": 0}, {"key": "35922277", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.59455127339371, "ground_truth": 0}, {"key": "32744293", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.411110870823332, "ground_truth": 0}, {"key": "32744293", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4629586196863981, "ground_truth": 0}, {"key": "32744293", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5698526574512904, "ground_truth": 0}, {"key": "32744293", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44746029048377123, "ground_truth": 0}, {"key": "32744293", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4532618289824731, "ground_truth": 0}, {"key": "30972362", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6057990313311298, "ground_truth": 0}, {"key": "30972362", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6057990317629, "ground_truth": 0}, {"key": "30972362", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6671476564659901, "ground_truth": 0}, {"key": "30972362", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238798387405, "ground_truth": 0}, {"key": "30972362", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4244119929379689, "ground_truth": 0}, {"key": "36380943", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27048022460057, "ground_truth": 0}, {"key": "36380943", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5117166116195699, "ground_truth": 0}, {"key": "36380943", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2798284740302612, "ground_truth": 0}, {"key": "36380943", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.36840570615163304, "ground_truth": 0}, {"key": "36380943", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30239109219737687, "ground_truth": 0}, {"key": "36929355", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2909808463449572, "ground_truth": 0}, {"key": "36929355", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.33458944642866634, "ground_truth": 0}, {"key": "36929355", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22000708912664727, "ground_truth": 0}, {"key": "36929355", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32939171345426266, "ground_truth": 0}, {"key": "36929355", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944723550994718, "ground_truth": 0}, {"key": "39127206", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6095241446901082, "ground_truth": 0}, {"key": "39127206", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16885695229801773, "ground_truth": 0}, {"key": "39127206", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22270012486935808, "ground_truth": 0}, {"key": "39127206", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802762470639, "ground_truth": 0}, {"key": "39127206", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632949353079, "ground_truth": 0}, {"key": "36128318", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29583986841623466, "ground_truth": 0}, {"key": "36128318", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5602526572242186, "ground_truth": 0}, {"key": "36128318", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24077458744575242, "ground_truth": 0}, {"key": "36128318", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203401202843, "ground_truth": 0}, {"key": "36128318", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4301473573015402, "ground_truth": 0}, {"key": "39863480", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5195213204301019, "ground_truth": 0}, {"key": "39863480", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5621764856908636, "ground_truth": 0}, {"key": "39863480", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.712232167377425, "ground_truth": 0}, {"key": "39863480", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671477047795438, "ground_truth": 0}, {"key": "39863480", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984718903841, "ground_truth": 0}, {"key": "38634057", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.247987406327685, "ground_truth": 0}, {"key": "38634057", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2295352101530311, "ground_truth": 0}, {"key": "38634057", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4687906152162291, "ground_truth": 0}, {"key": "38634057", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20434190821077597, "ground_truth": 0}, {"key": "38634057", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14128141721585966, "ground_truth": 0}, {"key": "33131935", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35756751297072414, "ground_truth": 0}, {"key": "33131935", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5389832342847322, "ground_truth": 0}, {"key": "33131935", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.41300356427321905, "ground_truth": 0}, {"key": "33131935", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4436003988264616, "ground_truth": 0}, {"key": "33131935", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39981165900740323, "ground_truth": 0}, {"key": "39021319", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21337716873061585, "ground_truth": 0}, {"key": "39021319", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12592277037438632, "ground_truth": 0}, {"key": "39021319", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20817892843578314, "ground_truth": 0}, {"key": "39021319", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11124121621437941, "ground_truth": 0}, {"key": "39021319", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09138210287938578, "ground_truth": 0}, {"key": "40644571", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2107663066742749, "ground_truth": 0}, {"key": "40644571", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1192029225453029, "ground_truth": 0}, {"key": "40644571", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13846178710890691, "ground_truth": 0}, {"key": "40644571", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11920292301990983, "ground_truth": 0}, {"key": "40644571", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18952107925224057, "ground_truth": 0}, {"key": "14681877", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.28298808677513404, "ground_truth": 0}, {"key": "14681877", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27202454173055235, "ground_truth": 0}, {"key": "14681877", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3557748976497479, "ground_truth": 0}, {"key": "14681877", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31573596497882667, "ground_truth": 0}, {"key": "14681877", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16132023652607777, "ground_truth": 0}, {"key": "36570890", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33807710993402773, "ground_truth": 0}, {"key": "36570890", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6688802542929473, "ground_truth": 0}, {"key": "36570890", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4824291141808046, "ground_truth": 0}, {"key": "36570890", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023563755719185, "ground_truth": 0}, {"key": "36570890", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4035668599707643, "ground_truth": 0}, {"key": "30452755", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6531269085525625, "ground_truth": 0}, {"key": "30452755", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5983121822130868, "ground_truth": 0}, {"key": "30452755", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5195213360238988, "ground_truth": 0}, {"key": "30452755", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315943150457158, "ground_truth": 0}, {"key": "30452755", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4960938237587249, "ground_truth": 0}, {"key": "37347053", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24944723854997491, "ground_truth": 0}, {"key": "37347053", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21866938025803284, "ground_truth": 0}, {"key": "37347053", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2379298991589262, "ground_truth": 0}, {"key": "37347053", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2909808911161556, "ground_truth": 0}, {"key": "37347053", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594720817428118, "ground_truth": 0}, {"key": "38890979", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17781086747575958, "ground_truth": 0}, {"key": "38890979", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21601153960347902, "ground_truth": 0}, {"key": "38890979", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21733752545195215, "ground_truth": 0}, {"key": "38890979", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15921741629861827, "ground_truth": 0}, {"key": "38890979", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1655931093903649, "ground_truth": 0}, {"key": "32974694", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15610490346857994, "ground_truth": 0}, {"key": "32974694", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3451052892425735, "ground_truth": 0}, {"key": "32974694", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18010665212427157, "ground_truth": 0}, {"key": "32974694", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2751297093789206, "ground_truth": 0}, {"key": "32974694", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16776335215163155, "ground_truth": 0}, {"key": "38519940", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6187804264785993, "ground_truth": 0}, {"key": "38519940", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47657968239222637, "ground_truth": 0}, {"key": "38519940", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38676344501820914, "ground_truth": 0}, {"key": "38519940", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318295176026, "ground_truth": 0}, {"key": "38519940", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036222718817, "ground_truth": 0}, {"key": "38870104", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5679366051393363, "ground_truth": 0}, {"key": "38870104", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40356685292146904, "ground_truth": 0}, {"key": "38870104", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3738758096992093, "ground_truth": 0}, {"key": "38870104", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4167966336727848, "ground_truth": 0}, {"key": "38870104", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3998116437957654, "ground_truth": 0}, {"key": "34283161", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19193279552131584, "ground_truth": 0}, {"key": "34283161", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3451052852117862, "ground_truth": 0}, {"key": "34283161", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12506537813659718, "ground_truth": 0}, {"key": "34283161", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2538610119904096, "ground_truth": 0}, {"key": "34283161", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4035668462463376, "ground_truth": 0}, {"key": "31650463", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26588045721163717, "ground_truth": 0}, {"key": "31650463", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47268347690261847, "ground_truth": 0}, {"key": "31650463", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3775406622577389, "ground_truth": 0}, {"key": "31650463", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3793783854068032, "ground_truth": 0}, {"key": "31650463", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3293917163830545, "ground_truth": 0}, {"key": "35589432", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6654105695229824, "ground_truth": 0}, {"key": "35589432", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4863315342726, "ground_truth": 0}, {"key": "35589432", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5736783846355922, "ground_truth": 0}, {"key": "35589432", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381467847294, "ground_truth": 0}, {"key": "35589432", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27048022231042695, "ground_truth": 0}, {"key": "14412752", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39233681774182444, "ground_truth": 0}, {"key": "14412752", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43590152666172577, "ground_truth": 0}, {"key": "14412752", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.37387579733469684, "ground_truth": 0}, {"key": "14412752", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3647775390658416, "ground_truth": 0}, {"key": "14412752", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199383851744, "ground_truth": 0}, {"key": "37271183", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6671476782326868, "ground_truth": 0}, {"key": "37271183", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6893056076977228, "ground_truth": 0}, {"key": "37271183", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8509647110908145, "ground_truth": 0}, {"key": "37271183", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358397637235, "ground_truth": 0}, {"key": "37271183", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916163000913, "ground_truth": 0}, {"key": "35588153", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7154239702951534, "ground_truth": 0}, {"key": "35588153", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8044059250672858, "ground_truth": 0}, {"key": "35588153", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6206216065855433, "ground_truth": 0}, {"key": "35588153", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.810478932139871, "ground_truth": 0}, {"key": "35588153", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300761888815, "ground_truth": 0}, {"key": "39876692", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3242354195638759, "ground_truth": 0}, {"key": "39876692", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.36477753460745477, "ground_truth": 0}, {"key": "39876692", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42059963345738216, "ground_truth": 0}, {"key": "39876692", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3242353918524764, "ground_truth": 0}, {"key": "39876692", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2568320070461029, "ground_truth": 0}, {"key": "38992323", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3830641547947068, "ground_truth": 0}, {"key": "38992323", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3575675206672922, "ground_truth": 0}, {"key": "38992323", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4416730131204518, "ground_truth": 0}, {"key": "38992323", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5428632728375083, "ground_truth": 0}, {"key": "38992323", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633960081993, "ground_truth": 0}, {"key": "37556002", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1801066732360539, "ground_truth": 0}, {"key": "37556002", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1602660333910273, "ground_truth": 0}, {"key": "37556002", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20561504712602838, "ground_truth": 0}, {"key": "37556002", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27512971850072804, "ground_truth": 0}, {"key": "37556002", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20181322652700426, "ground_truth": 0}, {"key": "39875801", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6859494860326951, "ground_truth": 0}, {"key": "39875801", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.35577487524998036, "ground_truth": 0}, {"key": "39875801", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6671476785468726, "ground_truth": 0}, {"key": "39875801", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203455890071, "ground_truth": 0}, {"key": "39875801", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428633023660681, "ground_truth": 0}, {"key": "39272285", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2798285070062842, "ground_truth": 0}, {"key": "39272285", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12421301144273023, "ground_truth": 0}, {"key": "39272285", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2450850196267846, "ground_truth": 0}, {"key": "39272285", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3023910662158591, "ground_truth": 0}, {"key": "39272285", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37754066411172427, "ground_truth": 0}, {"key": "39629714", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3140505313803193, "ground_truth": 0}, {"key": "39629714", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.09073548540047333, "ground_truth": 0}, {"key": "39629714", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2309197442503413, "ground_truth": 0}, {"key": "39629714", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08882029176881193, "ground_truth": 0}, {"key": "39629714", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2568320004726967, "ground_truth": 0}, {"key": "34043257", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5428632772166424, "ground_truth": 0}, {"key": "34043257", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4474602853099383, "ground_truth": 0}, {"key": "34043257", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5370413812457971, "ground_truth": 0}, {"key": "34043257", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804310949072, "ground_truth": 0}, {"key": "34043257", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631920678583, "ground_truth": 0}, {"key": "33995240", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20817892873114582, "ground_truth": 0}, {"key": "33995240", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5331543906879788, "ground_truth": 0}, {"key": "33995240", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39233682289313027, "ground_truth": 0}, {"key": "33995240", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17217184920957684, "ground_truth": 0}, {"key": "33995240", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641555972855, "ground_truth": 0}, {"key": "39399948", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.49023563717913937, "ground_truth": 0}, {"key": "39399948", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6477982180625294, "ground_truth": 0}, {"key": "39399948", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.32082130552000376, "ground_truth": 0}, {"key": "39399948", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.592666591472751, "ground_truth": 0}, {"key": "39399948", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941409156237261, "ground_truth": 0}, {"key": "33185890", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5602526594522369, "ground_truth": 0}, {"key": "33185890", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6261241780530227, "ground_truth": 0}, {"key": "33185890", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6224593250062632, "ground_truth": 0}, {"key": "33185890", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.51757085728728, "ground_truth": 0}, {"key": "33185890", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.476579657448531, "ground_truth": 0}, {"key": "35280425", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1592174041170662, "ground_truth": 0}, {"key": "35280425", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28298809645074463, "ground_truth": 0}, {"key": "35280425", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20055768563429832, "ground_truth": 0}, {"key": "35280425", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.115960719792498, "ground_truth": 0}, {"key": "35280425", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14318771483981182, "ground_truth": 0}, {"key": "16365170", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5926666019402229, "ground_truth": 0}, {"key": "16365170", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7853086062957284, "ground_truth": 0}, {"key": "16365170", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7431680157949079, "ground_truth": 0}, {"key": "16365170", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486735217042322, "ground_truth": 0}, {"key": "16365170", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804339474766, "ground_truth": 0}, {"key": "24388238", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23091977457549653, "ground_truth": 0}, {"key": "24388238", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2766905371399599, "ground_truth": 0}, {"key": "24388238", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19559405730302326, "ground_truth": 0}, {"key": "24388238", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2254166051315041, "ground_truth": 0}, {"key": "24388238", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1871326983179741, "ground_truth": 0}, {"key": "35024827", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17217185391042064, "ground_truth": 0}, {"key": "35024827", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17667160966632878, "ground_truth": 0}, {"key": "35024827", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13753245624799829, "ground_truth": 0}, {"key": "35024827", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2081789307367406, "ground_truth": 0}, {"key": "35024827", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09670578843511721, "ground_truth": 0}, {"key": "38624944", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.48633148535711374, "ground_truth": 0}, {"key": "38624944", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4359015234621625, "ground_truth": 0}, {"key": "38624944", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5945512886055025, "ground_truth": 0}, {"key": "38624944", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45519860872510454, "ground_truth": 0}, {"key": "38624944", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754386179322, "ground_truth": 0}, {"key": "34719830", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3611647332017532, "ground_truth": 0}, {"key": "34719830", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47852883614035463, "ground_truth": 0}, {"key": "34719830", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5389831964043391, "ground_truth": 0}, {"key": "34719830", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476988187159, "ground_truth": 0}, {"key": "34719830", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4474603036679675, "ground_truth": 0}, {"key": "38995225", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17328820813995446, "ground_truth": 0}, {"key": "38995225", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3123700079886899, "ground_truth": 0}, {"key": "38995225", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14223189026917255, "ground_truth": 0}, {"key": "38995225", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17895589837364256, "ground_truth": 0}, {"key": "38995225", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18242552308912255, "ground_truth": 0}, {"key": "34242311", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16559310023818935, "ground_truth": 0}, {"key": "34242311", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37022538369758023, "ground_truth": 0}, {"key": "34242311", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07696083473984003, "ground_truth": 0}, {"key": "34242311", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11516222868880971, "ground_truth": 0}, {"key": "34242311", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19193280291303116, "ground_truth": 0}, {"key": "39253748", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6636689390174889, "ground_truth": 0}, {"key": "39253748", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6495786215551755, "ground_truth": 0}, {"key": "39253748", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4726834545243279, "ground_truth": 0}, {"key": "39253748", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526667858956, "ground_truth": 0}, {"key": "39253748", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185319379989, "ground_truth": 0}, {"key": "37131104", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9674102568250071, "ground_truth": 0}, {"key": "37131104", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9224823430648412, "ground_truth": 0}, {"key": "37131104", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9190632946332181, "ground_truth": 0}, {"key": "37131104", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9658995752609664, "ground_truth": 0}, {"key": "37131104", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9790357586334376, "ground_truth": 0}, {"key": "38490554", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6548947458513237, "ground_truth": 0}, {"key": "38490554", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5448013875606043, "ground_truth": 0}, {"key": "38490554", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.750552762852997, "ground_truth": 0}, {"key": "38490554", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512676009167, "ground_truth": 0}, {"key": "38490554", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.682573717107273, "ground_truth": 0}, {"key": "29009500", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.28616926329607273, "ground_truth": 0}, {"key": "29009500", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5602526723512928, "ground_truth": 0}, {"key": "29009500", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38491215329156875, "ground_truth": 0}, {"key": "29009500", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245597239153, "ground_truth": 0}, {"key": "29009500", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.26284185761557094, "ground_truth": 0}, {"key": "36703057", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "36703057", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17781086630888496, "ground_truth": 0}, {"key": "36703057", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22541660953419795, "ground_truth": 0}, {"key": "36703057", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22270013362648947, "ground_truth": 0}, {"key": "36703057", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.190724015042248, "ground_truth": 0}, {"key": "34876987", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7745833957751733, "ground_truth": 0}, {"key": "34876987", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5832033733354468, "ground_truth": 0}, {"key": "34876987", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5058590975574837, "ground_truth": 0}, {"key": "34876987", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.41111087109579747, "ground_truth": 0}, {"key": "34876987", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4726835102611686, "ground_truth": 0}, {"key": "36209258", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34510527925651924, "ground_truth": 0}, {"key": "36209258", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5544704735311622, "ground_truth": 0}, {"key": "36209258", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1801066733472, "ground_truth": 0}, {"key": "36209258", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2829881239197045, "ground_truth": 0}, {"key": "36209258", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378234997202286, "ground_truth": 0}, {"key": "36854437", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13939638818335737, "ground_truth": 0}, {"key": "36854437", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2958398410961475, "ground_truth": 0}, {"key": "36854437", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1097057728486533, "ground_truth": 0}, {"key": "36854437", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13296425214394098, "ground_truth": 0}, {"key": "36854437", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11676401010318777, "ground_truth": 0}, {"key": "38047723", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13477592088466622, "ground_truth": 0}, {"key": "38047723", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19072402195613836, "ground_truth": 0}, {"key": "38047723", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08035746827657315, "ground_truth": 0}, {"key": "38047723", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15203224222634731, "ground_truth": 0}, {"key": "38047723", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.175538063126137, "ground_truth": 0}, {"key": "34287816", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21601153609079543, "ground_truth": 0}, {"key": "34287816", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28298811331933077, "ground_truth": 0}, {"key": "34287816", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3904758414031302, "ground_truth": 0}, {"key": "34287816", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.346873078657286, "ground_truth": 0}, {"key": "34287816", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40168779843477975, "ground_truth": 0}, {"key": "33235855", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.855851147917174, "ground_truth": 0}, {"key": "33235855", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6406358530157942, "ground_truth": 0}, {"key": "33235855", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5907792054091047, "ground_truth": 0}, {"key": "33235855", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228905134005, "ground_truth": 0}, {"key": "33235855", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416508786281, "ground_truth": 0}, {"key": "34381016", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2814055886770127, "ground_truth": 0}, {"key": "34381016", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37387583656695306, "ground_truth": 0}, {"key": "34381016", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.37204876693823047, "ground_truth": 0}, {"key": "34381016", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3468731114759827, "ground_truth": 0}, {"key": "34381016", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45326183775162787, "ground_truth": 0}, {"key": "28064995", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2798285095928334, "ground_truth": 0}, {"key": "28064995", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3738758158954002, "ground_truth": 0}, {"key": "28064995", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18126321718191513, "ground_truth": 0}, {"key": "28064995", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16238002696467374, "ground_truth": 0}, {"key": "28064995", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594720853636518, "ground_truth": 0}, {"key": "37576197", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11047114485057295, "ground_truth": 0}, {"key": "37576197", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.04849600372793591, "ground_truth": 0}, {"key": "37576197", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.059646942398612256, "ground_truth": 0}, {"key": "37576197", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12002563098436908, "ground_truth": 0}, {"key": "37576197", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12252321375634612, "ground_truth": 0}, {"key": "34454741", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20434190358578214, "ground_truth": 0}, {"key": "34454741", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1338674893320062, "ground_truth": 0}, {"key": "34454741", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2845759862170318, "ground_truth": 0}, {"key": "34454741", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15405756572262044, "ground_truth": 0}, {"key": "34454741", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19436780327301978, "ground_truth": 0}, {"key": "34766970", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2829881276142346, "ground_truth": 0}, {"key": "34766970", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.36840570504119347, "ground_truth": 0}, {"key": "34766970", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31405054284596684, "ground_truth": 0}, {"key": "34766970", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38491215337416135, "ground_truth": 0}, {"key": "34766970", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090237072060781, "ground_truth": 0}, {"key": "35574186", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "35574186", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23934933156152755, "ground_truth": 0}, {"key": "35574186", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3345894336776384, "ground_truth": 0}, {"key": "35574186", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37204880358961334, "ground_truth": 0}, {"key": "35574186", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.626124178994349, "ground_truth": 0}, {"key": "35486470", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20817893444492183, "ground_truth": 0}, {"key": "35486470", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2365162382890991, "ground_truth": 0}, {"key": "35486470", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1744102744445796, "ground_truth": 0}, {"key": "35486470", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3191213928015268, "ground_truth": 0}, {"key": "35486470", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11596071429868592, "ground_truth": 0}, {"key": "40977702", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08389038932011549, "ground_truth": 0}, {"key": "40977702", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07263670829275598, "ground_truth": 0}, {"key": "40977702", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14511535378268733, "ground_truth": 0}, {"key": "40977702", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.06418264194381494, "ground_truth": 0}, {"key": "40977702", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.04603389819029459, "ground_truth": 0}, {"key": "35336618", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4921881308008825, "ground_truth": 0}, {"key": "35336618", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43590151375429864, "ground_truth": 0}, {"key": "35336618", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5234203640250652, "ground_truth": 0}, {"key": "35336618", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43014734418788436, "ground_truth": 0}, {"key": "35336618", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591091397389, "ground_truth": 0}, {"key": "33024679", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.320821314195063, "ground_truth": 0}, {"key": "33024679", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3539863064777219, "ground_truth": 0}, {"key": "33024679", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4649015768654377, "ground_truth": 0}, {"key": "33024679", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307859011614, "ground_truth": 0}, {"key": "33024679", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.42059959433790994, "ground_truth": 0}, {"key": "37451334", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25982561355640466, "ground_truth": 0}, {"key": "37451334", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17328820604467488, "ground_truth": 0}, {"key": "37451334", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.32252598059564436, "ground_truth": 0}, {"key": "37451334", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1666753934168933, "ground_truth": 0}, {"key": "37451334", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364245270603585, "ground_truth": 0}, {"key": "33354824", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2658804813741809, "ground_truth": 0}, {"key": "33354824", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23934933819103515, "ground_truth": 0}, {"key": "33354824", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20434188306236425, "ground_truth": 0}, {"key": "33354824", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12002562397271115, "ground_truth": 0}, {"key": "33354824", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30902370742075974, "ground_truth": 0}, {"key": "34688538", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2200071056013304, "ground_truth": 0}, {"key": "34688538", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12765262321131468, "ground_truth": 0}, {"key": "34688538", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1259227701677646, "ground_truth": 0}, {"key": "34688538", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18242552601724, "ground_truth": 0}, {"key": "34688538", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20434191035994534, "ground_truth": 0}, {"key": "33646276", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20689406029705168, "ground_truth": 0}, {"key": "33646276", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22270014506521615, "ground_truth": 0}, {"key": "33646276", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3208213127155314, "ground_truth": 0}, {"key": "33646276", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1089450468348434, "ground_truth": 0}, {"key": "33646276", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486735007230678, "ground_truth": 0}, {"key": "40322608", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.47852884272854196, "ground_truth": 0}, {"key": "40322608", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2538610188069613, "ground_truth": 0}, {"key": "40322608", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43014731141607004, "ground_truth": 0}, {"key": "40322608", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.476579666227972, "ground_truth": 0}, {"key": "40322608", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786205697046, "ground_truth": 0}, {"key": "39565762", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36658972736159684, "ground_truth": 0}, {"key": "39565762", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3504213853751003, "ground_truth": 0}, {"key": "39565762", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24798743574503337, "ground_truth": 0}, {"key": "39565762", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4359015223200207, "ground_truth": 0}, {"key": "39565762", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4960938388343948, "ground_truth": 0}, {"key": "30534259", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19682620522004918, "ground_truth": 0}, {"key": "30534259", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5175709061761063, "ground_truth": 0}, {"key": "30534259", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.443600417716334, "ground_truth": 0}, {"key": "30534259", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.381219560584771, "ground_truth": 0}, {"key": "30534259", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4339814400770282, "ground_truth": 0}, {"key": "39644242", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5273165106971038, "ground_truth": 0}, {"key": "39644242", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4960938396557985, "ground_truth": 0}, {"key": "39644242", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5467381544985204, "ground_truth": 0}, {"key": "39644242", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.36296922027091444, "ground_truth": 0}, {"key": "39644242", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.513668454741092, "ground_truth": 0}, {"key": "19853740", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.029535338006079864, "ground_truth": 0}, {"key": "19853740", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07055959798110684, "ground_truth": 0}, {"key": "19853740", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11838510155295537, "ground_truth": 0}, {"key": "19853740", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.048496001492953696, "ground_truth": 0}, {"key": "19853740", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.084492759162562, "ground_truth": 0}, {"key": "33023078", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39981163910096407, "ground_truth": 0}, {"key": "33023078", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4824290953883609, "ground_truth": 0}, {"key": "33023078", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.46101673850051955, "ground_truth": 0}, {"key": "33023078", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4167966677611683, "ground_truth": 0}, {"key": "33023078", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804787000901779, "ground_truth": 0}, {"key": "38329806", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08819004604647483, "ground_truth": 0}, {"key": "38329806", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10970577261277703, "ground_truth": 0}, {"key": "38329806", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.30239108454460023, "ground_truth": 0}, {"key": "38329806", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.06278920686597467, "ground_truth": 0}, {"key": "38329806", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09009299211309085, "ground_truth": 0}, {"key": "38761942", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2227001394327513, "ground_truth": 0}, {"key": "38761942", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.556399569496632, "ground_truth": 0}, {"key": "38761942", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42441200060764467, "ground_truth": 0}, {"key": "38761942", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413837903539, "ground_truth": 0}, {"key": "38761942", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995668027845, "ground_truth": 0}, {"key": "33773576", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15817435611588024, "ground_truth": 0}, {"key": "33773576", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5370414025039835, "ground_truth": 0}, {"key": "33773576", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3849121633720608, "ground_truth": 0}, {"key": "33773576", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.272024537974308, "ground_truth": 0}, {"key": "33773576", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.609524183950863, "ground_truth": 0}, {"key": "37642631", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2613309377624447, "ground_truth": 0}, {"key": "37642631", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1871326822642871, "ground_truth": 0}, {"key": "37642631", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22135069029078155, "ground_truth": 0}, {"key": "37642631", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14804719293818105, "ground_truth": 0}, {"key": "37642631", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3040416825196723, "ground_truth": 0}, {"key": "36609836", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39981166173564797, "ground_truth": 0}, {"key": "36609836", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4436004341421763, "ground_truth": 0}, {"key": "36609836", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5717665836524396, "ground_truth": 0}, {"key": "36609836", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786310397624, "ground_truth": 0}, {"key": "36609836", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38491213669181223, "ground_truth": 0}, {"key": "41035610", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14804719869767372, "ground_truth": 0}, {"key": "41035610", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3208212885528992, "ground_truth": 0}, {"key": "41035610", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22678362508776617, "ground_truth": 0}, {"key": "41035610", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2735743849746932, "ground_truth": 0}, {"key": "41035610", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2974699733644825, "ground_truth": 0}, {"key": "37592684", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13660838604717823, "ground_truth": 0}, {"key": "37592684", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6261241766920791, "ground_truth": 0}, {"key": "37592684", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.47073663877693084, "ground_truth": 0}, {"key": "37592684", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324551185786, "ground_truth": 0}, {"key": "37592684", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557748716473004, "ground_truth": 0}, {"key": "38951040", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19559409334177658, "ground_truth": 0}, {"key": "38951040", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14608724121987976, "ground_truth": 0}, {"key": "38951040", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14223188987402852, "ground_truth": 0}, {"key": "38951040", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256438951437, "ground_truth": 0}, {"key": "38951040", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16667540345391627, "ground_truth": 0}, {"key": "40774469", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24077459737662724, "ground_truth": 0}, {"key": "40774469", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.055823140505002616, "ground_truth": 0}, {"key": "40774469", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1581743582839694, "ground_truth": 0}, {"key": "40774469", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17328820738526282, "ground_truth": 0}, {"key": "40774469", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.25238404510672835, "ground_truth": 0}, {"key": "40876288", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3174262549328358, "ground_truth": 0}, {"key": "40876288", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4205995771666, "ground_truth": 0}, {"key": "40876288", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20181322393936957, "ground_truth": 0}, {"key": "40876288", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11047115029434468, "ground_truth": 0}, {"key": "40876288", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16344543900946357, "ground_truth": 0}, {"key": "40340131", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34158250002839413, "ground_truth": 0}, {"key": "40340131", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5506073545856425, "ground_truth": 0}, {"key": "40340131", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.48438011084852267, "ground_truth": 0}, {"key": "40340131", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629586449656312, "ground_truth": 0}, {"key": "40340131", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43398145582008946, "ground_truth": 0}, {"key": "30121591", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5389832200602946, "ground_truth": 0}, {"key": "30121591", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5253688288172841, "ground_truth": 0}, {"key": "30121591", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3363310512537187, "ground_truth": 0}, {"key": "30121591", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.39981162568604695, "ground_truth": 0}, {"key": "30121591", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2893717012976369, "ground_truth": 0}, {"key": "35623366", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.538983250503951, "ground_truth": 0}, {"key": "35623366", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11436852347649619, "ground_truth": 0}, {"key": "35623366", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.544801379021935, "ground_truth": 0}, {"key": "35623366", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43398149516418, "ground_truth": 0}, {"key": "35623366", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2925953008987439, "ground_truth": 0}, {"key": "41014093", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5888891340098066, "ground_truth": 0}, {"key": "41014093", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.39047585830689596, "ground_truth": 0}, {"key": "41014093", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7648915990088244, "ground_truth": 0}, {"key": "41014093", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907791939684698, "ground_truth": 0}, {"key": "41014093", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786217339713, "ground_truth": 0}, {"key": "11387984", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3867634449208691, "ground_truth": 0}, {"key": "11387984", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15921741371070325, "ground_truth": 0}, {"key": "11387984", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3575675483287331, "ground_truth": 0}, {"key": "11387984", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3979384403237834, "ground_truth": 0}, {"key": "11387984", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19682620684437122, "ground_truth": 0}, {"key": "39508312", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3775406829905013, "ground_truth": 0}, {"key": "39508312", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3557748785786396, "ground_truth": 0}, {"key": "39508312", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3398276437148272, "ground_truth": 0}, {"key": "39508312", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22270013903388963, "ground_truth": 0}, {"key": "39508312", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2479874576092124, "ground_truth": 0}, {"key": "35815369", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26284184566269686, "ground_truth": 0}, {"key": "35815369", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42632159353723936, "ground_truth": 0}, {"key": "35815369", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6334102569049347, "ground_truth": 0}, {"key": "35815369", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3363310505508809, "ground_truth": 0}, {"key": "35815369", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3345894514900873, "ground_truth": 0}, {"key": "35802823", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5717666211043346, "ground_truth": 0}, {"key": "35802823", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4687906338223396, "ground_truth": 0}, {"key": "35802823", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7371581856388265, "ground_truth": 0}, {"key": "35802823", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942940615037, "ground_truth": 0}, {"key": "35802823", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125961015849, "ground_truth": 0}, {"key": "38499968", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5292634120753726, "ground_truth": 0}, {"key": "38499968", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19072402339290245, "ground_truth": 0}, {"key": "38499968", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3363310516899936, "ground_truth": 0}, {"key": "38499968", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629586057281469, "ground_truth": 0}, {"key": "38499968", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592254058327707, "ground_truth": 0}, {"key": "36926726", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3575675266511217, "ground_truth": 0}, {"key": "36926726", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5888891126235264, "ground_truth": 0}, {"key": "36926726", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4668455938766628, "ground_truth": 0}, {"key": "36926726", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688286183169, "ground_truth": 0}, {"key": "36926726", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3904758364241807, "ground_truth": 0}, {"key": "40903712", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.49414086792490913, "ground_truth": 0}, {"key": "40903712", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5350984485632665, "ground_truth": 0}, {"key": "40903712", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3629691853138551, "ground_truth": 0}, {"key": "40903712", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.372048761792407, "ground_truth": 0}, {"key": "40903712", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37570645374098594, "ground_truth": 0}, {"key": "19614862", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6187804399432392, "ground_truth": 0}, {"key": "19614862", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.346873073976661, "ground_truth": 0}, {"key": "19614862", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.558326998754999, "ground_truth": 0}, {"key": "19614862", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.556399581685994, "ground_truth": 0}, {"key": "19614862", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.41111085506841194, "ground_truth": 0}, {"key": "38861704", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.32939172183097054, "ground_truth": 0}, {"key": "38861704", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.289371701362927, "ground_truth": 0}, {"key": "38861704", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5409238773746905, "ground_truth": 0}, {"key": "38861704", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31069441192783026, "ground_truth": 0}, {"key": "38861704", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2942149776034034, "ground_truth": 0}, {"key": "34349607", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16238002804522367, "ground_truth": 0}, {"key": "34349607", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2991051847063943, "ground_truth": 0}, {"key": "34349607", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21076629271269054, "ground_truth": 0}, {"key": "34349607", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2407745928370637, "ground_truth": 0}, {"key": "34349607", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.06465349039568939, "ground_truth": 0}, {"key": "20773800", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1311732275176822, "ground_truth": 0}, {"key": "20773800", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24364245416433114, "ground_truth": 0}, {"key": "20773800", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07978201729992675, "ground_truth": 0}, {"key": "20773800", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09670579461378166, "ground_truth": 0}, {"key": "20773800", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.06656918744556188, "ground_truth": 0}, {"key": "35545608", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7106282858717875, "ground_truth": 0}, {"key": "35545608", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30902370263774565, "ground_truth": 0}, {"key": "35545608", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18594720563035155, "ground_truth": 0}, {"key": "35545608", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37022538240313757, "ground_truth": 0}, {"key": "35545608", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17441027562746256, "ground_truth": 0}, {"key": "37258984", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19806417377457225, "ground_truth": 0}, {"key": "37258984", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38676342541406644, "ground_truth": 0}, {"key": "37258984", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16132023527519954, "ground_truth": 0}, {"key": "37258984", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593641549239381, "ground_truth": 0}, {"key": "37258984", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.25238403694474376, "ground_truth": 0}, {"key": "37274562", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1883239666804033, "ground_truth": 0}, {"key": "37274562", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3904758295877609, "ground_truth": 0}, {"key": "37274562", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5117166185556332, "ground_truth": 0}, {"key": "37274562", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3191213951818985, "ground_truth": 0}, {"key": "37274562", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633965837136, "ground_truth": 0}, {"key": "40828068", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6187804217643962, "ground_truth": 0}, {"key": "40828068", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7074047065990259, "ground_truth": 0}, {"key": "40828068", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6876300152671497, "ground_truth": 0}, {"key": "40828068", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593535896792, "ground_truth": 0}, {"key": "40828068", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.596433164613617, "ground_truth": 0}, {"key": "37807180", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1710611850131858, "ground_truth": 0}, {"key": "37807180", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4073334332433017, "ground_truth": 0}, {"key": "37807180", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1143685238598757, "ground_truth": 0}, {"key": "37807180", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19193280078651043, "ground_truth": 0}, {"key": "37807180", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2643583350421349, "ground_truth": 0}, {"key": "40748607", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6976089078932483, "ground_truth": 0}, {"key": "40748607", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7416740066264019, "ground_truth": 0}, {"key": "40748607", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.649578637421897, "ground_truth": 0}, {"key": "40748607", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.581303079571842, "ground_truth": 0}, {"key": "40748607", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046847443457, "ground_truth": 0}, {"key": "40123819", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5907791925641112, "ground_truth": 0}, {"key": "40123819", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38861803174598264, "ground_truth": 0}, {"key": "40123819", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7620701041658589, "ground_truth": 0}, {"key": "40123819", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.40922077589733125, "ground_truth": 0}, {"key": "40123819", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3363310354656035, "ground_truth": 0}, {"key": "38453867", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20946968131639887, "ground_truth": 0}, {"key": "38453867", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4148988528716658, "ground_truth": 0}, {"key": "38453867", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16776334893405612, "ground_truth": 0}, {"key": "38453867", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28937171674348283, "ground_truth": 0}, {"key": "38453867", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.29098084049357037, "ground_truth": 0}, {"key": "38944856", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27982849513033076, "ground_truth": 0}, {"key": "38944856", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28140561355050736, "ground_truth": 0}, {"key": "38944856", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39047579587067016, "ground_truth": 0}, {"key": "38944856", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2829881215619408, "ground_truth": 0}, {"key": "38944856", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33633104238945166, "ground_truth": 0}, {"key": "35778898", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5234203356844076, "ground_truth": 0}, {"key": "35778898", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4397473260847217, "ground_truth": 0}, {"key": "35778898", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3960681555360282, "ground_truth": 0}, {"key": "35778898", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878541182908, "ground_truth": 0}, {"key": "35778898", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175082363053, "ground_truth": 0}, {"key": "32530125", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21076629280843462, "ground_truth": 0}, {"key": "32530125", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4016877994126606, "ground_truth": 0}, {"key": "32530125", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22270013942762246, "ground_truth": 0}, {"key": "32530125", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1699562298296524, "ground_truth": 0}, {"key": "32530125", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.31405056113640895, "ground_truth": 0}, {"key": "35010363", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2094696843630069, "ground_truth": 0}, {"key": "35010363", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22678363537816448, "ground_truth": 0}, {"key": "35010363", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2379298931712804, "ground_truth": 0}, {"key": "35010363", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16026604016198995, "ground_truth": 0}, {"key": "35010363", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3056973077006466, "ground_truth": 0}, {"key": "27514800", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5389832107819896, "ground_truth": 0}, {"key": "27514800", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.39420094148953244, "ground_truth": 0}, {"key": "27514800", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8278281478475651, "ground_truth": 0}, {"key": "27514800", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5428632682243125, "ground_truth": 0}, {"key": "27514800", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998418381408, "ground_truth": 0}, {"key": "25725840", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2735743771098314, "ground_truth": 0}, {"key": "25725840", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25386101284195056, "ground_truth": 0}, {"key": "25725840", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23231015352564122, "ground_truth": 0}, {"key": "25725840", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23792989734286624, "ground_truth": 0}, {"key": "25725840", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1835936244605252, "ground_truth": 0}, {"key": "38327225", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5331544072915807, "ground_truth": 0}, {"key": "38327225", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7279754441322718, "ground_truth": 0}, {"key": "38327225", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.284576007608206, "ground_truth": 0}, {"key": "38327225", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1520322509150406, "ground_truth": 0}, {"key": "38327225", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3522017854286889, "ground_truth": 0}, {"key": "11991724", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4436003897709531, "ground_truth": 0}, {"key": "11991724", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5717666402870512, "ground_truth": 0}, {"key": "11991724", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4668455984454951, "ground_truth": 0}, {"key": "11991724", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711592290373, "ground_truth": 0}, {"key": "11991724", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.46684558586425606, "ground_truth": 0}, {"key": "32217545", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3311197162830239, "ground_truth": 0}, {"key": "32217545", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3276683265608474, "ground_truth": 0}, {"key": "32217545", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7563575593336691, "ground_truth": 0}, {"key": "32217545", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3023910750113385, "ground_truth": 0}, {"key": "32217545", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3242353931822959, "ground_truth": 0}, {"key": "12731847", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23091975630249234, "ground_truth": 0}, {"key": "12731847", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26740817966042707, "ground_truth": 0}, {"key": "12731847", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1520322509172062, "ground_truth": 0}, {"key": "12731847", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12678517080369947, "ground_truth": 0}, {"key": "12731847", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1500288111807054, "ground_truth": 0}, {"key": "36827234", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21866936593087666, "ground_truth": 0}, {"key": "36827234", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5273164996809262, "ground_truth": 0}, {"key": "36827234", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6791786837672387, "ground_truth": 0}, {"key": "36827234", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3522017905372585, "ground_truth": 0}, {"key": "36827234", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360040872205775, "ground_truth": 0}, {"key": "29111539", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1666754048942046, "ground_truth": 0}, {"key": "29111539", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2436424436835759, "ground_truth": 0}, {"key": "29111539", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3090237068013872, "ground_truth": 0}, {"key": "29111539", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2583260001599965, "ground_truth": 0}, {"key": "29111539", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37754069784639793, "ground_truth": 0}, {"key": "37763052", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2240554530914153, "ground_truth": 0}, {"key": "37763052", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28140560615119425, "ground_truth": 0}, {"key": "37763052", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5698526327821312, "ground_truth": 0}, {"key": "37763052", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07316471657648031, "ground_truth": 0}, {"key": "37763052", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3345894448303143, "ground_truth": 0}, {"key": "30682335", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.04707417782874377, "ground_truth": 0}, {"key": "30682335", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1366084026774152, "ground_truth": 0}, {"key": "30682335", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19436781130843336, "ground_truth": 0}, {"key": "30682335", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.06512754532352938, "ground_truth": 0}, {"key": "30682335", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.051845467267383406, "ground_truth": 0}, {"key": "12261276", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2958398756412289, "ground_truth": 0}, {"key": "12261276", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28937169717395395, "ground_truth": 0}, {"key": "12261276", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.34510528670213053, "ground_truth": 0}, {"key": "12261276", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2494472362945146, "ground_truth": 0}, {"key": "12261276", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118829602967, "ground_truth": 0}, {"key": "36912979", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29910519499873894, "ground_truth": 0}, {"key": "36912979", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6113819420658567, "ground_truth": 0}, {"key": "36912979", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24220563210999732, "ground_truth": 0}, {"key": "36912979", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16667540370424747, "ground_truth": 0}, {"key": "36912979", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808663046671, "ground_truth": 0}, {"key": "30205259", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5019531095276663, "ground_truth": 0}, {"key": "30205259", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5774953691968573, "ground_truth": 0}, {"key": "30205259", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6261241447617062, "ground_truth": 0}, {"key": "30205259", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643803378111, "ground_truth": 0}, {"key": "30205259", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4843801103692743, "ground_truth": 0}, {"key": "39458032", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.874934621350573, "ground_truth": 0}, {"key": "39458032", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8539127518832322, "ground_truth": 0}, {"key": "39458032", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6406358491120421, "ground_truth": 0}, {"key": "39458032", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494868220231, "ground_truth": 0}, {"key": "39458032", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544125111462, "ground_truth": 0}, {"key": "35116452", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16238002220309708, "ground_truth": 0}, {"key": "35116452", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07751766020811279, "ground_truth": 0}, {"key": "35116452", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10374862827193293, "ground_truth": 0}, {"key": "35116452", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.057071398684099654, "ground_truth": 0}, {"key": "35116452", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12506538549623672, "ground_truth": 0}, {"key": "40107476", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3157359676623502, "ground_truth": 0}, {"key": "40107476", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6039318385970366, "ground_truth": 0}, {"key": "40107476", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3629692074628323, "ground_truth": 0}, {"key": "40107476", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.30074559416071406, "ground_truth": 0}, {"key": "40107476", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2766905237710246, "ground_truth": 0}, {"key": "39501049", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.45326183175862106, "ground_truth": 0}, {"key": "39501049", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5660185607396235, "ground_truth": 0}, {"key": "39501049", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7122321896329069, "ground_truth": 0}, {"key": "39501049", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717666068942765, "ground_truth": 0}, {"key": "39501049", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6808786408180614, "ground_truth": 0}, {"key": "39642178", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35398630435296274, "ground_truth": 0}, {"key": "39642178", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2254166209759564, "ground_truth": 0}, {"key": "39642178", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.0907354815409993, "ground_truth": 0}, {"key": "39642178", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12168574727912192, "ground_truth": 0}, {"key": "39642178", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1789559048747593, "ground_truth": 0}, {"key": "38024796", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3090237071973969, "ground_truth": 0}, {"key": "38024796", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.46295862717695213, "ground_truth": 0}, {"key": "38024796", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27825680559924265, "ground_truth": 0}, {"key": "38024796", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3090237084970342, "ground_truth": 0}, {"key": "38024796", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2240554566687644, "ground_truth": 0}, {"key": "36652079", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22953520402276997, "ground_truth": 0}, {"key": "36652079", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3923368314840342, "ground_truth": 0}, {"key": "36652079", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38676345583731225, "ground_truth": 0}, {"key": "36652079", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1666754073334341, "ground_truth": 0}, {"key": "36652079", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2720245603627953, "ground_truth": 0}, {"key": "32193402", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5214711561863863, "ground_truth": 0}, {"key": "32193402", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4649015811427657, "ground_truth": 0}, {"key": "32193402", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4416729931079021, "ground_truth": 0}, {"key": "32193402", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668455889523578, "ground_truth": 0}, {"key": "32193402", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526567269234, "ground_truth": 0}, {"key": "32589706", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2146913995441671, "ground_truth": 0}, {"key": "32589706", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3504213630128942, "ground_truth": 0}, {"key": "32589706", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2553436609886908, "ground_truth": 0}, {"key": "32589706", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2365162481582308, "ground_truth": 0}, {"key": "32589706", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22678363851208258, "ground_truth": 0}, {"key": "38590589", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.38861802115008925, "ground_truth": 0}, {"key": "38590589", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6943026802148864, "ground_truth": 0}, {"key": "38590589", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20434190730231652, "ground_truth": 0}, {"key": "38590589", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203294849691, "ground_truth": 0}, {"key": "38590589", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4130035767816888, "ground_truth": 0}, {"key": "37045414", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.930962069282353, "ground_truth": 0}, {"key": "37045414", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9207896833732845, "ground_truth": 0}, {"key": "37045414", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9339146289428301, "ground_truth": 0}, {"key": "37045414", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.950041474543562, "ground_truth": 0}, {"key": "37045414", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9299510406745087, "ground_truth": 0}, {"key": "33310095", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5832033585358393, "ground_truth": 0}, {"key": "33310095", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25832596756687043, "ground_truth": 0}, {"key": "33310095", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2200070947776335, "ground_truth": 0}, {"key": "33310095", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9284088002990444, "ground_truth": 0}, {"key": "33310095", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793783849419006, "ground_truth": 0}, {"key": "37934604", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24364245707072424, "ground_truth": 0}, {"key": "37934604", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5234203505253842, "ground_truth": 0}, {"key": "37934604", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5292633830961265, "ground_truth": 0}, {"key": "37934604", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687309953704154, "ground_truth": 0}, {"key": "37934604", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.29098085461530826, "ground_truth": 0}, {"key": "39012181", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9697854116215687, "ground_truth": 0}, {"key": "39012181", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.954984466150359, "ground_truth": 0}, {"key": "39012181", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9441768608646179, "ground_truth": 0}, {"key": "39012181", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.936749478401965, "ground_truth": 0}, {"key": "39012181", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9788748079745406, "ground_truth": 0}, {"key": "40221674", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6297746112132001, "ground_truth": 0}, {"key": "40221674", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7577943659093546, "ground_truth": 0}, {"key": "40221674", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8365545666505609, "ground_truth": 0}, {"key": "40221674", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.432063391026198, "ground_truth": 0}, {"key": "40221674", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740080855233, "ground_truth": 0}, {"key": "36884862", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4804786740684649, "ground_truth": 0}, {"key": "36884862", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.529263381294053, "ground_truth": 0}, {"key": "36884862", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5312093799870774, "ground_truth": 0}, {"key": "36884862", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688236484331, "ground_truth": 0}, {"key": "36884862", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4148988410539001, "ground_truth": 0}, {"key": "39054429", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25091277724427935, "ground_truth": 0}, {"key": "39054429", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.46101679297197473, "ground_truth": 0}, {"key": "39054429", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2829881264463877, "ground_truth": 0}, {"key": "39054429", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2309197626640269, "ground_truth": 0}, {"key": "39054429", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3311197405328237, "ground_truth": 0}, {"key": "36753964", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2798284944623085, "ground_truth": 0}, {"key": "36753964", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20055768084759795, "ground_truth": 0}, {"key": "36753964", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2704802258575382, "ground_truth": 0}, {"key": "36753964", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17441027822404723, "ground_truth": 0}, {"key": "36753964", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21337717286967856, "ground_truth": 0}, {"key": "37612459", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26133091402086217, "ground_truth": 0}, {"key": "37612459", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5117165957497152, "ground_truth": 0}, {"key": "37612459", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2267836198722229, "ground_truth": 0}, {"key": "37612459", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2393493436701046, "ground_truth": 0}, {"key": "37612459", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18126320603729093, "ground_truth": 0}, {"key": "36805789", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6150878755449039, "ground_truth": 0}, {"key": "36805789", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5428632781507469, "ground_truth": 0}, {"key": "36805789", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5813030915665279, "ground_truth": 0}, {"key": "36805789", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201715071959424, "ground_truth": 0}, {"key": "36805789", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684848395423, "ground_truth": 0}, {"key": "12757394", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33458945219628955, "ground_truth": 0}, {"key": "12757394", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.451326477376215, "ground_truth": 0}, {"key": "12757394", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4035668689350965, "ground_truth": 0}, {"key": "12757394", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22541659916800308, "ground_truth": 0}, {"key": "12757394", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076628930012947, "ground_truth": 0}, {"key": "32192542", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6531269089350505, "ground_truth": 0}, {"key": "32192542", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7170118777944309, "ground_truth": 0}, {"key": "32192542", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7662936466398089, "ground_truth": 0}, {"key": "32192542", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136949693461, "ground_truth": 0}, {"key": "32192542", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185825805322, "ground_truth": 0}, {"key": "34856060", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13477591517468868, "ground_truth": 0}, {"key": "34856060", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07423136375640063, "ground_truth": 0}, {"key": "34856060", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08210662460078576, "ground_truth": 0}, {"key": "34856060", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1645164687178429, "ground_truth": 0}, {"key": "34856060", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1613202407719548, "ground_truth": 0}, {"key": "36083416", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13568954109569292, "ground_truth": 0}, {"key": "36083416", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3647775924345207, "ground_truth": 0}, {"key": "36083416", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2365162159564436, "ground_truth": 0}, {"key": "36083416", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1744102731277919, "ground_truth": 0}, {"key": "36083416", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39233683207686143, "ground_truth": 0}, {"key": "33839050", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1393963865873357, "ground_truth": 0}, {"key": "33839050", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18952109754219806, "ground_truth": 0}, {"key": "33839050", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16995623884266875, "ground_truth": 0}, {"key": "33839050", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20561503740364612, "ground_truth": 0}, {"key": "33839050", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.08570927429610489, "ground_truth": 0}, {"key": "18464690", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1470645283650301, "ground_truth": 0}, {"key": "18464690", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2465333453718455, "ground_truth": 0}, {"key": "18464690", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17441026650738753, "ground_truth": 0}, {"key": "18464690", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08329192178297469, "ground_truth": 0}, {"key": "18464690", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1233656125700684, "ground_truth": 0}, {"key": "39212665", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3468730754950625, "ground_truth": 0}, {"key": "39212665", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37204878642036154, "ground_truth": 0}, {"key": "39212665", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19806417073766802, "ground_truth": 0}, {"key": "39212665", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3157359785833799, "ground_truth": 0}, {"key": "39212665", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416730113950302, "ground_truth": 0}, {"key": "40094011", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5679366114179148, "ground_truth": 0}, {"key": "40094011", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.49804691006338686, "ground_truth": 0}, {"key": "40094011", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7057850312307298, "ground_truth": 0}, {"key": "40094011", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191372353598, "ground_truth": 0}, {"key": "40094011", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689455179774, "ground_truth": 0}, {"key": "36036272", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.622459303986606, "ground_truth": 0}, {"key": "36036272", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5851011401281103, "ground_truth": 0}, {"key": "36036272", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.37937838465403667, "ground_truth": 0}, {"key": "36036272", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994422955406578, "ground_truth": 0}, {"key": "36036272", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174807425116, "ground_truth": 0}, {"key": "30681904", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19436783242885722, "ground_truth": 0}, {"key": "30681904", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17781087294054393, "ground_truth": 0}, {"key": "30681904", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20055767955489015, "ground_truth": 0}, {"key": "30681904", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17441026758464195, "ground_truth": 0}, {"key": "30681904", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2845759971297395, "ground_truth": 0}, {"key": "27834240", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16238003185325087, "ground_truth": 0}, {"key": "27834240", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5312093636173189, "ground_truth": 0}, {"key": "27834240", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27048021760957086, "ground_truth": 0}, {"key": "27834240", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1907240204380894, "ground_truth": 0}, {"key": "27834240", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366316361407, "ground_truth": 0}, {"key": "35025075", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19559406937122478, "ground_truth": 0}, {"key": "35025075", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.35936412921549143, "ground_truth": 0}, {"key": "35025075", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19559407494414383, "ground_truth": 0}, {"key": "35025075", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.355774881324831, "ground_truth": 0}, {"key": "35025075", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1847675156141547, "ground_truth": 0}, {"key": "33316985", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18832398678023696, "ground_truth": 0}, {"key": "33316985", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2379298953476512, "ground_truth": 0}, {"key": "33316985", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23792989318287952, "ground_truth": 0}, {"key": "33316985", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15405755967121623, "ground_truth": 0}, {"key": "33316985", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1347759032080516, "ground_truth": 0}, {"key": "17037056", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.04501553186502277, "ground_truth": 0}, {"key": "17037056", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.036769466644048086, "ground_truth": 0}, {"key": "17037056", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.0338440329679961, "ground_truth": 0}, {"key": "17037056", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.03308597551572865, "ground_truth": 0}, {"key": "17037056", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.02843603170560301, "ground_truth": 0}, {"key": "34050457", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5156199324592758, "ground_truth": 0}, {"key": "34050457", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6150878720785973, "ground_truth": 0}, {"key": "34050457", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5409238780185589, "ground_truth": 0}, {"key": "34050457", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.40922082110635827, "ground_truth": 0}, {"key": "34050457", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.41869690924441966, "ground_truth": 0}, {"key": "34713745", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2735743919500099, "ground_truth": 0}, {"key": "34713745", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2523840349048868, "ground_truth": 0}, {"key": "34713745", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3123700192527005, "ground_truth": 0}, {"key": "34713745", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15713685455074222, "ground_truth": 0}, {"key": "34713745", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15610490073348382, "ground_truth": 0}, {"key": "40856210", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11047115019894041, "ground_truth": 0}, {"key": "40856210", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28140561364599753, "ground_truth": 0}, {"key": "40856210", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.06656918929275474, "ground_truth": 0}, {"key": "40856210", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12678516487722388, "ground_truth": 0}, {"key": "40856210", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09670579313175995, "ground_truth": 0}, {"key": "40848302", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.41869692459686, "ground_truth": 0}, {"key": "40848302", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40168782055821095, "ground_truth": 0}, {"key": "40848302", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.769080223749883, "ground_truth": 0}, {"key": "40848302", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29098085577602356, "ground_truth": 0}, {"key": "40848302", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185471043546, "ground_truth": 0}, {"key": "40636168", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31573599076551206, "ground_truth": 0}, {"key": "40636168", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28776781972927074, "ground_truth": 0}, {"key": "40636168", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2958398748537749, "ground_truth": 0}, {"key": "40636168", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510838199449344, "ground_truth": 0}, {"key": "40636168", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2829881217164842, "ground_truth": 0}, {"key": "34423311", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.07211219512413256, "ground_truth": 0}, {"key": "34423311", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2030746261547487, "ground_truth": 0}, {"key": "34423311", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2005576868901886, "ground_truth": 0}, {"key": "34423311", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1710611867640167, "ground_truth": 0}, {"key": "34423311", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16451646435231598, "ground_truth": 0}, {"key": "34833945", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6566582478352425, "ground_truth": 0}, {"key": "34833945", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6791786808903547, "ground_truth": 0}, {"key": "34833945", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7759445601975762, "ground_truth": 0}, {"key": "34833945", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063776507915, "ground_truth": 0}, {"key": "34833945", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837620411896, "ground_truth": 0}, {"key": "21272328", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.07263670433224134, "ground_truth": 0}, {"key": "21272328", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23510839400378836, "ground_truth": 0}, {"key": "21272328", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.03435868853930208, "ground_truth": 0}, {"key": "21272328", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.06097518318072838, "ground_truth": 0}, {"key": "21272328", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.06187599040824929, "ground_truth": 0}, {"key": "38648957", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11047114319138752, "ground_truth": 0}, {"key": "38648957", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.05921025211420874, "ground_truth": 0}, {"key": "38648957", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16344543858035718, "ground_truth": 0}, {"key": "38648957", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.060529386877071024, "ground_truth": 0}, {"key": "38648957", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.05146276902426518, "ground_truth": 0}, {"key": "24942981", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2436424665832334, "ground_truth": 0}, {"key": "24942981", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3259495344699932, "ground_truth": 0}, {"key": "24942981", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23231015186773804, "ground_truth": 0}, {"key": "24942981", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1955940746223891, "ground_truth": 0}, {"key": "24942981", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17667160113939268, "ground_truth": 0}, {"key": "35882366", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26894144954060645, "ground_truth": 0}, {"key": "35882366", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14511536580925125, "ground_truth": 0}, {"key": "35882366", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15921740178662286, "ground_truth": 0}, {"key": "35882366", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10302442400589015, "ground_truth": 0}, {"key": "35882366", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.06325052448040441, "ground_truth": 0}, {"key": "40559523", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3040416773484098, "ground_truth": 0}, {"key": "40559523", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38306415528027754, "ground_truth": 0}, {"key": "40559523", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25091277570578374, "ground_truth": 0}, {"key": "40559523", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24364243324176288, "ground_truth": 0}, {"key": "40559523", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3328523508635948, "ground_truth": 0}, {"key": "24632722", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.137532473997191, "ground_truth": 0}, {"key": "24632722", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2613309181474992, "ground_truth": 0}, {"key": "24632722", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08449275366694514, "ground_truth": 0}, {"key": "24632722", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25832600084010643, "ground_truth": 0}, {"key": "24632722", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19193278602243258, "ground_truth": 0}, {"key": "36002759", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1571368578973164, "ground_truth": 0}, {"key": "36002759", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2925953076742392, "ground_truth": 0}, {"key": "36002759", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3174262835848375, "ground_truth": 0}, {"key": "36002759", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19682621082062696, "ground_truth": 0}, {"key": "36002759", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.29421497314379114, "ground_truth": 0}, {"key": "29508534", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4765796392309581, "ground_truth": 0}, {"key": "29508534", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4263215686919616, "ground_truth": 0}, {"key": "29508534", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2583260040365507, "ground_truth": 0}, {"key": "29508534", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3979384179791187, "ground_truth": 0}, {"key": "29508534", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33458945187634714, "ground_truth": 0}, {"key": "15631612", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40544872683093913, "ground_truth": 0}, {"key": "15631612", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5389832580648103, "ground_truth": 0}, {"key": "15631612", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4167966343836464, "ground_truth": 0}, {"key": "15631612", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.39793841203505687, "ground_truth": 0}, {"key": "15631612", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.445529554415958, "ground_truth": 0}, {"key": "40731892", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12085323034930988, "ground_truth": 0}, {"key": "40731892", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1634454375434934, "ground_truth": 0}, {"key": "40731892", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2704802078457014, "ground_truth": 0}, {"key": "40731892", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31237000124057684, "ground_truth": 0}, {"key": "40731892", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092207750051709, "ground_truth": 0}, {"key": "35971910", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6893056172488817, "ground_truth": 0}, {"key": "35971910", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7248702792827436, "ground_truth": 0}, {"key": "35971910", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4804786588873771, "ground_truth": 0}, {"key": "35971910", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601357208869, "ground_truth": 0}, {"key": "35971910", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36477756857511484, "ground_truth": 0}, {"key": "34428424", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6297745843531376, "ground_truth": 0}, {"key": "34428424", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6406358747975139, "ground_truth": 0}, {"key": "34428424", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6791787074974316, "ground_truth": 0}, {"key": "34428424", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224446506527, "ground_truth": 0}, {"key": "34428424", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073419874224, "ground_truth": 0}, {"key": "36971005", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7759445557026193, "ground_truth": 0}, {"key": "36971005", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7592254083080092, "ground_truth": 0}, {"key": "36971005", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4282333847811545, "ground_truth": 0}, {"key": "36971005", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723799729076, "ground_truth": 0}, {"key": "36971005", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684650629241, "ground_truth": 0}, {"key": "34649067", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.381219572400372, "ground_truth": 0}, {"key": "34649067", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24508502270547722, "ground_truth": 0}, {"key": "34649067", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43206338062147454, "ground_truth": 0}, {"key": "34649067", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2689414385280759, "ground_truth": 0}, {"key": "34649067", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1835936371608012, "ground_truth": 0}, {"key": "37355154", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15610490203696029, "ground_truth": 0}, {"key": "37355154", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5660185612723436, "ground_truth": 0}, {"key": "37355154", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5156199309195671, "ground_truth": 0}, {"key": "37355154", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3259495155630028, "ground_truth": 0}, {"key": "37355154", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641744538114, "ground_truth": 0}, {"key": "38674697", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19806418082111046, "ground_truth": 0}, {"key": "38674697", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19806417711789334, "ground_truth": 0}, {"key": "38674697", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20946969676132224, "ground_truth": 0}, {"key": "38674697", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1250653843059561, "ground_truth": 0}, {"key": "38674697", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594721215143128, "ground_truth": 0}, {"key": "40525767", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9678992915479594, "ground_truth": 0}, {"key": "40525767", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9202179881016413, "ground_truth": 0}, {"key": "40525767", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9079671318129371, "ground_truth": 0}, {"key": "40525767", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9284087952306416, "ground_truth": 0}, {"key": "40525767", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869847357993, "ground_truth": 0}, {"key": "27165110", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.07369627413880506, "ground_truth": 0}, {"key": "27165110", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.136608398385429, "ground_truth": 0}, {"key": "27165110", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07864237748906323, "ground_truth": 0}, {"key": "27165110", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10230470342116833, "ground_truth": 0}, {"key": "27165110", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.0857092779264242, "ground_truth": 0}, {"key": "35497491", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3486451366083031, "ground_truth": 0}, {"key": "35497491", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16995623921441314, "ground_truth": 0}, {"key": "35497491", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08035746560509618, "ground_truth": 0}, {"key": "35497491", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22270014221551016, "ground_truth": 0}, {"key": "35497491", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23091975216238497, "ground_truth": 0}, {"key": "40690716", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3415824917661835, "ground_truth": 0}, {"key": "40690716", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5774953261979474, "ground_truth": 0}, {"key": "40690716", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4707366022596097, "ground_truth": 0}, {"key": "40690716", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891440569625, "ground_truth": 0}, {"key": "40690716", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.579400424281993, "ground_truth": 0}, {"key": "34835193", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8910549556725296, "ground_truth": 0}, {"key": "34835193", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9073122217955212, "ground_truth": 0}, {"key": "34835193", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8933094046296673, "ground_truth": 0}, {"key": "34835193", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359934338276, "ground_truth": 0}, {"key": "34835193", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.882427861344692, "ground_truth": 0}, {"key": "39471712", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31069435094362796, "ground_truth": 0}, {"key": "39471712", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14804718229218222, "ground_truth": 0}, {"key": "39471712", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39606816571007375, "ground_truth": 0}, {"key": "39471712", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1422318887997919, "ground_truth": 0}, {"key": "39471712", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2309197542239268, "ground_truth": 0}, {"key": "39115192", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7956580907815411, "ground_truth": 0}, {"key": "39115192", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.36477756190437965, "ground_truth": 0}, {"key": "39115192", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5312093777449933, "ground_truth": 0}, {"key": "39115192", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19436782290667862, "ground_truth": 0}, {"key": "39115192", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4551986137407995, "ground_truth": 0}, {"key": "23520673", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11676400983315424, "ground_truth": 0}, {"key": "23520673", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.29098086793361666, "ground_truth": 0}, {"key": "23520673", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5563995519639908, "ground_truth": 0}, {"key": "23520673", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14128141927062424, "ground_truth": 0}, {"key": "23520673", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4016878017036047, "ground_truth": 0}, {"key": "35764233", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19314738362681877, "ground_truth": 0}, {"key": "35764233", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21206880871602513, "ground_truth": 0}, {"key": "35764233", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20946969504372573, "ground_truth": 0}, {"key": "35764233", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10521052944918954, "ground_truth": 0}, {"key": "35764233", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19072402397120083, "ground_truth": 0}, {"key": "35228910", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09602549532951575, "ground_truth": 0}, {"key": "35228910", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.314050561472081, "ground_truth": 0}, {"key": "35228910", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4921881405160822, "ground_truth": 0}, {"key": "35228910", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1721718411406039, "ground_truth": 0}, {"key": "35228910", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1500288308605504, "ground_truth": 0}, {"key": "36795599", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8322366541541832, "ground_truth": 0}, {"key": "36795599", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6757645989232923, "ground_truth": 0}, {"key": "36795599", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8344068892605987, "ground_truth": 0}, {"key": "36795599", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897281416671, "ground_truth": 0}, {"key": "36795599", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916072623753, "ground_truth": 0}, {"key": "38641949", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6095241461627726, "ground_truth": 0}, {"key": "38641949", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5039061541016722, "ground_truth": 0}, {"key": "38641949", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2782568121219668, "ground_truth": 0}, {"key": "38641949", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4590761155165765, "ground_truth": 0}, {"key": "38641949", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4359015238527699, "ground_truth": 0}, {"key": "29968443", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7563575738699001, "ground_truth": 0}, {"key": "29968443", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7534666724564851, "ground_truth": 0}, {"key": "29968443", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7772998651203772, "ground_truth": 0}, {"key": "29968443", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3293917157480601, "ground_truth": 0}, {"key": "29968443", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324894238015, "ground_truth": 0}, {"key": "21268042", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24508502873715912, "ground_truth": 0}, {"key": "21268042", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3433417285723093, "ground_truth": 0}, {"key": "21268042", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2465333391856698, "ground_truth": 0}, {"key": "21268042", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2877678112708052, "ground_truth": 0}, {"key": "21268042", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3451052742186197, "ground_truth": 0}, {"key": "26808572", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.49218812187172023, "ground_truth": 0}, {"key": "26808572", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3998116294637935, "ground_truth": 0}, {"key": "26808572", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2958398548285497, "ground_truth": 0}, {"key": "26808572", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4035668760993842, "ground_truth": 0}, {"key": "26808572", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708859850766, "ground_truth": 0}, {"key": "37829390", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.41300357031442336, "ground_truth": 0}, {"key": "37829390", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.503906180386236, "ground_truth": 0}, {"key": "37829390", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6636689675085792, "ground_truth": 0}, {"key": "37829390", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684491248716, "ground_truth": 0}, {"key": "37829390", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238813743741, "ground_truth": 0}, {"key": "35716045", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3904758475539173, "ground_truth": 0}, {"key": "35716045", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.49804687988544377, "ground_truth": 0}, {"key": "35716045", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4765796532260267, "ground_truth": 0}, {"key": "35716045", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.268941447572459, "ground_truth": 0}, {"key": "35716045", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544311628471, "ground_truth": 0}, {"key": "34367070", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6370308070534474, "ground_truth": 0}, {"key": "34367070", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6926419923568767, "ground_truth": 0}, {"key": "34367070", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5448014120577257, "ground_truth": 0}, {"key": "34367070", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253888623371, "ground_truth": 0}, {"key": "34367070", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849598624976, "ground_truth": 0}, {"key": "35239748", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18594720432534217, "ground_truth": 0}, {"key": "35239748", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1200256303542899, "ground_truth": 0}, {"key": "35239748", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10743747540218573, "ground_truth": 0}, {"key": "35239748", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09739039953712504, "ground_truth": 0}, {"key": "35239748", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17217185198346824, "ground_truth": 0}, {"key": "40421370", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.06325052528539311, "ground_truth": 0}, {"key": "40421370", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13206616508569405, "ground_truth": 0}, {"key": "40421370", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24653334405780028, "ground_truth": 0}, {"key": "40421370", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776335645693297, "ground_truth": 0}, {"key": "40421370", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.05300977102953815, "ground_truth": 0}, {"key": "37288396", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5409238663217417, "ground_truth": 0}, {"key": "37288396", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3793783955030663, "ground_truth": 0}, {"key": "37288396", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7520125575862858, "ground_truth": 0}, {"key": "37288396", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.49414087908160276, "ground_truth": 0}, {"key": "37288396", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360041839997516, "ground_truth": 0}, {"key": "38903688", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5078118634885638, "ground_truth": 0}, {"key": "38903688", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5640984463977746, "ground_truth": 0}, {"key": "38903688", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7008948212914132, "ground_truth": 0}, {"key": "38903688", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45519859995640694, "ground_truth": 0}, {"key": "38903688", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.48242909109003795, "ground_truth": 0}, {"key": "28071228", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6723317324805571, "ground_truth": 0}, {"key": "28071228", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6150878565840052, "ground_truth": 0}, {"key": "28071228", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6187804397690538, "ground_truth": 0}, {"key": "28071228", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113820108834211, "ground_truth": 0}, {"key": "28071228", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643566435003, "ground_truth": 0}, {"key": "36855834", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.146087240265575, "ground_truth": 0}, {"key": "36855834", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.152032251369881, "ground_truth": 0}, {"key": "36855834", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14903528726041976, "ground_truth": 0}, {"key": "36855834", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15713685643053077, "ground_truth": 0}, {"key": "36855834", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1613202376752896, "ground_truth": 0}, {"key": "40548717", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09268777826624265, "ground_truth": 0}, {"key": "40548717", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10669059331822427, "ground_truth": 0}, {"key": "40548717", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26133091786964696, "ground_truth": 0}, {"key": "40548717", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.06325052897825562, "ground_truth": 0}, {"key": "40548717", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.03904829016128494, "ground_truth": 0}, {"key": "37051175", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4493926194957465, "ground_truth": 0}, {"key": "37051175", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.33285232331271325, "ground_truth": 0}, {"key": "37051175", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5717666198235393, "ground_truth": 0}, {"key": "37051175", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.289371704057832, "ground_truth": 0}, {"key": "37051175", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370414009294139, "ground_truth": 0}, {"key": "38882119", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6279512181711551, "ground_truth": 0}, {"key": "38882119", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3468730764718985, "ground_truth": 0}, {"key": "38882119", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5019531265243292, "ground_truth": 0}, {"key": "38882119", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494632983125, "ground_truth": 0}, {"key": "38882119", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.501953100700813, "ground_truth": 0}, {"key": "19485402", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.292595288769578, "ground_truth": 0}, {"key": "19485402", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.36477756762676855, "ground_truth": 0}, {"key": "19485402", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3276683022741136, "ground_truth": 0}, {"key": "19485402", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16238003413571409, "ground_truth": 0}, {"key": "19485402", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21866938673628245, "ground_truth": 0}, {"key": "36060907", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15921738992563936, "ground_truth": 0}, {"key": "36060907", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23510837585587857, "ground_truth": 0}, {"key": "36060907", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20946969867110327, "ground_truth": 0}, {"key": "36060907", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1200256340212753, "ground_truth": 0}, {"key": "36060907", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21601154496741148, "ground_truth": 0}, {"key": "24037309", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21469141502417902, "ground_truth": 0}, {"key": "24037309", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26133093519655637, "ground_truth": 0}, {"key": "24037309", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2583259730977614, "ground_truth": 0}, {"key": "24037309", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.47073659818585445, "ground_truth": 0}, {"key": "24037309", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591014129163, "ground_truth": 0}, {"key": "35605805", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33458944341148683, "ground_truth": 0}, {"key": "35605805", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4282334160942392, "ground_truth": 0}, {"key": "35605805", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2436424392443969, "ground_truth": 0}, {"key": "35605805", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3886180264231488, "ground_truth": 0}, {"key": "35605805", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3056973281615187, "ground_truth": 0}, {"key": "17706248", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13117322154158828, "ground_truth": 0}, {"key": "17706248", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5370413787569628, "ground_truth": 0}, {"key": "17706248", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22405545568008606, "ground_truth": 0}, {"key": "17706248", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45713672709731124, "ground_truth": 0}, {"key": "17706248", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2393493355330508, "ground_truth": 0}, {"key": "36883559", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31742626703167887, "ground_truth": 0}, {"key": "36883559", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30735799815931114, "ground_truth": 0}, {"key": "36883559", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22541661680877045, "ground_truth": 0}, {"key": "36883559", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22953520454981993, "ground_truth": 0}, {"key": "36883559", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2704802238096745, "ground_truth": 0}, {"key": "32799471", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.32252600419648575, "ground_truth": 0}, {"key": "32799471", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2613309222859701, "ground_truth": 0}, {"key": "32799471", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1699562325993277, "ground_truth": 0}, {"key": "32799471", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3886180293841768, "ground_truth": 0}, {"key": "32799471", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2845759845336161, "ground_truth": 0}, {"key": "34797243", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10521053349374888, "ground_truth": 0}, {"key": "34797243", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13117322310046148, "ground_truth": 0}, {"key": "34797243", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.136608401544777, "ground_truth": 0}, {"key": "34797243", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.034880888744748456, "ground_truth": 0}, {"key": "34797243", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.04115288700880763, "ground_truth": 0}, {"key": "32154876", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24798744875352172, "ground_truth": 0}, {"key": "32154876", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23510839875070574, "ground_truth": 0}, {"key": "32154876", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2227001382393025, "ground_truth": 0}, {"key": "32154876", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16026604532361602, "ground_truth": 0}, {"key": "32154876", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561505280894707, "ground_truth": 0}, {"key": "37962274", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3056973156501665, "ground_truth": 0}, {"key": "37962274", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26588046764156187, "ground_truth": 0}, {"key": "37962274", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14608725041112605, "ground_truth": 0}, {"key": "37962274", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11047114685756054, "ground_truth": 0}, {"key": "37962274", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3208212728779999, "ground_truth": 0}, {"key": "35574030", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5869964190975233, "ground_truth": 0}, {"key": "35574030", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3575674941537362, "ground_truth": 0}, {"key": "35574030", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6619228891078002, "ground_truth": 0}, {"key": "35574030", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.424411995503181, "ground_truth": 0}, {"key": "35574030", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615951966672, "ground_truth": 0}, {"key": "39105949", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44360042481959605, "ground_truth": 0}, {"key": "39105949", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4668455753385706, "ground_truth": 0}, {"key": "39105949", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4687905948826378, "ground_truth": 0}, {"key": "39105949", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.42059957870399095, "ground_truth": 0}, {"key": "39105949", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3702254184475414, "ground_truth": 0}, {"key": "41064322", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7279754362952111, "ground_truth": 0}, {"key": "41064322", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.767689866445949, "ground_truth": 0}, {"key": "41064322", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7431680138991961, "ground_truth": 0}, {"key": "41064322", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306191415953, "ground_truth": 0}, {"key": "41064322", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585698818617, "ground_truth": 0}, {"key": "28105101", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3830641861096072, "ground_truth": 0}, {"key": "28105101", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42059958961341154, "ground_truth": 0}, {"key": "28105101", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21733750907517357, "ground_truth": 0}, {"key": "28105101", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37204879315214634, "ground_truth": 0}, {"key": "28105101", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.451326483917178, "ground_truth": 0}, {"key": "36036068", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.42250463018804474, "ground_truth": 0}, {"key": "36036068", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5136684490274119, "ground_truth": 0}, {"key": "36036068", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2798285133468847, "ground_truth": 0}, {"key": "36036068", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35220176217978344, "ground_truth": 0}, {"key": "36036068", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3040416688485923, "ground_truth": 0}, {"key": "37991460", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2782568076142212, "ground_truth": 0}, {"key": "37991460", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5774953858410989, "ground_truth": 0}, {"key": "37991460", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.222700147988955, "ground_truth": 0}, {"key": "37991460", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1403362518182791, "ground_truth": 0}, {"key": "37991460", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.47852885006187706, "ground_truth": 0}, {"key": "38437830", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15817435705379693, "ground_truth": 0}, {"key": "38437830", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22541661689121942, "ground_truth": 0}, {"key": "38437830", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3960681552881715, "ground_truth": 0}, {"key": "38437830", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.33633104468502184, "ground_truth": 0}, {"key": "38437830", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416730231991354, "ground_truth": 0}, {"key": "36507138", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17441026942705706, "ground_truth": 0}, {"key": "36507138", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26133092568105537, "ground_truth": 0}, {"key": "36507138", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3363310309987858, "ground_truth": 0}, {"key": "36507138", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3157359520558103, "ground_truth": 0}, {"key": "36507138", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36477754787230904, "ground_truth": 0}, {"key": "37824866", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30074559221812075, "ground_truth": 0}, {"key": "37824866", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44939262780677247, "ground_truth": 0}, {"key": "37824866", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42441201119996835, "ground_truth": 0}, {"key": "37824866", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708753156185, "ground_truth": 0}, {"key": "37824866", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.352201781129662, "ground_truth": 0}, {"key": "25088134", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30074557995189666, "ground_truth": 0}, {"key": "25088134", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3276682754348708, "ground_truth": 0}, {"key": "25088134", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2674081891296318, "ground_truth": 0}, {"key": "25088134", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24508502443661614, "ground_truth": 0}, {"key": "25088134", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15507847557893958, "ground_truth": 0}, {"key": "40172531", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5563995784634962, "ground_truth": 0}, {"key": "40172531", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.45713670124995215, "ground_truth": 0}, {"key": "40172531", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5253688144390206, "ground_truth": 0}, {"key": "40172531", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22953520432724184, "ground_truth": 0}, {"key": "40172531", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.25683199698550324, "ground_truth": 0}, {"key": "37035874", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.289371706651489, "ground_truth": 0}, {"key": "37035874", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38491216788784083, "ground_truth": 0}, {"key": "37035874", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4225046299983552, "ground_truth": 0}, {"key": "37035874", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4244120001015744, "ground_truth": 0}, {"key": "37035874", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.28616926196581877, "ground_truth": 0}, {"key": "36404465", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8044059154344156, "ground_truth": 0}, {"key": "36404465", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8116760092094539, "ground_truth": 0}, {"key": "36404465", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7826624827601747, "ground_truth": 0}, {"key": "36404465", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059113787211, "ground_truth": 0}, {"key": "36404465", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281480339857, "ground_truth": 0}, {"key": "39602052", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.28298812647794797, "ground_truth": 0}, {"key": "39602052", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5234203447397218, "ground_truth": 0}, {"key": "39602052", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5039061503001183, "ground_truth": 0}, {"key": "39602052", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331531992957, "ground_truth": 0}, {"key": "39602052", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.47073660220890123, "ground_truth": 0}, {"key": "33792789", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13028542597734616, "ground_truth": 0}, {"key": "33792789", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.06853749058907015, "ground_truth": 0}, {"key": "33792789", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22953520336020852, "ground_truth": 0}, {"key": "33792789", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12168574851929538, "ground_truth": 0}, {"key": "33792789", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510838411618254, "ground_truth": 0}, {"key": "32776626", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13386749120155184, "ground_truth": 0}, {"key": "32776626", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37754069478947033, "ground_truth": 0}, {"key": "32776626", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20561504219815738, "ground_truth": 0}, {"key": "32776626", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653333778778058, "ground_truth": 0}, {"key": "32776626", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2407745937111424, "ground_truth": 0}, {"key": "37195090", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.32939172907864234, "ground_truth": 0}, {"key": "37195090", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38306417061790937, "ground_truth": 0}, {"key": "37195090", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.47852882734855534, "ground_truth": 0}, {"key": "37195090", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064708797499, "ground_truth": 0}, {"key": "37195090", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38306415812566885, "ground_truth": 0}, {"key": "33981824", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2407745961813231, "ground_truth": 0}, {"key": "33981824", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.235108383232864, "ground_truth": 0}, {"key": "33981824", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1052105401476263, "ground_truth": 0}, {"key": "33981824", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16451646013734195, "ground_truth": 0}, {"key": "33981824", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.05921025454578735, "ground_truth": 0}, {"key": "39569142", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1490352994309755, "ground_truth": 0}, {"key": "39569142", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25534366116318336, "ground_truth": 0}, {"key": "39569142", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.183593632759904, "ground_truth": 0}, {"key": "39569142", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11279539914912208, "ground_truth": 0}, {"key": "39569142", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594721218361515, "ground_truth": 0}, {"key": "40268210", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17781085413738976, "ground_truth": 0}, {"key": "40268210", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1460872499025162, "ground_truth": 0}, {"key": "40268210", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35398628559713263, "ground_truth": 0}, {"key": "40268210", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25091277996188144, "ground_truth": 0}, {"key": "40268210", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2553436657179508, "ground_truth": 0}, {"key": "34925159", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2704802226781844, "ground_truth": 0}, {"key": "34925159", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17667158786564716, "ground_truth": 0}, {"key": "34925159", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3311197356824418, "ground_truth": 0}, {"key": "34925159", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3665897095814369, "ground_truth": 0}, {"key": "34925159", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4130035888581578, "ground_truth": 0}, {"key": "36181903", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3191213680369076, "ground_truth": 0}, {"key": "36181903", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41679663206625345, "ground_truth": 0}, {"key": "36181903", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35577489854642363, "ground_truth": 0}, {"key": "36181903", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24220562565658652, "ground_truth": 0}, {"key": "36181903", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35042138312832055, "ground_truth": 0}, {"key": "38620559", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3830641687441353, "ground_truth": 0}, {"key": "38620559", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5253688240330296, "ground_truth": 0}, {"key": "38620559", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.459076118523539, "ground_truth": 0}, {"key": "38620559", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3504213813245974, "ground_truth": 0}, {"key": "38620559", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.46879060983181514, "ground_truth": 0}, {"key": "32719657", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.0764076792370154, "ground_truth": 0}, {"key": "32719657", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41111084913113216, "ground_truth": 0}, {"key": "32719657", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12940272642616524, "ground_truth": 0}, {"key": "32719657", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14903529565995927, "ground_truth": 0}, {"key": "32719657", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.055823141589026445, "ground_truth": 0}, {"key": "37530914", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12168575347142604, "ground_truth": 0}, {"key": "37530914", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18832398107041118, "ground_truth": 0}, {"key": "37530914", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25091277208519697, "ground_truth": 0}, {"key": "37530914", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35398628728869574, "ground_truth": 0}, {"key": "37530914", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21337718632456715, "ground_truth": 0}, {"key": "33306933", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.45713671574658893, "ground_truth": 0}, {"key": "33306933", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5563995848265194, "ground_truth": 0}, {"key": "33306933", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6774740313035816, "ground_truth": 0}, {"key": "33306933", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907615886811354, "ground_truth": 0}, {"key": "33306933", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3886180362316605, "ground_truth": 0}, {"key": "33837212", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09138210141228317, "ground_truth": 0}, {"key": "33837212", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.09877258836948488, "ground_truth": 0}, {"key": "33837212", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1931473737061487, "ground_truth": 0}, {"key": "33837212", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.06418264367896427, "ground_truth": 0}, {"key": "33837212", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10743747519158968, "ground_truth": 0}, {"key": "40945179", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5409238588193825, "ground_truth": 0}, {"key": "40945179", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5851011328419302, "ground_truth": 0}, {"key": "40945179", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5907792082387032, "ground_truth": 0}, {"key": "40945179", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531269221821787, "ground_truth": 0}, {"key": "40945179", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365401710284, "ground_truth": 0}, {"key": "34152358", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2735744054213877, "ground_truth": 0}, {"key": "34152358", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21469141494672872, "ground_truth": 0}, {"key": "34152358", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3345894600870735, "ground_truth": 0}, {"key": "34152358", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18359363644988594, "ground_truth": 0}, {"key": "34152358", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922078610009516, "ground_truth": 0}, {"key": "34136541", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6057990405139866, "ground_truth": 0}, {"key": "34136541", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.46101675228417976, "ground_truth": 0}, {"key": "34136541", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5774953871780132, "ground_truth": 0}, {"key": "34136541", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512285161564, "ground_truth": 0}, {"key": "34136541", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3451052878817227, "ground_truth": 0}, {"key": "37469603", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4282334059678475, "ground_truth": 0}, {"key": "37469603", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.52731653042988, "ground_truth": 0}, {"key": "37469603", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6224593311242097, "ground_truth": 0}, {"key": "37469603", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2991051950993002, "ground_truth": 0}, {"key": "37469603", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982762455631627, "ground_truth": 0}, {"key": "37353611", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6757646061135573, "ground_truth": 0}, {"key": "37353611", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5679366009829591, "ground_truth": 0}, {"key": "37353611", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4804786984431575, "ground_truth": 0}, {"key": "37353611", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35577488801140095, "ground_truth": 0}, {"key": "37353611", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4513265145416824, "ground_truth": 0}, {"key": "37211649", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40168781419163235, "ground_truth": 0}, {"key": "37211649", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.62245932850266, "ground_truth": 0}, {"key": "37211649", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.299105201282538, "ground_truth": 0}, {"key": "37211649", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2925953004708565, "ground_truth": 0}, {"key": "37211649", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.46684558578245033, "ground_truth": 0}, {"key": "37320976", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1968262090522091, "ground_truth": 0}, {"key": "37320976", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19930799611574523, "ground_truth": 0}, {"key": "37320976", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15002882312343843, "ground_truth": 0}, {"key": "37320976", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1384617857422588, "ground_truth": 0}, {"key": "37320976", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.31573600381372074, "ground_truth": 0}, {"key": "34492412", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7994423194812936, "ground_truth": 0}, {"key": "34492412", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47073661765651664, "ground_truth": 0}, {"key": "34492412", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8140528093874363, "ground_truth": 0}, {"key": "34492412", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28616925440675006, "ground_truth": 0}, {"key": "34492412", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964173398416, "ground_truth": 0}, {"key": "36655016", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4130035741206273, "ground_truth": 0}, {"key": "36655016", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6442251210557357, "ground_truth": 0}, {"key": "36655016", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5058591248091121, "ground_truth": 0}, {"key": "36655016", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4785288327601762, "ground_truth": 0}, {"key": "36655016", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33458941755953253, "ground_truth": 0}, {"key": "35220773", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19806418732085346, "ground_truth": 0}, {"key": "35220773", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26435835529680635, "ground_truth": 0}, {"key": "35220773", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21601154436110948, "ground_truth": 0}, {"key": "35220773", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3276683130266854, "ground_truth": 0}, {"key": "35220773", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641721656792, "ground_truth": 0}, {"key": "31569808", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2200071102303434, "ground_truth": 0}, {"key": "31569808", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12252320952286268, "ground_truth": 0}, {"key": "31569808", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17328820518079724, "ground_truth": 0}, {"key": "31569808", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.125922774559257, "ground_truth": 0}, {"key": "31569808", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.127652620099016, "ground_truth": 0}, {"key": "37696256", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1688569529990098, "ground_truth": 0}, {"key": "37696256", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3157359721461582, "ground_truth": 0}, {"key": "37696256", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1993080094367878, "ground_truth": 0}, {"key": "37696256", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16132024487052576, "ground_truth": 0}, {"key": "37696256", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12168575286302302, "ground_truth": 0}, {"key": "36874328", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.32082131791910606, "ground_truth": 0}, {"key": "36874328", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30735801489588266, "ground_truth": 0}, {"key": "36874328", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25832596702078636, "ground_truth": 0}, {"key": "36874328", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28937168832953597, "ground_truth": 0}, {"key": "36874328", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27512972471711145, "ground_truth": 0}, {"key": "24532377", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.350421388222688, "ground_truth": 0}, {"key": "24532377", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.616935805945652, "ground_truth": 0}, {"key": "24532377", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3593641341503153, "ground_truth": 0}, {"key": "24532377", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526689411046, "ground_truth": 0}, {"key": "24532377", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165179155425, "ground_truth": 0}, {"key": "39560618", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3522017900148173, "ground_truth": 0}, {"key": "39560618", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3106944085223796, "ground_truth": 0}, {"key": "39560618", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1812632045076387, "ground_truth": 0}, {"key": "39560618", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19072401888206214, "ground_truth": 0}, {"key": "39560618", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1276526134489055, "ground_truth": 0}, {"key": "34922693", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15405755709258256, "ground_truth": 0}, {"key": "34922693", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22270014535660476, "ground_truth": 0}, {"key": "34922693", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11676401739770506, "ground_truth": 0}, {"key": "34922693", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.0670562872504082, "ground_truth": 0}, {"key": "34922693", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.0894546063679493, "ground_truth": 0}, {"key": "33629577", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22541660778327216, "ground_truth": 0}, {"key": "33629577", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14903530727924524, "ground_truth": 0}, {"key": "33629577", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3090237036246847, "ground_truth": 0}, {"key": "33629577", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20946969686910166, "ground_truth": 0}, {"key": "33629577", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17781088305723355, "ground_truth": 0}, {"key": "32284359", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3276682904190223, "ground_truth": 0}, {"key": "32284359", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3398276311704265, "ground_truth": 0}, {"key": "32284359", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.30404169091426975, "ground_truth": 0}, {"key": "32284359", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35398631450090057, "ground_truth": 0}, {"key": "32284359", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36477757609431716, "ground_truth": 0}, {"key": "28082962", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3830641939296749, "ground_truth": 0}, {"key": "28082962", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.535098435201781, "ground_truth": 0}, {"key": "28082962", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3225260047820947, "ground_truth": 0}, {"key": "28082962", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224450462116, "ground_truth": 0}, {"key": "28082962", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32766830069254943, "ground_truth": 0}, {"key": "24796803", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8116760243570511, "ground_truth": 0}, {"key": "24796803", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8910549598261235, "ground_truth": 0}, {"key": "24796803", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8469578462151609, "ground_truth": 0}, {"key": "24796803", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.789233679026927, "ground_truth": 0}, {"key": "24796803", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201714971700844, "ground_truth": 0}, {"key": "35466150", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.603931802954789, "ground_truth": 0}, {"key": "35466150", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5019531348011275, "ground_truth": 0}, {"key": "35466150", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6150878693646397, "ground_truth": 0}, {"key": "35466150", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.672331696122449, "ground_truth": 0}, {"key": "35466150", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241904136411, "ground_truth": 0}, {"key": "35754289", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7431680242840157, "ground_truth": 0}, {"key": "35754289", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6020615657072763, "ground_truth": 0}, {"key": "35754289", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7371581603267826, "ground_truth": 0}, {"key": "35754289", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094716622182, "ground_truth": 0}, {"key": "35754289", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.757794356070688, "ground_truth": 0}, {"key": "36678662", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6113819932595358, "ground_truth": 0}, {"key": "36678662", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.684264014659854, "ground_truth": 0}, {"key": "36678662", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5717665996238047, "ground_truth": 0}, {"key": "36678662", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.484380081065018, "ground_truth": 0}, {"key": "36678662", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358390311564, "ground_truth": 0}, {"key": "35399671", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39233682363744526, "ground_truth": 0}, {"key": "35399671", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24077458512862426, "ground_truth": 0}, {"key": "35399671", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.49609380446872847, "ground_truth": 0}, {"key": "35399671", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.47657963591687863, "ground_truth": 0}, {"key": "35399671", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.34334174164372894, "ground_truth": 0}, {"key": "36888180", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27982850150414185, "ground_truth": 0}, {"key": "36888180", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30239106278884886, "ground_truth": 0}, {"key": "36888180", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31573597392274383, "ground_truth": 0}, {"key": "36888180", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2030746344720696, "ground_truth": 0}, {"key": "36888180", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2043419147348686, "ground_truth": 0}, {"key": "28061069", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5832033654771956, "ground_truth": 0}, {"key": "28061069", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3415824937846973, "ground_truth": 0}, {"key": "28061069", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4726834462336405, "ground_truth": 0}, {"key": "28061069", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684723992003, "ground_truth": 0}, {"key": "28061069", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.48242912479404915, "ground_truth": 0}, {"key": "22259982", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4339814815982049, "ground_truth": 0}, {"key": "22259982", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5945512707337612, "ground_truth": 0}, {"key": "22259982", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6095241646559633, "ground_truth": 0}, {"key": "22259982", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942804666709, "ground_truth": 0}, {"key": "22259982", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.41111087471183455, "ground_truth": 0}, {"key": "34026805", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4073334250830663, "ground_truth": 0}, {"key": "34026805", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.48242910070474543, "ground_truth": 0}, {"key": "34026805", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.34510527201332464, "ground_truth": 0}, {"key": "34026805", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974733581283865, "ground_truth": 0}, {"key": "34026805", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4282333818599972, "ground_truth": 0}, {"key": "36713809", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5926665944521434, "ground_truth": 0}, {"key": "36713809", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42059959927644286, "ground_truth": 0}, {"key": "36713809", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8056321739990102, "ground_truth": 0}, {"key": "36713809", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881312449054, "ground_truth": 0}, {"key": "36713809", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365486744127, "ground_truth": 0}, {"key": "39726411", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1666754047415968, "ground_truth": 0}, {"key": "39726411", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19682621514247878, "ground_truth": 0}, {"key": "39726411", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1550784701702908, "ground_truth": 0}, {"key": "39726411", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18010666398004338, "ground_truth": 0}, {"key": "39726411", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20307463527775632, "ground_truth": 0}, {"key": "37069841", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36116472711806547, "ground_truth": 0}, {"key": "37069841", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3140505483802485, "ground_truth": 0}, {"key": "37069841", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3647775536213483, "ground_truth": 0}, {"key": "37069841", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292634043229097, "ground_truth": 0}, {"key": "37069841", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44939263633855037, "ground_truth": 0}, {"key": "38894693", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31405054866030546, "ground_truth": 0}, {"key": "38894693", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3157359783211975, "ground_truth": 0}, {"key": "38894693", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39793842319170764, "ground_truth": 0}, {"key": "38894693", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27825677079836997, "ground_truth": 0}, {"key": "38894693", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22405543915091572, "ground_truth": 0}, {"key": "33946032", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8244619300143418, "ground_truth": 0}, {"key": "33946032", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7325918393785109, "ground_truth": 0}, {"key": "33946032", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8407825844599646, "ground_truth": 0}, {"key": "33946032", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786339487959, "ground_truth": 0}, {"key": "33946032", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743602948, "ground_truth": 0}, {"key": "39035311", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.46490156991306997, "ground_truth": 0}, {"key": "39035311", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3174262725348414, "ground_truth": 0}, {"key": "39035311", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5851011557015384, "ground_truth": 0}, {"key": "39035311", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45132650612051656, "ground_truth": 0}, {"key": "39035311", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4320633923942454, "ground_truth": 0}, {"key": "27680038", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21601153342333212, "ground_truth": 0}, {"key": "27680038", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2465333473772727, "ground_truth": 0}, {"key": "27680038", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2553436404990981, "ground_truth": 0}, {"key": "27680038", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3415824997483216, "ground_truth": 0}, {"key": "27680038", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17328820806843734, "ground_truth": 0}, {"key": "36901907", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3557748928839707, "ground_truth": 0}, {"key": "36901907", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3647775373376417, "ground_truth": 0}, {"key": "36901907", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.332852308694677, "ground_truth": 0}, {"key": "36901907", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43782350038306156, "ground_truth": 0}, {"key": "36901907", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.25238404320012986, "ground_truth": 0}, {"key": "21530542", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19314738507240056, "ground_truth": 0}, {"key": "21530542", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1919327957409895, "ground_truth": 0}, {"key": "21530542", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17217185985105687, "ground_truth": 0}, {"key": "21530542", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687309491270707, "ground_truth": 0}, {"key": "21530542", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3007455599933255, "ground_truth": 0}, {"key": "38192532", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.464901570473666, "ground_truth": 0}, {"key": "38192532", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4941409078412111, "ground_truth": 0}, {"key": "38192532", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2538610055627122, "ground_truth": 0}, {"key": "38192532", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881204526752, "ground_truth": 0}, {"key": "38192532", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.46295861971352525, "ground_truth": 0}, {"key": "34102400", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20689406085990045, "ground_truth": 0}, {"key": "34102400", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.08035746715308387, "ground_truth": 0}, {"key": "34102400", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20689405723882917, "ground_truth": 0}, {"key": "34102400", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223188735485087, "ground_truth": 0}, {"key": "34102400", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10017222710756736, "ground_truth": 0}, {"key": "36133399", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2877677842867541, "ground_truth": 0}, {"key": "36133399", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31237000779911445, "ground_truth": 0}, {"key": "36133399", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33633105652155537, "ground_truth": 0}, {"key": "36133399", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011710947245, "ground_truth": 0}, {"key": "36133399", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3040416706444426, "ground_truth": 0}, {"key": "34314544", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2909808691470432, "ground_truth": 0}, {"key": "34314544", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5774953706273519, "ground_truth": 0}, {"key": "34314544", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.34334175953250723, "ground_truth": 0}, {"key": "34314544", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798743755605487, "ground_truth": 0}, {"key": "34314544", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3225259804883912, "ground_truth": 0}, {"key": "33460074", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7233094962651354, "ground_truth": 0}, {"key": "33460074", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.48242907202678564, "ground_truth": 0}, {"key": "33460074", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3140505540786111, "ground_truth": 0}, {"key": "33460074", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.46490160294182215, "ground_truth": 0}, {"key": "33460074", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082806264609, "ground_truth": 0}, {"key": "36191495", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1451153628906992, "ground_truth": 0}, {"key": "36191495", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16667540044892487, "ground_truth": 0}, {"key": "36191495", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09009299402750684, "ground_truth": 0}, {"key": "36191495", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2450850105271025, "ground_truth": 0}, {"key": "36191495", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12168574628715748, "ground_truth": 0}, {"key": "39532668", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6352224409134487, "ground_truth": 0}, {"key": "39532668", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6654105406872313, "ground_truth": 0}, {"key": "39532668", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6566582514425799, "ground_truth": 0}, {"key": "39532668", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238957027387, "ground_truth": 0}, {"key": "39532668", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.503906180103525, "ground_truth": 0}, {"key": "20328247", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19193278730628718, "ground_truth": 0}, {"key": "20328247", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23091976708022902, "ground_truth": 0}, {"key": "20328247", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2643583637475845, "ground_truth": 0}, {"key": "20328247", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035752671301, "ground_truth": 0}, {"key": "20328247", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2704802361086807, "ground_truth": 0}, {"key": "39112675", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22000708538775388, "ground_truth": 0}, {"key": "39112675", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.178955896281693, "ground_truth": 0}, {"key": "39112675", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.37022536680437557, "ground_truth": 0}, {"key": "39112675", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256458946149, "ground_truth": 0}, {"key": "39112675", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22541660841832173, "ground_truth": 0}, {"key": "31620300", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.338077121210662, "ground_truth": 0}, {"key": "31620300", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19314737581331246, "ground_truth": 0}, {"key": "31620300", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21337719598312996, "ground_truth": 0}, {"key": "31620300", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557748830247832, "ground_truth": 0}, {"key": "31620300", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953521610913105, "ground_truth": 0}, {"key": "37518509", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27048022655083975, "ground_truth": 0}, {"key": "37518509", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1302854234852157, "ground_truth": 0}, {"key": "37518509", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3575675460301791, "ground_truth": 0}, {"key": "37518509", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878470994084, "ground_truth": 0}, {"key": "37518509", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3040416691322539, "ground_truth": 0}, {"key": "35454095", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27357439871716704, "ground_truth": 0}, {"key": "35454095", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6057990616436149, "ground_truth": 0}, {"key": "35454095", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26588048143296705, "ground_truth": 0}, {"key": "35454095", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17895588254054945, "ground_truth": 0}, {"key": "35454095", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12678516790401306, "ground_truth": 0}, {"key": "38542788", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5851011513238807, "ground_truth": 0}, {"key": "38542788", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5331544065723627, "ground_truth": 0}, {"key": "38542788", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7892337067901959, "ground_truth": 0}, {"key": "38542788", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898447517028, "ground_truth": 0}, {"key": "38542788", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774739944658353, "ground_truth": 0}, {"key": "23944937", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34864513626534266, "ground_truth": 0}, {"key": "23944937", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3849121563970813, "ground_truth": 0}, {"key": "23944937", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25982564343964987, "ground_truth": 0}, {"key": "23944937", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4073334116911905, "ground_truth": 0}, {"key": "23944937", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510837191730877, "ground_truth": 0}, {"key": "31753944", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12852513590354936, "ground_truth": 0}, {"key": "31753944", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22541662753201214, "ground_truth": 0}, {"key": "31753944", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13477592363747443, "ground_truth": 0}, {"key": "31753944", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776335334357526, "ground_truth": 0}, {"key": "31753944", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10230470968351354, "ground_truth": 0}, {"key": "35527214", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08819004127566829, "ground_truth": 0}, {"key": "35527214", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11516222709888166, "ground_truth": 0}, {"key": "35527214", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13660839882622342, "ground_truth": 0}, {"key": "35527214", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11357958181822808, "ground_truth": 0}, {"key": "35527214", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469143339932775, "ground_truth": 0}, {"key": "40400404", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7981867659562764, "ground_truth": 0}, {"key": "40400404", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8577680943789405, "ground_truth": 0}, {"key": "40400404", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6959583348026556, "ground_truth": 0}, {"key": "40400404", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059589996753, "ground_truth": 0}, {"key": "40400404", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880286490906, "ground_truth": 0}, {"key": "21713119", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.38861802460307565, "ground_truth": 0}, {"key": "21713119", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25091278428829505, "ground_truth": 0}, {"key": "21713119", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21601153295014477, "ground_truth": 0}, {"key": "21713119", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27048020588025273, "ground_truth": 0}, {"key": "21713119", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19193279166015234, "ground_truth": 0}, {"key": "28730678", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3775406656151904, "ground_truth": 0}, {"key": "28730678", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4941409252335865, "ground_truth": 0}, {"key": "28730678", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20307462491290698, "ground_truth": 0}, {"key": "28730678", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.42059960647422373, "ground_truth": 0}, {"key": "28730678", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4359015194760906, "ground_truth": 0}, {"key": "36823733", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.392336827703583, "ground_truth": 0}, {"key": "36823733", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4205995995972285, "ground_truth": 0}, {"key": "36823733", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5467381455677032, "ground_truth": 0}, {"key": "36823733", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35220176969537936, "ground_truth": 0}, {"key": "36823733", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38491215321799976, "ground_truth": 0}, {"key": "35988862", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12592277278556788, "ground_truth": 0}, {"key": "35988862", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13660839879125652, "ground_truth": 0}, {"key": "35988862", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17895590215265175, "ground_truth": 0}, {"key": "35988862", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19806417710709356, "ground_truth": 0}, {"key": "35988862", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.052230850702420575, "ground_truth": 0}, {"key": "40499665", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5660185199301525, "ground_truth": 0}, {"key": "40499665", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43974737331046454, "ground_truth": 0}, {"key": "40499665", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4843800907481638, "ground_truth": 0}, {"key": "40499665", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629585942275309, "ground_truth": 0}, {"key": "40499665", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819849969707, "ground_truth": 0}, {"key": "32829820", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3593641497313724, "ground_truth": 0}, {"key": "32829820", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.09947021317111557, "ground_truth": 0}, {"key": "32829820", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33982761490834096, "ground_truth": 0}, {"key": "32829820", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4378235148001202, "ground_truth": 0}, {"key": "32829820", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641512470708, "ground_truth": 0}, {"key": "20583553", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1520322503800053, "ground_truth": 0}, {"key": "20583553", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10447732024209712, "ground_truth": 0}, {"key": "20583553", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07585817695930049, "ground_truth": 0}, {"key": "20583553", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18713269362904955, "ground_truth": 0}, {"key": "20583553", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1302854234710725, "ground_truth": 0}, {"key": "30501550", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7648916130871779, "ground_truth": 0}, {"key": "30501550", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6601723825949114, "ground_truth": 0}, {"key": "30501550", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7839884643076551, "ground_truth": 0}, {"key": "30501550", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321925258089, "ground_truth": 0}, {"key": "30501550", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476678600855, "ground_truth": 0}, {"key": "38755897", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11838509713495497, "ground_truth": 0}, {"key": "38755897", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23091975379694965, "ground_truth": 0}, {"key": "38755897", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5698526474381655, "ground_truth": 0}, {"key": "38755897", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4397473271398324, "ground_truth": 0}, {"key": "38755897", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3345894365323474, "ground_truth": 0}, {"key": "35507201", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5563995742578579, "ground_truth": 0}, {"key": "35507201", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5136684834043165, "ground_truth": 0}, {"key": "35507201", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3886180400137778, "ground_truth": 0}, {"key": "35507201", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185516035311, "ground_truth": 0}, {"key": "35507201", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995896186321, "ground_truth": 0}, {"key": "36453511", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5175709036400638, "ground_truth": 0}, {"key": "36453511", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6039318308651404, "ground_truth": 0}, {"key": "36453511", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39793839047334023, "ground_truth": 0}, {"key": "36453511", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026800329422, "ground_truth": 0}, {"key": "36453511", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982107797172, "ground_truth": 0}, {"key": "38066835", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30239109554662796, "ground_truth": 0}, {"key": "38066835", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.09268778229775633, "ground_truth": 0}, {"key": "38066835", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25091278937067024, "ground_truth": 0}, {"key": "38066835", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1422318873632455, "ground_truth": 0}, {"key": "38066835", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1732882022976149, "ground_truth": 0}, {"key": "39697181", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.362969225498622, "ground_truth": 0}, {"key": "39697181", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3960681649057988, "ground_truth": 0}, {"key": "39697181", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19559407899771836, "ground_truth": 0}, {"key": "39697181", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2281565132682698, "ground_truth": 0}, {"key": "39697181", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4726834709941497, "ground_truth": 0}, {"key": "21820893", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2658804809688068, "ground_truth": 0}, {"key": "21820893", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43590153741126436, "ground_truth": 0}, {"key": "21820893", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18832397427889305, "ground_truth": 0}, {"key": "21820893", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22541661192349002, "ground_truth": 0}, {"key": "21820893", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416729976830815, "ground_truth": 0}, {"key": "40519933", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6352224367653369, "ground_truth": 0}, {"key": "40519933", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5717666109426476, "ground_truth": 0}, {"key": "40519933", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4532618154444635, "ground_truth": 0}, {"key": "40519933", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29583986283206803, "ground_truth": 0}, {"key": "40519933", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269483741987, "ground_truth": 0}, {"key": "30446033", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17667158230133037, "ground_truth": 0}, {"key": "30446033", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.490235608590574, "ground_truth": 0}, {"key": "30446033", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2798284717146604, "ground_truth": 0}, {"key": "30446033", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3433417401258557, "ground_truth": 0}, {"key": "30446033", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953520277409709, "ground_truth": 0}, {"key": "40216291", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6242935460189983, "ground_truth": 0}, {"key": "40216291", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.653126915627066, "ground_truth": 0}, {"key": "40216291", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5736783985820431, "ground_truth": 0}, {"key": "40216291", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460137088368322, "ground_truth": 0}, {"key": "40216291", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185944035613855, "ground_truth": 0}, {"key": "33479118", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3611647122697972, "ground_truth": 0}, {"key": "33479118", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38121956937807083, "ground_truth": 0}, {"key": "33479118", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3629692223287444, "ground_truth": 0}, {"key": "33479118", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31573597864601494, "ground_truth": 0}, {"key": "33479118", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3486451462870525, "ground_truth": 0}, {"key": "22297373", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09467769854995671, "ground_truth": 0}, {"key": "22297373", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12336562095346966, "ground_truth": 0}, {"key": "22297373", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12336562134751745, "ground_truth": 0}, {"key": "22297373", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17217185535720272, "ground_truth": 0}, {"key": "22297373", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469142159429214, "ground_truth": 0}, {"key": "36463668", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19930801181495436, "ground_truth": 0}, {"key": "36463668", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22815649498350776, "ground_truth": 0}, {"key": "36463668", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3486451475521357, "ground_truth": 0}, {"key": "36463668", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.26740817354021285, "ground_truth": 0}, {"key": "36463668", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1276526194688063, "ground_truth": 0}, {"key": "35264615", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.205615034722159, "ground_truth": 0}, {"key": "35264615", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5097643808173898, "ground_truth": 0}, {"key": "35264615", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2909808947109359, "ground_truth": 0}, {"key": "35264615", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3702253882973046, "ground_truth": 0}, {"key": "35264615", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3191213841900009, "ground_truth": 0}, {"key": "39898482", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3684056975503727, "ground_truth": 0}, {"key": "39898482", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38861805179706893, "ground_truth": 0}, {"key": "39898482", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7416740130190118, "ground_truth": 0}, {"key": "39898482", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185466686095, "ground_truth": 0}, {"key": "39898482", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004129182852, "ground_truth": 0}, {"key": "37228721", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3056973422112963, "ground_truth": 0}, {"key": "37228721", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4726834613052716, "ground_truth": 0}, {"key": "37228721", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19314738547941399, "ground_truth": 0}, {"key": "37228721", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864512301017586, "ground_truth": 0}, {"key": "37228721", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2568319850824213, "ground_truth": 0}, {"key": "24535799", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8832359916322418, "ground_truth": 0}, {"key": "24535799", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.929951037379524, "ground_truth": 0}, {"key": "24535799", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6959583288358349, "ground_truth": 0}, {"key": "24535799", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.814052794639736, "ground_truth": 0}, {"key": "24535799", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256177095735, "ground_truth": 0}, {"key": "35177759", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5428632665018095, "ground_truth": 0}, {"key": "35177759", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3923368282344023, "ground_truth": 0}, {"key": "35177759", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6513548680773692, "ground_truth": 0}, {"key": "35177759", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331544259883155, "ground_truth": 0}, {"key": "35177759", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132651926662426, "ground_truth": 0}, {"key": "34364829", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.46490156877770616, "ground_truth": 0}, {"key": "34364829", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5019530937043049, "ground_truth": 0}, {"key": "34364829", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3040416593946398, "ground_truth": 0}, {"key": "34364829", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4785288329497088, "ground_truth": 0}, {"key": "34364829", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24508502984930772, "ground_truth": 0}, {"key": "38090732", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4726834690923713, "ground_truth": 0}, {"key": "38090732", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42441198412474784, "ground_truth": 0}, {"key": "38090732", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2798284804719443, "ground_truth": 0}, {"key": "38090732", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629586281814989, "ground_truth": 0}, {"key": "38090732", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117166031811449, "ground_truth": 0}, {"key": "30651479", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3174262814548809, "ground_truth": 0}, {"key": "30651479", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7577943775286391, "ground_truth": 0}, {"key": "30651479", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18713267821846022, "ground_truth": 0}, {"key": "30651479", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23370634743838017, "ground_truth": 0}, {"key": "30651479", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18952107956545708, "ground_truth": 0}, {"key": "39380921", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2658804715948356, "ground_truth": 0}, {"key": "39380921", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17328821616641504, "ground_truth": 0}, {"key": "39380921", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1778108722129859, "ground_truth": 0}, {"key": "39380921", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20817893198053522, "ground_truth": 0}, {"key": "39380921", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22135069444619968, "ground_truth": 0}, {"key": "39037490", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13117322701012196, "ground_truth": 0}, {"key": "39037490", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12002563588572268, "ground_truth": 0}, {"key": "39037490", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.06233104011405238, "ground_truth": 0}, {"key": "39037490", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20055768728980164, "ground_truth": 0}, {"key": "39037490", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2674081609623293, "ground_truth": 0}, {"key": "35917499", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5851011698229008, "ground_truth": 0}, {"key": "35917499", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6671476719637661, "ground_truth": 0}, {"key": "35917499", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5525397179546965, "ground_truth": 0}, {"key": "35917499", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593464848065, "ground_truth": 0}, {"key": "35917499", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582754559804, "ground_truth": 0}, {"key": "34908073", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5214711544963667, "ground_truth": 0}, {"key": "34908073", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4493926177301759, "ground_truth": 0}, {"key": "34908073", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27048023957737566, "ground_truth": 0}, {"key": "34908073", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4590761370117413, "ground_truth": 0}, {"key": "34908073", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563996243322228, "ground_truth": 0}, {"key": "36344759", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6334102564109819, "ground_truth": 0}, {"key": "36344759", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5448013685139588, "ground_truth": 0}, {"key": "36344759", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5156199293266596, "ground_truth": 0}, {"key": "36344759", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370308092870537, "ground_truth": 0}, {"key": "36344759", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185441111969, "ground_truth": 0}, {"key": "39984637", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19072403607069358, "ground_truth": 0}, {"key": "39984637", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18359362009135177, "ground_truth": 0}, {"key": "39984637", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09268778076500246, "ground_truth": 0}, {"key": "39984637", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08449275405929678, "ground_truth": 0}, {"key": "39984637", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12168574904995791, "ground_truth": 0}, {"key": "17917326", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4590761341815334, "ground_truth": 0}, {"key": "17917326", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20689405333746927, "ground_truth": 0}, {"key": "17917326", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27048023333176513, "ground_truth": 0}, {"key": "17917326", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19314738254015812, "ground_truth": 0}, {"key": "17917326", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18126321208946528, "ground_truth": 0}, {"key": "32193638", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.32082130406303794, "ground_truth": 0}, {"key": "32193638", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40922079298936226, "ground_truth": 0}, {"key": "32193638", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3123700040797198, "ground_truth": 0}, {"key": "32193638", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2030746360101, "ground_truth": 0}, {"key": "32193638", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35042140670152006, "ground_truth": 0}, {"key": "34564692", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6388352814254266, "ground_truth": 0}, {"key": "34564692", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7041601439520349, "ground_truth": 0}, {"key": "34564692", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6584175065611968, "ground_truth": 0}, {"key": "34564692", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416739958214058, "ground_truth": 0}, {"key": "34564692", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121860438816, "ground_truth": 0}, {"key": "39329284", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9353465086092095, "ground_truth": 0}, {"key": "39329284", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9324533042966603, "ground_truth": 0}, {"key": "39329284", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6531269119233531, "ground_truth": 0}, {"key": "39329284", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142446192534, "ground_truth": 0}, {"key": "39329284", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068813255671, "ground_truth": 0}, {"key": "37438541", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34687308202953937, "ground_truth": 0}, {"key": "37438541", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3242353998188813, "ground_truth": 0}, {"key": "37438541", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.29098088661192095, "ground_truth": 0}, {"key": "37438541", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16667539898326109, "ground_truth": 0}, {"key": "37438541", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22405544902557673, "ground_truth": 0}, {"key": "34652757", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.538983224086955, "ground_truth": 0}, {"key": "34652757", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4882834000063815, "ground_truth": 0}, {"key": "34652757", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4746311930790942, "ground_truth": 0}, {"key": "34652757", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.48828341146105037, "ground_truth": 0}, {"key": "34652757", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882833965098323, "ground_truth": 0}, {"key": "31361004", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2337063541635763, "ground_truth": 0}, {"key": "31361004", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43398144913530506, "ground_truth": 0}, {"key": "31361004", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4843800813828776, "ground_truth": 0}, {"key": "31361004", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953514509846, "ground_truth": 0}, {"key": "31361004", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3849121627214706, "ground_truth": 0}, {"key": "26150727", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27048023037352104, "ground_truth": 0}, {"key": "26150727", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42441199019586917, "ground_truth": 0}, {"key": "26150727", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2281565022165959, "ground_truth": 0}, {"key": "26150727", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08269733863898775, "ground_truth": 0}, {"key": "26150727", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33458944280148967, "ground_truth": 0}, {"key": "36997402", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5755880073422351, "ground_truth": 0}, {"key": "36997402", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7371581735883322, "ground_truth": 0}, {"key": "36997402", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3328523158737875, "ground_truth": 0}, {"key": "36997402", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358466959847, "ground_truth": 0}, {"key": "36997402", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.569852650138729, "ground_truth": 0}, {"key": "37430643", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1919327947834115, "ground_truth": 0}, {"key": "37430643", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2523840373240439, "ground_truth": 0}, {"key": "37430643", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.372048788148122, "ground_truth": 0}, {"key": "37430643", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4960938432311598, "ground_truth": 0}, {"key": "37430643", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3522017600098375, "ground_truth": 0}, {"key": "36964631", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.319121381210337, "ground_truth": 0}, {"key": "36964631", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42059958444642326, "ground_truth": 0}, {"key": "36964631", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.34158249950145175, "ground_truth": 0}, {"key": "36964631", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37204876948479787, "ground_truth": 0}, {"key": "36964631", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23370635589599636, "ground_truth": 0}, {"key": "35502013", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12085323765712652, "ground_truth": 0}, {"key": "35502013", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07585818245946345, "ground_truth": 0}, {"key": "35502013", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1250653813386913, "ground_truth": 0}, {"key": "35502013", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.06512754818542153, "ground_truth": 0}, {"key": "35502013", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13477591399407177, "ground_truth": 0}, {"key": "33987664", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15002881602983628, "ground_truth": 0}, {"key": "33987664", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3293917238697888, "ground_truth": 0}, {"key": "33987664", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2213506961763603, "ground_truth": 0}, {"key": "33987664", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3775406968812921, "ground_truth": 0}, {"key": "33987664", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13939638604303248, "ground_truth": 0}, {"key": "35203721", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24220563694196273, "ground_truth": 0}, {"key": "35203721", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23091975663582676, "ground_truth": 0}, {"key": "35203721", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1721718460839445, "ground_truth": 0}, {"key": "35203721", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4148988456961285, "ground_truth": 0}, {"key": "35203721", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17328819225182304, "ground_truth": 0}, {"key": "39028348", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35936411825574216, "ground_truth": 0}, {"key": "39028348", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3174262366202732, "ground_truth": 0}, {"key": "39028348", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42441201206544743, "ground_truth": 0}, {"key": "39028348", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3775406761594364, "ground_truth": 0}, {"key": "39028348", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4073333855498242, "ground_truth": 0}, {"key": "37459383", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3174262826872694, "ground_truth": 0}, {"key": "37459383", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.35398629268794335, "ground_truth": 0}, {"key": "37459383", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5774953598429825, "ground_truth": 0}, {"key": "37459383", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3960681595872549, "ground_truth": 0}, {"key": "37459383", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.362969212613893, "ground_truth": 0}, {"key": "34020070", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5506073837973717, "ground_truth": 0}, {"key": "34020070", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5832033506690725, "ground_truth": 0}, {"key": "34020070", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5331543966644415, "ground_truth": 0}, {"key": "34020070", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35220178898840826, "ground_truth": 0}, {"key": "34020070", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420094734114247, "ground_truth": 0}, {"key": "35176615", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44167300886803, "ground_truth": 0}, {"key": "35176615", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5350984336926367, "ground_truth": 0}, {"key": "35176615", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16344542660251155, "ground_truth": 0}, {"key": "35176615", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21469141384610366, "ground_truth": 0}, {"key": "35176615", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16995623039892338, "ground_truth": 0}, {"key": "33296389", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.48242910805383127, "ground_truth": 0}, {"key": "33296389", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.45907612446870694, "ground_truth": 0}, {"key": "33296389", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6242935354337507, "ground_truth": 0}, {"key": "33296389", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43206341514149366, "ground_truth": 0}, {"key": "33296389", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.41679665981741776, "ground_truth": 0}, {"key": "35399504", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.682573740014437, "ground_truth": 0}, {"key": "35399504", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6601723643384557, "ground_truth": 0}, {"key": "35399504", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8606036194342047, "ground_truth": 0}, {"key": "35399504", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786125184533, "ground_truth": 0}, {"key": "35399504", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324724520927, "ground_truth": 0}, {"key": "34807886", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4416729764970948, "ground_truth": 0}, {"key": "34807886", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37022539433791174, "ground_truth": 0}, {"key": "34807886", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.30074557298551574, "ground_truth": 0}, {"key": "34807886", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633874625331, "ground_truth": 0}, {"key": "34807886", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.26133094030197446, "ground_truth": 0}, {"key": "37629813", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19930801018013425, "ground_truth": 0}, {"key": "37629813", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2845759926460193, "ground_truth": 0}, {"key": "37629813", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22270013746149103, "ground_truth": 0}, {"key": "37629813", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.06705629160613445, "ground_truth": 0}, {"key": "37629813", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14804719055808319, "ground_truth": 0}, {"key": "28084389", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22270015819430272, "ground_truth": 0}, {"key": "28084389", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5234203517539018, "ground_truth": 0}, {"key": "28084389", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4629586265382548, "ground_truth": 0}, {"key": "28084389", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723749196676, "ground_truth": 0}, {"key": "28084389", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358360518933, "ground_truth": 0}, {"key": "35391734", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20946968922553694, "ground_truth": 0}, {"key": "35391734", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3486451526003269, "ground_truth": 0}, {"key": "35391734", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14414884833470912, "ground_truth": 0}, {"key": "35391734", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1993080030049695, "ground_truth": 0}, {"key": "35391734", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20307462822469363, "ground_truth": 0}, {"key": "40214591", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.135689550394736, "ground_truth": 0}, {"key": "40214591", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30902369589841455, "ground_truth": 0}, {"key": "40214591", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39606816860823535, "ground_truth": 0}, {"key": "40214591", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17667161170071133, "ground_truth": 0}, {"key": "40214591", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19806417398208123, "ground_truth": 0}, {"key": "26283171", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4902356049054261, "ground_truth": 0}, {"key": "26283171", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5331543959455795, "ground_truth": 0}, {"key": "26283171", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2893717037729215, "ground_truth": 0}, {"key": "26283171", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32423539241802113, "ground_truth": 0}, {"key": "26283171", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2829881404122418, "ground_truth": 0}, {"key": "37084030", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2337063359964009, "ground_truth": 0}, {"key": "37084030", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21733751238559526, "ground_truth": 0}, {"key": "37084030", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4378235023585008, "ground_truth": 0}, {"key": "37084030", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.364777556822413, "ground_truth": 0}, {"key": "37084030", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18010665798722028, "ground_truth": 0}, {"key": "39027295", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10594828003397257, "ground_truth": 0}, {"key": "39027295", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1835936112611595, "ground_truth": 0}, {"key": "39027295", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2735744081112747, "ground_truth": 0}, {"key": "39027295", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2351083832439581, "ground_truth": 0}, {"key": "39027295", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.08694165879398075, "ground_truth": 0}, {"key": "14018647", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14318770968418043, "ground_truth": 0}, {"key": "14018647", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23510838897929323, "ground_truth": 0}, {"key": "14018647", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23231015817122436, "ground_truth": 0}, {"key": "14018647", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12506537793247596, "ground_truth": 0}, {"key": "14018647", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220563398211467, "ground_truth": 0}, {"key": "37424289", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7476159451334347, "ground_truth": 0}, {"key": "37424289", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8233284047382128, "ground_truth": 0}, {"key": "37424289", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8116760273350345, "ground_truth": 0}, {"key": "37424289", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867819878566, "ground_truth": 0}, {"key": "37424289", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640357414252, "ground_truth": 0}, {"key": "37498031", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31912138821999303, "ground_truth": 0}, {"key": "37498031", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27202456645148687, "ground_truth": 0}, {"key": "37498031", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31237000132891757, "ground_truth": 0}, {"key": "37498031", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.69264197989687, "ground_truth": 0}, {"key": "37498031", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44552953407295065, "ground_truth": 0}, {"key": "30104095", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7745833900341931, "ground_truth": 0}, {"key": "30104095", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8529354709958118, "ground_truth": 0}, {"key": "30104095", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.626124190568759, "ground_truth": 0}, {"key": "30104095", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216505729809, "ground_truth": 0}, {"key": "30104095", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.455198622246151, "ground_truth": 0}, {"key": "37911407", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5428632801297112, "ground_truth": 0}, {"key": "37911407", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5370413804717861, "ground_truth": 0}, {"key": "37911407", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7233094751880115, "ground_truth": 0}, {"key": "37911407", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.602061583471617, "ground_truth": 0}, {"key": "37911407", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964379655916, "ground_truth": 0}, {"key": "39177472", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5964331840287637, "ground_truth": 0}, {"key": "39177472", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.509764336158117, "ground_truth": 0}, {"key": "39177472", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3998116270900258, "ground_truth": 0}, {"key": "39177472", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3363310692258961, "ground_truth": 0}, {"key": "39177472", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707366157305226, "ground_truth": 0}, {"key": "32325454", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24364245040953048, "ground_truth": 0}, {"key": "32325454", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07864237796839313, "ground_truth": 0}, {"key": "32325454", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11201595462764949, "ground_truth": 0}, {"key": "32325454", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24364243147838738, "ground_truth": 0}, {"key": "32325454", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10230470487236226, "ground_truth": 0}, {"key": "38395319", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.48047867548498047, "ground_truth": 0}, {"key": "38395319", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4824291233752773, "ground_truth": 0}, {"key": "38395319", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.315735981010308, "ground_truth": 0}, {"key": "38395319", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35220178210503594, "ground_truth": 0}, {"key": "38395319", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832361425719, "ground_truth": 0}, {"key": "38235895", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.240774592571533, "ground_truth": 0}, {"key": "38235895", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.437823484942561, "ground_truth": 0}, {"key": "38235895", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38491215121384154, "ground_truth": 0}, {"key": "38235895", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864513230182326, "ground_truth": 0}, {"key": "38235895", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378234884248186, "ground_truth": 0}, {"key": "26543267", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33633105568267885, "ground_truth": 0}, {"key": "26543267", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2643583628071652, "ground_truth": 0}, {"key": "26543267", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40356686307291884, "ground_truth": 0}, {"key": "26543267", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31912138349231745, "ground_truth": 0}, {"key": "26543267", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2553436409610011, "ground_truth": 0}, {"key": "39054728", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9304582548231362, "ground_truth": 0}, {"key": "39054728", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.967163045698854, "ground_truth": 0}, {"key": "39054728", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9465966673216023, "ground_truth": 0}, {"key": "39054728", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9539660977429586, "ground_truth": 0}, {"key": "39054728", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9829546824196874, "ground_truth": 0}, {"key": "39158443", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.261330903841878, "ground_truth": 0}, {"key": "39158443", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2568319911017332, "ground_truth": 0}, {"key": "39158443", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43974737862267854, "ground_truth": 0}, {"key": "39158443", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1550784853546433, "ground_truth": 0}, {"key": "39158443", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27825678080956645, "ground_truth": 0}, {"key": "36254201", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.49609385600037215, "ground_truth": 0}, {"key": "36254201", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30569732590452675, "ground_truth": 0}, {"key": "36254201", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3830641729133447, "ground_truth": 0}, {"key": "36254201", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1561049027631702, "ground_truth": 0}, {"key": "36254201", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.368405700890763, "ground_truth": 0}, {"key": "23434347", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3174262548138218, "ground_truth": 0}, {"key": "23434347", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12002562195535188, "ground_truth": 0}, {"key": "23434347", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3522017800627405, "ground_truth": 0}, {"key": "23434347", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37754066316816853, "ground_truth": 0}, {"key": "23434347", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3647775345900174, "ground_truth": 0}, {"key": "34397620", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22678362937660293, "ground_truth": 0}, {"key": "34397620", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13028542471661053, "ground_truth": 0}, {"key": "34397620", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3557748874762544, "ground_truth": 0}, {"key": "34397620", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16667539765934655, "ground_truth": 0}, {"key": "34397620", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510837665024859, "ground_truth": 0}, {"key": "34340916", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21206879890296396, "ground_truth": 0}, {"key": "34340916", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21733752657276525, "ground_truth": 0}, {"key": "34340916", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1460872413296205, "ground_truth": 0}, {"key": "34340916", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2643583468398658, "ground_truth": 0}, {"key": "34340916", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21206880711363185, "ground_truth": 0}, {"key": "30375089", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21733751825227668, "ground_truth": 0}, {"key": "30375089", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27202456238241074, "ground_truth": 0}, {"key": "30375089", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1766716068638801, "ground_truth": 0}, {"key": "30375089", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18832398985791624, "ground_truth": 0}, {"key": "30375089", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3040416860974727, "ground_truth": 0}, {"key": "35807797", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5755879881828128, "ground_truth": 0}, {"key": "35807797", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4073334172428848, "ground_truth": 0}, {"key": "35807797", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5983122065601758, "ground_truth": 0}, {"key": "35807797", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601553511604, "ground_truth": 0}, {"key": "35807797", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956580908577815, "ground_truth": 0}, {"key": "34188172", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17441026751556726, "ground_truth": 0}, {"key": "34188172", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.165593115510929, "ground_truth": 0}, {"key": "34188172", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10521053681613174, "ground_truth": 0}, {"key": "34188172", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1520322390097324, "ground_truth": 0}, {"key": "34188172", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.26284183835309216, "ground_truth": 0}, {"key": "37075567", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6095241694626371, "ground_truth": 0}, {"key": "37075567", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5621765108863348, "ground_truth": 0}, {"key": "37075567", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8210441171104327, "ground_truth": 0}, {"key": "37075567", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292634033060916, "ground_truth": 0}, {"key": "37075567", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.57749537328334, "ground_truth": 0}, {"key": "35559735", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2267836488487816, "ground_truth": 0}, {"key": "35559735", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8278281521350385, "ground_truth": 0}, {"key": "35559735", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.32594951715568976, "ground_truth": 0}, {"key": "35559735", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.607663173866561, "ground_truth": 0}, {"key": "35559735", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38491214356708153, "ground_truth": 0}, {"key": "33005019", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2379298885888646, "ground_truth": 0}, {"key": "33005019", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28776781450909333, "ground_truth": 0}, {"key": "33005019", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5117166131738535, "ground_truth": 0}, {"key": "33005019", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29746996117304075, "ground_truth": 0}, {"key": "33005019", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1871326917304428, "ground_truth": 0}, {"key": "30808252", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8749346158107614, "ground_truth": 0}, {"key": "30808252", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.873214828636071, "ground_truth": 0}, {"key": "30808252", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7981867761997584, "ground_truth": 0}, {"key": "30808252", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743532752191, "ground_truth": 0}, {"key": "30808252", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624792435446, "ground_truth": 0}, {"key": "15159017", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3486451457291661, "ground_truth": 0}, {"key": "15159017", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22678363558070264, "ground_truth": 0}, {"key": "15159017", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4244119927518303, "ground_truth": 0}, {"key": "15159017", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.33285233434630573, "ground_truth": 0}, {"key": "15159017", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819974206326, "ground_truth": 0}, {"key": "24493400", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1602660337755303, "ground_truth": 0}, {"key": "24493400", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5312093714787022, "ground_truth": 0}, {"key": "24493400", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3293917182671563, "ground_truth": 0}, {"key": "24493400", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4863315416113323, "ground_truth": 0}, {"key": "24493400", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.61508785507017, "ground_truth": 0}, {"key": "37791071", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4148988453182899, "ground_truth": 0}, {"key": "37791071", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7074046915485945, "ground_truth": 0}, {"key": "37791071", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4687905993414803, "ground_truth": 0}, {"key": "37791071", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073662693823, "ground_truth": 0}, {"key": "37791071", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824291219638306, "ground_truth": 0}, {"key": "33528627", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.353986311227867, "ground_truth": 0}, {"key": "33528627", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.36477756355014695, "ground_truth": 0}, {"key": "33528627", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4320634108293558, "ground_truth": 0}, {"key": "33528627", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3259495271527047, "ground_truth": 0}, {"key": "33528627", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3979384144656141, "ground_truth": 0}, {"key": "39925662", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6723317102871011, "ground_truth": 0}, {"key": "39925662", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7534666358944523, "ground_truth": 0}, {"key": "39925662", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5409238598140332, "ground_truth": 0}, {"key": "39925662", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4941408967853613, "ground_truth": 0}, {"key": "39925662", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757645845439127, "ground_truth": 0}, {"key": "29213416", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2043419004506601, "ground_truth": 0}, {"key": "29213416", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7969253679537012, "ground_truth": 0}, {"key": "29213416", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4960938362373227, "ground_truth": 0}, {"key": "29213416", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030661897068, "ground_truth": 0}, {"key": "29213416", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35398630811155474, "ground_truth": 0}, {"key": "34492745", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12852513214165903, "ground_truth": 0}, {"key": "34492745", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20434190088537893, "ground_truth": 0}, {"key": "34492745", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22678363008715546, "ground_truth": 0}, {"key": "34492745", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44746030490494515, "ground_truth": 0}, {"key": "34492745", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.29910519049022327, "ground_truth": 0}, {"key": "34191937", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27669052435126007, "ground_truth": 0}, {"key": "34191937", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16026603214788468, "ground_truth": 0}, {"key": "34191937", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22135069860126705, "ground_truth": 0}, {"key": "34191937", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11596071645079241, "ground_truth": 0}, {"key": "34191937", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.25386099613674473, "ground_truth": 0}, {"key": "34933372", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.49414090965276775, "ground_truth": 0}, {"key": "34933372", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4073333858081176, "ground_truth": 0}, {"key": "34933372", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2553436378628607, "ground_truth": 0}, {"key": "34933372", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31573597497564193, "ground_truth": 0}, {"key": "34933372", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4035668527561004, "ground_truth": 0}, {"key": "38714379", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8670357596272695, "ground_truth": 0}, {"key": "38714379", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6926419736539594, "ground_truth": 0}, {"key": "38714379", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.732591836457916, "ground_truth": 0}, {"key": "38714379", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419625846649, "ground_truth": 0}, {"key": "38714379", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891328872506, "ground_truth": 0}, {"key": "39220660", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6001883633817854, "ground_truth": 0}, {"key": "39220660", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5136684847285136, "ground_truth": 0}, {"key": "39220660", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5214711919508372, "ground_truth": 0}, {"key": "39220660", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684729179296, "ground_truth": 0}, {"key": "39220660", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.49023560149535766, "ground_truth": 0}, {"key": "41028780", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20817892587171544, "ground_truth": 0}, {"key": "41028780", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3191213689042299, "ground_truth": 0}, {"key": "41028780", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21337716622514538, "ground_truth": 0}, {"key": "41028780", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16995623983124283, "ground_truth": 0}, {"key": "41028780", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23231014512024722, "ground_truth": 0}, {"key": "39457108", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6531269139601434, "ground_truth": 0}, {"key": "39457108", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3998116316363904, "ground_truth": 0}, {"key": "39457108", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.32423539966492376, "ground_truth": 0}, {"key": "39457108", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238811741952, "ground_truth": 0}, {"key": "39457108", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.41300356278707445, "ground_truth": 0}, {"key": "38288018", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5563995824889884, "ground_truth": 0}, {"key": "38288018", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3757064723737794, "ground_truth": 0}, {"key": "38288018", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4532618670970829, "ground_truth": 0}, {"key": "38288018", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29910519957959986, "ground_truth": 0}, {"key": "38288018", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23934934297030286, "ground_truth": 0}, {"key": "40106293", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11516223315974365, "ground_truth": 0}, {"key": "40106293", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19682620759872602, "ground_truth": 0}, {"key": "40106293", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11357958672021526, "ground_truth": 0}, {"key": "40106293", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1422318873818861, "ground_truth": 0}, {"key": "40106293", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1530421550115668, "ground_truth": 0}, {"key": "39948797", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21469142042404737, "ground_truth": 0}, {"key": "39948797", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6150878537819549, "ground_truth": 0}, {"key": "39948797", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4148988403294685, "ground_truth": 0}, {"key": "39948797", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687308938234657, "ground_truth": 0}, {"key": "39948797", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.46101674938329756, "ground_truth": 0}, {"key": "31853399", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7295197723554757, "ground_truth": 0}, {"key": "31853399", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40922078862253775, "ground_truth": 0}, {"key": "31853399", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7956581162679713, "ground_truth": 0}, {"key": "31853399", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926420018491163, "ground_truth": 0}, {"key": "31853399", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837594808773, "ground_truth": 0}, {"key": "35273252", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2081789356099549, "ground_truth": 0}, {"key": "35273252", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22953521361264334, "ground_truth": 0}, {"key": "35273252", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2782567898858855, "ground_truth": 0}, {"key": "35273252", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18713267743280143, "ground_truth": 0}, {"key": "35273252", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1766716062719599, "ground_truth": 0}, {"key": "37130459", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7431680197609296, "ground_truth": 0}, {"key": "37130459", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9246876913587171, "ground_truth": 0}, {"key": "37130459", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9032942103198928, "ground_truth": 0}, {"key": "37130459", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869881585326, "ground_truth": 0}, {"key": "37130459", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218294567625, "ground_truth": 0}, {"key": "21734003", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18952107026715692, "ground_truth": 0}, {"key": "21734003", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6513548642445754, "ground_truth": 0}, {"key": "21734003", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6150878691327327, "ground_truth": 0}, {"key": "21734003", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937837030275356, "ground_truth": 0}, {"key": "21734003", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569735582549973, "ground_truth": 0}, {"key": "33990737", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.47268347374367026, "ground_truth": 0}, {"key": "33990737", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21206881185630727, "ground_truth": 0}, {"key": "33990737", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25534367625976484, "ground_truth": 0}, {"key": "33990737", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1470645299214472, "ground_truth": 0}, {"key": "33990737", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45519858911687316, "ground_truth": 0}, {"key": "34559912", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5964331686408507, "ground_truth": 0}, {"key": "34559912", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6076631701564486, "ground_truth": 0}, {"key": "34559912", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5888891197682854, "ground_truth": 0}, {"key": "34559912", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217431973437023, "ground_truth": 0}, {"key": "34559912", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601352327869, "ground_truth": 0}, {"key": "39820439", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09073548494367512, "ground_truth": 0}, {"key": "39820439", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21601153627896513, "ground_truth": 0}, {"key": "39820439", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27825679574024287, "ground_truth": 0}, {"key": "39820439", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27669053482583766, "ground_truth": 0}, {"key": "39820439", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23651622662678437, "ground_truth": 0}, {"key": "34759328", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5888891416140757, "ground_truth": 0}, {"key": "34759328", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5214711475690124, "ground_truth": 0}, {"key": "34759328", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6791786943817542, "ground_truth": 0}, {"key": "34759328", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089219117432, "ground_truth": 0}, {"key": "34759328", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191399002364, "ground_truth": 0}, {"key": "36939137", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31236999750875094, "ground_truth": 0}, {"key": "36939137", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7476159563981446, "ground_truth": 0}, {"key": "36939137", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6808786278624539, "ground_truth": 0}, {"key": "36939137", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745834059374698, "ground_truth": 0}, {"key": "36939137", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159523195026, "ground_truth": 0}, {"key": "35851522", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34510529201136975, "ground_truth": 0}, {"key": "35851522", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47657966703122134, "ground_truth": 0}, {"key": "35851522", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2643583581919838, "ground_truth": 0}, {"key": "35851522", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.33982763560954105, "ground_truth": 0}, {"key": "35851522", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2735743759094965, "ground_truth": 0}, {"key": "22412782", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24944722896927213, "ground_truth": 0}, {"key": "22412782", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23510837430000237, "ground_truth": 0}, {"key": "22412782", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2281565111544026, "ground_truth": 0}, {"key": "22412782", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2005576834126096, "ground_truth": 0}, {"key": "22412782", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3311197362299733, "ground_truth": 0}, {"key": "38579227", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.41679665509827124, "ground_truth": 0}, {"key": "38579227", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4980468974889623, "ground_truth": 0}, {"key": "38579227", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.325949530519114, "ground_truth": 0}, {"key": "38579227", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.47268346470866124, "ground_truth": 0}, {"key": "38579227", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711589210185, "ground_truth": 0}, {"key": "37206995", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1744102823904927, "ground_truth": 0}, {"key": "37206995", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27982849452923614, "ground_truth": 0}, {"key": "37206995", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17895590544169468, "ground_truth": 0}, {"key": "37206995", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2538610173706875, "ground_truth": 0}, {"key": "37206995", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.26740816185448396, "ground_truth": 0}, {"key": "38700847", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6460137196391789, "ground_truth": 0}, {"key": "38700847", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40544870278416906, "ground_truth": 0}, {"key": "38700847", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40544872731006487, "ground_truth": 0}, {"key": "38700847", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238797441077, "ground_truth": 0}, {"key": "38700847", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4054487507239927, "ground_truth": 0}, {"key": "20246590", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9664104920400698, "ground_truth": 0}, {"key": "20246590", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9750122062427312, "ground_truth": 0}, {"key": "20246590", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9669140215039718, "ground_truth": 0}, {"key": "20246590", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9425067244432498, "ground_truth": 0}, {"key": "20246590", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9775429458526699, "ground_truth": 0}, {"key": "39141360", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6206216168812819, "ground_truth": 0}, {"key": "39141360", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5370414177788468, "ground_truth": 0}, {"key": "39141360", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6352224413713565, "ground_truth": 0}, {"key": "39141360", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241830842795, "ground_truth": 0}, {"key": "39141360", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512161299013, "ground_truth": 0}, {"key": "37906226", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1294027232420813, "ground_truth": 0}, {"key": "37906226", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.08035746959747248, "ground_truth": 0}, {"key": "37906226", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10017222262360513, "ground_truth": 0}, {"key": "37906226", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14608725086626598, "ground_truth": 0}, {"key": "37906226", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2160115342743026, "ground_truth": 0}, {"key": "16201033", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11436852626788588, "ground_truth": 0}, {"key": "16201033", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1812631914293823, "ground_truth": 0}, {"key": "16201033", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17328820664636355, "ground_truth": 0}, {"key": "16201033", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.0758581773435598, "ground_truth": 0}, {"key": "16201033", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23091975632603223, "ground_truth": 0}, {"key": "36469022", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.517570895436829, "ground_truth": 0}, {"key": "36469022", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4054487340332283, "ground_truth": 0}, {"key": "36469022", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3522017772427734, "ground_truth": 0}, {"key": "36469022", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4532618602199498, "ground_truth": 0}, {"key": "36469022", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.498046879731853, "ground_truth": 0}, {"key": "31295270", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.041462274120198976, "ground_truth": 0}, {"key": "31295270", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.386763445670185, "ground_truth": 0}, {"key": "31295270", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1066905942397827, "ground_truth": 0}, {"key": "31295270", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22541661019478126, "ground_truth": 0}, {"key": "31295270", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12421301083350941, "ground_truth": 0}, {"key": "35360689", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26588047910388196, "ground_truth": 0}, {"key": "35360689", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12002563258374502, "ground_truth": 0}, {"key": "35360689", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09467770028223414, "ground_truth": 0}, {"key": "35360689", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09268777870613344, "ground_truth": 0}, {"key": "35360689", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1721718617045923, "ground_truth": 0}, {"key": "29202793", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23510839194440433, "ground_truth": 0}, {"key": "29202793", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31237001282513627, "ground_truth": 0}, {"key": "29202793", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31573598770592687, "ground_truth": 0}, {"key": "29202793", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3380771405287409, "ground_truth": 0}, {"key": "29202793", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27202455869909353, "ground_truth": 0}, {"key": "35999008", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23792988905092763, "ground_truth": 0}, {"key": "35999008", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13117322190501132, "ground_truth": 0}, {"key": "35999008", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07921031840133576, "ground_truth": 0}, {"key": "35999008", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09268777247523383, "ground_truth": 0}, {"key": "35999008", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220561894771395, "ground_truth": 0}, {"key": "31797119", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6150878573700234, "ground_truth": 0}, {"key": "31797119", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3522017673477863, "ground_truth": 0}, {"key": "31797119", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3738758299980323, "ground_truth": 0}, {"key": "31797119", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.538983229870986, "ground_truth": 0}, {"key": "31797119", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762877403329, "ground_truth": 0}, {"key": "26711893", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24077460593895852, "ground_truth": 0}, {"key": "26711893", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24364241985311255, "ground_truth": 0}, {"key": "26711893", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3575675283427977, "ground_truth": 0}, {"key": "26711893", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21733751525864242, "ground_truth": 0}, {"key": "26711893", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18242551430035536, "ground_truth": 0}, {"key": "35348288", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17328820262347347, "ground_truth": 0}, {"key": "35348288", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19930801374272722, "ground_truth": 0}, {"key": "35348288", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2658804895580239, "ground_truth": 0}, {"key": "35348288", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09138210750968878, "ground_truth": 0}, {"key": "35348288", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1766715957726704, "ground_truth": 0}, {"key": "38124131", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10818895209520663, "ground_truth": 0}, {"key": "38124131", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14318770695371283, "ground_truth": 0}, {"key": "38124131", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16559310918861345, "ground_truth": 0}, {"key": "38124131", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20689406446445355, "ground_truth": 0}, {"key": "38124131", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24077460015435745, "ground_truth": 0}, {"key": "20285901", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3140505326155334, "ground_truth": 0}, {"key": "20285901", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26740816592633465, "ground_truth": 0}, {"key": "20285901", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24077460259384031, "ground_truth": 0}, {"key": "20285901", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2991051743790242, "ground_truth": 0}, {"key": "20285901", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.29583988124135496, "ground_truth": 0}, {"key": "35633632", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16344543036514647, "ground_truth": 0}, {"key": "35633632", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2465333291765954, "ground_truth": 0}, {"key": "35633632", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2735743951479992, "ground_truth": 0}, {"key": "35633632", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25534365673728715, "ground_truth": 0}, {"key": "35633632", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469140562132316, "ground_truth": 0}, {"key": "10741274", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.753466653232155, "ground_truth": 0}, {"key": "10741274", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4726834649622768, "ground_truth": 0}, {"key": "10741274", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7866228195899041, "ground_truth": 0}, {"key": "10741274", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948153437656, "ground_truth": 0}, {"key": "10741274", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804325514952, "ground_truth": 0}, {"key": "30605795", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4551986150578422, "ground_truth": 0}, {"key": "30605795", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5486734858113623, "ground_truth": 0}, {"key": "30605795", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4610167921156511, "ground_truth": 0}, {"key": "30605795", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633840014507, "ground_truth": 0}, {"key": "30605795", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4186969081810035, "ground_truth": 0}, {"key": "30539722", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10970577210819853, "ground_truth": 0}, {"key": "30539722", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2094696884949089, "ground_truth": 0}, {"key": "30539722", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12168574688817363, "ground_truth": 0}, {"key": "30539722", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3398276111010291, "ground_truth": 0}, {"key": "30539722", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19193279513372172, "ground_truth": 0}, {"key": "18639299", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4436004268531385, "ground_truth": 0}, {"key": "18639299", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07055959468072383, "ground_truth": 0}, {"key": "18639299", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1623800344243862, "ground_truth": 0}, {"key": "18639299", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1710611931705537, "ground_truth": 0}, {"key": "18639299", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1540575708312296, "ground_truth": 0}, {"key": "39773552", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3040416771079541, "ground_truth": 0}, {"key": "39773552", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2227001376844698, "ground_truth": 0}, {"key": "39773552", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.261330933489469, "ground_truth": 0}, {"key": "39773552", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22815650790404768, "ground_truth": 0}, {"key": "39773552", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11676401253830433, "ground_truth": 0}, {"key": "34086410", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3208212933114551, "ground_truth": 0}, {"key": "34086410", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21733751357589415, "ground_truth": 0}, {"key": "34086410", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13117322356947753, "ground_truth": 0}, {"key": "34086410", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.05877655740354348, "ground_truth": 0}, {"key": "34086410", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10669059552605525, "ground_truth": 0}, {"key": "35454652", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2674081530711193, "ground_truth": 0}, {"key": "35454652", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.392336836772976, "ground_truth": 0}, {"key": "35454652", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35936413919500193, "ground_truth": 0}, {"key": "35454652", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2958398847748651, "ground_truth": 0}, {"key": "35454652", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37387581635071404, "ground_truth": 0}, {"key": "36158310", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4282333603658057, "ground_truth": 0}, {"key": "36158310", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10743747119122533, "ground_truth": 0}, {"key": "36158310", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6619228607044215, "ground_truth": 0}, {"key": "36158310", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557749019100507, "ground_truth": 0}, {"key": "36158310", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3979384197617736, "ground_truth": 0}, {"key": "35688387", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16559311754856812, "ground_truth": 0}, {"key": "35688387", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42632158283629534, "ground_truth": 0}, {"key": "35688387", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08093670912318168, "ground_truth": 0}, {"key": "35688387", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07921032004659159, "ground_truth": 0}, {"key": "35688387", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12085323604337032, "ground_truth": 0}, {"key": "34209292", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5486734564765912, "ground_truth": 0}, {"key": "34209292", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.34864513725509116, "ground_truth": 0}, {"key": "34209292", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.29910518846183937, "ground_truth": 0}, {"key": "34209292", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907610200254473, "ground_truth": 0}, {"key": "34209292", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19930799371444596, "ground_truth": 0}, {"key": "25037859", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2200071011250414, "ground_truth": 0}, {"key": "25037859", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2925952861338625, "ground_truth": 0}, {"key": "25037859", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2018132110222854, "ground_truth": 0}, {"key": "25037859", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11201595207457313, "ground_truth": 0}, {"key": "25037859", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15817436119991102, "ground_truth": 0}, {"key": "36412121", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6424324658854058, "ground_truth": 0}, {"key": "36412121", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6315943177153548, "ground_truth": 0}, {"key": "36412121", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5717665724480221, "ground_truth": 0}, {"key": "36412121", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943691784176, "ground_truth": 0}, {"key": "36412121", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102583008878, "ground_truth": 0}, {"key": "34909172", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.47657966849595024, "ground_truth": 0}, {"key": "34909172", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3611647258474466, "ground_truth": 0}, {"key": "34909172", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.37022538667511407, "ground_truth": 0}, {"key": "34909172", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37022539503573, "ground_truth": 0}, {"key": "34909172", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939172746082107, "ground_truth": 0}, {"key": "39011806", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3942009365504647, "ground_truth": 0}, {"key": "39011806", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26740815384910616, "ground_truth": 0}, {"key": "39011806", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.36296919822116674, "ground_truth": 0}, {"key": "39011806", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937835147062593, "ground_truth": 0}, {"key": "39011806", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36840568852533345, "ground_truth": 0}, {"key": "33096163", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5136684579309467, "ground_truth": 0}, {"key": "33096163", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5467381557360088, "ground_truth": 0}, {"key": "33096163", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.709019144705245, "ground_truth": 0}, {"key": "33096163", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4493926550736666, "ground_truth": 0}, {"key": "33096163", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593168902435, "ground_truth": 0}, {"key": "38762205", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4035668505875668, "ground_truth": 0}, {"key": "38762205", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.796925382438874, "ground_truth": 0}, {"key": "38762205", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18952110107501027, "ground_truth": 0}, {"key": "38762205", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717665852055841, "ground_truth": 0}, {"key": "38762205", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641409930508, "ground_truth": 0}, {"key": "35519177", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33458943839734534, "ground_truth": 0}, {"key": "35519177", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3380771159087978, "ground_truth": 0}, {"key": "35519177", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40356683522137987, "ground_truth": 0}, {"key": "35519177", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4455295130277047, "ground_truth": 0}, {"key": "35519177", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640985272586917, "ground_truth": 0}, {"key": "36192531", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3904758625217585, "ground_truth": 0}, {"key": "36192531", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5039061666237084, "ground_truth": 0}, {"key": "36192531", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4244119954346047, "ground_truth": 0}, {"key": "36192531", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.42441199045611505, "ground_truth": 0}, {"key": "36192531", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526543328172, "ground_truth": 0}, {"key": "33160852", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9539661007821996, "ground_truth": 0}, {"key": "33160852", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9515039978006269, "ground_truth": 0}, {"key": "33160852", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8856314787686612, "ground_truth": 0}, {"key": "33160852", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438951033774418, "ground_truth": 0}, {"key": "33160852", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210675049966, "ground_truth": 0}, {"key": "36312304", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22000710253265368, "ground_truth": 0}, {"key": "36312304", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.281405586192467, "ground_truth": 0}, {"key": "36312304", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2509127699025064, "ground_truth": 0}, {"key": "36312304", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2704802309005931, "ground_truth": 0}, {"key": "36312304", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17217184228503835, "ground_truth": 0}, {"key": "33773343", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17667160839916715, "ground_truth": 0}, {"key": "33773343", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4092207964768481, "ground_truth": 0}, {"key": "33773343", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3023910713123803, "ground_truth": 0}, {"key": "33773343", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.33633103647404466, "ground_truth": 0}, {"key": "33773343", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364246472553025, "ground_truth": 0}, {"key": "34913320", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5679366147912228, "ground_truth": 0}, {"key": "34913320", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.554470484832233, "ground_truth": 0}, {"key": "34913320", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39606815954077035, "ground_truth": 0}, {"key": "34913320", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5525397003653857, "ground_truth": 0}, {"key": "34913320", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.726425593190198, "ground_truth": 0}, {"key": "33784155", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22135069102218125, "ground_truth": 0}, {"key": "33784155", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6057990363904053, "ground_truth": 0}, {"key": "33784155", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17895589818768434, "ground_truth": 0}, {"key": "33784155", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11201595132472009, "ground_truth": 0}, {"key": "33784155", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3123700036102772, "ground_truth": 0}, {"key": "24085062", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.987472066667625, "ground_truth": 0}, {"key": "24085062", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9585377244171418, "ground_truth": 0}, {"key": "24085062", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9676556689179019, "ground_truth": 0}, {"key": "24085062", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.989347488159456, "ground_truth": 0}, {"key": "24085062", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9833429602000442, "ground_truth": 0}, {"key": "33893487", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1338674955755659, "ground_truth": 0}, {"key": "33893487", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12852514186566144, "ground_truth": 0}, {"key": "33893487", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.36477756864056293, "ground_truth": 0}, {"key": "33893487", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12252321283804177, "ground_truth": 0}, {"key": "33893487", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20055769305775442, "ground_truth": 0}, {"key": "40913011", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7074047170421777, "ground_truth": 0}, {"key": "40913011", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8092759647196562, "ground_truth": 0}, {"key": "40913011", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7772998749799356, "ground_truth": 0}, {"key": "40913011", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.73259183974943, "ground_truth": 0}, {"key": "40913011", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673209199215, "ground_truth": 0}, {"key": "29642545", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2845760056538465, "ground_truth": 0}, {"key": "29642545", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1847675181572364, "ground_truth": 0}, {"key": "29642545", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.28298811942340013, "ground_truth": 0}, {"key": "29642545", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2909808694234156, "ground_truth": 0}, {"key": "29642545", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.25683200679969675, "ground_truth": 0}, {"key": "35969159", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2160115435592947, "ground_truth": 0}, {"key": "35969159", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2751297272140494, "ground_truth": 0}, {"key": "35969159", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.194367820034857, "ground_truth": 0}, {"key": "35969159", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2005576831276532, "ground_truth": 0}, {"key": "35969159", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27825676624885853, "ground_truth": 0}, {"key": "37081669", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3208213071402758, "ground_truth": 0}, {"key": "37081669", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6095241572713913, "ground_truth": 0}, {"key": "37081669", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4320634068038252, "ground_truth": 0}, {"key": "37081669", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20434190636451482, "ground_truth": 0}, {"key": "37081669", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2337063509154816, "ground_truth": 0}, {"key": "40048022", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.46490156430965895, "ground_truth": 0}, {"key": "40048022", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41300355064315086, "ground_truth": 0}, {"key": "40048022", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.352201809253835, "ground_truth": 0}, {"key": "40048022", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.40922078017877656, "ground_truth": 0}, {"key": "40048022", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3259495330653621, "ground_truth": 0}, {"key": "32884004", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4649015923201741, "ground_truth": 0}, {"key": "32884004", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7386690720308832, "ground_truth": 0}, {"key": "32884004", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.433981490673738, "ground_truth": 0}, {"key": "32884004", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3775406706532394, "ground_truth": 0}, {"key": "32884004", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30735798229323946, "ground_truth": 0}, {"key": "39022490", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40168783450620604, "ground_truth": 0}, {"key": "39022490", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37570644174153506, "ground_truth": 0}, {"key": "39022490", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.48438006312748044, "ground_truth": 0}, {"key": "39022490", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.36116472829445884, "ground_truth": 0}, {"key": "39022490", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974733179956466, "ground_truth": 0}, {"key": "35159385", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5813030813531824, "ground_truth": 0}, {"key": "35159385", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7943849558099197, "ground_truth": 0}, {"key": "35159385", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.47268350131639497, "ground_truth": 0}, {"key": "35159385", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165052794836, "ground_truth": 0}, {"key": "35159385", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943857819249, "ground_truth": 0}, {"key": "34363669", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.525368820897519, "ground_truth": 0}, {"key": "34363669", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43590151927176507, "ground_truth": 0}, {"key": "34363669", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42823336927855843, "ground_truth": 0}, {"key": "34363669", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29583985826527115, "ground_truth": 0}, {"key": "34363669", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18126319613313205, "ground_truth": 0}, {"key": "36119687", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7718434983657669, "ground_truth": 0}, {"key": "36119687", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4339814626397668, "ground_truth": 0}, {"key": "36119687", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7745833980220741, "ground_truth": 0}, {"key": "36119687", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303129222002, "ground_truth": 0}, {"key": "36119687", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201714927287762, "ground_truth": 0}, {"key": "35217446", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5058591259160846, "ground_truth": 0}, {"key": "35217446", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43974736422270155, "ground_truth": 0}, {"key": "35217446", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5292633865522332, "ground_truth": 0}, {"key": "35217446", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653335149586594, "ground_truth": 0}, {"key": "35217446", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118474748715, "ground_truth": 0}, {"key": "39049331", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13660839317837445, "ground_truth": 0}, {"key": "39049331", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12002562758121925, "ground_truth": 0}, {"key": "39049331", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13846178485265115, "ground_truth": 0}, {"key": "39049331", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07921031774994448, "ground_truth": 0}, {"key": "39049331", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13660839537871478, "ground_truth": 0}, {"key": "36472242", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6334102375698076, "ground_truth": 0}, {"key": "36472242", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6406358662658364, "ground_truth": 0}, {"key": "36472242", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5679366044764398, "ground_truth": 0}, {"key": "36472242", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689278484277, "ground_truth": 0}, {"key": "36472242", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935424778004, "ground_truth": 0}, {"key": "31854721", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6388352862929731, "ground_truth": 0}, {"key": "31854721", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.611381980698616, "ground_truth": 0}, {"key": "31854721", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6132365979689963, "ground_truth": 0}, {"key": "31854721", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688808624563, "ground_truth": 0}, {"key": "31854721", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195286271366, "ground_truth": 0}, {"key": "18725849", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26740815751907626, "ground_truth": 0}, {"key": "18725849", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22953520891966556, "ground_truth": 0}, {"key": "18725849", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3398276433362575, "ground_truth": 0}, {"key": "18725849", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717666190881197, "ground_truth": 0}, {"key": "18725849", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.48242911184383713, "ground_truth": 0}, {"key": "36883179", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2146914134167552, "ground_truth": 0}, {"key": "36883179", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15002882407842807, "ground_truth": 0}, {"key": "36883179", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.047780069375313004, "ground_truth": 0}, {"key": "36883179", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08694166178950437, "ground_truth": 0}, {"key": "36883179", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10818895302952389, "ground_truth": 0}, {"key": "34266359", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3886180498918802, "ground_truth": 0}, {"key": "34266359", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4263215928313584, "ground_truth": 0}, {"key": "34266359", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.418696894705654, "ground_truth": 0}, {"key": "34266359", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4746311937857935, "ground_truth": 0}, {"key": "34266359", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3007455670529814, "ground_truth": 0}, {"key": "31920289", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14706453464957525, "ground_truth": 0}, {"key": "31920289", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3140505501846975, "ground_truth": 0}, {"key": "31920289", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31069439548362277, "ground_truth": 0}, {"key": "31920289", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20307463649010957, "ground_truth": 0}, {"key": "31920289", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22270014386663173, "ground_truth": 0}, {"key": "36292997", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2877677828807758, "ground_truth": 0}, {"key": "36292997", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31573598188382224, "ground_truth": 0}, {"key": "36292997", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43014734209080957, "ground_truth": 0}, {"key": "36292997", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3293917124556925, "ground_truth": 0}, {"key": "36292997", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.426321585563261, "ground_truth": 0}, {"key": "30412533", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4726834715033224, "ground_truth": 0}, {"key": "30412533", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5888891324069936, "ground_truth": 0}, {"key": "30412533", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5602526227909905, "ground_truth": 0}, {"key": "30412533", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082754713474, "ground_truth": 0}, {"key": "30412533", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358408780316, "ground_truth": 0}, {"key": "40433191", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30074558750060604, "ground_truth": 0}, {"key": "40433191", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3090237109234121, "ground_truth": 0}, {"key": "40433191", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5234203358578825, "ground_truth": 0}, {"key": "40433191", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786297971015, "ground_truth": 0}, {"key": "40433191", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.46295863429302836, "ground_truth": 0}, {"key": "34565591", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5583269799847649, "ground_truth": 0}, {"key": "34565591", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18010667158139487, "ground_truth": 0}, {"key": "34565591", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2942149641128936, "ground_truth": 0}, {"key": "34565591", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25982565149093184, "ground_truth": 0}, {"key": "34565591", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510839822263402, "ground_truth": 0}, {"key": "36062480", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39233684690430365, "ground_truth": 0}, {"key": "36062480", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7138307479440443, "ground_truth": 0}, {"key": "36062480", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.73411952046414, "ground_truth": 0}, {"key": "36062480", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.583203354869529, "ground_truth": 0}, {"key": "36062480", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526739840649, "ground_truth": 0}, {"key": "37276883", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.32939171005137197, "ground_truth": 0}, {"key": "37276883", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43014734819625616, "ground_truth": 0}, {"key": "37276883", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3468730912649313, "ground_truth": 0}, {"key": "37276883", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708629104052, "ground_truth": 0}, {"key": "37276883", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.46879064976353235, "ground_truth": 0}, {"key": "38509260", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4035668562551522, "ground_truth": 0}, {"key": "38509260", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7122322032053227, "ground_truth": 0}, {"key": "38509260", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8187368054516271, "ground_truth": 0}, {"key": "38509260", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832187956305, "ground_truth": 0}, {"key": "38509260", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39233679734036186, "ground_truth": 0}, {"key": "37139607", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.507811875282659, "ground_truth": 0}, {"key": "37139607", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5640984666040512, "ground_truth": 0}, {"key": "37139607", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5964331268707622, "ground_truth": 0}, {"key": "37139607", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.61693582461017, "ground_truth": 0}, {"key": "37139607", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331281357098, "ground_truth": 0}, {"key": "37092824", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.970687768178597, "ground_truth": 0}, {"key": "37092824", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9268352857472865, "ground_truth": 0}, {"key": "37092824", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9343951675854341, "ground_truth": 0}, {"key": "37092824", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9437636519537422, "ground_truth": 0}, {"key": "37092824", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9059898223514624, "ground_truth": 0}, {"key": "32191802", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8031738127978822, "ground_truth": 0}, {"key": "32191802", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5774953779011528, "ground_truth": 0}, {"key": "32191802", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7826624499770071, "ground_truth": 0}, {"key": "32191802", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006919896402851, "ground_truth": 0}, {"key": "32191802", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307396123414, "ground_truth": 0}, {"key": "39396038", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7577943825322929, "ground_truth": 0}, {"key": "39396038", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5832033698257035, "ground_truth": 0}, {"key": "39396038", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6315943101175082, "ground_truth": 0}, {"key": "39396038", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668456180769237, "ground_truth": 0}, {"key": "39396038", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476658050298, "ground_truth": 0}, {"key": "39076884", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2829881159926504, "ground_truth": 0}, {"key": "39076884", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31237002111431095, "ground_truth": 0}, {"key": "39076884", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38306415554858086, "ground_truth": 0}, {"key": "39076884", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2583259682634102, "ground_truth": 0}, {"key": "39076884", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.332852345859696, "ground_truth": 0}, {"key": "27763432", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2689414124582041, "ground_truth": 0}, {"key": "27763432", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3090237159745722, "ground_truth": 0}, {"key": "27763432", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3665897236214435, "ground_truth": 0}, {"key": "27763432", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21469142434040786, "ground_truth": 0}, {"key": "27763432", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13568955606919197, "ground_truth": 0}, {"key": "37806929", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40356684785435526, "ground_truth": 0}, {"key": "37806929", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.416796628120943, "ground_truth": 0}, {"key": "37806929", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31237000366332396, "ground_truth": 0}, {"key": "37806929", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061540513425, "ground_truth": 0}, {"key": "37806929", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.46684559534454456, "ground_truth": 0}, {"key": "32334186", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4882834112965825, "ground_truth": 0}, {"key": "32334186", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3276683194615688, "ground_truth": 0}, {"key": "32334186", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2845760103654155, "ground_truth": 0}, {"key": "32334186", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4092208318245251, "ground_truth": 0}, {"key": "32334186", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880177093532, "ground_truth": 0}, {"key": "36187324", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5602526549869865, "ground_truth": 0}, {"key": "36187324", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.33458945001149304, "ground_truth": 0}, {"key": "36187324", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3629692019520935, "ground_truth": 0}, {"key": "36187324", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3775406775013422, "ground_truth": 0}, {"key": "36187324", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203485092886, "ground_truth": 0}, {"key": "35306009", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9213576126326007, "ground_truth": 0}, {"key": "35306009", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7185943760722731, "ground_truth": 0}, {"key": "35306009", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8397339776383536, "ground_truth": 0}, {"key": "35306009", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.903974518267456, "ground_truth": 0}, {"key": "35306009", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110467565862, "ground_truth": 0}, {"key": "39490050", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24653334015830658, "ground_truth": 0}, {"key": "39490050", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4882834102656266, "ground_truth": 0}, {"key": "39490050", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15817435749215775, "ground_truth": 0}, {"key": "39490050", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757212829786758, "ground_truth": 0}, {"key": "39490050", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09670578543326588, "ground_truth": 0}, {"key": "38072149", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.521471162020811, "ground_truth": 0}, {"key": "38072149", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3073580251763551, "ground_truth": 0}, {"key": "38072149", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2829881053072786, "ground_truth": 0}, {"key": "38072149", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3090237285255085, "ground_truth": 0}, {"key": "38072149", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32082130671993736, "ground_truth": 0}, {"key": "35899689", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31742624890995147, "ground_truth": 0}, {"key": "35899689", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14223188863773722, "ground_truth": 0}, {"key": "35899689", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20307461202775426, "ground_truth": 0}, {"key": "35899689", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.30902369432857923, "ground_truth": 0}, {"key": "35899689", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2942149770947102, "ground_truth": 0}, {"key": "27994518", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.0726367045572253, "ground_truth": 0}, {"key": "27994518", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18010666641788453, "ground_truth": 0}, {"key": "27994518", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12506538347413118, "ground_truth": 0}, {"key": "27994518", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09602549483457638, "ground_truth": 0}, {"key": "27994518", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11920291210541722, "ground_truth": 0}, {"key": "10615479", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23651623564100643, "ground_truth": 0}, {"key": "10615479", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.29746994148648076, "ground_truth": 0}, {"key": "10615479", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3486451452374829, "ground_truth": 0}, {"key": "10615479", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3123700077218794, "ground_truth": 0}, {"key": "10615479", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3328523405171619, "ground_truth": 0}, {"key": "40186667", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4263215867460708, "ground_truth": 0}, {"key": "40186667", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22000710900229384, "ground_truth": 0}, {"key": "40186667", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.30735804123741134, "ground_truth": 0}, {"key": "40186667", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29259529071946216, "ground_truth": 0}, {"key": "40186667", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1993079976000795, "ground_truth": 0}, {"key": "38622886", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4668456025840359, "ground_truth": 0}, {"key": "38622886", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5717666155501993, "ground_truth": 0}, {"key": "38622886", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42632160343865916, "ground_truth": 0}, {"key": "38622886", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984953910164, "ground_truth": 0}, {"key": "38622886", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984226776238, "ground_truth": 0}, {"key": "40686943", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3468730831810444, "ground_truth": 0}, {"key": "40686943", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3276682968107813, "ground_truth": 0}, {"key": "40686943", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.443600416396629, "ground_truth": 0}, {"key": "40686943", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.49609381811763037, "ground_truth": 0}, {"key": "40686943", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24798742492241904, "ground_truth": 0}, {"key": "30604567", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.857768107650605, "ground_truth": 0}, {"key": "30604567", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7826625014167516, "ground_truth": 0}, {"key": "30604567", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7931059343806955, "ground_truth": 0}, {"key": "30604567", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786113761013, "ground_truth": 0}, {"key": "30604567", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.886420413155823, "ground_truth": 0}, {"key": "35440903", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6297746088483529, "ground_truth": 0}, {"key": "35440903", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3174262812409558, "ground_truth": 0}, {"key": "35440903", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5097643812481443, "ground_truth": 0}, {"key": "35440903", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.39047580603616966, "ground_truth": 0}, {"key": "35440903", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991051777535023, "ground_truth": 0}, {"key": "37219533", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13296424636642912, "ground_truth": 0}, {"key": "37219533", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23510837333653306, "ground_truth": 0}, {"key": "37219533", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24508500517697746, "ground_truth": 0}, {"key": "37219533", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1801066571734442, "ground_truth": 0}, {"key": "37219533", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13477591875948727, "ground_truth": 0}, {"key": "40178965", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5409238686460073, "ground_truth": 0}, {"key": "40178965", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5698526488966821, "ground_truth": 0}, {"key": "40178965", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6442250964011569, "ground_truth": 0}, {"key": "40178965", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251190779794, "ground_truth": 0}, {"key": "40178965", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.34864516126711215, "ground_truth": 0}, {"key": "13750468", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23792989608941031, "ground_truth": 0}, {"key": "13750468", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24220563848772364, "ground_truth": 0}, {"key": "13750468", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25238404973495054, "ground_truth": 0}, {"key": "13750468", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24364244819651915, "ground_truth": 0}, {"key": "13750468", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2751297272484276, "ground_truth": 0}, {"key": "17754949", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.46101679195371426, "ground_truth": 0}, {"key": "17754949", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3208213058267375, "ground_truth": 0}, {"key": "17754949", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.45326184424561394, "ground_truth": 0}, {"key": "17754949", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4590761562863959, "ground_truth": 0}, {"key": "17754949", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407826045581689, "ground_truth": 0}, {"key": "36675623", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7662936415886397, "ground_truth": 0}, {"key": "36675623", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8187368093189156, "ground_truth": 0}, {"key": "36675623", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6206216031236028, "ground_truth": 0}, {"key": "36675623", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867594796446, "ground_truth": 0}, {"key": "36675623", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620700989734006, "ground_truth": 0}, {"key": "40035440", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9289263317369627, "ground_truth": 0}, {"key": "40035440", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7295197824558415, "ground_truth": 0}, {"key": "40035440", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.46295861217329976, "ground_truth": 0}, {"key": "40035440", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762845694231, "ground_truth": 0}, {"key": "40035440", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754547614431, "ground_truth": 0}, {"key": "37685909", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.175538065035743, "ground_truth": 0}, {"key": "37685909", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14903530368518664, "ground_truth": 0}, {"key": "37685909", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6057990710051688, "ground_truth": 0}, {"key": "37685909", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07159119682697974, "ground_truth": 0}, {"key": "37685909", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12421300761395153, "ground_truth": 0}, {"key": "36938787", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8799743753433952, "ground_truth": 0}, {"key": "36938787", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9343951648765905, "ground_truth": 0}, {"key": "36938787", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7648916012980654, "ground_truth": 0}, {"key": "36938787", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031738209675917, "ground_truth": 0}, {"key": "36938787", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.895522669030714, "ground_truth": 0}, {"key": "39398068", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18126321269040416, "ground_truth": 0}, {"key": "39398068", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12592276754876555, "ground_truth": 0}, {"key": "39398068", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2598256397443263, "ground_truth": 0}, {"key": "39398068", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15610490080790856, "ground_truth": 0}, {"key": "39398068", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17667159294627954, "ground_truth": 0}, {"key": "39926408", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.0960254894274912, "ground_truth": 0}, {"key": "39926408", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21076629386095078, "ground_truth": 0}, {"key": "39926408", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18952108540481427, "ground_truth": 0}, {"key": "39926408", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14033624422639646, "ground_truth": 0}, {"key": "39926408", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076629822231718, "ground_truth": 0}, {"key": "40465336", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2613309241289076, "ground_truth": 0}, {"key": "40465336", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21733751974998194, "ground_truth": 0}, {"key": "40465336", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17667162108581488, "ground_truth": 0}, {"key": "40465336", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3629691895564944, "ground_truth": 0}, {"key": "40465336", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.384912156847663, "ground_truth": 0}, {"key": "34173549", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8688267790633595, "ground_truth": 0}, {"key": "34173549", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.509764391528863, "ground_truth": 0}, {"key": "34173549", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8848377733638215, "ground_truth": 0}, {"key": "34173549", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.953966097258232, "ground_truth": 0}, {"key": "34173549", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9196425316667658, "ground_truth": 0}, {"key": "33541535", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.38306413897966923, "ground_truth": 0}, {"key": "33541535", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3157359666246557, "ground_truth": 0}, {"key": "33541535", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4902356093389556, "ground_truth": 0}, {"key": "33541535", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704552267261, "ground_truth": 0}, {"key": "33541535", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666157197325, "ground_truth": 0}, {"key": "35685195", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6619228670397265, "ground_truth": 0}, {"key": "35685195", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4054487455173802, "ground_truth": 0}, {"key": "35685195", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5888891308226922, "ground_truth": 0}, {"key": "35685195", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224267587926, "ground_truth": 0}, {"key": "35685195", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019530841651425, "ground_truth": 0}, {"key": "28440730", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.071073667037813, "ground_truth": 0}, {"key": "28440730", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22135069676365116, "ground_truth": 0}, {"key": "28440730", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3208213067229233, "ground_truth": 0}, {"key": "28440730", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.0933468783330944, "ground_truth": 0}, {"key": "28440730", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4073334210136323, "ground_truth": 0}, {"key": "38338714", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4551986130150454, "ground_truth": 0}, {"key": "38338714", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5467381375910114, "ground_truth": 0}, {"key": "38338714", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6132365406972932, "ground_truth": 0}, {"key": "38338714", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990476656154, "ground_truth": 0}, {"key": "38338714", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689543116518, "ground_truth": 0}, {"key": "32191881", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19072402281880435, "ground_truth": 0}, {"key": "32191881", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32939172699455677, "ground_truth": 0}, {"key": "32191881", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1755380731890182, "ground_truth": 0}, {"key": "32191881", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21601154212706833, "ground_truth": 0}, {"key": "32191881", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.594551278707869, "ground_truth": 0}, {"key": "37707251", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13296425312977786, "ground_truth": 0}, {"key": "37707251", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5019531457831637, "ground_truth": 0}, {"key": "37707251", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4378235128375412, "ground_truth": 0}, {"key": "37707251", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2613309345053052, "ground_truth": 0}, {"key": "37707251", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33285231818629085, "ground_truth": 0}, {"key": "40172567", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1311732249494789, "ground_truth": 0}, {"key": "40172567", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14128141941944894, "ground_truth": 0}, {"key": "40172567", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1384617969263257, "ground_truth": 0}, {"key": "40172567", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15203225585483, "ground_truth": 0}, {"key": "40172567", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561504256503188, "ground_truth": 0}, {"key": "33113255", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5813030951666388, "ground_truth": 0}, {"key": "33113255", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5755879905256874, "ground_truth": 0}, {"key": "33113255", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40168783505669986, "ground_truth": 0}, {"key": "33113255", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.552539728873186, "ground_truth": 0}, {"key": "33113255", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.55639957040388, "ground_truth": 0}, {"key": "33022143", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16344543267625425, "ground_truth": 0}, {"key": "33022143", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.276690513078513, "ground_truth": 0}, {"key": "33022143", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2942149332750446, "ground_truth": 0}, {"key": "33022143", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.399811621861646, "ground_truth": 0}, {"key": "33022143", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092207958297899, "ground_truth": 0}, {"key": "32084473", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6688802686991506, "ground_truth": 0}, {"key": "32084473", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5851011510083578, "ground_truth": 0}, {"key": "32084473", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4980468467774176, "ground_truth": 0}, {"key": "32084473", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.420599570468816, "ground_truth": 0}, {"key": "32084473", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.618780435382524, "ground_truth": 0}, {"key": "40564245", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5117166199707288, "ground_truth": 0}, {"key": "40564245", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7648916254624812, "ground_truth": 0}, {"key": "40564245", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7813306252158545, "ground_truth": 0}, {"key": "40564245", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448013948892396, "ground_truth": 0}, {"key": "40564245", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723832465755, "ground_truth": 0}, {"key": "31717213", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2337063523076723, "ground_truth": 0}, {"key": "31717213", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27512973054246087, "ground_truth": 0}, {"key": "31717213", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24364246272740978, "ground_truth": 0}, {"key": "31717213", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.346873090320459, "ground_truth": 0}, {"key": "31717213", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897592685914, "ground_truth": 0}, {"key": "34861894", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40168779586514414, "ground_truth": 0}, {"key": "34861894", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23651623485774576, "ground_truth": 0}, {"key": "34861894", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4301473504943914, "ground_truth": 0}, {"key": "34861894", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2133771695461637, "ground_truth": 0}, {"key": "34861894", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38861805229232615, "ground_truth": 0}, {"key": "40838760", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.684264035157422, "ground_truth": 0}, {"key": "40838760", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5717665853800291, "ground_truth": 0}, {"key": "40838760", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6020616083408705, "ground_truth": 0}, {"key": "40838760", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4416730023517498, "ground_truth": 0}, {"key": "40838760", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526424206941, "ground_truth": 0}, {"key": "40044849", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4301473438549968, "ground_truth": 0}, {"key": "40044849", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.660172401803472, "ground_truth": 0}, {"key": "40044849", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5078118649462046, "ground_truth": 0}, {"key": "40044849", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413821690107, "ground_truth": 0}, {"key": "40044849", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004310354137, "ground_truth": 0}, {"key": "30296116", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16344543845709372, "ground_truth": 0}, {"key": "30296116", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37570647344646185, "ground_truth": 0}, {"key": "30296116", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19436781906972544, "ground_truth": 0}, {"key": "30296116", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2925952945744101, "ground_truth": 0}, {"key": "30296116", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17667160227986034, "ground_truth": 0}, {"key": "34931360", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5544704559266301, "ground_truth": 0}, {"key": "34931360", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5467381111106041, "ground_truth": 0}, {"key": "34931360", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3123700147688873, "ground_truth": 0}, {"key": "34931360", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22815648018707177, "ground_truth": 0}, {"key": "34931360", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23091976815706572, "ground_truth": 0}, {"key": "18862422", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2094696995527866, "ground_truth": 0}, {"key": "18862422", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4378234946775034, "ground_truth": 0}, {"key": "18862422", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25386101519375576, "ground_truth": 0}, {"key": "18862422", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4320633794462445, "ground_truth": 0}, {"key": "18862422", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27357438903458375, "ground_truth": 0}, {"key": "36361140", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4339814622018486, "ground_truth": 0}, {"key": "36361140", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.36477756286860713, "ground_truth": 0}, {"key": "36361140", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.44360042112012094, "ground_truth": 0}, {"key": "36361140", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3812195814825894, "ground_truth": 0}, {"key": "36361140", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35398630638324186, "ground_truth": 0}, {"key": "39703329", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2146914303590881, "ground_truth": 0}, {"key": "39703329", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25534363825340745, "ground_truth": 0}, {"key": "39703329", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1721718485735907, "ground_truth": 0}, {"key": "39703329", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3539863149923208, "ground_truth": 0}, {"key": "39703329", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953520684496018, "ground_truth": 0}, {"key": "34033324", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8774767827676607, "ground_truth": 0}, {"key": "34033324", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7866228185896871, "ground_truth": 0}, {"key": "34033324", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6406358687603745, "ground_truth": 0}, {"key": "34033324", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9304582585028164, "ground_truth": 0}, {"key": "34033324", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195373804842, "ground_truth": 0}, {"key": "35658862", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3259495095606008, "ground_truth": 0}, {"key": "35658862", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6688802663360669, "ground_truth": 0}, {"key": "35658862", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6406358837401704, "ground_truth": 0}, {"key": "35658862", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3123700261515942, "ground_truth": 0}, {"key": "35658862", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2494472298861753, "ground_truth": 0}, {"key": "36092657", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6039318618172267, "ground_truth": 0}, {"key": "36092657", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5794004166200226, "ground_truth": 0}, {"key": "36092657", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4532618416575376, "ground_truth": 0}, {"key": "36092657", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45132649276652725, "ground_truth": 0}, {"key": "36092657", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.699254436217917, "ground_truth": 0}, {"key": "26333438", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14414885732765137, "ground_truth": 0}, {"key": "26333438", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19436781700606104, "ground_truth": 0}, {"key": "26333438", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12678516859176758, "ground_truth": 0}, {"key": "26333438", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12678517373148462, "ground_truth": 0}, {"key": "26333438", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594720022651923, "ground_truth": 0}, {"key": "34184963", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17553806718365653, "ground_truth": 0}, {"key": "34184963", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.39606817367239994, "ground_truth": 0}, {"key": "34184963", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15304215973792157, "ground_truth": 0}, {"key": "34184963", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31742625484841747, "ground_truth": 0}, {"key": "34184963", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.26435834901523325, "ground_truth": 0}, {"key": "35069975", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2782567982640192, "ground_truth": 0}, {"key": "35069975", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3123700328108862, "ground_truth": 0}, {"key": "35069975", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15921740259471484, "ground_truth": 0}, {"key": "35069975", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28937167588554713, "ground_truth": 0}, {"key": "35069975", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3629691876608766, "ground_truth": 0}, {"key": "36443950", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1812632010687145, "ground_truth": 0}, {"key": "36443950", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21469140351836413, "ground_truth": 0}, {"key": "36443950", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16344543016155935, "ground_truth": 0}, {"key": "36443950", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15713685106187816, "ground_truth": 0}, {"key": "36443950", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2628418477432571, "ground_truth": 0}, {"key": "29460858", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14414885653636003, "ground_truth": 0}, {"key": "29460858", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.289371705490539, "ground_truth": 0}, {"key": "29460858", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19193278882165524, "ground_truth": 0}, {"key": "29460858", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11436853000409926, "ground_truth": 0}, {"key": "29460858", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3486451398332456, "ground_truth": 0}, {"key": "36155704", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13939638495268916, "ground_truth": 0}, {"key": "36155704", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1835936312911927, "ground_truth": 0}, {"key": "36155704", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.083291926997078, "ground_truth": 0}, {"key": "36155704", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12852513474161578, "ground_truth": 0}, {"key": "36155704", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.130285421102623, "ground_truth": 0}, {"key": "37185211", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "37185211", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7476159629600155, "ground_truth": 0}, {"key": "37185211", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5078118632426551, "ground_truth": 0}, {"key": "37185211", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136775717853, "ground_truth": 0}, {"key": "37185211", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878434504706, "ground_truth": 0}, {"key": "36454885", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2942149533532468, "ground_truth": 0}, {"key": "36454885", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2814056187097123, "ground_truth": 0}, {"key": "36454885", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24508499341683718, "ground_truth": 0}, {"key": "36454885", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2323101567550966, "ground_truth": 0}, {"key": "36454885", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3311197309837715, "ground_truth": 0}, {"key": "33148906", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11676401203432565, "ground_truth": 0}, {"key": "33148906", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15304215804095686, "ground_truth": 0}, {"key": "33148906", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16451645254780603, "ground_truth": 0}, {"key": "33148906", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.30239108809897236, "ground_truth": 0}, {"key": "33148906", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944723121261456, "ground_truth": 0}, {"key": "18086604", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24364246376488033, "ground_truth": 0}, {"key": "18086604", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24944723161720092, "ground_truth": 0}, {"key": "18086604", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22135069513675468, "ground_truth": 0}, {"key": "18086604", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19436782776613268, "ground_truth": 0}, {"key": "18086604", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11436853144196252, "ground_truth": 0}, {"key": "33693397", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3557748978100918, "ground_truth": 0}, {"key": "33693397", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2782567607176317, "ground_truth": 0}, {"key": "33693397", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20689406243364436, "ground_truth": 0}, {"key": "33693397", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2925952887842257, "ground_truth": 0}, {"key": "33693397", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1980641767700103, "ground_truth": 0}, {"key": "39501530", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22405545737183086, "ground_truth": 0}, {"key": "39501530", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2658804710474441, "ground_truth": 0}, {"key": "39501530", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16132024035190537, "ground_truth": 0}, {"key": "39501530", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3345894452428416, "ground_truth": 0}, {"key": "39501530", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43590152749110284, "ground_truth": 0}, {"key": "30948874", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.45326185088512, "ground_truth": 0}, {"key": "30948874", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2766905385106711, "ground_truth": 0}, {"key": "30948874", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4649015865958583, "ground_truth": 0}, {"key": "30948874", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4687906214643474, "ground_truth": 0}, {"key": "30948874", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990625802573, "ground_truth": 0}, {"key": "39410675", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4746312060843423, "ground_truth": 0}, {"key": "39410675", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7549149790006224, "ground_truth": 0}, {"key": "39410675", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7826625004866264, "ground_truth": 0}, {"key": "39410675", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948330413616, "ground_truth": 0}, {"key": "39410675", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926420009113121, "ground_truth": 0}, {"key": "32903337", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15817436003916915, "ground_truth": 0}, {"key": "32903337", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20946968892482154, "ground_truth": 0}, {"key": "32903337", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20181320417807727, "ground_truth": 0}, {"key": "32903337", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2043418826659327, "ground_truth": 0}, {"key": "32903337", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13386748761004347, "ground_truth": 0}, {"key": "27685132", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16238003185489108, "ground_truth": 0}, {"key": "27685132", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20817893506339427, "ground_truth": 0}, {"key": "27685132", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2227001424225576, "ground_truth": 0}, {"key": "27685132", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13939638125039994, "ground_truth": 0}, {"key": "27685132", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09401018289053656, "ground_truth": 0}, {"key": "22791471", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20946968149743975, "ground_truth": 0}, {"key": "22791471", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26284184673260763, "ground_truth": 0}, {"key": "22791471", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.41489885443576674, "ground_truth": 0}, {"key": "22791471", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.437823472726557, "ground_truth": 0}, {"key": "22791471", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22000709599884266, "ground_truth": 0}, {"key": "32292348", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27669051156351737, "ground_truth": 0}, {"key": "32292348", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21733751457831332, "ground_truth": 0}, {"key": "32292348", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25982564439622513, "ground_truth": 0}, {"key": "32292348", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.26894141134110383, "ground_truth": 0}, {"key": "32292348", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.289371689824906, "ground_truth": 0}, {"key": "20482930", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3415824931316201, "ground_truth": 0}, {"key": "20482930", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5813031074657933, "ground_truth": 0}, {"key": "20482930", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3056973249009723, "ground_truth": 0}, {"key": "20482930", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44167300530120657, "ground_truth": 0}, {"key": "20482930", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3328523087624619, "ground_truth": 0}, {"key": "11635754", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39606816213258333, "ground_truth": 0}, {"key": "11635754", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2704802281547997, "ground_truth": 0}, {"key": "11635754", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.37937840837189574, "ground_truth": 0}, {"key": "11635754", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953531823813, "ground_truth": 0}, {"key": "11635754", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.519521307506699, "ground_truth": 0}, {"key": "40029096", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4148988630981601, "ground_truth": 0}, {"key": "40029096", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16451644453290806, "ground_truth": 0}, {"key": "40029096", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2407745962878613, "ground_truth": 0}, {"key": "40029096", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.26894144377031265, "ground_truth": 0}, {"key": "40029096", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3276682883193823, "ground_truth": 0}, {"key": "40414719", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8152324955397636, "ground_truth": 0}, {"key": "40414719", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5813030809872527, "ground_truth": 0}, {"key": "40414719", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7154239947124008, "ground_truth": 0}, {"key": "40414719", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563557725289, "ground_truth": 0}, {"key": "40414719", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740203367157, "ground_truth": 0}, {"key": "39537616", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40733339138097346, "ground_truth": 0}, {"key": "39537616", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3522017876287083, "ground_truth": 0}, {"key": "39537616", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40168779300401425, "ground_truth": 0}, {"key": "39537616", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44552954319911336, "ground_truth": 0}, {"key": "39537616", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964338494744, "ground_truth": 0}, {"key": "33245830", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.533154400175327, "ground_truth": 0}, {"key": "33245830", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5350984360425493, "ground_truth": 0}, {"key": "33245830", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4130035634676838, "ground_truth": 0}, {"key": "33245830", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.47852882966131727, "ground_truth": 0}, {"key": "33245830", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4687906541374513, "ground_truth": 0}, {"key": "39243601", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.176671613238743, "ground_truth": 0}, {"key": "39243601", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.06804042374789994, "ground_truth": 0}, {"key": "39243601", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24364245858653927, "ground_truth": 0}, {"key": "39243601", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14706453219849192, "ground_truth": 0}, {"key": "39243601", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561505385098264, "ground_truth": 0}, {"key": "35815905", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1666754104825168, "ground_truth": 0}, {"key": "35815905", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2553436473917458, "ground_truth": 0}, {"key": "35815905", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.045352579929454545, "ground_truth": 0}, {"key": "35815905", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12940273634030394, "ground_truth": 0}, {"key": "35815905", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21733752808069862, "ground_truth": 0}, {"key": "35260212", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3056973241241178, "ground_truth": 0}, {"key": "35260212", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43974737409104786, "ground_truth": 0}, {"key": "35260212", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.299105191188145, "ground_truth": 0}, {"key": "35260212", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23934934691525234, "ground_truth": 0}, {"key": "35260212", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4590761081112875, "ground_truth": 0}, {"key": "39193924", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17328822810365294, "ground_truth": 0}, {"key": "39193924", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26133090519272917, "ground_truth": 0}, {"key": "39193924", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09009299007117731, "ground_truth": 0}, {"key": "39193924", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15713686108433506, "ground_truth": 0}, {"key": "39193924", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15203224483927671, "ground_truth": 0}, {"key": "40658569", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14414885405418568, "ground_truth": 0}, {"key": "40658569", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.34864515809785906, "ground_truth": 0}, {"key": "40658569", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "40658569", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37387580895075223, "ground_truth": 0}, {"key": "40658569", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1812632005323612, "ground_truth": 0}, {"key": "33497596", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24508501746899372, "ground_truth": 0}, {"key": "33497596", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15304215316264314, "ground_truth": 0}, {"key": "33497596", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12506537637872406, "ground_truth": 0}, {"key": "33497596", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15713685682631598, "ground_truth": 0}, {"key": "33497596", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12678516749437663, "ground_truth": 0}, {"key": "40339241", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4785288065182387, "ground_truth": 0}, {"key": "40339241", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5019531030219025, "ground_truth": 0}, {"key": "40339241", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.48242911877354927, "ground_truth": 0}, {"key": "40339241", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995901776887, "ground_truth": 0}, {"key": "40339241", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2553436439305801, "ground_truth": 0}, {"key": "31792608", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21337717992174404, "ground_truth": 0}, {"key": "31792608", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.33458944532095414, "ground_truth": 0}, {"key": "31792608", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16667540013003082, "ground_truth": 0}, {"key": "31792608", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2814056138607097, "ground_truth": 0}, {"key": "31792608", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2005576768088151, "ground_truth": 0}, {"key": "33132662", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25386099851797556, "ground_truth": 0}, {"key": "33132662", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.46101681681531254, "ground_truth": 0}, {"key": "33132662", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35398629197694725, "ground_truth": 0}, {"key": "33132662", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11124121939350559, "ground_truth": 0}, {"key": "33132662", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16667539309170512, "ground_truth": 0}, {"key": "37577457", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4649015622563882, "ground_truth": 0}, {"key": "37577457", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6477982292019342, "ground_truth": 0}, {"key": "37577457", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2845759975074063, "ground_truth": 0}, {"key": "37577457", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43782350559255434, "ground_truth": 0}, {"key": "37577457", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37387580299785866, "ground_truth": 0}, {"key": "38701278", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3702253845698538, "ground_truth": 0}, {"key": "38701278", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.49023558901037617, "ground_truth": 0}, {"key": "38701278", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.48633152024933907, "ground_truth": 0}, {"key": "38701278", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3363310453841703, "ground_truth": 0}, {"key": "38701278", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473232389843, "ground_truth": 0}, {"key": "34570783", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6757646081544939, "ground_truth": 0}, {"key": "34570783", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5214711686846143, "ground_truth": 0}, {"key": "34570783", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8386797759094149, "ground_truth": 0}, {"key": "34570783", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.779992881733728, "ground_truth": 0}, {"key": "34570783", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883413048212, "ground_truth": 0}, {"key": "39064526", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12421300952834317, "ground_truth": 0}, {"key": "39064526", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22541659879335021, "ground_truth": 0}, {"key": "39064526", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1688569610671584, "ground_truth": 0}, {"key": "39064526", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22135069492469264, "ground_truth": 0}, {"key": "39064526", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.47657966996061235, "ground_truth": 0}, {"key": "40741545", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5234203553375089, "ground_truth": 0}, {"key": "40741545", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8128673198999185, "ground_truth": 0}, {"key": "40741545", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6601723653119513, "ground_truth": 0}, {"key": "40741545", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740072511046, "ground_truth": 0}, {"key": "40741545", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666014035404, "ground_truth": 0}, {"key": "36929751", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8019358178654467, "ground_truth": 0}, {"key": "36929751", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6279512056719531, "ground_truth": 0}, {"key": "36929751", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7341195075376977, "ground_truth": 0}, {"key": "36929751", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511529724278, "ground_truth": 0}, {"key": "36929751", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898583390089, "ground_truth": 0}, {"key": "23984730", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.201813233281918, "ground_truth": 0}, {"key": "23984730", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.48047867823795126, "ground_truth": 0}, {"key": "23984730", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24798744573032125, "ground_truth": 0}, {"key": "23984730", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.39793841524681894, "ground_truth": 0}, {"key": "23984730", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3023910875684759, "ground_truth": 0}, {"key": "36007415", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.38861804099127334, "ground_truth": 0}, {"key": "36007415", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.744656335106034, "ground_truth": 0}, {"key": "36007415", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42441196173420465, "ground_truth": 0}, {"key": "36007415", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3106943710864128, "ground_truth": 0}, {"key": "36007415", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4590760998392154, "ground_truth": 0}, {"key": "38875041", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23370637139437705, "ground_truth": 0}, {"key": "38875041", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47268348267942256, "ground_truth": 0}, {"key": "38875041", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3942009685670989, "ground_truth": 0}, {"key": "38875041", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4551986082171059, "ground_truth": 0}, {"key": "38875041", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.48438006947544576, "ground_truth": 0}]